summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--rts/RetainerProfile.c232
1 files changed, 137 insertions, 95 deletions
diff --git a/rts/RetainerProfile.c b/rts/RetainerProfile.c
index c9b42956a1..d42de2e72d 100644
--- a/rts/RetainerProfile.c
+++ b/rts/RetainerProfile.c
@@ -158,8 +158,10 @@ typedef union {
} srt;
} nextPos;
-// Tagged stack element, that keeps information how to process
-// the next element in the traverse stack.
+/**
+ * Position pointer into a closure. Determines what the next element to return
+ * for a stackElement is.
+ */
typedef struct {
nextPosType type;
nextPos next;
@@ -172,29 +174,48 @@ typedef union {
retainer c_child_r;
} stackData;
-// Element in the traverse stack, keeps the element, information
-// how to continue processing the element, and it's retainer set.
+/**
+ * An element of the traversal work-stack. Besides the closure itself this also
+ * stores it's parent and associated data.
+ *
+ * When 'info.type == posTypeFresh' a 'stackElement' represents just one
+ * closure, namely 'c' and 'cp' being it's parent. Otherwise 'info' specifies an
+ * offset into the children of 'c'. This is to support returning a closure's
+ * children one-by-one without pushing one element per child onto the stack. See
+ * traversePushChildren() and traversePop().
+ *
+ */
typedef struct {
stackPos info;
StgClosure *c;
- StgClosure *cp; // parent of 'c'
+ StgClosure *cp; // parent of 'c'. Only used when info.type == posTypeFresh.
stackData data;
} stackElement;
typedef struct {
/*
Invariants:
+
firstStack points to the first block group.
+
currentStack points to the block group currently being used.
+
currentStack->free == stackLimit.
+
stackTop points to the topmost byte in the stack of currentStack.
+
Unless the whole stack is empty, stackTop must point to the topmost
object (or byte) in the whole stack. Thus, it is only when the whole stack
- is empty that stackTop == stackLimit (not during the execution of push()
- and pop()).
+ is empty that stackTop == stackLimit (not during the execution of
+ pushStackElement() and popStackElement()).
+
stackBottom == currentStack->start.
+
stackLimit == currentStack->start + BLOCK_SIZE_W * currentStack->blocks.
+
+
Note:
+
When a current stack becomes empty, stackTop is set to point to
the topmost element on the previous block group so as to satisfy
the invariants described above.
@@ -226,7 +247,8 @@ typedef struct {
int stackSize, maxStackSize;
} traverseState;
-/* Callback called when heap traversal visits a closure.
+/**
+ * Callback called when heap traversal visits a closure.
*
* Before this callback is called the profiling header of the visited closure
* 'c' is zero'd with 'setTravDataToZero' if this closure hasn't been visited in
@@ -298,9 +320,9 @@ returnToOldStack( traverseState *ts, bdescr *bd )
bd->free = (StgPtr)ts->stackLimit;
}
-/* -----------------------------------------------------------------------------
- * Initializes the traverse stack.
- * -------------------------------------------------------------------------- */
+/**
+ * Initializes the traversal work-stack.
+ */
static void
initializeTraverseStack( traverseState *ts )
{
@@ -315,11 +337,12 @@ initializeTraverseStack( traverseState *ts )
newStackBlock(ts, ts->firstStack);
}
-/* -----------------------------------------------------------------------------
- * Frees all the block groups in the traverse stack.
+/**
+ * Frees all the block groups in the traversal works-stack.
+ *
* Invariants:
* firstStack != NULL
- * -------------------------------------------------------------------------- */
+ */
static void
closeTraverseStack( traverseState *ts )
{
@@ -433,15 +456,17 @@ find_srt( stackPos *info )
}
}
-/* -----------------------------------------------------------------------------
- * Pushes an element onto traverse stack
- * -------------------------------------------------------------------------- */
+/**
+ * Push a set of closures, represented by a single 'stackElement', onto the
+ * traversal work-stack.
+ */
static void
pushStackElement(traverseState *ts, stackElement *se)
{
bdescr *nbd; // Next Block Descriptor
if (ts->stackTop - 1 < ts->stackBottom) {
- debug("pop() to the next stack.\n");
+ debug("pushStackElement() to the next stack.\n");
+
// currentStack->free is updated when the active stack is switched
// to the next stack.
ts->currentStack->free = (StgPtr)ts->stackTop;
@@ -471,13 +496,12 @@ pushStackElement(traverseState *ts, stackElement *se)
debug("stackSize = %d\n", ts->stackSize);
}
-/* Push an object onto traverse stack. This method can be used anytime
- * instead of calling retainClosure(), it exists in order to use an
- * explicit stack instead of direct recursion.
+/**
+ * Push a single closure onto the traversal work-stack.
*
- * *cp - object's parent
- * *c - closure
- * c_child_r - closure retainer.
+ * cp - object's parent
+ * c - closure
+ * data - data associated with closure.
*/
static INLINE void
traversePushClosure(traverseState *ts, StgClosure *c, StgClosure *cp, stackData data) {
@@ -491,28 +515,34 @@ traversePushClosure(traverseState *ts, StgClosure *c, StgClosure *cp, stackData
pushStackElement(ts, &se);
};
-/* -----------------------------------------------------------------------------
- * push() pushes a stackElement representing the next child of *c
- * onto the traverse stack. If *c has no child, *first_child is set
- * to NULL and nothing is pushed onto the stack. If *c has only one
- * child, *c_child is set to that child and nothing is pushed onto
- * the stack. If *c has more than two children, *first_child is set
- * to the first child and a stackElement representing the second
- * child is pushed onto the stack.
-
- * Invariants:
- * *c_child_r is the most recent retainer of *c's children.
- * *c is not any of TSO, AP, PAP, AP_STACK, which means that
- * there cannot be any stack objects.
- * Note: SRTs are considered to be children as well.
- * -------------------------------------------------------------------------- */
+/**
+ * traversePushChildren() extracts the first child of 'c' in 'first_child' and
+ * conceptually pushes all remaining children of 'c' onto the traversal stack
+ * while associating 'data' with the pushed elements to be returned upon poping.
+ *
+ * If 'c' has no children, 'first_child' is set to NULL and nothing is pushed
+ * onto the stack.
+ *
+ * If 'c' has only one child, 'first_child' is set to that child and nothing is
+ * pushed onto the stack.
+ *
+ * Invariants:
+ *
+ * - 'c' is not any of TSO, AP, PAP, AP_STACK, which means that there cannot
+ * be any stack objects.
+ *
+ * Note: SRTs are considered to be children as well.
+ *
+ * Note: When pushing onto the stack we only really push one 'stackElement'
+ * representing all children onto the stack. See traversePop()
+ */
static INLINE void
traversePushChildren(traverseState *ts, StgClosure *c, stackData data, StgClosure **first_child)
{
stackElement se;
bdescr *nbd; // Next Block Descriptor
- debug("push(): stackTop = 0x%x, currentStackBoundary = 0x%x\n", ts->stackTop, ts->currentStackBoundary);
+ debug("traversePushChildren(): stackTop = 0x%x, currentStackBoundary = 0x%x\n", ts->stackTop, ts->currentStackBoundary);
ASSERT(get_itbl(c)->type != TSO);
ASSERT(get_itbl(c)->type != AP_STACK);
@@ -523,7 +553,7 @@ traversePushChildren(traverseState *ts, StgClosure *c, stackData data, StgClosur
se.c = c;
se.data = data;
- // Note: se.cp ommitted on purpose, only retainPushClosure uses that.
+ // Note: se.cp ommitted on purpose, only traversePushClosure uses that.
// fill in se.info
switch (get_itbl(c)->type) {
@@ -712,19 +742,14 @@ traversePushChildren(traverseState *ts, StgClosure *c, stackData data, StgClosur
pushStackElement(ts, &se);
}
-/* -----------------------------------------------------------------------------
- * popOff() and popOffReal(): Pop a stackElement off the traverse stack.
+/**
+ * popStackElement(): Remove a depleted stackElement from the top of the
+ * traversal work-stack.
+ *
* Invariants:
* stackTop cannot be equal to stackLimit unless the whole stack is
- * empty, in which case popOff() is not allowed.
- * Note:
- * You can think of popOffReal() as a part of popOff() which is
- * executed at the end of popOff() in necessary. Since popOff() is
- * likely to be executed quite often while popOffReal() is not, we
- * separate popOffReal() from popOff(), which is declared as an
- * INLINE function (for the sake of execution speed). popOffReal()
- * is called only within popOff() and nowhere else.
- * -------------------------------------------------------------------------- */
+ * empty, in which case popStackElement() is not allowed.
+ */
static void
popStackElement(traverseState *ts) {
debug("popStackElement(): stackTop = 0x%x, currentStackBoundary = 0x%x\n", ts->stackTop, ts->currentStackBoundary);
@@ -746,7 +771,7 @@ popStackElement(traverseState *ts) {
bdescr *pbd; // Previous Block Descriptor
- debug("pop() to the previous stack.\n");
+ debug("popStackElement() to the previous stack.\n");
ASSERT(ts->stackTop + 1 == ts->stackLimit);
ASSERT(ts->stackBottom == (stackElement *)ts->currentStack->start);
@@ -780,9 +805,10 @@ popStackElement(traverseState *ts) {
debug("stackSize = %d\n", ts->stackSize);
}
-/* -----------------------------------------------------------------------------
+/**
* Finds the next object to be considered for retainer profiling and store
* its pointer to *c.
+ *
* If the unprocessed object was stored in the stack (posTypeFresh), the
* this object is returned as-is. Otherwise Test if the topmost stack
* element indicates that more objects are left,
@@ -790,20 +816,23 @@ popStackElement(traverseState *ts) {
* set *cp and *data appropriately, both of which are stored in the stack
* element. The topmost stack element then is overwritten so as for it to now
* denote the next object.
+ *
* If the topmost stack element indicates no more objects are left, pop
* off the stack element until either an object can be retrieved or
* the current stack chunk becomes empty, indicated by true returned by
* isOnBoundary(), in which case *c is set to NULL.
+ *
* Note:
+ *
* It is okay to call this function even when the current stack chunk
* is empty.
- * -------------------------------------------------------------------------- */
+ */
static INLINE void
traversePop(traverseState *ts, StgClosure **c, StgClosure **cp, stackData *data)
{
stackElement *se;
- debug("pop(): stackTop = 0x%x currentStackBoundary = 0x%x\n", ts->stackTop, ts->currentStackBoundary);
+ debug("traversePop(): stackTop = 0x%x currentStackBoundary = 0x%x\n", ts->stackTop, ts->currentStackBoundary);
// Is this the last internal element? If so instead of modifying the current
// stackElement in place we actually remove it from the stack.
@@ -816,7 +845,8 @@ traversePop(traverseState *ts, StgClosure **c, StgClosure **cp, stackData *data)
}
// Note: Below every `break`, where the loop condition is true, must be
- // accompanied by a popOff() otherwise this is an infinite loop.
+ // accompanied by a popStackElement() otherwise this is an infinite
+ // loop.
se = ts->stackTop;
// If this is a top-level element, you should pop that out.
@@ -845,7 +875,7 @@ traversePop(traverseState *ts, StgClosure **c, StgClosure **cp, stackData *data)
if (se->info.next.step == 2) {
*c = (StgClosure *)((StgMVar *)se->c)->tail;
se->info.next.step++; // move to the next step
- // no popOff
+ // no popStackElement
} else {
*c = ((StgMVar *)se->c)->value;
last = true;
@@ -857,7 +887,7 @@ traversePop(traverseState *ts, StgClosure **c, StgClosure **cp, stackData *data)
if (se->info.next.step == 2) {
*c = ((StgWeak *)se->c)->value;
se->info.next.step++;
- // no popOff
+ // no popStackElement
} else {
*c = ((StgWeak *)se->c)->finalizer;
last = true;
@@ -982,7 +1012,7 @@ traversePop(traverseState *ts, StgClosure **c, StgClosure **cp, stackData *data)
case IND:
case INVALID_OBJECT:
default:
- barf("Invalid object *c in pop(): %d", get_itbl(se->c)->type);
+ barf("Invalid object *c in traversePop(): %d", get_itbl(se->c)->type);
return;
}
} while (*c == NULL);
@@ -1194,7 +1224,7 @@ associate( StgClosure *c, RetainerSet *s )
}
/* -----------------------------------------------------------------------------
- Call retainPushClosure for each of the closures covered by a large bitmap.
+ Call traversePushClosure for each of the closures covered by a large bitmap.
-------------------------------------------------------------------------- */
static void
@@ -1236,24 +1266,32 @@ traverseSmallBitmap (traverseState *ts, StgPtr p, uint32_t size, StgWord bitmap,
return p;
}
-/* -----------------------------------------------------------------------------
- * Process all the objects in the stack chunk from stackStart to stackEnd
- * with *c and *c_child_r being their parent and their most recent retainer,
- * respectively. Treat stackOptionalFun as another child of *c if it is
- * not NULL.
+/**
+ * traversePushStack(ts, cp, data, stackStart, stackEnd) pushes all the objects
+ * in the STG stack-chunk from stackStart to stackEnd onto the traversal
+ * work-stack with 'c' and 'data' being their parent and associated data,
+ * respectively.
+ *
* Invariants:
- * *c is one of the following: TSO, AP_STACK.
- * If *c is TSO, c == c_child_r.
+ *
+ * *cp is one of the following: TSO, AP_STACK.
+ *
+ * If *cp is TSO, c == c_child_r.
+ *
* stackStart < stackEnd.
+ *
* RSET(c) and RSET(c_child_r) are valid, i.e., their
* interpretation conforms to the current value of flip (even when they
* are interpreted to be NULL).
+ *
* If *c is TSO, its state is not ThreadComplete,or ThreadKilled,
* which means that its stack is ready to process.
+ *
* Note:
+ *
* This code was almost plagiarzied from GC.c! For each pointer,
- * retainPushClosure() is invoked instead of evacuate().
- * -------------------------------------------------------------------------- */
+ * traversePushClosure() is invoked instead of evacuate().
+ */
static void
traversePushStack(traverseState *ts, StgClosure *cp, stackData data,
StgPtr stackStart, StgPtr stackEnd)
@@ -1265,7 +1303,7 @@ traversePushStack(traverseState *ts, StgClosure *cp, stackData data,
uint32_t size;
/*
- Each invocation of retainStack() creates a new virtual
+ Each invocation of traversePushStack() creates a new virtual
stack. Since all such stacks share a single common stack, we
record the current currentStackBoundary, which will be restored
at the exit.
@@ -1273,7 +1311,7 @@ traversePushStack(traverseState *ts, StgClosure *cp, stackData data,
oldStackBoundary = ts->currentStackBoundary;
ts->currentStackBoundary = ts->stackTop;
- debug("retainStack() called: oldStackBoundary = 0x%x, currentStackBoundary = 0x%x\n",
+ debug("traversePushStack() called: oldStackBoundary = 0x%x, currentStackBoundary = 0x%x\n",
oldStackBoundary, ts->currentStackBoundary);
ASSERT(get_itbl(cp)->type == STACK);
@@ -1360,19 +1398,19 @@ traversePushStack(traverseState *ts, StgClosure *cp, stackData data,
}
default:
- barf("Invalid object found in retainStack(): %d",
+ barf("Invalid object found in traversePushStack(): %d",
(int)(info->i.type));
}
}
// restore currentStackBoundary
ts->currentStackBoundary = oldStackBoundary;
- debug("retainStack() finished: currentStackBoundary = 0x%x\n",
+ debug("traversePushStack() finished: currentStackBoundary = 0x%x\n",
ts->currentStackBoundary);
}
/* ----------------------------------------------------------------------------
- * Call retainPushClosure for each of the children of a PAP/AP
+ * Call traversePushClosure for each of the children of a PAP/AP
* ------------------------------------------------------------------------- */
static INLINE StgPtr
@@ -1495,22 +1533,10 @@ retainVisitClosure( const StgClosure *c, const StgClosure *cp, const stackData d
return 0;
}
-/* -----------------------------------------------------------------------------
- * Compute the retainer set of *c0 and all its desecents by traversing.
- * *cp0 is the parent of *c0, and *r0 is the most recent retainer of *c0.
- * Invariants:
- * c0 = cp0 = r0 holds only for root objects.
- * RSET(cp0) and RSET(r0) are valid, i.e., their
- * interpretation conforms to the current value of flip (even when they
- * are interpreted to be NULL).
- * However, RSET(c0) may be corrupt, i.e., it may not conform to
- * the current value of flip. If it does not, during the execution
- * of this function, RSET(c0) must be initialized as well as all
- * its descendants.
- * Note:
- * stackTop must be the same at the beginning and the exit of this function.
- * *c0 can be TSO (as well as AP_STACK).
- * -------------------------------------------------------------------------- */
+/**
+ * Traverse all closures on the traversal work-stack, calling 'visit_cb'
+ * on each closure. See 'visitClosure_cb' for details.
+ */
static void
traverseWorkStack(traverseState *ts, visitClosure_cb visit_cb)
{
@@ -1541,7 +1567,7 @@ inner_loop:
case TSO:
if (((StgTSO *)c)->what_next == ThreadComplete ||
((StgTSO *)c)->what_next == ThreadKilled) {
- debug("ThreadComplete or ThreadKilled encountered in retainClosure()\n");
+ debug("ThreadComplete or ThreadKilled encountered in traverseWorkStack()\n");
goto loop;
}
break;
@@ -1673,7 +1699,8 @@ inner_loop:
// If first_child is null, c has no child.
// If first_child is not null, the top stack element points to the next
- // object. push() may or may not push a stackElement on the stack.
+ // object. traversePushChildren() may or may not push a stackElement on the
+ // stack.
if (first_child == NULL)
goto loop;
@@ -1684,9 +1711,24 @@ inner_loop:
goto inner_loop;
}
-/* -----------------------------------------------------------------------------
+/**
* Compute the retainer set for every object reachable from *tl.
- * -------------------------------------------------------------------------- */
+ *
+ * Compute the retainer set of *c0 and all its desecents by traversing.
+ * *cp0 is the parent of *c0, and *r0 is the most recent retainer of *c0.
+ * Invariants:
+ * c0 = cp0 = r0 holds only for root objects.
+ * RSET(cp0) and RSET(r0) are valid, i.e., their
+ * interpretation conforms to the current value of flip (even when they
+ * are interpreted to be NULL).
+ * However, RSET(c0) may be corrupt, i.e., it may not conform to
+ * the current value of flip. If it does not, during the execution
+ * of this function, RSET(c0) must be initialized as well as all
+ * its descendants.
+ * Note:
+ * stackTop must be the same at the beginning and the exit of this function.
+ * *c0 can be TSO (as well as AP_STACK).
+ */
static void
retainRoot(void *user, StgClosure **tl)
{