diff options
author | Simon Marlow <marlowsd@gmail.com> | 2009-08-02 21:32:04 +0000 |
---|---|---|
committer | Simon Marlow <marlowsd@gmail.com> | 2009-08-02 21:32:04 +0000 |
commit | a2a67cd520b9841114d69a87a423dabcb3b4368e (patch) | |
tree | 3dc6bbf53dff5421c14fbeb2d812c1424f2718c0 /rts/parallel | |
parent | 5d379cbe65e406d5c3a848fe7fcd090cafbfeb78 (diff) | |
download | haskell-a2a67cd520b9841114d69a87a423dabcb3b4368e.tar.gz |
RTS tidyup sweep, first phase
The first phase of this tidyup is focussed on the header files, and in
particular making sure we are exposinng publicly exactly what we need
to, and no more.
- Rts.h now includes everything that the RTS exposes publicly,
rather than a random subset of it.
- Most of the public header files have moved into subdirectories, and
many of them have been renamed. But clients should not need to
include any of the other headers directly, just #include the main
public headers: Rts.h, HsFFI.h, RtsAPI.h.
- All the headers needed for via-C compilation have moved into the
stg subdirectory, which is self-contained. Most of the headers for
the rest of the RTS APIs have moved into the rts subdirectory.
- I left MachDeps.h where it is, because it is so widely used in
Haskell code.
- I left a deprecated stub for RtsFlags.h in place. The flag
structures are now exposed by Rts.h.
- Various internal APIs are no longer exposed by public header files.
- Various bits of dead code and declarations have been removed
- More gcc warnings are turned on, and the RTS code is more
warning-clean.
- More source files #include "PosixSource.h", and hence only use
standard POSIX (1003.1c-1995) interfaces.
There is a lot more tidying up still to do, this is just the first
pass. I also intend to standardise the names for external RTS APIs
(e.g use the rts_ prefix consistently), and declare the internal APIs
as hidden for shared libraries.
Diffstat (limited to 'rts/parallel')
-rw-r--r-- | rts/parallel/GranSim.c | 6 | ||||
-rw-r--r-- | rts/parallel/WSDeque.c | 285 | ||||
-rw-r--r-- | rts/parallel/WSDeque.h | 126 |
3 files changed, 3 insertions, 414 deletions
diff --git a/rts/parallel/GranSim.c b/rts/parallel/GranSim.c index 1b26bb9dff..7f7ad4424f 100644 --- a/rts/parallel/GranSim.c +++ b/rts/parallel/GranSim.c @@ -1,5 +1,5 @@ /* - Time-stamp: <2006-10-19 15:12:58 simonmar> + Time-stamp: <2009-07-06 21:48:36 simonmar> Variables and functions specific to GranSim the parallelism simulator for GPH. @@ -40,6 +40,8 @@ //@node Includes, Prototypes and externs, GranSim specific code, GranSim specific code //@subsection Includes +#if defined(GRAN) + #include "Rts.h" #include "RtsFlags.h" #include "RtsUtils.h" @@ -58,8 +60,6 @@ //@node Prototypes and externs, Constants and Variables, Includes, GranSim specific code //@subsection Prototypes and externs -#if defined(GRAN) - /* Prototypes */ static inline PEs ga_to_proc(StgWord); static inline rtsBool any_idle(void); diff --git a/rts/parallel/WSDeque.c b/rts/parallel/WSDeque.c deleted file mode 100644 index acecb85e5f..0000000000 --- a/rts/parallel/WSDeque.c +++ /dev/null @@ -1,285 +0,0 @@ -/* ----------------------------------------------------------------------------- - * - * (c) The GHC Team, 2009 - * - * Work-stealing Deque data structure - * - * The implementation uses Double-Ended Queues with lock-free access - * (thereby often called "deque") as described in - * - * D.Chase and Y.Lev, Dynamic Circular Work-Stealing Deque. - * SPAA'05, July 2005, Las Vegas, USA. - * ACM 1-58113-986-1/05/0007 - * - * Author: Jost Berthold MSRC 07-09/2008 - * - * The DeQue is held as a circular array with known length. Positions - * of top (read-end) and bottom (write-end) always increase, and the - * array is accessed with indices modulo array-size. While this bears - * the risk of overflow, we assume that (with 64 bit indices), a - * program must run very long to reach that point. - * - * The write end of the queue (position bottom) can only be used with - * mutual exclusion, i.e. by exactly one caller at a time. At this - * end, new items can be enqueued using pushBottom()/newSpark(), and - * removed using popBottom()/reclaimSpark() (the latter implying a cas - * synchronisation with potential concurrent readers for the case of - * just one element). - * - * Multiple readers can steal from the read end (position top), and - * are synchronised without a lock, based on a cas of the top - * position. One reader wins, the others return NULL for a failure. - * - * Both popWSDeque and stealWSDeque also return NULL when the queue is empty. - * - * Testing: see testsuite/tests/ghc-regress/rts/testwsdeque.c. If - * there's anything wrong with the deque implementation, this test - * will probably catch it. - * - * ---------------------------------------------------------------------------*/ - -#include "Rts.h" -#include "RtsUtils.h" -#include "WSDeque.h" -#include "SMP.h" // for cas - -#define CASTOP(addr,old,new) ((old) == cas(((StgPtr)addr),(old),(new))) - -/* ----------------------------------------------------------------------------- - * newWSDeque - * -------------------------------------------------------------------------- */ - -/* internal helpers ... */ - -static StgWord -roundUp2(StgWord val) -{ - StgWord rounded = 1; - - /* StgWord is unsigned anyway, only catch 0 */ - if (val == 0) { - barf("DeQue,roundUp2: invalid size 0 requested"); - } - /* at least 1 bit set, shift up to its place */ - do { - rounded = rounded << 1; - } while (0 != (val = val>>1)); - return rounded; -} - -WSDeque * -newWSDeque (nat size) -{ - StgWord realsize; - WSDeque *q; - - realsize = roundUp2(size); /* to compute modulo as a bitwise & */ - - q = (WSDeque*) stgMallocBytes(sizeof(WSDeque), /* admin fields */ - "newWSDeque"); - q->elements = stgMallocBytes(realsize * sizeof(StgClosurePtr), /* dataspace */ - "newWSDeque:data space"); - q->top=0; - q->bottom=0; - q->topBound=0; /* read by writer, updated each time top is read */ - - q->size = realsize; /* power of 2 */ - q->moduloSize = realsize - 1; /* n % size == n & moduloSize */ - - ASSERT_WSDEQUE_INVARIANTS(q); - return q; -} - -/* ----------------------------------------------------------------------------- - * freeWSDeque - * -------------------------------------------------------------------------- */ - -void -freeWSDeque (WSDeque *q) -{ - stgFree(q->elements); - stgFree(q); -} - -/* ----------------------------------------------------------------------------- - * - * popWSDeque: remove an element from the write end of the queue. - * Returns the removed spark, and NULL if a race is lost or the pool - * empty. - * - * If only one spark is left in the pool, we synchronise with - * concurrently stealing threads by using cas to modify the top field. - * This routine should NEVER be called by a task which does not own - * this deque. - * - * -------------------------------------------------------------------------- */ - -void * -popWSDeque (WSDeque *q) -{ - /* also a bit tricky, has to avoid concurrent steal() calls by - accessing top with cas, when there is only one element left */ - StgWord t, b; - long currSize; - void * removed; - - ASSERT_WSDEQUE_INVARIANTS(q); - - b = q->bottom; - - // "decrement b as a test, see what happens" - b--; - q->bottom = b; - - // very important that the following read of q->top does not occur - // before the earlier write to q->bottom. - store_load_barrier(); - - t = q->top; /* using topBound would give an *upper* bound, we - need a lower bound. We use the real top here, but - can update the topBound value */ - q->topBound = t; - currSize = (long)b - (long)t; - if (currSize < 0) { /* was empty before decrementing b, set b - consistently and abort */ - q->bottom = t; - return NULL; - } - - // read the element at b - removed = q->elements[b & q->moduloSize]; - - if (currSize > 0) { /* no danger, still elements in buffer after b-- */ - // debugBelch("popWSDeque: t=%ld b=%ld = %ld\n", t, b, removed); - return removed; - } - /* otherwise, has someone meanwhile stolen the same (last) element? - Check and increment top value to know */ - if ( !(CASTOP(&(q->top),t,t+1)) ) { - removed = NULL; /* no success, but continue adjusting bottom */ - } - q->bottom = t+1; /* anyway, empty now. Adjust bottom consistently. */ - q->topBound = t+1; /* ...and cached top value as well */ - - ASSERT_WSDEQUE_INVARIANTS(q); - ASSERT(q->bottom >= q->top); - - // debugBelch("popWSDeque: t=%ld b=%ld = %ld\n", t, b, removed); - - return removed; -} - -/* ----------------------------------------------------------------------------- - * stealWSDeque - * -------------------------------------------------------------------------- */ - -void * -stealWSDeque_ (WSDeque *q) -{ - void * stolen; - StgWord b,t; - -// Can't do this on someone else's spark pool: -// ASSERT_WSDEQUE_INVARIANTS(q); - - // NB. these loads must be ordered, otherwise there is a race - // between steal and pop. - t = q->top; - load_load_barrier(); - b = q->bottom; - - // NB. b and t are unsigned; we need a signed value for the test - // below, because it is possible that t > b during a - // concurrent popWSQueue() operation. - if ((long)b - (long)t <= 0 ) { - return NULL; /* already looks empty, abort */ - } - - /* now access array, see pushBottom() */ - stolen = q->elements[t & q->moduloSize]; - - /* now decide whether we have won */ - if ( !(CASTOP(&(q->top),t,t+1)) ) { - /* lost the race, someon else has changed top in the meantime */ - return NULL; - } /* else: OK, top has been incremented by the cas call */ - - // debugBelch("stealWSDeque_: t=%d b=%d\n", t, b); - -// Can't do this on someone else's spark pool: -// ASSERT_WSDEQUE_INVARIANTS(q); - - return stolen; -} - -void * -stealWSDeque (WSDeque *q) -{ - void *stolen; - - do { - stolen = stealWSDeque_(q); - } while (stolen == NULL && !looksEmptyWSDeque(q)); - - return stolen; -} - -/* ----------------------------------------------------------------------------- - * pushWSQueue - * -------------------------------------------------------------------------- */ - -#define DISCARD_NEW - -/* enqueue an element. Should always succeed by resizing the array - (not implemented yet, silently fails in that case). */ -rtsBool -pushWSDeque (WSDeque* q, void * elem) -{ - StgWord t; - StgWord b; - StgWord sz = q->moduloSize; - - ASSERT_WSDEQUE_INVARIANTS(q); - - /* we try to avoid reading q->top (accessed by all) and use - q->topBound (accessed only by writer) instead. - This is why we do not just call empty(q) here. - */ - b = q->bottom; - t = q->topBound; - if ( (StgInt)b - (StgInt)t >= (StgInt)sz ) { - /* NB. 1. sz == q->size - 1, thus ">=" - 2. signed comparison, it is possible that t > b - */ - /* could be full, check the real top value in this case */ - t = q->top; - q->topBound = t; - if (b - t >= sz) { /* really no space left :-( */ - /* reallocate the array, copying the values. Concurrent steal()s - will in the meantime use the old one and modify only top. - This means: we cannot safely free the old space! Can keep it - on a free list internally here... - - Potential bug in combination with steal(): if array is - replaced, it is unclear which one concurrent steal operations - use. Must read the array base address in advance in steal(). - */ -#if defined(DISCARD_NEW) - ASSERT_WSDEQUE_INVARIANTS(q); - return rtsFalse; // we didn't push anything -#else - /* could make room by incrementing the top position here. In - * this case, should use CASTOP. If this fails, someone else has - * removed something, and new room will be available. - */ - ASSERT_WSDEQUE_INVARIANTS(q); -#endif - } - } - - q->elements[b & sz] = elem; - q->bottom = b + 1; - - ASSERT_WSDEQUE_INVARIANTS(q); - return rtsTrue; -} diff --git a/rts/parallel/WSDeque.h b/rts/parallel/WSDeque.h deleted file mode 100644 index d85567c38a..0000000000 --- a/rts/parallel/WSDeque.h +++ /dev/null @@ -1,126 +0,0 @@ -/* ----------------------------------------------------------------------------- - * - * (c) The GHC Team, 2009 - * - * Work-stealing Deque data structure - * - * ---------------------------------------------------------------------------*/ - -#ifndef WSDEQUE_H -#define WSDEQUE_H - -typedef struct WSDeque_ { - // Size of elements array. Used for modulo calculation: we round up - // to powers of 2 and use the dyadic log (modulo == bitwise &) - StgWord size; - StgWord moduloSize; /* bitmask for modulo */ - - // top, index where multiple readers steal() (protected by a cas) - volatile StgWord top; - - // bottom, index of next free place where one writer can push - // elements. This happens unsynchronised. - volatile StgWord bottom; - - // both top and bottom are continuously incremented, and used as - // an index modulo the current array size. - - // lower bound on the current top value. This is an internal - // optimisation to avoid unnecessarily accessing the top field - // inside pushBottom - volatile StgWord topBound; - - // The elements array - void ** elements; - - // Please note: the dataspace cannot follow the admin fields - // immediately, as it should be possible to enlarge it without - // disposing the old one automatically (as realloc would)! - -} WSDeque; - -/* INVARIANTS, in this order: reasonable size, - topBound consistent, space pointer, space accessible to us. - - NB. This is safe to use only (a) on a spark pool owned by the - current thread, or (b) when there's only one thread running, or no - stealing going on (e.g. during GC). -*/ -#define ASSERT_WSDEQUE_INVARIANTS(p) \ - ASSERT((p)->size > 0); \ - ASSERT((p)->topBound <= (p)->top); \ - ASSERT((p)->elements != NULL); \ - ASSERT(*((p)->elements) || 1); \ - ASSERT(*((p)->elements - 1 + ((p)->size)) || 1); - -// No: it is possible that top > bottom when using pop() -// ASSERT((p)->bottom >= (p)->top); -// ASSERT((p)->size > (p)->bottom - (p)->top); - -/* ----------------------------------------------------------------------------- - * Operations - * - * A WSDeque has an *owner* thread. The owner can perform any operation; - * other threads are only allowed to call stealWSDeque_(), - * stealWSDeque(), looksEmptyWSDeque(), and dequeElements(). - * - * -------------------------------------------------------------------------- */ - -// Allocation, deallocation -WSDeque * newWSDeque (nat size); -void freeWSDeque (WSDeque *q); - -// Take an element from the "write" end of the pool. Can be called -// by the pool owner only. -void* popWSDeque (WSDeque *q); - -// Push onto the "write" end of the pool. Return true if the push -// succeeded, or false if the deque is full. -rtsBool pushWSDeque (WSDeque *q, void *elem); - -// Removes all elements from the deque -INLINE_HEADER void discardElements (WSDeque *q); - -// Removes an element of the deque from the "read" end, or returns -// NULL if the pool is empty, or if there was a collision with another -// thief. -void * stealWSDeque_ (WSDeque *q); - -// Removes an element of the deque from the "read" end, or returns -// NULL if the pool is empty. -void * stealWSDeque (WSDeque *q); - -// "guesses" whether a deque is empty. Can return false negatives in -// presence of concurrent steal() calls, and false positives in -// presence of a concurrent pushBottom(). -INLINE_HEADER rtsBool looksEmptyWSDeque (WSDeque* q); - -INLINE_HEADER long dequeElements (WSDeque *q); - -/* ----------------------------------------------------------------------------- - * PRIVATE below here - * -------------------------------------------------------------------------- */ - -INLINE_HEADER long -dequeElements (WSDeque *q) -{ - StgWord t = q->top; - StgWord b = q->bottom; - // try to prefer false negatives by reading top first - return ((long)b - (long)t); -} - -INLINE_HEADER rtsBool -looksEmptyWSDeque (WSDeque *q) -{ - return (dequeElements(q) <= 0); -} - -INLINE_HEADER void -discardElements (WSDeque *q) -{ - q->top = q->bottom; -// pool->topBound = pool->top; -} - -#endif // WSDEQUE_H |