diff options
author | Tamar Christina <tamar@zhox.com> | 2019-06-01 10:56:31 +0100 |
---|---|---|
committer | Ben Gamari <ben@smart-cactus.org> | 2020-07-15 16:41:01 -0400 |
commit | 459e1c5f7c71e37ed8bb239c57bdec441d278fff (patch) | |
tree | e049c6429afef505fcd65af9eb0a785be78aa200 /rts | |
parent | 00a23bfda4840546075ec2b2e18f61380b360dfc (diff) | |
download | haskell-459e1c5f7c71e37ed8bb239c57bdec441d278fff.tar.gz |
winio: Use SlimReaderLocks and ConditonalVariables provided by the OS instead of emulated ones
Diffstat (limited to 'rts')
-rw-r--r-- | rts/HeapStackCheck.cmm | 4 | ||||
-rw-r--r-- | rts/PrimOps.cmm | 4 | ||||
-rw-r--r-- | rts/StgMiscClosures.cmm | 4 | ||||
-rw-r--r-- | rts/win32/IOManager.c | 60 | ||||
-rw-r--r-- | rts/win32/OSMem.c | 19 | ||||
-rw-r--r-- | rts/win32/OSThreads.c | 176 | ||||
-rw-r--r-- | rts/win32/WorkQueue.c | 14 | ||||
-rw-r--r-- | rts/win32/WorkQueue.h | 4 |
8 files changed, 117 insertions, 168 deletions
diff --git a/rts/HeapStackCheck.cmm b/rts/HeapStackCheck.cmm index 1c1de089dc..b8df323c8b 100644 --- a/rts/HeapStackCheck.cmm +++ b/rts/HeapStackCheck.cmm @@ -17,8 +17,8 @@ #if defined(__PIC__) import pthread_mutex_unlock; #endif -import EnterCriticalSection; -import LeaveCriticalSection; +import AcquireSRWLockExclusive; +import ReleaseSRWLockExclusives; /* Stack/Heap Check Failure * ------------------------ diff --git a/rts/PrimOps.cmm b/rts/PrimOps.cmm index 1fd746edf6..e13e89b98c 100644 --- a/rts/PrimOps.cmm +++ b/rts/PrimOps.cmm @@ -31,8 +31,8 @@ import pthread_mutex_unlock; #endif import CLOSURE base_ControlziExceptionziBase_nestedAtomically_closure; import CLOSURE base_GHCziIOziException_heapOverflow_closure; -import EnterCriticalSection; -import LeaveCriticalSection; +import AcquireSRWLockExclusive; +import ReleaseSRWLockExclusive; import CLOSURE ghczmprim_GHCziTypes_False_closure; #if defined(PROFILING) import CLOSURE CCS_MAIN; diff --git a/rts/StgMiscClosures.cmm b/rts/StgMiscClosures.cmm index 4293dfb787..7a8f20dded 100644 --- a/rts/StgMiscClosures.cmm +++ b/rts/StgMiscClosures.cmm @@ -15,8 +15,8 @@ import pthread_mutex_lock; import ghczmprim_GHCziTypes_Czh_info; import ghczmprim_GHCziTypes_Izh_info; -import EnterCriticalSection; -import LeaveCriticalSection; +import AcquireSRWLockExclusive; +import ReleaseSRWLockExclusive; /* ---------------------------------------------------------------------------- Stack underflow diff --git a/rts/win32/IOManager.c b/rts/win32/IOManager.c index f155180ef3..e5da32b982 100644 --- a/rts/win32/IOManager.c +++ b/rts/win32/IOManager.c @@ -22,7 +22,7 @@ * Internal state maintained by the IO manager. */ typedef struct IOManagerState { - CritSection manLock; + Mutex manLock; WorkQueue* workQueue; int queueSize; int numWorkers; @@ -30,7 +30,7 @@ typedef struct IOManagerState { HANDLE hExitEvent; unsigned int requestID; /* fields for keeping track of active WorkItems */ - CritSection active_work_lock; + Mutex active_work_lock; WorkItem* active_work_items; UINT sleepResolution; } IOManagerState; @@ -65,7 +65,7 @@ IOWorkerProc(PVOID param) // The error code is communicated back on completion of request; reset. errCode = 0; - EnterCriticalSection(&iom->manLock); + OS_ACQUIRE_LOCK(&iom->manLock); /* Signal that the worker is idle. * * 'workersIdle' is used when determining whether or not to @@ -73,7 +73,7 @@ IOWorkerProc(PVOID param) * (see addIORequest().) */ iom->workersIdle++; - LeaveCriticalSection(&iom->manLock); + OS_RELEASE_LOCK(&iom->manLock); /* * A possible future refinement is to make long-term idle threads @@ -85,19 +85,19 @@ IOWorkerProc(PVOID param) if (rc == WAIT_OBJECT_0) { // we received the exit event - EnterCriticalSection(&iom->manLock); + OS_ACQUIRE_LOCK(&iom->manLock); ioMan->numWorkers--; - LeaveCriticalSection(&iom->manLock); + OS_RELEASE_LOCK(&iom->manLock); return 0; } - EnterCriticalSection(&iom->manLock); + OS_ACQUIRE_LOCK(&iom->manLock); /* Signal that the thread is 'non-idle' and about to consume * a work item. */ iom->workersIdle--; iom->queueSize--; - LeaveCriticalSection(&iom->manLock); + OS_RELEASE_LOCK(&iom->manLock); if ( rc == (WAIT_OBJECT_0 + 1) ) { /* work item available, fetch it. */ @@ -266,17 +266,17 @@ IOWorkerProc(PVOID param) } else { fprintf(stderr, "unable to fetch work; fatal.\n"); fflush(stderr); - EnterCriticalSection(&iom->manLock); + OS_ACQUIRE_LOCK(&iom->manLock); ioMan->numWorkers--; - LeaveCriticalSection(&iom->manLock); + OS_RELEASE_LOCK(&iom->manLock); return 1; } } else { fprintf(stderr, "waiting failed (%lu); fatal.\n", rc); fflush(stderr); - EnterCriticalSection(&iom->manLock); + OS_ACQUIRE_LOCK(&iom->manLock); ioMan->numWorkers--; - LeaveCriticalSection(&iom->manLock); + OS_RELEASE_LOCK(&iom->manLock); return 1; } } @@ -334,13 +334,13 @@ StartIOManager(void) } ioMan->hExitEvent = hExit; - InitializeCriticalSection(&ioMan->manLock); + OS_INIT_LOCK(&ioMan->manLock); ioMan->workQueue = wq; ioMan->numWorkers = 0; ioMan->workersIdle = 0; ioMan->queueSize = 0; ioMan->requestID = 1; - InitializeCriticalSection(&ioMan->active_work_lock); + OS_INIT_LOCK(&ioMan->active_work_lock); ioMan->active_work_items = NULL; ioMan->sleepResolution = sleepResolution; @@ -360,7 +360,7 @@ int depositWorkItem( unsigned int reqID, WorkItem* wItem ) { - EnterCriticalSection(&ioMan->manLock); + OS_ACQUIRE_LOCK(&ioMan->manLock); #if 0 fprintf(stderr, "depositWorkItem: %d/%d\n", @@ -397,9 +397,9 @@ depositWorkItem( unsigned int reqID, if ( (ioMan->workersIdle < ioMan->queueSize) ) { /* see if giving up our quantum ferrets out some idle threads. */ - LeaveCriticalSection(&ioMan->manLock); + OS_RELEASE_LOCK(&ioMan->manLock); Sleep(0); - EnterCriticalSection(&ioMan->manLock); + OS_ACQUIRE_LOCK(&ioMan->manLock); if ( (ioMan->workersIdle < ioMan->queueSize) ) { /* No, go ahead and create another. */ ioMan->numWorkers++; @@ -408,7 +408,7 @@ depositWorkItem( unsigned int reqID, } } } - LeaveCriticalSection(&ioMan->manLock); + OS_RELEASE_LOCK(&ioMan->manLock); if (SubmitWork(ioMan->workQueue,wItem)) { /* Note: the work item has potentially been consumed by a worker thread @@ -522,17 +522,17 @@ void ShutdownIOManager ( bool wait_threads ) if (wait_threads) { /* Wait for all worker threads to die. */ for (;;) { - EnterCriticalSection(&ioMan->manLock); + OS_ACQUIRE_LOCK(&ioMan->manLock); num = ioMan->numWorkers; - LeaveCriticalSection(&ioMan->manLock); + OS_RELEASE_LOCK(&ioMan->manLock); if (num == 0) break; Sleep(10); } FreeWorkQueue(ioMan->workQueue); CloseHandle(ioMan->hExitEvent); - DeleteCriticalSection(&ioMan->active_work_lock); - DeleteCriticalSection(&ioMan->manLock); + OS_CLOSE_LOCK(&ioMan->active_work_lock); + OS_CLOSE_LOCK(&ioMan->manLock); mmresult = timeEndPeriod(ioMan->sleepResolution); if (mmresult != MMSYSERR_NOERROR) { @@ -550,10 +550,10 @@ void RegisterWorkItem(IOManagerState* ioMan, WorkItem* wi) { - EnterCriticalSection(&ioMan->active_work_lock); + OS_ACQUIRE_LOCK(&ioMan->active_work_lock); wi->link = ioMan->active_work_items; ioMan->active_work_items = wi; - LeaveCriticalSection(&ioMan->active_work_lock); + OS_RELEASE_LOCK(&ioMan->active_work_lock); } static @@ -563,7 +563,7 @@ DeregisterWorkItem(IOManagerState* ioMan, { WorkItem *ptr, *prev; - EnterCriticalSection(&ioMan->active_work_lock); + OS_ACQUIRE_LOCK(&ioMan->active_work_lock); for(prev=NULL,ptr=ioMan->active_work_items;ptr;prev=ptr,ptr=ptr->link) { if (wi->requestID == ptr->requestID) { if (prev==NULL) { @@ -571,13 +571,13 @@ DeregisterWorkItem(IOManagerState* ioMan, } else { prev->link = ptr->link; } - LeaveCriticalSection(&ioMan->active_work_lock); + OS_RELEASE_LOCK(&ioMan->active_work_lock); return; } } fprintf(stderr, "DeregisterWorkItem: unable to locate work item %d\n", wi->requestID); - LeaveCriticalSection(&ioMan->active_work_lock); + OS_RELEASE_LOCK(&ioMan->active_work_lock); } @@ -596,11 +596,11 @@ void abandonWorkRequest ( int reqID ) { WorkItem *ptr; - EnterCriticalSection(&ioMan->active_work_lock); + OS_ACQUIRE_LOCK(&ioMan->active_work_lock); for(ptr=ioMan->active_work_items;ptr;ptr=ptr->link) { if (ptr->requestID == (unsigned int)reqID ) { ptr->abandonOp = 1; - LeaveCriticalSection(&ioMan->active_work_lock); + OS_RELEASE_LOCK(&ioMan->active_work_lock); return; } } @@ -608,7 +608,7 @@ abandonWorkRequest ( int reqID ) * finished sometime since awaitRequests() last drained the completed * request table; i.e., not an error. */ - LeaveCriticalSection(&ioMan->active_work_lock); + OS_RELEASE_LOCK(&ioMan->active_work_lock); } #endif diff --git a/rts/win32/OSMem.c b/rts/win32/OSMem.c index dd0f60ff0a..fd26d06c4e 100644 --- a/rts/win32/OSMem.c +++ b/rts/win32/OSMem.c @@ -37,28 +37,11 @@ static alloc_rec* allocs = NULL; /* free_blocks are kept in ascending order, and adjacent blocks are merged */ static block_rec* free_blocks = NULL; -/* Mingw-w64 does not currently have this in their header. So we have to import it.*/ -typedef LPVOID(WINAPI *VirtualAllocExNumaProc)(HANDLE, LPVOID, SIZE_T, DWORD, DWORD, DWORD); - -/* Cache NUMA API call. */ -VirtualAllocExNumaProc _VirtualAllocExNuma; - void osMemInit(void) { allocs = NULL; free_blocks = NULL; - - /* Resolve and cache VirtualAllocExNuma. */ - if (osNumaAvailable() && RtsFlags.GcFlags.numa) - { - _VirtualAllocExNuma = (VirtualAllocExNumaProc)(void*)GetProcAddress(GetModuleHandleW(L"kernel32"), "VirtualAllocExNuma"); - if (!_VirtualAllocExNuma) - { - sysErrorBelch( - "osBindMBlocksToNode: VirtualAllocExNuma does not exist. How did you get this far?"); - } - } } static @@ -569,7 +552,7 @@ void osBindMBlocksToNode( On windows also -xb is broken, it does nothing so that can't be used to tweak it (see #12577). So for now, just let the OS decide. */ - temp = _VirtualAllocExNuma( + temp = VirtualAllocExNuma( GetCurrentProcess(), NULL, // addr? See base memory size, diff --git a/rts/win32/OSThreads.c b/rts/win32/OSThreads.c index fe35f35e82..706237363a 100644 --- a/rts/win32/OSThreads.c +++ b/rts/win32/OSThreads.c @@ -27,69 +27,6 @@ static uint32_t* cpuGroupCumulativeCache = NULL; /* Processor group dist cache. */ static uint8_t* cpuGroupDistCache = NULL; -/* Win32 threads and synchronisation objects */ - -/* A Condition is represented by a Win32 Event object; - * a Mutex by a Mutex kernel object. - * - * ToDo: go through the defn and usage of these to - * make sure the semantics match up with that of - * the (assumed) pthreads behaviour. This is really - * just a first pass at getting something compilable. - */ - -void -initCondition( Condition* pCond ) -{ - HANDLE h = CreateEvent(NULL, - FALSE, /* auto reset */ - FALSE, /* initially not signalled */ - NULL); /* unnamed => process-local. */ - - if ( h == NULL ) { - sysErrorBelch("initCondition: unable to create"); - stg_exit(EXIT_FAILURE); - } - *pCond = h; - return; -} - -void -closeCondition( Condition* pCond ) -{ - if ( CloseHandle(*pCond) == 0 ) { - sysErrorBelch("closeCondition: failed to close"); - } - return; -} - -bool -broadcastCondition ( Condition* pCond ) -{ - PulseEvent(*pCond); - return true; -} - -bool -signalCondition ( Condition* pCond ) -{ - if (SetEvent(*pCond) == 0) { - sysErrorBelch("SetEvent"); - stg_exit(EXIT_FAILURE); - } - return true; -} - -bool -waitCondition ( Condition* pCond, Mutex* pMut ) -{ - RELEASE_LOCK(pMut); - WaitForSingleObject(*pCond, INFINITE); - /* Hmm..use WaitForMultipleObjects() ? */ - ACQUIRE_LOCK(pMut); - return true; -} - void yieldThread() { @@ -150,35 +87,6 @@ osThreadIsAlive(OSThreadId id) return (exit_code == STILL_ACTIVE); } -#if defined(USE_CRITICAL_SECTIONS) -void -initMutex (Mutex* pMut) -{ - InitializeCriticalSectionAndSpinCount(pMut,4000); -} -void -closeMutex (Mutex* pMut) -{ - DeleteCriticalSection(pMut); -} -#else -void -initMutex (Mutex* pMut) -{ - HANDLE h = CreateMutex ( NULL, /* default sec. attributes */ - TRUE, /* not owned => initially signalled */ - NULL - ); - *pMut = h; - return; -} -void -closeMutex (Mutex* pMut) -{ - CloseHandle(*pMut); -} -#endif - void newThreadLocalKey (ThreadLocalKey *key) { @@ -252,6 +160,13 @@ forkOS_createThread ( HsStablePtr entry ) (unsigned*)&pId) == 0); } +#if defined(x86_64_HOST_ARCH) + +#if !defined(ALL_PROCESSOR_GROUPS) +#define ALL_PROCESSOR_GROUPS 0xffff +#endif +#endif + void freeThreadingResources (void) { if (cpuGroupCache) @@ -426,12 +341,15 @@ getNumberOfProcessors (void) if (nproc) { - IF_DEBUG(scheduler, debugBelch("[*] Total number of active processors detected: %u\n", nproc)); + IF_DEBUG(scheduler, debugBelch("[*] Total number of active " + "processors detected: %u\n", nproc)); return nproc; } - IF_DEBUG(scheduler, debugBelch("Could not determine Max number of logical processors.\n" - "Falling back to old code which limits to 64 logical processors.\n")); + IF_DEBUG(scheduler, debugBelch("Could not determine Max number of " + "logical processors.\n" + "Falling back to old code which limits " + "to 64 logical processors.\n")); } #endif @@ -484,7 +402,6 @@ setThreadAffinity (uint32_t n, uint32_t m) // cap N of M for (i = 0; i < n_groups; i++) { #if defined(x86_64_HOST_ARCH) - // If we support the new API, use it. if (mask[i] > 0) { GROUP_AFFINITY hGroup; @@ -515,24 +432,15 @@ setThreadAffinity (uint32_t n, uint32_t m) // cap N of M free(mask); } -typedef BOOL (WINAPI *PCSIO)(HANDLE); - void interruptOSThread (OSThreadId id) { HANDLE hdl; - PCSIO pCSIO; if (!(hdl = OpenThread(THREAD_TERMINATE,FALSE,id))) { sysErrorBelch("interruptOSThread: OpenThread"); stg_exit(EXIT_FAILURE); } - pCSIO = (PCSIO)(void*)GetProcAddress(GetModuleHandle(TEXT("Kernel32.dll")), - "CancelSynchronousIo"); - if ( NULL != pCSIO ) { - pCSIO(hdl); - } else { - // Nothing to do, unfortunately - } + CancelSynchronousIo(hdl); CloseHandle(hdl); } @@ -600,3 +508,59 @@ KernelThreadId kernelThreadId (void) DWORD tid = GetCurrentThreadId(); return tid; } + +/* Win32 threads and synchronisation objects */ + +/* A Condition is represented by a Win32 Event object; + * a Mutex by a Mutex kernel object. + * + * ToDo: go through the defn and usage of these to + * make sure the semantics match up with that of + * the (assumed) pthreads behaviour. This is really + * just a first pass at getting something compilable. + */ + +void +initCondition( Condition* pCond ) +{ + InitializeConditionVariable(pCond); + return; +} + +void +closeCondition( Condition* pCond STG_UNUSED) +{ + return; +} + +bool +broadcastCondition ( Condition* pCond ) +{ + WakeAllConditionVariable(pCond); + return true; +} + +bool +signalCondition ( Condition* pCond ) +{ + WakeConditionVariable(pCond); + return true; +} + +bool +waitCondition ( Condition* pCond, Mutex* pMut ) +{ + SleepConditionVariableSRW(pCond, pMut, INFINITE, 0); + return true; +} + +void +initMutex (Mutex* pMut) +{ + InitializeSRWLock(pMut); +} +void +closeMutex (Mutex* pMut) +{ + (void)pMut; +} diff --git a/rts/win32/WorkQueue.c b/rts/win32/WorkQueue.c index e560bd24cd..dba20c668b 100644 --- a/rts/win32/WorkQueue.c +++ b/rts/win32/WorkQueue.c @@ -3,11 +3,13 @@ * * (c) sof, 2002-2003. */ +#include "Rts.h" #include "WorkQueue.h" #include <stdbool.h> #include <stdio.h> #include <stdlib.h> #include <string.h> +#include <windows.h> static void queue_error_rc( char* loc, DWORD err); static void queue_error( char* loc, char* reason); @@ -48,7 +50,7 @@ NewWorkQueue() memset(wq, 0, sizeof *wq); - InitializeCriticalSection(&wq->queueLock); + OS_INIT_LOCK(&wq->queueLock); wq->workAvailable = newSemaphore(0, WORKQUEUE_SIZE); wq->roomAvailable = newSemaphore(WORKQUEUE_SIZE, WORKQUEUE_SIZE); @@ -83,7 +85,7 @@ FreeWorkQueue ( WorkQueue* pq ) if ( pq->roomAvailable ) { CloseHandle(pq->roomAvailable); } - DeleteCriticalSection(&pq->queueLock); + OS_CLOSE_LOCK(&pq->queueLock); free(pq); return; } @@ -147,13 +149,13 @@ FetchWork ( WorkQueue* pq, void** ppw ) return false; } - EnterCriticalSection(&pq->queueLock); + OS_ACQUIRE_LOCK(&pq->queueLock); *ppw = pq->items[pq->head]; /* For sanity's sake, zero out the pointer. */ pq->items[pq->head] = NULL; pq->head = (pq->head + 1) % WORKQUEUE_SIZE; rc = ReleaseSemaphore(pq->roomAvailable,1, NULL); - LeaveCriticalSection(&pq->queueLock); + OS_RELEASE_LOCK(&pq->queueLock); if ( 0 == rc ) { queue_error_rc("FetchWork.ReleaseSemaphore()", GetLastError()); return false; @@ -191,11 +193,11 @@ SubmitWork ( WorkQueue* pq, void* pw ) return false; } - EnterCriticalSection(&pq->queueLock); + OS_ACQUIRE_LOCK(&pq->queueLock); pq->items[pq->tail] = pw; pq->tail = (pq->tail + 1) % WORKQUEUE_SIZE; rc = ReleaseSemaphore(pq->workAvailable,1, NULL); - LeaveCriticalSection(&pq->queueLock); + OS_RELEASE_LOCK(&pq->queueLock); if ( 0 == rc ) { queue_error_rc("SubmitWork.ReleaseSemaphore()", GetLastError()); return false; diff --git a/rts/win32/WorkQueue.h b/rts/win32/WorkQueue.h index 4dbfcd40d3..569a7b4445 100644 --- a/rts/win32/WorkQueue.h +++ b/rts/win32/WorkQueue.h @@ -14,12 +14,12 @@ #define WORKQUEUE_SIZE 16 typedef HANDLE Semaphore; -typedef CRITICAL_SECTION CritSection; +typedef SRWLOCK Mutex; typedef struct WorkQueue { /* the master lock, need to be grabbed prior to using any of the other elements of the struct. */ - CritSection queueLock; + Mutex queueLock; /* consumers/workers block waiting for 'workAvailable' */ Semaphore workAvailable; Semaphore roomAvailable; |