summaryrefslogtreecommitdiff
path: root/rts
diff options
context:
space:
mode:
authorTamar Christina <tamar@zhox.com>2019-06-01 10:56:31 +0100
committerBen Gamari <ben@smart-cactus.org>2020-07-15 16:41:01 -0400
commit459e1c5f7c71e37ed8bb239c57bdec441d278fff (patch)
treee049c6429afef505fcd65af9eb0a785be78aa200 /rts
parent00a23bfda4840546075ec2b2e18f61380b360dfc (diff)
downloadhaskell-459e1c5f7c71e37ed8bb239c57bdec441d278fff.tar.gz
winio: Use SlimReaderLocks and ConditonalVariables provided by the OS instead of emulated ones
Diffstat (limited to 'rts')
-rw-r--r--rts/HeapStackCheck.cmm4
-rw-r--r--rts/PrimOps.cmm4
-rw-r--r--rts/StgMiscClosures.cmm4
-rw-r--r--rts/win32/IOManager.c60
-rw-r--r--rts/win32/OSMem.c19
-rw-r--r--rts/win32/OSThreads.c176
-rw-r--r--rts/win32/WorkQueue.c14
-rw-r--r--rts/win32/WorkQueue.h4
8 files changed, 117 insertions, 168 deletions
diff --git a/rts/HeapStackCheck.cmm b/rts/HeapStackCheck.cmm
index 1c1de089dc..b8df323c8b 100644
--- a/rts/HeapStackCheck.cmm
+++ b/rts/HeapStackCheck.cmm
@@ -17,8 +17,8 @@
#if defined(__PIC__)
import pthread_mutex_unlock;
#endif
-import EnterCriticalSection;
-import LeaveCriticalSection;
+import AcquireSRWLockExclusive;
+import ReleaseSRWLockExclusives;
/* Stack/Heap Check Failure
* ------------------------
diff --git a/rts/PrimOps.cmm b/rts/PrimOps.cmm
index 1fd746edf6..e13e89b98c 100644
--- a/rts/PrimOps.cmm
+++ b/rts/PrimOps.cmm
@@ -31,8 +31,8 @@ import pthread_mutex_unlock;
#endif
import CLOSURE base_ControlziExceptionziBase_nestedAtomically_closure;
import CLOSURE base_GHCziIOziException_heapOverflow_closure;
-import EnterCriticalSection;
-import LeaveCriticalSection;
+import AcquireSRWLockExclusive;
+import ReleaseSRWLockExclusive;
import CLOSURE ghczmprim_GHCziTypes_False_closure;
#if defined(PROFILING)
import CLOSURE CCS_MAIN;
diff --git a/rts/StgMiscClosures.cmm b/rts/StgMiscClosures.cmm
index 4293dfb787..7a8f20dded 100644
--- a/rts/StgMiscClosures.cmm
+++ b/rts/StgMiscClosures.cmm
@@ -15,8 +15,8 @@
import pthread_mutex_lock;
import ghczmprim_GHCziTypes_Czh_info;
import ghczmprim_GHCziTypes_Izh_info;
-import EnterCriticalSection;
-import LeaveCriticalSection;
+import AcquireSRWLockExclusive;
+import ReleaseSRWLockExclusive;
/* ----------------------------------------------------------------------------
Stack underflow
diff --git a/rts/win32/IOManager.c b/rts/win32/IOManager.c
index f155180ef3..e5da32b982 100644
--- a/rts/win32/IOManager.c
+++ b/rts/win32/IOManager.c
@@ -22,7 +22,7 @@
* Internal state maintained by the IO manager.
*/
typedef struct IOManagerState {
- CritSection manLock;
+ Mutex manLock;
WorkQueue* workQueue;
int queueSize;
int numWorkers;
@@ -30,7 +30,7 @@ typedef struct IOManagerState {
HANDLE hExitEvent;
unsigned int requestID;
/* fields for keeping track of active WorkItems */
- CritSection active_work_lock;
+ Mutex active_work_lock;
WorkItem* active_work_items;
UINT sleepResolution;
} IOManagerState;
@@ -65,7 +65,7 @@ IOWorkerProc(PVOID param)
// The error code is communicated back on completion of request; reset.
errCode = 0;
- EnterCriticalSection(&iom->manLock);
+ OS_ACQUIRE_LOCK(&iom->manLock);
/* Signal that the worker is idle.
*
* 'workersIdle' is used when determining whether or not to
@@ -73,7 +73,7 @@ IOWorkerProc(PVOID param)
* (see addIORequest().)
*/
iom->workersIdle++;
- LeaveCriticalSection(&iom->manLock);
+ OS_RELEASE_LOCK(&iom->manLock);
/*
* A possible future refinement is to make long-term idle threads
@@ -85,19 +85,19 @@ IOWorkerProc(PVOID param)
if (rc == WAIT_OBJECT_0) {
// we received the exit event
- EnterCriticalSection(&iom->manLock);
+ OS_ACQUIRE_LOCK(&iom->manLock);
ioMan->numWorkers--;
- LeaveCriticalSection(&iom->manLock);
+ OS_RELEASE_LOCK(&iom->manLock);
return 0;
}
- EnterCriticalSection(&iom->manLock);
+ OS_ACQUIRE_LOCK(&iom->manLock);
/* Signal that the thread is 'non-idle' and about to consume
* a work item.
*/
iom->workersIdle--;
iom->queueSize--;
- LeaveCriticalSection(&iom->manLock);
+ OS_RELEASE_LOCK(&iom->manLock);
if ( rc == (WAIT_OBJECT_0 + 1) ) {
/* work item available, fetch it. */
@@ -266,17 +266,17 @@ IOWorkerProc(PVOID param)
} else {
fprintf(stderr, "unable to fetch work; fatal.\n");
fflush(stderr);
- EnterCriticalSection(&iom->manLock);
+ OS_ACQUIRE_LOCK(&iom->manLock);
ioMan->numWorkers--;
- LeaveCriticalSection(&iom->manLock);
+ OS_RELEASE_LOCK(&iom->manLock);
return 1;
}
} else {
fprintf(stderr, "waiting failed (%lu); fatal.\n", rc);
fflush(stderr);
- EnterCriticalSection(&iom->manLock);
+ OS_ACQUIRE_LOCK(&iom->manLock);
ioMan->numWorkers--;
- LeaveCriticalSection(&iom->manLock);
+ OS_RELEASE_LOCK(&iom->manLock);
return 1;
}
}
@@ -334,13 +334,13 @@ StartIOManager(void)
}
ioMan->hExitEvent = hExit;
- InitializeCriticalSection(&ioMan->manLock);
+ OS_INIT_LOCK(&ioMan->manLock);
ioMan->workQueue = wq;
ioMan->numWorkers = 0;
ioMan->workersIdle = 0;
ioMan->queueSize = 0;
ioMan->requestID = 1;
- InitializeCriticalSection(&ioMan->active_work_lock);
+ OS_INIT_LOCK(&ioMan->active_work_lock);
ioMan->active_work_items = NULL;
ioMan->sleepResolution = sleepResolution;
@@ -360,7 +360,7 @@ int
depositWorkItem( unsigned int reqID,
WorkItem* wItem )
{
- EnterCriticalSection(&ioMan->manLock);
+ OS_ACQUIRE_LOCK(&ioMan->manLock);
#if 0
fprintf(stderr, "depositWorkItem: %d/%d\n",
@@ -397,9 +397,9 @@ depositWorkItem( unsigned int reqID,
if ( (ioMan->workersIdle < ioMan->queueSize) ) {
/* see if giving up our quantum ferrets out some idle threads.
*/
- LeaveCriticalSection(&ioMan->manLock);
+ OS_RELEASE_LOCK(&ioMan->manLock);
Sleep(0);
- EnterCriticalSection(&ioMan->manLock);
+ OS_ACQUIRE_LOCK(&ioMan->manLock);
if ( (ioMan->workersIdle < ioMan->queueSize) ) {
/* No, go ahead and create another. */
ioMan->numWorkers++;
@@ -408,7 +408,7 @@ depositWorkItem( unsigned int reqID,
}
}
}
- LeaveCriticalSection(&ioMan->manLock);
+ OS_RELEASE_LOCK(&ioMan->manLock);
if (SubmitWork(ioMan->workQueue,wItem)) {
/* Note: the work item has potentially been consumed by a worker thread
@@ -522,17 +522,17 @@ void ShutdownIOManager ( bool wait_threads )
if (wait_threads) {
/* Wait for all worker threads to die. */
for (;;) {
- EnterCriticalSection(&ioMan->manLock);
+ OS_ACQUIRE_LOCK(&ioMan->manLock);
num = ioMan->numWorkers;
- LeaveCriticalSection(&ioMan->manLock);
+ OS_RELEASE_LOCK(&ioMan->manLock);
if (num == 0)
break;
Sleep(10);
}
FreeWorkQueue(ioMan->workQueue);
CloseHandle(ioMan->hExitEvent);
- DeleteCriticalSection(&ioMan->active_work_lock);
- DeleteCriticalSection(&ioMan->manLock);
+ OS_CLOSE_LOCK(&ioMan->active_work_lock);
+ OS_CLOSE_LOCK(&ioMan->manLock);
mmresult = timeEndPeriod(ioMan->sleepResolution);
if (mmresult != MMSYSERR_NOERROR) {
@@ -550,10 +550,10 @@ void
RegisterWorkItem(IOManagerState* ioMan,
WorkItem* wi)
{
- EnterCriticalSection(&ioMan->active_work_lock);
+ OS_ACQUIRE_LOCK(&ioMan->active_work_lock);
wi->link = ioMan->active_work_items;
ioMan->active_work_items = wi;
- LeaveCriticalSection(&ioMan->active_work_lock);
+ OS_RELEASE_LOCK(&ioMan->active_work_lock);
}
static
@@ -563,7 +563,7 @@ DeregisterWorkItem(IOManagerState* ioMan,
{
WorkItem *ptr, *prev;
- EnterCriticalSection(&ioMan->active_work_lock);
+ OS_ACQUIRE_LOCK(&ioMan->active_work_lock);
for(prev=NULL,ptr=ioMan->active_work_items;ptr;prev=ptr,ptr=ptr->link) {
if (wi->requestID == ptr->requestID) {
if (prev==NULL) {
@@ -571,13 +571,13 @@ DeregisterWorkItem(IOManagerState* ioMan,
} else {
prev->link = ptr->link;
}
- LeaveCriticalSection(&ioMan->active_work_lock);
+ OS_RELEASE_LOCK(&ioMan->active_work_lock);
return;
}
}
fprintf(stderr, "DeregisterWorkItem: unable to locate work item %d\n",
wi->requestID);
- LeaveCriticalSection(&ioMan->active_work_lock);
+ OS_RELEASE_LOCK(&ioMan->active_work_lock);
}
@@ -596,11 +596,11 @@ void
abandonWorkRequest ( int reqID )
{
WorkItem *ptr;
- EnterCriticalSection(&ioMan->active_work_lock);
+ OS_ACQUIRE_LOCK(&ioMan->active_work_lock);
for(ptr=ioMan->active_work_items;ptr;ptr=ptr->link) {
if (ptr->requestID == (unsigned int)reqID ) {
ptr->abandonOp = 1;
- LeaveCriticalSection(&ioMan->active_work_lock);
+ OS_RELEASE_LOCK(&ioMan->active_work_lock);
return;
}
}
@@ -608,7 +608,7 @@ abandonWorkRequest ( int reqID )
* finished sometime since awaitRequests() last drained the completed
* request table; i.e., not an error.
*/
- LeaveCriticalSection(&ioMan->active_work_lock);
+ OS_RELEASE_LOCK(&ioMan->active_work_lock);
}
#endif
diff --git a/rts/win32/OSMem.c b/rts/win32/OSMem.c
index dd0f60ff0a..fd26d06c4e 100644
--- a/rts/win32/OSMem.c
+++ b/rts/win32/OSMem.c
@@ -37,28 +37,11 @@ static alloc_rec* allocs = NULL;
/* free_blocks are kept in ascending order, and adjacent blocks are merged */
static block_rec* free_blocks = NULL;
-/* Mingw-w64 does not currently have this in their header. So we have to import it.*/
-typedef LPVOID(WINAPI *VirtualAllocExNumaProc)(HANDLE, LPVOID, SIZE_T, DWORD, DWORD, DWORD);
-
-/* Cache NUMA API call. */
-VirtualAllocExNumaProc _VirtualAllocExNuma;
-
void
osMemInit(void)
{
allocs = NULL;
free_blocks = NULL;
-
- /* Resolve and cache VirtualAllocExNuma. */
- if (osNumaAvailable() && RtsFlags.GcFlags.numa)
- {
- _VirtualAllocExNuma = (VirtualAllocExNumaProc)(void*)GetProcAddress(GetModuleHandleW(L"kernel32"), "VirtualAllocExNuma");
- if (!_VirtualAllocExNuma)
- {
- sysErrorBelch(
- "osBindMBlocksToNode: VirtualAllocExNuma does not exist. How did you get this far?");
- }
- }
}
static
@@ -569,7 +552,7 @@ void osBindMBlocksToNode(
On windows also -xb is broken, it does nothing so that can't
be used to tweak it (see #12577). So for now, just let the OS decide.
*/
- temp = _VirtualAllocExNuma(
+ temp = VirtualAllocExNuma(
GetCurrentProcess(),
NULL, // addr? See base memory
size,
diff --git a/rts/win32/OSThreads.c b/rts/win32/OSThreads.c
index fe35f35e82..706237363a 100644
--- a/rts/win32/OSThreads.c
+++ b/rts/win32/OSThreads.c
@@ -27,69 +27,6 @@ static uint32_t* cpuGroupCumulativeCache = NULL;
/* Processor group dist cache. */
static uint8_t* cpuGroupDistCache = NULL;
-/* Win32 threads and synchronisation objects */
-
-/* A Condition is represented by a Win32 Event object;
- * a Mutex by a Mutex kernel object.
- *
- * ToDo: go through the defn and usage of these to
- * make sure the semantics match up with that of
- * the (assumed) pthreads behaviour. This is really
- * just a first pass at getting something compilable.
- */
-
-void
-initCondition( Condition* pCond )
-{
- HANDLE h = CreateEvent(NULL,
- FALSE, /* auto reset */
- FALSE, /* initially not signalled */
- NULL); /* unnamed => process-local. */
-
- if ( h == NULL ) {
- sysErrorBelch("initCondition: unable to create");
- stg_exit(EXIT_FAILURE);
- }
- *pCond = h;
- return;
-}
-
-void
-closeCondition( Condition* pCond )
-{
- if ( CloseHandle(*pCond) == 0 ) {
- sysErrorBelch("closeCondition: failed to close");
- }
- return;
-}
-
-bool
-broadcastCondition ( Condition* pCond )
-{
- PulseEvent(*pCond);
- return true;
-}
-
-bool
-signalCondition ( Condition* pCond )
-{
- if (SetEvent(*pCond) == 0) {
- sysErrorBelch("SetEvent");
- stg_exit(EXIT_FAILURE);
- }
- return true;
-}
-
-bool
-waitCondition ( Condition* pCond, Mutex* pMut )
-{
- RELEASE_LOCK(pMut);
- WaitForSingleObject(*pCond, INFINITE);
- /* Hmm..use WaitForMultipleObjects() ? */
- ACQUIRE_LOCK(pMut);
- return true;
-}
-
void
yieldThread()
{
@@ -150,35 +87,6 @@ osThreadIsAlive(OSThreadId id)
return (exit_code == STILL_ACTIVE);
}
-#if defined(USE_CRITICAL_SECTIONS)
-void
-initMutex (Mutex* pMut)
-{
- InitializeCriticalSectionAndSpinCount(pMut,4000);
-}
-void
-closeMutex (Mutex* pMut)
-{
- DeleteCriticalSection(pMut);
-}
-#else
-void
-initMutex (Mutex* pMut)
-{
- HANDLE h = CreateMutex ( NULL, /* default sec. attributes */
- TRUE, /* not owned => initially signalled */
- NULL
- );
- *pMut = h;
- return;
-}
-void
-closeMutex (Mutex* pMut)
-{
- CloseHandle(*pMut);
-}
-#endif
-
void
newThreadLocalKey (ThreadLocalKey *key)
{
@@ -252,6 +160,13 @@ forkOS_createThread ( HsStablePtr entry )
(unsigned*)&pId) == 0);
}
+#if defined(x86_64_HOST_ARCH)
+
+#if !defined(ALL_PROCESSOR_GROUPS)
+#define ALL_PROCESSOR_GROUPS 0xffff
+#endif
+#endif
+
void freeThreadingResources (void)
{
if (cpuGroupCache)
@@ -426,12 +341,15 @@ getNumberOfProcessors (void)
if (nproc)
{
- IF_DEBUG(scheduler, debugBelch("[*] Total number of active processors detected: %u\n", nproc));
+ IF_DEBUG(scheduler, debugBelch("[*] Total number of active "
+ "processors detected: %u\n", nproc));
return nproc;
}
- IF_DEBUG(scheduler, debugBelch("Could not determine Max number of logical processors.\n"
- "Falling back to old code which limits to 64 logical processors.\n"));
+ IF_DEBUG(scheduler, debugBelch("Could not determine Max number of "
+ "logical processors.\n"
+ "Falling back to old code which limits "
+ "to 64 logical processors.\n"));
}
#endif
@@ -484,7 +402,6 @@ setThreadAffinity (uint32_t n, uint32_t m) // cap N of M
for (i = 0; i < n_groups; i++)
{
#if defined(x86_64_HOST_ARCH)
- // If we support the new API, use it.
if (mask[i] > 0)
{
GROUP_AFFINITY hGroup;
@@ -515,24 +432,15 @@ setThreadAffinity (uint32_t n, uint32_t m) // cap N of M
free(mask);
}
-typedef BOOL (WINAPI *PCSIO)(HANDLE);
-
void
interruptOSThread (OSThreadId id)
{
HANDLE hdl;
- PCSIO pCSIO;
if (!(hdl = OpenThread(THREAD_TERMINATE,FALSE,id))) {
sysErrorBelch("interruptOSThread: OpenThread");
stg_exit(EXIT_FAILURE);
}
- pCSIO = (PCSIO)(void*)GetProcAddress(GetModuleHandle(TEXT("Kernel32.dll")),
- "CancelSynchronousIo");
- if ( NULL != pCSIO ) {
- pCSIO(hdl);
- } else {
- // Nothing to do, unfortunately
- }
+ CancelSynchronousIo(hdl);
CloseHandle(hdl);
}
@@ -600,3 +508,59 @@ KernelThreadId kernelThreadId (void)
DWORD tid = GetCurrentThreadId();
return tid;
}
+
+/* Win32 threads and synchronisation objects */
+
+/* A Condition is represented by a Win32 Event object;
+ * a Mutex by a Mutex kernel object.
+ *
+ * ToDo: go through the defn and usage of these to
+ * make sure the semantics match up with that of
+ * the (assumed) pthreads behaviour. This is really
+ * just a first pass at getting something compilable.
+ */
+
+void
+initCondition( Condition* pCond )
+{
+ InitializeConditionVariable(pCond);
+ return;
+}
+
+void
+closeCondition( Condition* pCond STG_UNUSED)
+{
+ return;
+}
+
+bool
+broadcastCondition ( Condition* pCond )
+{
+ WakeAllConditionVariable(pCond);
+ return true;
+}
+
+bool
+signalCondition ( Condition* pCond )
+{
+ WakeConditionVariable(pCond);
+ return true;
+}
+
+bool
+waitCondition ( Condition* pCond, Mutex* pMut )
+{
+ SleepConditionVariableSRW(pCond, pMut, INFINITE, 0);
+ return true;
+}
+
+void
+initMutex (Mutex* pMut)
+{
+ InitializeSRWLock(pMut);
+}
+void
+closeMutex (Mutex* pMut)
+{
+ (void)pMut;
+}
diff --git a/rts/win32/WorkQueue.c b/rts/win32/WorkQueue.c
index e560bd24cd..dba20c668b 100644
--- a/rts/win32/WorkQueue.c
+++ b/rts/win32/WorkQueue.c
@@ -3,11 +3,13 @@
*
* (c) sof, 2002-2003.
*/
+#include "Rts.h"
#include "WorkQueue.h"
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
+#include <windows.h>
static void queue_error_rc( char* loc, DWORD err);
static void queue_error( char* loc, char* reason);
@@ -48,7 +50,7 @@ NewWorkQueue()
memset(wq, 0, sizeof *wq);
- InitializeCriticalSection(&wq->queueLock);
+ OS_INIT_LOCK(&wq->queueLock);
wq->workAvailable = newSemaphore(0, WORKQUEUE_SIZE);
wq->roomAvailable = newSemaphore(WORKQUEUE_SIZE, WORKQUEUE_SIZE);
@@ -83,7 +85,7 @@ FreeWorkQueue ( WorkQueue* pq )
if ( pq->roomAvailable ) {
CloseHandle(pq->roomAvailable);
}
- DeleteCriticalSection(&pq->queueLock);
+ OS_CLOSE_LOCK(&pq->queueLock);
free(pq);
return;
}
@@ -147,13 +149,13 @@ FetchWork ( WorkQueue* pq, void** ppw )
return false;
}
- EnterCriticalSection(&pq->queueLock);
+ OS_ACQUIRE_LOCK(&pq->queueLock);
*ppw = pq->items[pq->head];
/* For sanity's sake, zero out the pointer. */
pq->items[pq->head] = NULL;
pq->head = (pq->head + 1) % WORKQUEUE_SIZE;
rc = ReleaseSemaphore(pq->roomAvailable,1, NULL);
- LeaveCriticalSection(&pq->queueLock);
+ OS_RELEASE_LOCK(&pq->queueLock);
if ( 0 == rc ) {
queue_error_rc("FetchWork.ReleaseSemaphore()", GetLastError());
return false;
@@ -191,11 +193,11 @@ SubmitWork ( WorkQueue* pq, void* pw )
return false;
}
- EnterCriticalSection(&pq->queueLock);
+ OS_ACQUIRE_LOCK(&pq->queueLock);
pq->items[pq->tail] = pw;
pq->tail = (pq->tail + 1) % WORKQUEUE_SIZE;
rc = ReleaseSemaphore(pq->workAvailable,1, NULL);
- LeaveCriticalSection(&pq->queueLock);
+ OS_RELEASE_LOCK(&pq->queueLock);
if ( 0 == rc ) {
queue_error_rc("SubmitWork.ReleaseSemaphore()", GetLastError());
return false;
diff --git a/rts/win32/WorkQueue.h b/rts/win32/WorkQueue.h
index 4dbfcd40d3..569a7b4445 100644
--- a/rts/win32/WorkQueue.h
+++ b/rts/win32/WorkQueue.h
@@ -14,12 +14,12 @@
#define WORKQUEUE_SIZE 16
typedef HANDLE Semaphore;
-typedef CRITICAL_SECTION CritSection;
+typedef SRWLOCK Mutex;
typedef struct WorkQueue {
/* the master lock, need to be grabbed prior to
using any of the other elements of the struct. */
- CritSection queueLock;
+ Mutex queueLock;
/* consumers/workers block waiting for 'workAvailable' */
Semaphore workAvailable;
Semaphore roomAvailable;