summaryrefslogtreecommitdiff
path: root/includes
diff options
context:
space:
mode:
authorDouglas Wilson <douglas.wilson@gmail.com>2020-12-17 06:43:35 +0000
committerMarge Bot <ben+marge-bot@smart-cactus.org>2020-12-19 02:15:19 -0500
commitdf8e6e904d35e9ada4e43abf398dfb8a301f1bfa (patch)
treebf3f23b4f609a9951f226c4bb242949b441466c1 /includes
parent173112cad82630b02eb91acb1f5fb91a96fa02b9 (diff)
downloadhaskell-df8e6e904d35e9ada4e43abf398dfb8a301f1bfa.tar.gz
rts: Use weaker cas in WSDeque
The algorithm described in the referenced paper uses this slightly weaker atomic op. This is the first "exotic" cas we're using. I've added a macro in the <ORDERING>_OP style to match existing ones.
Diffstat (limited to 'includes')
-rw-r--r--includes/stg/SMP.h24
1 files changed, 24 insertions, 0 deletions
diff --git a/includes/stg/SMP.h b/includes/stg/SMP.h
index 389dd95c88..589bde8266 100644
--- a/includes/stg/SMP.h
+++ b/includes/stg/SMP.h
@@ -52,6 +52,13 @@ EXTERN_INLINE StgWord cas(StgVolatilePtr p, StgWord o, StgWord n);
EXTERN_INLINE StgWord8 cas_word8(StgWord8 *volatile p, StgWord8 o, StgWord8 n);
/*
+ * Compare-and-swap
+ * this uses a seq_cst success memory order and a relaxed failure memory order
+ */
+EXTERN_INLINE StgWord cas_seq_cst_relaxed(StgVolatilePtr p, StgWord o, StgWord n);
+
+
+/*
* Atomic addition by the provided quantity
*
* atomic_inc(p, n) {
@@ -304,6 +311,17 @@ cas_word8(StgWord8 *volatile p, StgWord8 o, StgWord8 n)
#endif
}
+EXTERN_INLINE StgWord
+cas_seq_cst_relaxed(StgVolatilePtr p, StgWord o, StgWord n) {
+#if defined(HAVE_C11_ATOMICS)
+ __atomic_compare_exchange_n(p, &o, n, 0, __ATOMIC_SEQ_CST, __ATOMIC_RELAXED);
+ return o;
+#else
+ return __sync_val_compare_and_swap(p, o, n);
+#endif
+
+}
+
// RRN: Generalized to arbitrary increments to enable fetch-and-add in
// Haskell code (fetchAddIntArray#).
// PT: add-and-fetch, returns new value
@@ -454,6 +472,9 @@ load_load_barrier(void) {
// Non-atomic addition for "approximate" counters that can be lossy
#define NONATOMIC_ADD(ptr,val) RELAXED_STORE(ptr, RELAXED_LOAD(ptr) + val)
+// compare-and-swap atomic operations
+#define SEQ_CST_RELAXED_CAS(p,o,n) cas_seq_cst_relaxed(p,o,n)
+
// Explicit fences
//
// These are typically necessary only in very specific cases (e.g. WSDeque)
@@ -489,6 +510,9 @@ EXTERN_INLINE void load_load_barrier () {} /* nothing */
// Non-atomic addition for "approximate" counters that can be lossy
#define NONATOMIC_ADD(ptr,val) *ptr += val
+// compare-and-swap atomic operations
+#define SEQ_CST_RELAXED_CAS(p,o,n) cas(p,o,n)
+
// Fences
#define RELEASE_FENCE()
#define SEQ_CST_FENCE()