summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorBen Wagner <bungeman@chromium.org>2021-11-14 17:28:09 -0500
committerBen Wagner <bungeman@chromium.org>2021-11-16 15:48:56 -0500
commit8d3425b8b80bd661efe6763bab508af2d8a265ef (patch)
treeb06ec2d7d694b0e3502668e0aaab2063da08e154 /src
parentbe453bd1590b545d490aa024ef267948419b4d3a (diff)
downloadfontconfig-8d3425b8b80bd661efe6763bab508af2d8a265ef.tar.gz
Back FcSerialize with open addressing hash table.
Instead of fixed number of buckets with chaining use an open addressing hash table with linear probing, max load factor 0.75, and a power of two number of buckets.
Diffstat (limited to 'src')
-rw-r--r--src/fcint.h13
-rw-r--r--src/fcserialize.c194
2 files changed, 170 insertions, 37 deletions
diff --git a/src/fcint.h b/src/fcint.h
index d6d44b0..c615b66 100644
--- a/src/fcint.h
+++ b/src/fcint.h
@@ -438,8 +438,6 @@ struct _FcCache {
* Used while constructing a directory cache object
*/
-#define FC_SERIALIZE_HASH_SIZE 8191
-
typedef union _FcAlign {
double d;
int i;
@@ -449,9 +447,9 @@ typedef union _FcAlign {
} FcAlign;
typedef struct _FcSerializeBucket {
- struct _FcSerializeBucket *next;
- const void *object;
- intptr_t offset;
+ const void *object; /* key */
+ uintptr_t hash; /* hash of key */
+ intptr_t offset; /* value */
} FcSerializeBucket;
typedef struct _FcCharSetFreezer FcCharSetFreezer;
@@ -460,7 +458,10 @@ typedef struct _FcSerialize {
intptr_t size;
FcCharSetFreezer *cs_freezer;
void *linear;
- FcSerializeBucket *buckets[FC_SERIALIZE_HASH_SIZE];
+ FcSerializeBucket *buckets;
+ size_t buckets_count;
+ size_t buckets_used;
+ size_t buckets_used_max;
} FcSerialize;
/*
diff --git a/src/fcserialize.c b/src/fcserialize.c
index d2f221d..2388dcd 100644
--- a/src/fcserialize.c
+++ b/src/fcserialize.c
@@ -47,50 +47,187 @@ FcSerializeCreate (void)
serialize->size = 0;
serialize->linear = NULL;
serialize->cs_freezer = NULL;
- memset (serialize->buckets, '\0', sizeof (serialize->buckets));
+ serialize->buckets = NULL;
+ serialize->buckets_count = 0;
+ serialize->buckets_used = 0;
+ serialize->buckets_used_max = 0;
return serialize;
}
void
FcSerializeDestroy (FcSerialize *serialize)
{
- uintptr_t bucket;
+ free (serialize->buckets);
+ if (serialize->cs_freezer)
+ FcCharSetFreezerDestroy (serialize->cs_freezer);
+ free (serialize);
+}
- for (bucket = 0; bucket < FC_SERIALIZE_HASH_SIZE; bucket++)
- {
- FcSerializeBucket *buck, *next;
+static size_t
+FcSerializeNextBucketIndex (const FcSerialize *serialize, size_t index)
+{
+ if (index == 0)
+ index = serialize->buckets_count;
+ --index;
+ return index;
+}
+
+#if ((SIZEOF_VOID_P) * (CHAR_BIT)) == 32
+
+/*
+ * Based on triple32
+ * https://github.com/skeeto/hash-prospector
+ */
+static uintptr_t
+FcSerializeHashPtr (const void *object)
+{
+ uintptr_t x = (uintptr_t)object;
+ x ^= x >> 17;
+ x *= 0xed5ad4bbU;
+ x ^= x >> 11;
+ x *= 0xac4c1b51U;
+ x ^= x >> 15;
+ x *= 0x31848babU;
+ x ^= x >> 14;
+ return x ? x : 1; /* 0 reserved to mark empty, x starts out 0 */
+}
- for (buck = serialize->buckets[bucket]; buck; buck = next) {
- next = buck->next;
- free (buck);
+
+#elif ((SIZEOF_VOID_P) * (CHAR_BIT)) == 64
+
+/*
+ * Based on splittable64/splitmix64 from Mix13
+ * https://zimbry.blogspot.com/2011/09/better-bit-mixing-improving-on.html
+ * https://prng.di.unimi.it/splitmix64.c
+ */
+static uintptr_t
+FcSerializeHashPtr (const void *object)
+{
+ uintptr_t x = (uintptr_t)object;
+ x ^= x >> 30;
+ x *= 0xbf58476d1ce4e5b9U;
+ x ^= x >> 27;
+ x *= 0x94d049bb133111ebU;
+ x ^= x >> 31;
+ return x ? x : 1; /* 0 reserved to mark empty, x starts out 0 */
+}
+
+#endif
+
+static FcSerializeBucket*
+FcSerializeFind (const FcSerialize *serialize, const void *object)
+{
+ uintptr_t hash = FcSerializeHashPtr (object);
+ size_t buckets_count = serialize->buckets_count;
+ size_t index = hash & (buckets_count-1);
+ for (size_t n = 0; n < buckets_count; ++n) {
+ FcSerializeBucket* bucket = &serialize->buckets[index];
+ if (bucket->hash == 0) {
+ return NULL;
+ }
+ if (object == bucket->object) {
+ return bucket;
}
+ index = FcSerializeNextBucketIndex (serialize, index);
}
- if (serialize->cs_freezer)
- FcCharSetFreezerDestroy (serialize->cs_freezer);
- free (serialize);
+ return NULL;
+}
+
+static FcSerializeBucket*
+FcSerializeUncheckedSet (FcSerialize *serialize, FcSerializeBucket* insert) {
+ const void *object = insert->object;
+ size_t buckets_count = serialize->buckets_count;
+ size_t index = insert->hash & (buckets_count-1);
+ for (size_t n = 0; n < buckets_count; ++n) {
+ FcSerializeBucket* bucket = &serialize->buckets[index];
+ if (bucket->hash == 0) {
+ *bucket = *insert;
+ ++serialize->buckets_used;
+ return bucket;
+ }
+ if (object == bucket->object) {
+ /* FcSerializeAlloc should not allow this to happen. */
+ assert (0);
+ *bucket = *insert;
+ return bucket;
+ }
+ index = FcSerializeNextBucketIndex (serialize, index);
+ }
+ assert (0);
+ return NULL;
+}
+
+static FcBool
+FcSerializeResize (FcSerialize *serialize, size_t new_count)
+{
+ size_t old_used = serialize->buckets_used;
+ size_t old_count = serialize->buckets_count;
+ FcSerializeBucket *old_buckets = serialize->buckets;
+ FcSerializeBucket *old_buckets_end = old_buckets + old_count;
+
+ FcSerializeBucket *new_buckets = malloc (new_count * sizeof (*old_buckets));
+ if (!new_buckets)
+ return FcFalse;
+ FcSerializeBucket *new_buckets_end = new_buckets + new_count;
+ for (FcSerializeBucket *b = new_buckets; b < new_buckets_end; ++b)
+ b->hash = 0;
+
+ serialize->buckets = new_buckets;
+ serialize->buckets_count = new_count;
+ serialize->buckets_used = 0;
+ for (FcSerializeBucket *b = old_buckets; b < old_buckets_end; ++b)
+ if (b->hash != 0 && !FcSerializeUncheckedSet (serialize, b))
+ {
+ serialize->buckets = old_buckets;
+ serialize->buckets_count = old_count;
+ serialize->buckets_used = old_used;
+ free (new_buckets);
+ return FcFalse;
+ }
+ free (old_buckets);
+ return FcTrue;
+}
+
+static FcSerializeBucket*
+FcSerializeSet (FcSerialize *serialize, const void *object, intptr_t offset)
+{
+ if (serialize->buckets_used >= serialize->buckets_used_max)
+ {
+ size_t capacity = serialize->buckets_count;
+ if (capacity == 0)
+ capacity = 4;
+ else if (capacity > SIZE_MAX / 2u)
+ return NULL;
+ else
+ capacity *= 2;
+
+ if (!FcSerializeResize (serialize, capacity))
+ return NULL;
+
+ serialize->buckets_used_max = capacity / 4u * 3u;
+ }
+
+ FcSerializeBucket bucket;
+ bucket.object = object;
+ bucket.offset = offset;
+ bucket.hash = FcSerializeHashPtr (object);
+ return FcSerializeUncheckedSet (serialize, &bucket);
}
/*
* Allocate space for an object in the serialized array. Keep track
* of where the object is placed and only allocate one copy of each object
*/
-
FcBool
FcSerializeAlloc (FcSerialize *serialize, const void *object, int size)
{
- uintptr_t bucket = ((uintptr_t) object) % FC_SERIALIZE_HASH_SIZE;
- FcSerializeBucket *buck;
-
- for (buck = serialize->buckets[bucket]; buck; buck = buck->next)
- if (buck->object == object)
- return FcTrue;
- buck = malloc (sizeof (FcSerializeBucket));
- if (!buck)
+ FcSerializeBucket *bucket = FcSerializeFind (serialize, object);
+ if (bucket)
+ return FcTrue;
+
+ if (!FcSerializeSet (serialize, object, serialize->size))
return FcFalse;
- buck->object = object;
- buck->offset = serialize->size;
- buck->next = serialize->buckets[bucket];
- serialize->buckets[bucket] = buck;
+
serialize->size += FcAlignSize (size);
return FcTrue;
}
@@ -113,13 +250,8 @@ FcSerializeReserve (FcSerialize *serialize, int size)
intptr_t
FcSerializeOffset (FcSerialize *serialize, const void *object)
{
- uintptr_t bucket = ((uintptr_t) object) % FC_SERIALIZE_HASH_SIZE;
- FcSerializeBucket *buck;
-
- for (buck = serialize->buckets[bucket]; buck; buck = buck->next)
- if (buck->object == object)
- return buck->offset;
- return 0;
+ FcSerializeBucket *bucket = FcSerializeFind (serialize, object);
+ return bucket ? bucket->offset : 0;
}
/*