summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorantirez <antirez@gmail.com>2015-09-25 10:06:28 +0200
committerantirez <antirez@gmail.com>2015-10-01 13:02:25 +0200
commit7af4eeb7455b40ef73c436d7b9eb05df31eb6886 (patch)
tree45002facb662e2aeed0d8c78653101089f1cdb50
parent9253d8507320dd1d7665a55e11e2cba3ae91c78d (diff)
downloadredis-7af4eeb7455b40ef73c436d7b9eb05df31eb6886.tar.gz
Lazyfree: incremental removed, only threaded survived.
-rw-r--r--src/lazyfree.c157
-rw-r--r--src/server.c51
-rw-r--r--src/server.h7
3 files changed, 24 insertions, 191 deletions
diff --git a/src/lazyfree.c b/src/lazyfree.c
index 27f9a56e9..aae11d8ab 100644
--- a/src/lazyfree.c
+++ b/src/lazyfree.c
@@ -1,15 +1,10 @@
#include "server.h"
#include "bio.h"
-static int lazyfree_threaded = 1; /* Use a thread to reclaim objects. */
-
-/* Initialization of the lazy free engine. Must be called only once at server
- * startup. */
-void initLazyfreeEngine(void) {
- server.lazyfree_dbs = listCreate();
- server.lazyfree_obj = listCreate();
- server.lazyfree_elements = 0;
-}
+static size_t lazyfree_objects = 0;
+static size_t lazyfree_dbs = 0;
+pthread_mutex_t lazyfree_objects_mutex = PTHREAD_MUTEX_INITIALIZER;
+pthread_mutex_t lazyfree_objects_dbs = PTHREAD_MUTEX_INITIALIZER;
/* Return the amount of work needed in order to free an object.
* The return value is not always the actual number of allocations the
@@ -44,88 +39,10 @@ size_t lazyfreeGetFreeEffort(robj *obj) {
}
}
-/* This callback is used together with dictScan() in order to free a dict.c
- * hash table incrementally. */
-void lazyfreeScanCallback(void *privdata, const dictEntry *de) {
- dict *ht = privdata;
- long saved_iterators = ht->iterators;
- ht->iterators = 1; /* Make sure no rehashing happens. */
- dictDelete(ht,dictGetKey(de));
- ht->iterators = saved_iterators;
-}
-
-/* Free some object from the lazy free list. */
-#define LAZYFREE_ITER_PER_STEP 100
-size_t lazyfreeFastStep(void) {
- size_t maxiter = LAZYFREE_ITER_PER_STEP;
- size_t workdone = 0;
- robj *current = NULL;
-
- while(maxiter--) {
- if (current == NULL) {
- listNode *ln = listFirst(server.lazyfree_obj);
- if (ln == NULL) break; /* Nothing more to free. */
- current = ln->value;
- }
- if ((current->type == OBJ_SET ||
- current->type == OBJ_HASH) &&
- current->encoding == OBJ_ENCODING_HT)
- {
- dict *ht = current->ptr;
- size_t origsize = dictSize(ht);
- ht->iterators = dictScan(ht,ht->iterators,lazyfreeScanCallback,ht);
- workdone++; /* We are not sure how many elements we freed, even if
- zero, the free list is non empty so we don't return
- 0 to the caller. */
- server.lazyfree_elements -= (origsize - dictSize(ht));
- if (dictSize(ht) == 0) {
- decrRefCount(current);
- listNode *ln = listFirst(server.lazyfree_obj);
- listDelNode(server.lazyfree_obj,ln);
- current = NULL;
- }
- } else {
- /* Not handled type or encoding. Do a blocking free. */
- size_t effort = lazyfreeGetFreeEffort(current);
- server.lazyfree_elements -= effort;
- workdone += effort;
- decrRefCount(current);
- listNode *ln = listFirst(server.lazyfree_obj);
- listDelNode(server.lazyfree_obj,ln);
- current = NULL;
- }
- }
- return workdone;
-}
-
-/* Handles slow or fast collection steps. */
-size_t lazyfreeStep(int type) {
- /* Threaded implementaiton: only block for STEP_OOM. */
- if (lazyfree_threaded) {
- if (type == LAZYFREE_STEP_OOM)
- return bioWaitStepOfType(BIO_LAZY_FREE);
- return 0;
- }
-
- /* Non threaded implementation: free things incrementally avoiding
- * to block. */
- if (type == LAZYFREE_STEP_FAST ||
- type == LAZYFREE_STEP_OOM) return lazyfreeFastStep();
-
- size_t totalwork = 0;
- mstime_t end = mstime()+2;
- do {
- size_t workdone = lazyfreeFastStep();
- if (workdone == 0) break;
- totalwork += workdone;
- } while(mstime() < end);
- return totalwork;
-}
-
/* Delete a key, value, and associated expiration entry if any, from the DB.
* If there are enough allocations to free the value object may be put into
* a lazy free list instead of being freed synchronously. The lazy free list
- * will be reclaimed incrementally in a non blocking way. */
+ * will be reclaimed in a different bio.c thread. */
#define LAZYFREE_THRESHOLD 64
int dbAsyncDelete(redisDb *db, robj *key) {
/* Deleting an entry from the expires dict will not free the sds of
@@ -143,12 +60,7 @@ int dbAsyncDelete(redisDb *db, robj *key) {
/* If releasing the object is too much work, let's put it into the
* lazy free list. */
if (free_effort > LAZYFREE_THRESHOLD) {
- if (lazyfree_threaded) {
- bioCreateBackgroundJob(BIO_LAZY_FREE,val,NULL,NULL);
- } else {
- listAddNodeTail(server.lazyfree_obj,val);
- server.lazyfree_elements += free_effort;
- }
+ bioCreateBackgroundJob(BIO_LAZY_FREE,val,NULL,NULL);
dictSetVal(db->dict,de,NULL);
}
}
@@ -162,60 +74,3 @@ int dbAsyncDelete(redisDb *db, robj *key) {
return 0;
}
}
-
-/* This is the timer handler we use to incrementally perform collection
- * into the lazy free lists. We can't use serverCron since we need a
- * very high timer frequency when there are many objects to collect, while
- * we lower the frequency to just 1HZ when there is nothing to do.
- *
- * Since a slow lazy free step will take 1.5 milliseconds and we modulate
- * the timer frequency from 1 to 333 HZ in an adaptive way, the CPU
- * used is between 0% (nothing in the lazy free list) to 50%.
- *
- * The frequency is obtained as follows: if the lazy free list is empty
- * it is set to 1HZ. If the lazy free has elements the call period starts
- * at 20 (50HZ) and is decremented (up to 3 ms = 333HZ) each time the server
- * used memory raises between calls of this function. */
-int lazyfreeCron(struct aeEventLoop *eventLoop, long long id, void *clientData)
-{
- UNUSED(eventLoop);
- UNUSED(id);
- UNUSED(clientData);
-
- /* Threaded lazy free does not need a timer, unregister the timer event. */
- if (lazyfree_threaded) return AE_NOMORE;
-
- static size_t prev_mem;
- static int timer_period = 1000; /* Defauls to 1HZ */
- static double mem_trend = 0;
- size_t mem = zmalloc_used_memory();
-
- /* Compute the memory trend, biased towards thinking memory is raising
- * for a few calls every time previous and current memory raise. */
- if (prev_mem < mem) mem_trend = 1;
- mem_trend *= 0.9; /* Make it slowly forget. */
- int mem_is_raising = mem_trend > .1;
-
- /* Free a few items. */
- size_t workdone = lazyfreeStep(LAZYFREE_STEP_SLOW);
-
- /* Adjust this timer call frequency according to the current state. */
- if (workdone) {
- if (timer_period == 1000) timer_period = 20;
- if (mem_is_raising && timer_period > 3)
- timer_period--; /* Raise call frequency. */
- else if (!mem_is_raising && timer_period < 20)
- timer_period++; /* Lower call frequency. */
- } else {
- timer_period = 1000; /* 1 HZ */
- }
- prev_mem = mem;
-#if 0
- printf("%llu (%d hz) %s (%f)\n",
- (unsigned long long)server.lazyfree_elements,
- 1000/timer_period,
- mem_is_raising ? "RAISING" : "lowering",
- mem_trend);
-#endif
- return timer_period;
-}
diff --git a/src/server.c b/src/server.c
index c5ab43b73..d9470f6d7 100644
--- a/src/server.c
+++ b/src/server.c
@@ -1298,11 +1298,6 @@ void beforeSleep(struct aeEventLoop *eventLoop) {
* later in this function. */
if (server.cluster_enabled) clusterBeforeSleep();
- /* Lazy free a few objects before to return to the event loop, this way
- * if there is activity in the server (that may generate writes) we
- * reclaim memory at a faster rate. */
- lazyfreeStep(LAZYFREE_STEP_FAST);
-
/* Run a fast expire cycle (the called function will return
* ASAP if a fast cycle is not needed). */
if (server.active_expire_enabled && server.masterhost == NULL)
@@ -1812,7 +1807,6 @@ void initServer(void) {
server.system_memory_size = zmalloc_get_memory_size();
createSharedObjects();
- initLazyfreeEngine();
adjustOpenFilesLimit();
server.el = aeCreateEventLoop(server.maxclients+CONFIG_FDSET_INCR);
server.db = zmalloc(sizeof(redisDb)*server.dbnum);
@@ -1879,8 +1873,7 @@ void initServer(void) {
/* Create out timers, that's our main way to process background
* operations. */
- if(aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL) == AE_ERR ||
- aeCreateTimeEvent(server.el, 1, lazyfreeCron, NULL, NULL) == AE_ERR) {
+ if (aeCreateTimeEvent(server.el, 1, serverCron, NULL, NULL) == AE_ERR) {
serverPanic("Can't create event loop timers.");
exit(1);
}
@@ -3285,18 +3278,19 @@ void evictionPoolPopulate(dict *sampledict, dict *keydict, struct evictionPoolEn
}
int freeMemoryIfNeeded(void) {
- size_t mem_used, mem_tofree, mem_freed;
+ size_t mem_reported, mem_used, mem_tofree, mem_freed;
int slaves = listLength(server.slaves);
mstime_t latency, eviction_latency;
long long delta;
/* Check if we are over the memory usage limit. If we are not, no need
* to subtract the slaves output buffers. We can just return ASAP. */
- mem_used = zmalloc_used_memory();
- if (mem_used <= server.maxmemory) return C_OK;
+ mem_reported = zmalloc_used_memory();
+ if (mem_reported <= server.maxmemory) return C_OK;
/* Remove the size of slaves output buffers and AOF buffer from the
* count of used memory. */
+ mem_used = mem_reported;
if (slaves) {
listIter li;
listNode *ln;
@@ -3323,28 +3317,8 @@ int freeMemoryIfNeeded(void) {
mem_tofree = mem_used - server.maxmemory;
mem_freed = 0;
- /* Let's start reclaiming memory from the lazy free list: those
- * objects are logically freed so this is the first thing we want
- * to get rid of. */
- if (listLength(server.lazyfree_dbs) || listLength(server.lazyfree_obj)) {
- latencyStartMonitor(eviction_latency);
- while (mem_freed < mem_tofree) {
- delta = (long long) zmalloc_used_memory();
- size_t workdone = lazyfreeStep(LAZYFREE_STEP_OOM);
- delta -= (long long) zmalloc_used_memory();
- mem_freed += delta;
- if (!workdone) break; /* Lazy free list is empty. */
- }
- latencyEndMonitor(eviction_latency);
- latencyAddSampleIfNeeded("eviction-lazyfree",eviction_latency);
- }
-
- /* If after lazy freeing we are alraedy back to our limit, no need
- * to evict keys. Return to the caller. */
- if (mem_freed >= mem_tofree) return C_OK;
-
if (server.maxmemory_policy == MAXMEMORY_NO_EVICTION)
- return C_ERR; /* We need to free memory, but policy forbids. */
+ goto cant_free; /* We need to free memory, but policy forbids. */
latencyStartMonitor(latency);
while (mem_freed < mem_tofree) {
@@ -3465,12 +3439,23 @@ int freeMemoryIfNeeded(void) {
if (!keys_freed) {
latencyEndMonitor(latency);
latencyAddSampleIfNeeded("eviction-cycle",latency);
- return C_ERR; /* nothing to free... */
+ goto cant_free; /* nothing to free... */
}
}
latencyEndMonitor(latency);
latencyAddSampleIfNeeded("eviction-cycle",latency);
return C_OK;
+
+cant_free:
+ /* We are here if we are not able to reclaim memory. There is only one
+ * last thing we can try: check if the lazyfree thread has jobs in queue
+ * and wait... */
+ while(bioPendingJobsOfType(BIO_LAZY_FREE)) {
+ if (((mem_reported - zmalloc_used_memory()) + mem_freed) >= mem_tofree)
+ break;
+ usleep(1000);
+ }
+ return C_ERR;
}
/* =================================== Main! ================================ */
diff --git a/src/server.h b/src/server.h
index 1d97d9360..5b5bc9887 100644
--- a/src/server.h
+++ b/src/server.h
@@ -704,10 +704,6 @@ struct redisServer {
int cronloops; /* Number of times the cron function run */
char runid[CONFIG_RUN_ID_SIZE+1]; /* ID always different at every exec. */
int sentinel_mode; /* True if this instance is a Sentinel. */
- /* Lazy free */
- list *lazyfree_dbs; /* List of DBs to free in background. */
- list *lazyfree_obj; /* List of objects to free in background. */
- size_t lazyfree_elements; /* Number of logical element in obj list. */
/* Networking */
int port; /* TCP listening port */
int tcp_backlog; /* TCP listen() backlog */
@@ -1411,9 +1407,6 @@ void slotToKeyFlush(void);
#define LAZYFREE_STEP_OOM 2 /* Free a few elements at any cost if there
is something to free: we are out of memory */
int dbAsyncDelete(redisDb *db, robj *key);
-void initLazyfreeEngine(void);
-size_t lazyfreeStep(int type);
-int lazyfreeCron(struct aeEventLoop *eventLoop, long long id, void *clientData);
/* API to get key arguments from commands */
int *getKeysFromCommand(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);