summaryrefslogtreecommitdiff
path: root/src/lsm
diff options
context:
space:
mode:
authorAlex Gorrod <alexg@wiredtiger.com>2015-06-02 05:02:44 +0000
committerAlex Gorrod <alexg@wiredtiger.com>2015-06-02 05:02:44 +0000
commit5789e9b1efa636e39081355a659573e84fd33e58 (patch)
treeae23f8703b01eaa8d42fbc4949208ba7e355dda7 /src/lsm
parent0840cee04aed3d90770dd6789947ff687f34022b (diff)
downloadmongo-5789e9b1efa636e39081355a659573e84fd33e58.tar.gz
Update the merge selection algorithm for LSM.
Previously we allowed merges to span multiple levels when we didn't mean to. Track chunk generations more closely to avoid that.
Diffstat (limited to 'src/lsm')
-rw-r--r--src/lsm/lsm_merge.c32
1 files changed, 28 insertions, 4 deletions
diff --git a/src/lsm/lsm_merge.c b/src/lsm/lsm_merge.c
index 92d80e9e91f..357e5ab5462 100644
--- a/src/lsm/lsm_merge.c
+++ b/src/lsm/lsm_merge.c
@@ -127,6 +127,7 @@ __lsm_merge_span(WT_SESSION_IMPL *session, WT_LSM_TREE *lsm_tree,
uint32_t aggressive, max_gap, max_gen, max_level;
uint64_t record_count, chunk_size;
u_int end_chunk, i, merge_max, merge_min, nchunks, start_chunk;
+ u_int oldest_gen, youngest_gen;
chunk_size = 0;
nchunks = 0;
@@ -194,6 +195,8 @@ __lsm_merge_span(WT_SESSION_IMPL *session, WT_LSM_TREE *lsm_tree,
* with the most recent set of chunks and work backwards until going
* further becomes significantly less efficient.
*/
+retry_find:
+ oldest_gen = youngest_gen = lsm_tree->chunk[end_chunk]->generation;
for (start_chunk = end_chunk + 1, record_count = 0;
start_chunk > 0; ) {
chunk = lsm_tree->chunk[start_chunk - 1];
@@ -226,6 +229,15 @@ __lsm_merge_span(WT_SESSION_IMPL *session, WT_LSM_TREE *lsm_tree,
chunk_size - youngest->size > lsm_tree->chunk_max))
break;
+ /* Track chunk generations seen while looking for a merge */
+ if (chunk->generation < youngest_gen)
+ youngest_gen = chunk->generation;
+ else if (chunk->generation > oldest_gen)
+ oldest_gen = chunk->generation;
+
+ if (oldest_gen - youngest_gen > max_gap)
+ break;
+
/*
* If we have enough chunks for a merge and the next chunk is
* in too high a generation, stop.
@@ -270,19 +282,27 @@ __lsm_merge_span(WT_SESSION_IMPL *session, WT_LSM_TREE *lsm_tree,
WT_ASSERT(session,
nchunks == 0 || (chunk != NULL && youngest != NULL));
+
/*
* Don't do merges that are too small or across too many
* generations.
*/
if (nchunks < merge_min ||
- lsm_tree->chunk[end_chunk]->generation >
- youngest->generation + max_gap) {
+ oldest_gen - youngest_gen > max_gap) {
for (i = 0; i < nchunks; i++) {
chunk = lsm_tree->chunk[start_chunk + i];
WT_ASSERT(session,
F_ISSET(chunk, WT_LSM_CHUNK_MERGING));
F_CLR(chunk, WT_LSM_CHUNK_MERGING);
}
+ /*
+ * If we didn't find a merge with appropriate gaps, try again
+ * with a smaller range.
+ */
+ if (oldest_gen - youngest_gen > max_gap) {
+ --end_chunk;
+ goto retry_find;
+ }
WT_RET(__lsm_merge_aggressive_update(session, lsm_tree));
return (WT_NOTFOUND);
}
@@ -368,8 +388,12 @@ __wt_lsm_merge(WT_SESSION_IMPL *session, WT_LSM_TREE *lsm_tree, u_int id)
start_chunk, end_chunk, dest_id, record_count, generation));
for (verb = start_chunk; verb <= end_chunk; verb++)
WT_ERR(__wt_verbose(session, WT_VERB_LSM,
- "%s: Chunk[%u] id %u",
- lsm_tree->name, verb, lsm_tree->chunk[verb]->id));
+ "Merging %s: Chunk[%u] id %u, gen: %" PRIu32
+ ", size: %" PRIu64 ", records: %" PRIu64,
+ lsm_tree->name, verb, lsm_tree->chunk[verb]->id,
+ lsm_tree->chunk[verb]->generation,
+ lsm_tree->chunk[verb]->size,
+ lsm_tree->chunk[verb]->count));
}
WT_ERR(__wt_calloc_one(session, &chunk));