summaryrefslogtreecommitdiff
path: root/src/third_party
diff options
context:
space:
mode:
authorLuke Chen <luke.chen@mongodb.com>2018-01-23 15:17:52 +1100
committerLuke Chen <luke.chen@mongodb.com>2018-01-23 15:31:07 +1100
commitcf856573c0dfd0e1d2c78d2216fafaa63ac43ae8 (patch)
tree7076f4fdecaea54b9abd5b0e5adf8665891a8fc9 /src/third_party
parentf3b504948c0cef40deffb4786ebdda6797625142 (diff)
downloadmongo-cf856573c0dfd0e1d2c78d2216fafaa63ac43ae8.tar.gz
Import wiredtiger: fc383862a729667bdd4011c363601c180f848d65 from branch mongodb-3.8
ref: 357efdd4ce..fc383862a7 for: 3.7.2 WT-3074 Automate a test to stress eviction walk with many active trees WT-3799 Test/format with timestamps enabled pin cache full WT-3835 cursor remove tries to return a key that doesn't exist WT-3846 Refine operation tracking visualization tool WT-3853 LSM version 1 metadata incompatibility WT-3860 Fix a list of lint issues WT-3862 Remove invalid diagnostic assertion during reconciliation
Diffstat (limited to 'src/third_party')
-rw-r--r--src/third_party/wiredtiger/bench/wtperf/runners/evict-fairness.wtperf20
-rw-r--r--src/third_party/wiredtiger/dist/s_clang-tidy19
-rw-r--r--src/third_party/wiredtiger/import.data2
-rw-r--r--src/third_party/wiredtiger/src/btree/bt_cursor.c20
-rw-r--r--src/third_party/wiredtiger/src/evict/evict_page.c18
-rw-r--r--src/third_party/wiredtiger/src/lsm/lsm_meta.c9
-rw-r--r--src/third_party/wiredtiger/src/reconcile/rec_write.c1
-rw-r--r--src/third_party/wiredtiger/src/utilities/util_main.c2
-rw-r--r--src/third_party/wiredtiger/test/format/util.c9
-rw-r--r--src/third_party/wiredtiger/tools/optrack/arrow-left.pngbin103602 -> 0 bytes
-rw-r--r--src/third_party/wiredtiger/tools/optrack/arrow-right.pngbin108216 -> 0 bytes
-rwxr-xr-xsrc/third_party/wiredtiger/tools/optrack/find-latency-spikes.py473
12 files changed, 327 insertions, 246 deletions
diff --git a/src/third_party/wiredtiger/bench/wtperf/runners/evict-fairness.wtperf b/src/third_party/wiredtiger/bench/wtperf/runners/evict-fairness.wtperf
new file mode 100644
index 00000000000..94f55f6bea9
--- /dev/null
+++ b/src/third_party/wiredtiger/bench/wtperf/runners/evict-fairness.wtperf
@@ -0,0 +1,20 @@
+# This configuration is used to test the eviction fairness of visiting all tables.
+# Create a set of tables with uneven distribution of data
+conn_config="cache_size=1G,eviction=(threads_max=8),file_manager=(close_idle_time=100000),checkpoint=(wait=20,log_size=2GB),session_max=1000"
+table_config="type=file"
+table_count=200
+icount=0
+random_range=1000000000
+pareto=0
+range_partition=true
+report_interval=5
+
+run_ops=1000000
+populate_threads=0
+icount=0
+threads=((count=60,inserts=1))
+
+# Warn if a latency over 1 second is seen
+max_latency=1000
+sample_interval=5
+sample_rate=1
diff --git a/src/third_party/wiredtiger/dist/s_clang-tidy b/src/third_party/wiredtiger/dist/s_clang-tidy
index 209d6f7d5d5..89d3fa4112a 100644
--- a/src/third_party/wiredtiger/dist/s_clang-tidy
+++ b/src/third_party/wiredtiger/dist/s_clang-tidy
@@ -32,18 +32,14 @@ sh autogen.sh > /dev/null || exit 1
# We need a custom wiredtiger_config.h, clang-tidy doesn't know where to
# find the x86intrin.h include file.
-echo '!!!!'
-echo 'Modifying wiredtiger_config.h'
-echo '!!!!'
cp wiredtiger_config.h $t
sed '/HAVE_X86INTRIN_H/d' < $t > wiredtiger_config.h
-# XXX
-# clang-tidy doesn't like verify_build at the moment.
-echo '!!!!'
-echo 'Modifying src/include/verify_build.h'
-echo '!!!!'
-echo '#define WT_STATIC_ASSERT(a)' > src/include/verify_build.h
+# We need a custom verify_build.h, clang-tidy doesn't like the magic.
+f=src/include/verify_build.h
+rm -f $f.save
+cp $f $f.save
+echo '#define WT_STATIC_ASSERT(a)' > $f
def="-D_GNU_SOURCE"
inc="-I. -Isrc/include"
@@ -81,4 +77,9 @@ sed -e '/ warnings generated/d' \
-e '/Suppressed.*warnings/d' \
-e '/Use -header-filter/d' < $t
+# Restore verify_build.h.
+f=src/include/verify_build.h
+rm -f $f
+mv $f.save $f
+
exit 0
diff --git a/src/third_party/wiredtiger/import.data b/src/third_party/wiredtiger/import.data
index dc3e684a19f..a67a400e735 100644
--- a/src/third_party/wiredtiger/import.data
+++ b/src/third_party/wiredtiger/import.data
@@ -1,5 +1,5 @@
{
- "commit": "357efdd4ce279efc71ff618c59fe1b903ef80bb2",
+ "commit": "fc383862a729667bdd4011c363601c180f848d65",
"github": "wiredtiger/wiredtiger.git",
"vendor": "wiredtiger",
"branch": "mongodb-3.8"
diff --git a/src/third_party/wiredtiger/src/btree/bt_cursor.c b/src/third_party/wiredtiger/src/btree/bt_cursor.c
index 6e90447f18d..8c7170e6180 100644
--- a/src/third_party/wiredtiger/src/btree/bt_cursor.c
+++ b/src/third_party/wiredtiger/src/btree/bt_cursor.c
@@ -1067,13 +1067,6 @@ err: if (ret == WT_RESTART) {
goto retry;
}
- /*
- * If the cursor is configured to overwrite and the record is not found,
- * that is exactly what we want, return success.
- */
- if (F_ISSET(cursor, WT_CURSTD_OVERWRITE) && ret == WT_NOTFOUND)
- ret = 0;
-
done: if (ret == 0) {
F_CLR(cursor, WT_CURSTD_VALUE_SET);
switch (positioned) {
@@ -1104,6 +1097,19 @@ done: if (ret == 0) {
if (ret != 0) {
WT_TRET(__cursor_reset(cbt));
__cursor_state_restore(cursor, &state);
+
+ /*
+ * If the cursor is configured to overwrite and the record isn't
+ * found, that is exactly what we want, return success. Note we
+ * set clear the return value after everything else, the clause
+ * above dealing with the cursor position is only correct if we
+ * were successful. If search failed after positioned is set to
+ * SEARCH_POSITION, we cannot return a key. The only action to
+ * take is to set the cursor to its original key, which we just
+ * did.
+ */
+ if (F_ISSET(cursor, WT_CURSTD_OVERWRITE) && ret == WT_NOTFOUND)
+ ret = 0;
}
return (ret);
diff --git a/src/third_party/wiredtiger/src/evict/evict_page.c b/src/third_party/wiredtiger/src/evict/evict_page.c
index 0ff314f3484..6d904a2004b 100644
--- a/src/third_party/wiredtiger/src/evict/evict_page.c
+++ b/src/third_party/wiredtiger/src/evict/evict_page.c
@@ -306,16 +306,14 @@ __evict_page_dirty_update(WT_SESSION_IMPL *session, WT_REF *ref, bool closing)
switch (mod->rec_result) {
case WT_PM_REC_EMPTY: /* Page is empty */
/*
- * Update the parent to reference a deleted page. The fact that
- * reconciliation left the page "empty" means there's no older
- * transaction in the system that might need to see an earlier
- * version of the page. For that reason, we clear the address
- * of the page, if we're forced to "read" into that namespace,
- * we'll instantiate a new page instead of trying to read from
- * the backing store.
+ * Update the parent to reference a deleted page. Reconciliation
+ * left the page "empty", so there's no older transaction in the
+ * system that might need to see an earlier version of the page.
+ * There's no backing address, if we're forced to "read" into
+ * that namespace, we instantiate a new page instead of trying
+ * to read from the backing store.
*/
__wt_ref_out(session, ref);
- ref->addr = NULL;
WT_WITH_PAGE_INDEX(session,
ret = __evict_delete_ref(session, ref, closing));
WT_RET_BUSY_OK(ret);
@@ -354,9 +352,7 @@ __evict_page_dirty_update(WT_SESSION_IMPL *session, WT_REF *ref, bool closing)
* Publish: a barrier to ensure the structure fields are set
* before the state change makes the page available to readers.
*/
- if (mod->mod_replace.addr == NULL)
- ref->addr = NULL;
- else {
+ if (mod->mod_replace.addr != NULL) {
WT_RET(__wt_calloc_one(session, &addr));
*addr = mod->mod_replace;
mod->mod_replace.addr = NULL;
diff --git a/src/third_party/wiredtiger/src/lsm/lsm_meta.c b/src/third_party/wiredtiger/src/lsm/lsm_meta.c
index 88daca989a6..de12f19380b 100644
--- a/src/third_party/wiredtiger/src/lsm/lsm_meta.c
+++ b/src/third_party/wiredtiger/src/lsm/lsm_meta.c
@@ -201,9 +201,12 @@ __lsm_meta_read_v1(
cv.str, cv.len, &lsm_tree->collator_name));
}
- WT_ERR(__wt_config_getones(
- session, lsmconf, "lsm.merge_custom.start_generation", &cv));
- lsm_tree->custom_generation = (uint32_t)cv.val;
+ /* lsm.merge_custom does not appear in all V1 LSM metadata. */
+ lsm_tree->custom_generation = 0;
+ if ((ret = __wt_config_getones(
+ session, lsmconf, "lsm.merge_custom.start_generation", &cv)) == 0)
+ lsm_tree->custom_generation = (uint32_t)cv.val;
+ WT_ERR_NOTFOUND_OK(ret);
if (lsm_tree->custom_generation != 0) {
WT_ERR(__wt_config_getones(
session, lsmconf, "lsm.merge_custom.prefix", &cv));
diff --git a/src/third_party/wiredtiger/src/reconcile/rec_write.c b/src/third_party/wiredtiger/src/reconcile/rec_write.c
index 3ad6bdf41ea..d9b415a76cd 100644
--- a/src/third_party/wiredtiger/src/reconcile/rec_write.c
+++ b/src/third_party/wiredtiger/src/reconcile/rec_write.c
@@ -1347,7 +1347,6 @@ __rec_txn_read(WT_SESSION_IMPL *session, WT_RECONCILE *r,
(F_ISSET(r, WT_REC_VISIBLE_ALL) ?
WT_TXNID_LE(r->last_running, txnid) :
!__txn_visible_id(session, txnid))) {
- WT_ASSERT(session, upd->type != WT_UPDATE_BIRTHMARK);
uncommitted = r->update_uncommitted = true;
continue;
}
diff --git a/src/third_party/wiredtiger/src/utilities/util_main.c b/src/third_party/wiredtiger/src/utilities/util_main.c
index fb9fb433892..2d08c4c5274 100644
--- a/src/third_party/wiredtiger/src/utilities/util_main.c
+++ b/src/third_party/wiredtiger/src/utilities/util_main.c
@@ -41,7 +41,7 @@ usage(void)
"\t" "compact\t compact an object\n"
"\t" "copyright copyright information\n"
"\t" "create\t create an object\n"
- "\t" "downgrade\t downgrade an database\n"
+ "\t" "downgrade downgrade a database\n"
"\t" "drop\t drop an object\n"
"\t" "dump\t dump an object\n"
"\t" "list\t list database objects\n"
diff --git a/src/third_party/wiredtiger/test/format/util.c b/src/third_party/wiredtiger/test/format/util.c
index b8343fee1d6..aa31521c3b7 100644
--- a/src/third_party/wiredtiger/test/format/util.c
+++ b/src/third_party/wiredtiger/test/format/util.c
@@ -621,6 +621,15 @@ timestamp(void *arg)
}
/*
+ * Don't try to update until we've committed some transactions
+ * with timestamps.
+ */
+ if (oldest_timestamp == 0) {
+ __wt_sleep(1, 0);
+ continue;
+ }
+
+ /*
* If less than 100 transactions out of date, wait up to 15
* seconds before updating.
*/
diff --git a/src/third_party/wiredtiger/tools/optrack/arrow-left.png b/src/third_party/wiredtiger/tools/optrack/arrow-left.png
deleted file mode 100644
index 315983e3118..00000000000
--- a/src/third_party/wiredtiger/tools/optrack/arrow-left.png
+++ /dev/null
Binary files differ
diff --git a/src/third_party/wiredtiger/tools/optrack/arrow-right.png b/src/third_party/wiredtiger/tools/optrack/arrow-right.png
deleted file mode 100644
index e874d0f55fc..00000000000
--- a/src/third_party/wiredtiger/tools/optrack/arrow-right.png
+++ /dev/null
Binary files differ
diff --git a/src/third_party/wiredtiger/tools/optrack/find-latency-spikes.py b/src/third_party/wiredtiger/tools/optrack/find-latency-spikes.py
index 5bb557ce21b..ac80b78bc5d 100755
--- a/src/third_party/wiredtiger/tools/optrack/find-latency-spikes.py
+++ b/src/third_party/wiredtiger/tools/optrack/find-latency-spikes.py
@@ -1,9 +1,36 @@
#!/usr/bin/env python
+#
+# Public Domain 2014-2018 MongoDB, Inc.
+# Public Domain 2008-2014 WiredTiger, Inc.
+#
+# This is free and unencumbered software released into the public domain.
+#
+# Anyone is free to copy, modify, publish, use, compile, sell, or
+# distribute this software, either in source code form or as a compiled
+# binary, for any purpose, commercial or non-commercial, and by any
+# means.
+#
+# In jurisdictions that recognize copyright laws, the author or authors
+# of this software dedicate any and all copyright interest in the
+# software to the public domain. We make this dedication for the benefit
+# of the public at large and to the detriment of our heirs and
+# successors. We intend this dedication to be an overt act of
+# relinquishment in perpetuity of all present and future rights to this
+# software under copyright law.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
+# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
+# IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
+# ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+# OTHER DEALINGS IN THE SOFTWARE.
+#!/usr/bin/env python
import argparse
from bokeh.layouts import column
from bokeh.models import ColumnDataSource, CustomJS, HoverTool, FixedTicker
-from bokeh.models import Legend, LegendItem
+from bokeh.models import LabelSet, Legend, LegendItem
from bokeh.models import NumeralTickFormatter, OpenURL, Range1d, TapTool
from bokeh.models.annotations import Label
from bokeh.plotting import figure, output_file, reset_output, save, show
@@ -15,10 +42,6 @@ import pandas as pd
import sys
import traceback
-# Names of the image files we use
-arrowLeftImg = "arrow-left.png";
-arrowRightImg = "arrow-right.png";
-
# A directory where we store cross-file plots for each bucket of the outlier
# histogram.
#
@@ -30,16 +53,16 @@ colorList = [];
# Codes for various colors for printing of informational and error messages.
#
class color:
- PURPLE = '\033[95m'
- CYAN = '\033[96m'
- DARKCYAN = '\033[36m'
- BLUE = '\033[94m'
- GREEN = '\033[92m'
- YELLOW = '\033[93m'
- RED = '\033[91m'
- BOLD = '\033[1m'
- UNDERLINE = '\033[4m'
- END = '\033[0m'
+ PURPLE = '\033[95m'
+ CYAN = '\033[96m'
+ DARKCYAN = '\033[36m'
+ BLUE = '\033[94m'
+ GREEN = '\033[92m'
+ YELLOW = '\033[93m'
+ RED = '\033[91m'
+ BOLD = '\033[1m'
+ UNDERLINE = '\033[4m'
+ END = '\033[0m'
# A function name mapped to its corresponding color.
#
@@ -80,7 +103,6 @@ pixelsPerWidthUnit = 5;
#
STDEV_MULT = 2;
-
def initColorList():
global colorList;
@@ -109,7 +131,6 @@ def getColorForFunction(function):
return funcToColor[function];
-
#
# An intervalEnd is a tuple of three items.
# item #0 is the timestamp,
@@ -151,9 +172,6 @@ def getIntervalData(intervalBeginningsStack, intervalEnd, logfile):
else:
matchFound = True;
- # This value determines how deep we are in the callstack
- # stackDepth = len(intervalBeginningsStack);
-
return intervalBegin[0], intervalEnd[0], intervalEnd[2], errorOccurred;
def plotOutlierHistogram(dataframe, maxOutliers, func, durationThreshold,
@@ -179,7 +197,8 @@ def plotOutlierHistogram(dataframe, maxOutliers, func, durationThreshold,
* pixelsPerHeightUnit + \
pixelsForTitle)),
x_axis_label = "Execution timeline (CPU cycles)",
- y_axis_label = "Number of outliers", tools = TOOLS);
+ y_axis_label = "Number of outliers",
+ tools = TOOLS, toolbar_location="above");
y_ticker_max = p.plot_height / pixelsPerHeightUnit;
y_ticker_step = max(1, (maxOutliers + 1)/y_ticker_max);
@@ -316,12 +335,6 @@ def createCallstackSeries(data, logfilename):
beginIntervals.append(intervalBegin);
endIntervals.append(intervalEnd);
functionNames.append(function);
- #stackDepths.append(stackDepth);
- #stackDepthsNext.append(stackDepth + 1);
-
- #print("Begin: " + str(intervalBegin)),
- #print(" Func: " + function),
- #print(" Stack depth: " + str(stackDepth));
else:
print("Invalid event in this line:");
@@ -352,27 +365,110 @@ def createCallstackSeries(data, logfilename):
return dataframe;
-def addLegend(p, legendItems, numLegends):
-
- legend = Legend(items=legendItems, orientation = "horizontal");
- p.add_layout(legend, place='above');
- legendItems[:] = []; # Empty the list.
-
- return (numLegends + 1);
-
# For each function we only show the legend once. In this dictionary we
# keep track of colors already used.
#
colorAlreadyUsedInLegend = {};
+def createLegendFigure(legendDict):
+
+ global pixelsForTitle;
+ global plotWidth;
+
+ FUNCS_PER_ROW = 5;
+ HSPACE_BETWEEN_FUNCS = 10;
+ VSPACE_BETWEEN_FUNCS = 1;
+
+ funcs = [];
+ colors = [];
+ x_coords = [];
+ y_coords = [];
+ pixelsForLegendItem = 20;
+
+ # Get a sorted list of functions and their
+ # corresponding colors.
+ #
+ for func in sorted(legendDict.keys()):
+ funcs.append(func);
+ colors.append(legendDict[func]);
+
+ # Figure out the coordinates of functions on the plot
+ #
+ for i in range(len(funcs)):
+
+ x_coord = i % (FUNCS_PER_ROW) + 1;
+ x_coord += i % (FUNCS_PER_ROW) * HSPACE_BETWEEN_FUNCS;
+ x_coords.append(x_coord);
+
+ y_coord = (i/FUNCS_PER_ROW) + 1;
+ y_coord += (i/FUNCS_PER_ROW) * VSPACE_BETWEEN_FUNCS;
+ y_coords.append(y_coord);
+
+ data = {};
+ data['func'] = funcs;
+ data['color'] = colors;
+ data['left'] = x_coords;
+ data['bottom'] = y_coords;
+
+ df = pd.DataFrame(data=data);
+
+ max_ycoord = df['bottom'].max();
+ df['bottom'] = (max_ycoord + 1) - df['bottom'];
+
+ df['right'] = df['left'] + 1;
+ df['top'] = df['bottom'] + 1;
+
+ cds = ColumnDataSource(df);
+
+ p = figure(title="TRACKED FUNCTIONS",
+ plot_width=plotWidth,
+ plot_height = max((max_ycoord + 2) * pixelsForLegendItem, 90),
+ tools = [], toolbar_location="above",
+ x_range = (0, (FUNCS_PER_ROW + 1)* HSPACE_BETWEEN_FUNCS),
+ y_range = (0, max_ycoord + 2),
+ x_axis_label = "",
+ y_axis_label = "");
+
+ p.title.align = "center";
+ p.title.text_font_style = "normal";
+
+ p.xaxis.axis_line_color = "lightgrey";
+ p.xaxis.major_tick_line_color = None;
+ p.xaxis.minor_tick_line_color = None;
+ p.xaxis.major_label_text_font_size = '0pt';
+
+ p.yaxis.axis_line_color = "lightgrey";
+ p.yaxis.major_tick_line_color = None;
+ p.yaxis.minor_tick_line_color = None;
+ p.yaxis.major_label_text_font_size = '0pt';
+
+ p.xgrid.grid_line_color = None;
+ p.ygrid.grid_line_color = None;
+
+ p.outline_line_width = 1
+ p.outline_line_alpha = 1
+ p.outline_line_color = "lightgrey"
+
+ p.quad(left = 'left', right = 'right', bottom = 'bottom',
+ top = 'top', color = 'color', line_color = "lightgrey",
+ line_width = 0.5, source=cds);
+
+ labels = LabelSet(x='right', y='bottom', text='func', level='glyph',
+ text_font_size = "10pt",
+ x_offset=3, y_offset=0, source=cds, render_mode='canvas');
+ p.add_layout(labels);
+
+ return p;
+
def generateBucketChartForFile(figureName, dataframe, y_max, x_min, x_max):
global colorAlreadyUsedInLegend;
global funcToColor;
+ global plotWidth;
- MAX_ITEMS_PER_LEGEND = 5;
+ MAX_ITEMS_PER_LEGEND = 10;
numLegends = 0;
- legendItems = [];
+ legendItems = {};
pixelsPerStackLevel = 30;
pixelsPerLegend = 60;
pixelsForTitle = 30;
@@ -387,13 +483,12 @@ def generateBucketChartForFile(figureName, dataframe, y_max, x_min, x_max):
TOOLS = [hover];
- p = figure(title=figureName, plot_width=1200,
+ p = figure(title=figureName, plot_width=plotWidth,
x_range = (x_min, x_max),
y_range = (0, y_max+1),
x_axis_label = "Time (CPU cycles)",
y_axis_label = "Stack depth",
- tools = TOOLS
- );
+ tools = TOOLS, toolbar_location="above");
# No minor ticks or labels on the y-axis
p.yaxis.major_tick_line_color = None;
@@ -402,7 +497,8 @@ def generateBucketChartForFile(figureName, dataframe, y_max, x_min, x_max):
p.yaxis.ticker = FixedTicker(ticks = range(0, y_max+1));
p.ygrid.ticker = FixedTicker(ticks = range(0, y_max+1));
- p.xaxis.formatter = NumeralTickFormatter(format="0,")
+ p.xaxis.formatter = NumeralTickFormatter(format="0,");
+ p.title.text_font_style = "bold";
p.quad(left = 'start', right = 'end', bottom = 'stackdepth',
top = 'stackdepthNext', color = 'color', line_color = "lightgrey",
@@ -427,28 +523,13 @@ def generateBucketChartForFile(figureName, dataframe, y_max, x_min, x_max):
else:
colorAlreadyUsedInLegend[fColor] = True;
- r = p.quad(left=0, right=1, bottom=0, top=1, color=fColor);
-
- lItem = LegendItem(label = func,
- renderers = [r]);
- legendItems.append(lItem);
-
- # Cap the number of items in a legend, so it can
- # fit horizontally.
- if (len(legendItems) == MAX_ITEMS_PER_LEGEND):
- numLegends = addLegend(p, legendItems, numLegends);
-
- # Add whatever legend items did not get added
- if (len(legendItems) > 0):
- numLegends = addLegend(p, legendItems, numLegends);
+ legendItems[func] = fColor;
# Plot height is the function of the maximum call stack and the number of
# legends
- p.plot_height = (numLegends * pixelsPerLegend) \
- + max((y_max+1) * pixelsPerStackLevel, 100) \
- + pixelsForTitle;
+ p.plot_height = max((y_max+1) * pixelsPerStackLevel, 100) + pixelsForTitle;
- return p;
+ return p, legendItems;
def generateEmptyDataset():
@@ -463,26 +544,6 @@ def generateEmptyDataset():
return pd.DataFrame(data=dict);
-# When we have no data for a trace interva we generate an empty file
-# for that interval.
-#
-def createNoDataFile(filename):
-
- try:
- f = open(filename, "w");
- except:
- print(color.RED + color.BOLD),
- exc_type, exc_value, exc_traceback = sys.exc_info()
- traceback.print_exception(exc_type, exc_value, exc_traceback);
- print("Could not open file " + filename + " for writing.");
- print(color.END);
- return;
-
- f.write("<body>\n");
- f.write("<p style=\"text-align:center;\">");
- f.write("No data was generated for this trace interval.</p>\n");
- f.write("</body>\n");
- f.close()
#
# Here we generate plots that span all the input files. Each plot shows
# the timelines for all files, stacked vertically. The timeline shows
@@ -493,26 +554,33 @@ def createNoDataFile(filename):
# across the timelines for all files. We call it a bucket, because it
# corresponds to a bucket in the outlier histogram.
#
-def generateCrossFilePlotsForBucket(i, lowerBound, upperBound):
+def generateCrossFilePlotsForBucket(i, lowerBound, upperBound, navigatorDF):
global bucketDir;
global colorAlreadyUsedInLegend;
+ aggregateLegendDict = {};
figuresForAllFiles = [];
fileName = bucketDir + "/bucket-" + str(i) + ".html";
reset_output();
+ intervalTitle = "Interval #" + str(i) + ". {:,}".format(lowerBound) + \
+ " to " + "{:,}".format(upperBound) + \
+ " CPU cycles.";
+
+ # Generate a navigator chart, which shows where we are in the
+ # trace and allows moving around the trace.
+ #
+ navigatorFigure = generateNavigatorFigure(navigatorDF, i, intervalTitle);
+ figuresForAllFiles.append(navigatorFigure);
+
# The following dictionary keeps track of legends. We need
# a legend for each new HTML file. So we reset the dictionary
# before generating a new file.
#
colorAlreadyUsedInLegend = {};
- intervalTitle = "Interval " + "{:,}".format(lowerBound) + \
- " to " + "{:,}".format(upperBound) + \
- " CPU cycles";
-
# Select from the dataframe for this file the records whose 'start'
# and 'end' timestamps fall within the lower and upper bound.
#
@@ -560,159 +628,154 @@ def generateCrossFilePlotsForBucket(i, lowerBound, upperBound):
bucketDF.loc[mask, 'start'] = lowerBound;
largestStackDepth = bucketDF['stackdepthNext'].max();
- figureTitle = fname + ": " + intervalTitle;
-
- figure = generateBucketChartForFile(figureTitle, bucketDF,
- largestStackDepth,
- lowerBound, upperBound);
+ figureTitle = fname;
+ figure, legendDict = generateBucketChartForFile(figureTitle, bucketDF,
+ largestStackDepth,
+ lowerBound, upperBound);
+ aggregateLegendDict.update(legendDict);
figuresForAllFiles.append(figure);
- if (len(figuresForAllFiles) > 0):
- savedFileName = save(column(figuresForAllFiles),
- filename = fileName, title=intervalTitle,
- resources=CDN);
- else:
- createNoDataFile(fileName);
+ # Create the legend for this file and insert it after the navigator figure
+ if (len(aggregateLegendDict) > 0):
+ legendFigure = createLegendFigure(aggregateLegendDict);
+ figuresForAllFiles.insert(1, legendFigure);
+
+ save(column(figuresForAllFiles), filename = fileName,
+ title=intervalTitle, resources=CDN);
return fileName;
-# Generate plots of time series slices across all files for each bucket
-# in the outlier histogram. Save each cross-file slice to an HTML file.
+# Generate a plot that shows a view of the entire timeline in a form of
+# intervals. By clicking on an interval we can navigate to that interval.
#
-def generateTSSlicesForBuckets():
+def generateNavigatorFigure(dataframe, i, title):
- global firstTimeStamp;
- global lastTimeStamp;
+ global pixelsForTitle;
+ global pixelsPerHeightUnit;
global plotWidth;
- global pixelsPerWidthUnit;
- bucketFilenames = [];
+ # Generate the colors, such that the current interval is shown in a
+ # different color than the rest.
+ #
+ numIntervals = dataframe['intervalnumber'].size;
+ color = ["white" for x in range(numIntervals)];
+ color[i] = "salmon";
+ dataframe['color'] = color;
- numBuckets = plotWidth / pixelsPerWidthUnit;
- timeUnitsPerBucket = (lastTimeStamp - firstTimeStamp) / numBuckets;
+ cds = ColumnDataSource(dataframe);
- for i in range(numBuckets):
- lowerBound = i * timeUnitsPerBucket;
- upperBound = (i+1) * timeUnitsPerBucket;
+ title = title + " CLICK TO NAVIGATE";
- fileName = generateCrossFilePlotsForBucket(i, lowerBound,
- upperBound);
+ hover = HoverTool(tooltips = [
+ ("interval #", "@intervalnumber"),
+ ("interval start", "@intervalbegin{0,0}"),
+ ("interval end", "@intervalend{0,0}")]);
- percentComplete = float(i) / float(numBuckets) * 100;
- print(color.BLUE + color.BOLD + " Generating timeline charts... "),
- sys.stdout.write("%d%% complete \r" % (percentComplete) );
- sys.stdout.flush();
- bucketFilenames.append(fileName);
+ TOOLS = [hover, "tap"];
- print(color.END);
+ p = figure(title = title, plot_width = plotWidth,
+ x_range = (0, numIntervals),
+ plot_height = 2 * pixelsPerHeightUnit + pixelsForTitle,
+ x_axis_label = "",
+ y_axis_label = "", tools = TOOLS,
+ toolbar_location="above");
- return bucketFilenames;
+ # No minor ticks or labels on the y-axis
+ p.yaxis.major_tick_line_color = None;
+ p.yaxis.minor_tick_line_color = None;
+ p.yaxis.major_label_text_font_size = '0pt';
+ p.yaxis.ticker = FixedTicker(ticks = range(0, 1));
+ p.ygrid.ticker = FixedTicker(ticks = range(0, 1));
-# Here we are making a line that will be inserted into an HTML file for
-# a given bucket (execution slice). This line will have links to the
-# previous slice and to the next slice, so we can navigate between slices
-# by clicking those links.
-#
-def makeLineWithLinks(previous, next):
+ p.xaxis.formatter = NumeralTickFormatter(format="0,");
- global arrowLeftImg;
- global arrowRightImg;
+ p.title.align = "center";
+ p.title.text_font_style = "normal";
- previousLink = "";
- nextLink = "";
+ p.quad(left = 'intervalnumber', right = 'intervalnumbernext',
+ bottom = 0, top = 2, color = 'color', source = cds,
+ nonselection_fill_color='color',
+ nonselection_fill_alpha = 1.0,
+ line_color = "aliceblue",
+ selection_fill_color = "white",
+ selection_line_color="lightgrey"
+ );
- # Strip the directory component out of the file name.
- #
- if previous is not None:
- words = previous.split("/");
- previousStripped = words[len(words)-1];
- previousLink = "<a href=\"" + previousStripped + "\">" + \
- "<img src=\"" + arrowLeftImg + \
- "\" height=\"30\" style=\"float:left\"></a><p>&nbsp;";
+ url = "@bucketfiles";
+ taptool = p.select(type=TapTool);
+ taptool.callback = OpenURL(url=url);
+ return p;
- if next is not None:
- words = next.split("/");
- nextStripped = words[len(words)-1];
- nextLink = "<a href=\"" + nextStripped + "\">" + \
- "<img src=\"" + arrowRightImg + \
- "\" height=\"30\" style=\"float:right\"></a><p>&nbsp;";
- line = previousLink + " " + nextLink + "\n";
- return line;
+# Create a dataframe describing all time intervals, which will later be used
+# to generate a plot allowing us to navigate along the execution by clicking
+# on different intervals.
+#
+def createIntervalNavigatorDF(numBuckets, timeUnitsPerBucket):
+ global bucketDir;
-# Into the current file insert links to the previous one and to the next one.
-# The rewritten file is saved under a new file name.
-#
-def linkFiles(current, previous, next):
+ bucketFiles = [];
+ bucketID = [];
+ intervalBegin = [];
+ intervalEnd = [];
- curFile = None;
- newFile = None;
- newFileName = current + ".new";
+ for i in range(numBuckets):
- try:
- curFile = open(current, "r");
- except:
- print(color.RED + color.BOLD),
- exc_type, exc_value, exc_traceback = sys.exc_info()
- traceback.print_exception(exc_type, exc_value, exc_traceback);
- print("Could not open file " + current + " for reading.");
- print(color.END);
- return None;
+ lBound = i * timeUnitsPerBucket;
+ uBound = (i+1) * timeUnitsPerBucket;
+ fileName = "bucket-" + str(i) + ".html";
- try:
- newFile = open(newFileName, "w");
- except:
- print(color.RED + color.BOLD),
- exc_type, exc_value, exc_traceback = sys.exc_info()
- traceback.print_exception(exc_type, exc_value, exc_traceback);
- print("Could not open file " + newFileName + " for writing.");
- print(color.END);
- return None;
+ bucketID.append(i);
+ intervalBegin.append(lBound);
+ intervalEnd.append(uBound);
+ bucketFiles.append(fileName);
- curFileLines = curFile.readlines();
+ data = {};
+ data['bucketfiles'] = bucketFiles;
+ data['intervalbegin'] = intervalBegin;
+ data['intervalend'] = intervalEnd;
+ data['intervalnumber'] = bucketID;
- for i in range(len(curFileLines)):
- line = curFileLines[i];
+ dataframe = pd.DataFrame(data=data);
+ dataframe['intervalnumbernext'] = dataframe['intervalnumber'] + 1;
+ return dataframe;
- insertedLine = makeLineWithLinks(previous, next);
+# Generate plots of time series slices across all files for each bucket
+# in the outlier histogram. Save each cross-file slice to an HTML file.
+#
+def generateTSSlicesForBuckets():
- if "<body>" in line:
- curFileLines.insert(i+1, insertedLine);
- elif "</body>" in line:
- curFileLines.insert(i, insertedLine);
+ global firstTimeStamp;
+ global lastTimeStamp;
+ global plotWidth;
+ global pixelsPerWidthUnit;
- for line in curFileLines:
- newFile.write(line);
+ bucketFilenames = [];
- curFile.close();
- newFile.close();
+ numBuckets = plotWidth / pixelsPerWidthUnit;
+ timeUnitsPerBucket = (lastTimeStamp - firstTimeStamp) / numBuckets;
- os.rename(newFileName, current);
+ navigatorDF = createIntervalNavigatorDF(numBuckets, timeUnitsPerBucket);
-# We have a list of bucket files. Each one is an HTML file showing a slice of
-# the execution. To be able to easily navigate between consecutive execution
-# slices we insert links into each slice-file that take us to the previous
-# slice and to the next slice.
-#
-def interlinkFiles(fnameList):
+ for i in range(numBuckets):
+ lowerBound = i * timeUnitsPerBucket;
+ upperBound = (i+1) * timeUnitsPerBucket;
- for i in range(len(fnameList)):
- current = fnameList[i];
+ fileName = generateCrossFilePlotsForBucket(i, lowerBound, upperBound,
+ navigatorDF);
- if i > 0:
- previous = fnameList[i-1];
- else:
- previous = None;
+ percentComplete = float(i) / float(numBuckets) * 100;
+ print(color.BLUE + color.BOLD + " Generating timeline charts... "),
+ sys.stdout.write("%d%% complete \r" % (percentComplete) );
+ sys.stdout.flush();
+ bucketFilenames.append(fileName);
- if (i < len(fnameList)-1):
- next = fnameList[i+1];
- else:
- next = None;
+ print(color.END);
- linkFiles(current, previous, next);
+ return bucketFilenames;
def processFile(fname):
@@ -1011,13 +1074,6 @@ def main():
if not os.path.exists(bucketDir):
os.makedirs(bucketDir);
- # Copy the image files that we will need later into bucketDir
- scriptLocation = os.path.dirname(os.path.realpath(__file__));
- os.system("cp " + scriptLocation + "/" + arrowLeftImg + " " + bucketDir +
- "/" + arrowLeftImg);
- os.system("cp " + scriptLocation + "/" + arrowRightImg + " " + bucketDir +
- "/" + arrowRightImg);
-
# Parallelize this later, so we are working on files in parallel.
for fname in args.files:
processFile(fname);
@@ -1030,12 +1086,6 @@ def main():
#
fileNameList = generateTSSlicesForBuckets();
- # Rewrite the files, so that they have links to one another. This way
- # you can navigate from one slice to the next by clicking the link inside
- # the file.
- #
- interlinkFiles(fileNameList);
-
totalFuncs = len(perFuncDF.keys());
i = 0;
# Generate a histogram of outlier durations
@@ -1058,6 +1108,3 @@ def main():
if __name__ == '__main__':
main()
-
-
-