move to perf because it makes debug builds fail

author: agirbal <antoine@10gen.com> 2011-12-06 15:00:13 -0800
committer: agirbal <antoine@10gen.com> 2011-12-06 15:00:13 -0800
commit: 1e2b1b04ab525f6096c5ef86b0f2f4436940d862 (patch)
tree: d792236062716a33f498c7070b72bb583a36ad69 /jstests/perf
parent: 4ee458d6b490e4ba6669f2e861dcec5cbf7142d4 (diff)
download: mongo-1e2b1b04ab525f6096c5ef86b0f2f4436940d862.tar.gz
1 files changed, 83 insertions, 0 deletions
diff --git a/jstests/perf/mr_bench.js b/jstests/perf/mr_bench.js
new file mode 100644
index 00000000000..1e24c65faf4
--- /dev/null
+++ b/jstests/perf/mr_bench.js
@@ -0,0 +1,83 @@
+
+t = db.mr_bench;
+t.drop();
+
+function getRandomStr(L){
+    var s= '';
+    var randomchar=function(){
+        var n= Math.floor(Math.random()*62);
+        if(n<10) return n; //1-10
+        if(n<36) return String.fromCharCode(n+55); //A-Z
+        return String.fromCharCode(n+61); //a-z
+    }
+    while(s.length< L) s+= randomchar();
+    return s;
+}
+
+t.ensureIndex({rand: 1}, {unique: true});
+
+largeStr = "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa";
+while (largeStr.length < 512) {
+    largeStr += largeStr;
+}
+largeStr = largeStr.substr(512);
+
+for ( i = 0; i < 100000; ++i ) {
+    t.save({rand: getRandomStr(20), same: "the same string", str: largeStr});
+}
+
+emit = printjson;
+count = t.count();
+
+function d( x ){
+    printjson( x );
+}
+
+m = function(){
+    emit(this.rand, {id: this._id, str: this.str});
+};
+
+m2 = function(){
+    emit(this.same, this.rand);
+};
+
+r = function(k,vals) {
+     var tmp = {};
+     vals.forEach(function(i) {
+        if(typeof(i) == 'string') {
+          tmp[i] = true;
+        } else {
+          for(var z in i) tmp[z] = true;
+        }
+     });
+
+     return tmp;
+}
+
+// following time limits are passing fine on a laptop with a debug build
+// so should always pass in theory unless something is wrong: GC, too much reducing, etc
+
+// 1st MR just uses random unique keys, with no reduce involved
+// this should be straightforward for perf, but could lead to OOM if settings are bad
+assert.time(
+function() { 
+res = db.runCommand( { mapreduce : "mr_bench" , map : m , reduce : r , out : "mr_bench_out" } );
+d( res );
+assert.eq( count , res.counts.input , "A" );
+x = db[res.result];
+assert.eq( count , x.find().count() , "B" );
+return 1;
+}, "unique key mr", 20000);
+
+// 2nd MR emits the same key, and a unique value is added as key to same object
+// if object is kept in ram and being reduced, this can be really slow
+assert.time(
+function() { 
+res = db.runCommand( { mapreduce : "mr_bench" , map : m2 , reduce : r , out : "mr_bench_out" } );
+d( res );
+assert.eq( count , res.counts.input , "A" );
+x = db[res.result];
+assert.eq( 1 , x.find().count() , "B" );
+return 1;
+}, "single key mr", 30000);
+
author	agirbal <antoine@10gen.com>	2011-12-06 15:00:13 -0800
committer	agirbal <antoine@10gen.com>	2011-12-06 15:00:13 -0800
commit	1e2b1b04ab525f6096c5ef86b0f2f4436940d862 (patch)
tree	d792236062716a33f498c7070b72bb583a36ad69 /jstests/perf
parent	4ee458d6b490e4ba6669f2e861dcec5cbf7142d4 (diff)
download	mongo-1e2b1b04ab525f6096c5ef86b0f2f4436940d862.tar.gz