diff options
author | agirbal <antoine@10gen.com> | 2011-12-06 15:00:13 -0800 |
---|---|---|
committer | agirbal <antoine@10gen.com> | 2011-12-06 15:00:13 -0800 |
commit | 1e2b1b04ab525f6096c5ef86b0f2f4436940d862 (patch) | |
tree | d792236062716a33f498c7070b72bb583a36ad69 /jstests/perf | |
parent | 4ee458d6b490e4ba6669f2e861dcec5cbf7142d4 (diff) | |
download | mongo-1e2b1b04ab525f6096c5ef86b0f2f4436940d862.tar.gz |
move to perf because it makes debug builds fail
Diffstat (limited to 'jstests/perf')
-rw-r--r-- | jstests/perf/mr_bench.js | 83 |
1 files changed, 83 insertions, 0 deletions
diff --git a/jstests/perf/mr_bench.js b/jstests/perf/mr_bench.js new file mode 100644 index 00000000000..1e24c65faf4 --- /dev/null +++ b/jstests/perf/mr_bench.js @@ -0,0 +1,83 @@ + +t = db.mr_bench; +t.drop(); + +function getRandomStr(L){ + var s= ''; + var randomchar=function(){ + var n= Math.floor(Math.random()*62); + if(n<10) return n; //1-10 + if(n<36) return String.fromCharCode(n+55); //A-Z + return String.fromCharCode(n+61); //a-z + } + while(s.length< L) s+= randomchar(); + return s; +} + +t.ensureIndex({rand: 1}, {unique: true}); + +largeStr = "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"; +while (largeStr.length < 512) { + largeStr += largeStr; +} +largeStr = largeStr.substr(512); + +for ( i = 0; i < 100000; ++i ) { + t.save({rand: getRandomStr(20), same: "the same string", str: largeStr}); +} + +emit = printjson; +count = t.count(); + +function d( x ){ + printjson( x ); +} + +m = function(){ + emit(this.rand, {id: this._id, str: this.str}); +}; + +m2 = function(){ + emit(this.same, this.rand); +}; + +r = function(k,vals) { + var tmp = {}; + vals.forEach(function(i) { + if(typeof(i) == 'string') { + tmp[i] = true; + } else { + for(var z in i) tmp[z] = true; + } + }); + + return tmp; +} + +// following time limits are passing fine on a laptop with a debug build +// so should always pass in theory unless something is wrong: GC, too much reducing, etc + +// 1st MR just uses random unique keys, with no reduce involved +// this should be straightforward for perf, but could lead to OOM if settings are bad +assert.time( +function() { +res = db.runCommand( { mapreduce : "mr_bench" , map : m , reduce : r , out : "mr_bench_out" } ); +d( res ); +assert.eq( count , res.counts.input , "A" ); +x = db[res.result]; +assert.eq( count , x.find().count() , "B" ); +return 1; +}, "unique key mr", 20000); + +// 2nd MR emits the same key, and a unique value is added as key to same object +// if object is kept in ram and being reduced, this can be really slow +assert.time( +function() { +res = db.runCommand( { mapreduce : "mr_bench" , map : m2 , reduce : r , out : "mr_bench_out" } ); +d( res ); +assert.eq( count , res.counts.input , "A" ); +x = db[res.result]; +assert.eq( 1 , x.find().count() , "B" ); +return 1; +}, "single key mr", 30000); + |