1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
|
// mr.js
MR = {};
MR.init = function(){
$max = 0;
$arr = [];
emit = MR.emit;
$numEmits = 0;
$numReduces = 0;
$numReducesToDB = 0;
gc(); // this is just so that keep memory size sane
}
MR.cleanup = function(){
MR.init();
gc();
}
MR.emit = function(k,v){
$numEmits++;
var num = nativeHelper.apply( get_num_ , [ k ] );
var data = $arr[num];
if ( ! data ){
data = { key : k , values : new Array(1000) , count : 0 };
$arr[num] = data;
}
data.values[data.count++] = v;
$max = Math.max( $max , data.count );
}
MR.doReduce = function( useDB ){
$numReduces++;
if ( useDB )
$numReducesToDB++;
$max = 0;
for ( var i=0; i<$arr.length; i++){
var data = $arr[i];
if ( ! data )
continue;
if ( useDB ){
var x = tempcoll.findOne( { _id : data.key } );
if ( x ){
data.values[data.count++] = x.value;
}
}
var r = $reduce( data.key , data.values.slice( 0 , data.count ) );
if ( r && r.length && r[0] ){
data.values = r;
data.count = r.length;
}
else{
data.values[0] = r;
data.count = 1;
}
$max = Math.max( $max , data.count );
if ( useDB ){
if ( data.count == 1 ){
tempcoll.save( { _id : data.key , value : data.values[0] } );
}
else {
tempcoll.save( { _id : data.key , value : data.values.slice( 0 , data.count ) } );
}
}
}
}
MR.check = function(){
if ( $max < 2000 && $arr.length < 1000 ){
return 0;
}
MR.doReduce();
if ( $max < 2000 && $arr.length < 1000 ){
return 1;
}
MR.doReduce( true );
$arr = [];
$max = 0;
reset_num();
gc();
return 2;
}
MR.finalize = function(){
tempcoll.find().forEach(
function(z){
z.value = $finalize( z._id , z.value );
tempcoll.save( z );
}
);
}
|