// extsort.h
/**
* Copyright (C) 2008 10gen Inc.
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License, version 3,
* as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see .
*/
#pragma once
#include "../pch.h"
#include "jsobj.h"
#include "namespace-inl.h"
#include "curop-inl.h"
#include "../util/array.h"
namespace mongo {
/**
for external (disk) sorting by BSONObj and attaching a value
*/
class BSONObjExternalSorter : boost::noncopyable {
public:
BSONObjExternalSorter( IndexInterface &i, const BSONObj & order = BSONObj() , long maxFileSize = 1024 * 1024 * 100 );
~BSONObjExternalSorter();
typedef pair Data;
private:
IndexInterface& _idxi;
static int _compare(IndexInterface& i, const Data& l, const Data& r, const Ordering& order) {
RARELY killCurrentOp.checkForInterrupt();
_compares++;
int x = i.keyCompare(l.first, r.first, order);
if ( x )
return x;
return l.second.compare( r.second );
}
class MyCmp {
public:
MyCmp( IndexInterface& i, BSONObj order = BSONObj() ) : _i(i), _order( Ordering::make(order) ) {}
bool operator()( const Data &l, const Data &r ) const {
return _compare(_i, l, r, _order) < 0;
};
private:
IndexInterface& _i;
const Ordering _order;
};
static IndexInterface *extSortIdxInterface;
static Ordering extSortOrder;
static int extSortComp( const void *lv, const void *rv ) {
DEV RARELY {
dbMutex.assertWriteLocked(); // must be as we use a global var
}
Data * l = (Data*)lv;
Data * r = (Data*)rv;
return _compare(*extSortIdxInterface, *l, *r, extSortOrder);
};
class FileIterator : boost::noncopyable {
public:
FileIterator( string file );
~FileIterator();
bool more();
Data next();
private:
MemoryMappedFile _file;
char * _buf;
char * _end;
};
public:
typedef FastArray InMemory;
class Iterator : boost::noncopyable {
public:
Iterator( BSONObjExternalSorter * sorter );
~Iterator();
bool more();
Data next();
private:
MyCmp _cmp;
vector _files;
vector< pair > _stash;
InMemory * _in;
InMemory::iterator _it;
};
void add( const BSONObj& o , const DiskLoc & loc );
void add( const BSONObj& o , int a , int b ) {
add( o , DiskLoc( a , b ) );
}
/* call after adding values, and before fetching the iterator */
void sort();
auto_ptr iterator() {
uassert( 10052 , "not sorted" , _sorted );
return auto_ptr( new Iterator( this ) );
}
int numFiles() {
return _files.size();
}
long getCurSizeSoFar() { return _curSizeSoFar; }
void hintNumObjects( long long numObjects ) {
if ( numObjects < _arraySize )
_arraySize = (int)(numObjects + 100);
}
private:
void _sortInMem();
void sort( string file );
void finishMap();
BSONObj _order;
long _maxFilesize;
path _root;
int _arraySize;
InMemory * _cur;
long _curSizeSoFar;
list _files;
bool _sorted;
static unsigned long long _compares;
};
}