/**
* Copyright (C) 2008 10gen Inc.
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License, version 3,
* as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see .
*/
#include "mongo/pch.h"
#include "mongo/db/btreecursor.h"
#include "mongo/db/btree.h"
#include "mongo/db/curop-inl.h"
#include "mongo/db/kill_current_op.h"
#include "mongo/db/pdfile.h"
#include "mongo/db/queryutil.h"
namespace mongo {
template< class V >
class BtreeCursorImpl : public BtreeCursor {
public:
typedef typename BucketBasics::KeyNode KeyNode;
typedef typename V::Key Key;
typedef typename V::_KeyNode _KeyNode;
BtreeCursorImpl( NamespaceDetails* a , int b, const IndexDetails& c )
: BtreeCursor(a,b,c){
}
void init(const BSONObj &d, const BSONObj &e, bool f, int g) {
BtreeCursor::init(d,e,f,g);
}
void init( const shared_ptr< FieldRangeVector >& bounds, int singleIntervalLimit, int direction ) {
BtreeCursor::init(bounds,singleIntervalLimit,direction );
pair< DiskLoc, int > noBestParent;
indexDetails.head.btree()->customLocate( bucket, keyOfs, startKey, 0, false, _boundsIterator->cmp(), _boundsIterator->inc(), _ordering, direction, noBestParent );
skipAndCheck();
dassert( _dups.size() == 0 );
}
virtual DiskLoc currLoc() {
if( bucket.isNull() ) return DiskLoc();
return currKeyNode().recordLoc;
}
virtual BSONObj keyAt(int ofs) const {
verify( !bucket.isNull() );
const BtreeBucket *b = bucket.btree();
int n = b->getN();
if( n == b->INVALID_N_SENTINEL ) {
throw UserException(15850, "keyAt bucket deleted");
}
dassert( n >= 0 && n < 10000 );
return ofs >= n ? BSONObj() : b->keyNode(ofs).key.toBson();
}
virtual BSONObj currKey() const {
verify( !bucket.isNull() );
return bucket.btree()->keyNode(keyOfs).key.toBson();
}
virtual bool curKeyHasChild() {
return !currKeyNode().prevChildBucket.isNull();
}
bool skipUnusedKeys() {
int u = 0;
while ( 1 ) {
if ( !ok() )
break;
const _KeyNode& kn = keyNode(keyOfs);
if ( kn.isUsed() )
break;
bucket = _advance(bucket, keyOfs, _direction, "skipUnusedKeys");
u++;
//don't include unused keys in nscanned
//++_nscanned;
}
if ( u > 10 )
OCCASIONALLY log() << "btree unused skipped:" << u << endl;
return u;
}
/* Since the last noteLocation(), our key may have moved around, and that old cached
information may thus be stale and wrong (although often it is right). We check
that here; if we have moved, we have to search back for where we were at.
i.e., after operations on the index, the BtreeCursor's cached location info may
be invalid. This function ensures validity, so you should call it before using
the cursor if other writers have used the database since the last noteLocation
call.
*/
void checkLocation() {
if ( eof() )
return;
_multikey = d->isMultikey(idxNo);
if ( keyOfs >= 0 ) {
verify( !keyAtKeyOfs.isEmpty() );
try {
// Note keyAt() returns an empty BSONObj if keyOfs is now out of range,
// which is possible as keys may have been deleted.
int x = 0;
while( 1 ) {
// if ( b->keyAt(keyOfs).woEqual(keyAtKeyOfs) &&
// b->k(keyOfs).recordLoc == locAtKeyOfs ) {
if ( keyAt(keyOfs).binaryEqual(keyAtKeyOfs) ) {
const _KeyNode& kn = keyNode(keyOfs);
if( kn.recordLoc == locAtKeyOfs ) {
if ( !kn.isUsed() ) {
// we were deleted but still exist as an unused
// marker key. advance.
skipUnusedKeys();
}
return;
}
}
// we check one key earlier too, in case a key was just deleted. this is
// important so that multi updates are reasonably fast.
if( keyOfs == 0 || x++ )
break;
keyOfs--;
}
}
catch(UserException& e) {
if( e.getCode() != 15850 )
throw;
// hack: fall through if bucket was just deleted. should only happen under deleteObjects()
DEV log() << "debug info: bucket was deleted" << endl;
}
}
/* normally we don't get to here. when we do, old position is no longer
valid and we must refind where we left off (which is expensive)
*/
/* TODO: Switch to keep indexdetails and do idx.head! */
bucket = _locate(keyAtKeyOfs, locAtKeyOfs);
RARELY log() << "key seems to have moved in the index, refinding. " << bucket.toString() << endl;
if ( ! bucket.isNull() )
skipUnusedKeys();
}
protected:
virtual void _advanceTo(DiskLoc &thisLoc, int &keyOfs, const BSONObj &keyBegin, int keyBeginLen, bool afterKey, const vector< const BSONElement * > &keyEnd, const vector< bool > &keyEndInclusive, const Ordering &order, int direction ) {
thisLoc.btree()->advanceTo(thisLoc, keyOfs, keyBegin, keyBeginLen, afterKey, keyEnd, keyEndInclusive, order, direction);
}
virtual DiskLoc _advance(const DiskLoc& thisLoc, int& keyOfs, int direction, const char *caller) {
return thisLoc.btree()->advance(thisLoc, keyOfs, direction, caller);
}
virtual void _audit() {
out() << "BtreeCursor(). dumping head bucket" << endl;
indexDetails.head.btree()->dump();
}
virtual DiskLoc _locate(const BSONObj& key, const DiskLoc& loc) {
bool found;
return indexDetails.head.btree()->
locate(indexDetails, indexDetails.head, key, _ordering, keyOfs, found, loc, _direction);
}
const _KeyNode& keyNode(int keyOfs) const {
return bucket.btree()->k(keyOfs);
}
private:
const KeyNode currKeyNode() const {
verify( !bucket.isNull() );
const BtreeBucket *b = bucket.btree();
return b->keyNode(keyOfs);
}
};
template class BtreeCursorImpl;
template class BtreeCursorImpl;
BtreeCursor* BtreeCursor::make( NamespaceDetails * nsd , int idxNo , const IndexDetails& indexDetails ) {
int v = indexDetails.version();
if( v == 1 )
return new BtreeCursorImpl( nsd , idxNo , indexDetails );
if( v == 0 )
return new BtreeCursorImpl( nsd , idxNo , indexDetails );
dassert( IndexDetails::isASupportedIndexVersionNumber(v) );
uasserted(14800, str::stream() << "unsupported index version " << v);
return 0; // not reachable
}
BtreeCursor* BtreeCursor::make( NamespaceDetails* namespaceDetails,
const IndexDetails& id,
const BSONObj& startKey,
const BSONObj& endKey,
bool endKeyInclusive,
int direction ) {
auto_ptr c( make( namespaceDetails, namespaceDetails->idxNo( id ), id ) );
c->init(startKey,endKey,endKeyInclusive,direction);
c->initWithoutIndependentFieldRanges();
dassert( c->_dups.size() == 0 );
return c.release();
}
BtreeCursor* BtreeCursor::make( NamespaceDetails* namespaceDetails,
const IndexDetails& id,
const shared_ptr& bounds,
int singleIntervalLimit,
int direction )
{
auto_ptr c( make( namespaceDetails, namespaceDetails->idxNo( id ), id ) );
c->init(bounds,singleIntervalLimit,direction);
return c.release();
}
BtreeCursor::BtreeCursor( NamespaceDetails* nsd, int theIndexNo, const IndexDetails& id ) :
d( nsd ),
idxNo( theIndexNo ),
indexDetails( id ),
_ordering( Ordering::make( BSONObj() ) ),
_boundsMustMatch( true ),
_nscanned() {
}
void BtreeCursor::_finishConstructorInit() {
_multikey = d->isMultikey( idxNo );
_order = indexDetails.keyPattern();
_ordering = Ordering::make( _order );
}
void BtreeCursor::init( const BSONObj& sk, const BSONObj& ek, bool endKeyInclusive, int direction ) {
_finishConstructorInit();
startKey = sk;
endKey = ek;
_endKeyInclusive = endKeyInclusive;
_direction = direction;
_independentFieldRanges = false;
audit();
}
void BtreeCursor::init( const shared_ptr< FieldRangeVector > &bounds, int singleIntervalLimit, int direction ) {
_finishConstructorInit();
_bounds = bounds;
verify( _bounds );
_direction = direction;
_endKeyInclusive = true;
_boundsIterator.reset( new FieldRangeVectorIterator( *_bounds , singleIntervalLimit ) );
_independentFieldRanges = true;
audit();
startKey = _bounds->startKey();
_boundsIterator->advance( startKey ); // handles initialization
_boundsIterator->prepDive();
bucket = indexDetails.head;
keyOfs = 0;
}
/** Properly destroy forward declared class members. */
BtreeCursor::~BtreeCursor() {}
void BtreeCursor::audit() {
dassert( d->idxNo((IndexDetails&) indexDetails) == idxNo );
}
void BtreeCursor::initWithoutIndependentFieldRanges() {
if ( indexDetails.getSpec().getType() ) {
startKey = indexDetails.getSpec().getType()->fixKey( startKey );
endKey = indexDetails.getSpec().getType()->fixKey( endKey );
}
bucket = _locate(startKey, _direction > 0 ? minDiskLoc : maxDiskLoc);
if ( ok() ) {
_nscanned = 1;
}
skipUnusedKeys();
checkEnd();
}
void BtreeCursor::skipAndCheck() {
long long startNscanned = _nscanned;
skipUnusedKeys();
while( 1 ) {
if ( !skipOutOfRangeKeysAndCheckEnd() ) {
break;
}
do {
// If nscanned is increased by more than 20 before a matching key is found, abort
// skipping through the btree to find a matching key. This iteration cutoff
// prevents unbounded internal iteration within BtreeCursor::init() and
// BtreeCursor::advance() (the callers of skipAndCheck()). See SERVER-3448.
if ( _nscanned > startNscanned + 20 ) {
skipUnusedKeys();
// If iteration is aborted before a key matching _bounds is identified, the
// cursor may be left pointing at a key that is not within bounds
// (_bounds->matchesKey( currKey() ) may be false). Set _boundsMustMatch to
// false accordingly.
_boundsMustMatch = false;
return;
}
} while( skipOutOfRangeKeysAndCheckEnd() );
if ( !skipUnusedKeys() ) {
break;
}
}
}
bool BtreeCursor::skipOutOfRangeKeysAndCheckEnd() {
if ( !ok() ) {
return false;
}
int ret = _boundsIterator->advance( currKey() );
if ( ret == -2 ) {
bucket = DiskLoc();
return false;
}
else if ( ret == -1 ) {
++_nscanned;
return false;
}
++_nscanned;
advanceTo( currKey(), ret, _boundsIterator->after(), _boundsIterator->cmp(), _boundsIterator->inc() );
return true;
}
// Return a value in the set {-1, 0, 1} to represent the sign of parameter i.
int sgn( int i ) {
if ( i == 0 )
return 0;
return i > 0 ? 1 : -1;
}
// Check if the current key is beyond endKey.
void BtreeCursor::checkEnd() {
if ( bucket.isNull() )
return;
if ( !endKey.isEmpty() ) {
int cmp = sgn( endKey.woCompare( currKey(), _order ) );
if ( ( cmp != 0 && cmp != _direction ) ||
( cmp == 0 && !_endKeyInclusive ) )
bucket = DiskLoc();
}
}
void BtreeCursor::advanceTo( const BSONObj &keyBegin, int keyBeginLen, bool afterKey, const vector< const BSONElement * > &keyEnd, const vector< bool > &keyEndInclusive) {
_advanceTo( bucket, keyOfs, keyBegin, keyBeginLen, afterKey, keyEnd, keyEndInclusive, _ordering, _direction );
}
bool BtreeCursor::advance() {
// Reset this flag at the start of a new iteration.
_boundsMustMatch = true;
killCurrentOp.checkForInterrupt();
if ( bucket.isNull() )
return false;
bucket = _advance(bucket, keyOfs, _direction, "BtreeCursor::advance");
if ( !_independentFieldRanges ) {
skipUnusedKeys();
checkEnd();
if ( ok() ) {
++_nscanned;
}
}
else {
skipAndCheck();
}
return ok();
}
void BtreeCursor::noteLocation() {
if ( !eof() ) {
BSONObj o = currKey().getOwned();
keyAtKeyOfs = o;
locAtKeyOfs = currLoc();
}
}
string BtreeCursor::toString() {
string s = string("BtreeCursor ") + indexDetails.indexName();
if ( _direction < 0 ) s += " reverse";
if ( _bounds.get() && _bounds->size() > 1 ) s += " multi";
return s;
}
BSONObj BtreeCursor::prettyIndexBounds() const {
if ( !_independentFieldRanges ) {
return BSON( "start" << prettyKey( startKey ) << "end" << prettyKey( endKey ) );
}
else {
return _bounds->obj();
}
}
bool BtreeCursor::currentMatches( MatchDetails* details ) {
// If currKey() might not match the specified _bounds, check whether or not it does.
if ( !_boundsMustMatch && _bounds && !_bounds->matchesKey( currKey() ) ) {
// If the key does not match _bounds, it does not match the query.
return false;
}
// Forward to the base class implementation, which may utilize a Matcher.
return Cursor::currentMatches( details );
}
/* ----------------------------------------------------------------------------- */
struct BtreeCursorUnitTest {
BtreeCursorUnitTest() {
verify( minDiskLoc.compare(maxDiskLoc) < 0 );
}
} btut;
} // namespace mongo