1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
|
/**
* Copyright (C) 2008 10gen Inc.
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License, version 3,
* as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
* As a special exception, the copyright holders give permission to link the
* code of portions of this program with the OpenSSL library under certain
* conditions as described in each individual source file and distribute
* linked combinations including the program with the OpenSSL library. You
* must comply with the GNU Affero General Public License in all respects for
* all of the code used other than as permitted herein. If you modify file(s)
* with this exception, you may extend this exception to your version of the
* file(s), but you are not obligated to do so. If you do not wish to do so,
* delete this exception statement from your version. If you delete this
* exception statement from all source files in the program, then also delete
* it in the license file.
*/
#pragma once
#include <boost/optional.hpp>
#include "mongo/client/dbclientinterface.h"
#include "mongo/db/auth/user_name.h"
#include "mongo/db/cursor_id.h"
#include "mongo/db/jsobj.h"
#include "mongo/db/logical_session_id.h"
#include "mongo/db/query/plan_executor.h"
#include "mongo/db/record_id.h"
#include "mongo/stdx/functional.h"
#include "mongo/util/net/message.h"
namespace mongo {
class Collection;
class CursorManager;
class RecoveryUnit;
/**
* Parameters used for constructing a ClientCursor. Makes an owned copy of 'originatingCommandObj'
* to be used across getMores.
*
* ClientCursors cannot be constructed in isolation, but rather must be
* constructed and managed using a CursorManager. See cursor_manager.h for more details.
*/
struct ClientCursorParams {
ClientCursorParams(std::unique_ptr<PlanExecutor, PlanExecutor::Deleter> planExecutor,
NamespaceString nss,
UserNameIterator authenticatedUsersIter,
bool isReadCommitted,
BSONObj originatingCommandObj)
: exec(std::move(planExecutor)),
nss(std::move(nss)),
isReadCommitted(isReadCommitted),
queryOptions(exec->getCanonicalQuery()
? exec->getCanonicalQuery()->getQueryRequest().getOptions()
: 0),
originatingCommandObj(originatingCommandObj.getOwned()) {
while (authenticatedUsersIter.more()) {
authenticatedUsers.emplace_back(authenticatedUsersIter.next());
}
}
void setTailable(bool tailable) {
if (tailable)
queryOptions |= QueryOption_CursorTailable;
else
queryOptions &= ~QueryOption_CursorTailable;
}
void setAwaitData(bool awaitData) {
if (awaitData)
queryOptions |= QueryOption_AwaitData;
else
queryOptions &= ~QueryOption_AwaitData;
}
std::unique_ptr<PlanExecutor, PlanExecutor::Deleter> exec;
const NamespaceString nss;
std::vector<UserName> authenticatedUsers;
bool isReadCommitted = false;
int queryOptions = 0;
BSONObj originatingCommandObj;
};
/**
* A ClientCursor is the server-side state associated with a particular cursor id. A cursor id is a
* handle that we return to the client for queries which require results to be returned in multiple
* batches. The client can manage the server-side cursor state by passing the cursor id back to the
* server for certain supported operations.
*
* For instance, a client can retrieve the next batch of results from the cursor by issuing a
* getMore on this cursor id. It can also request that server-side resources be freed by issuing a
* killCursors on a particular cursor id. This is useful if the client wishes to abandon the cursor
* without retrieving all results.
*
* ClientCursors cannot exist in isolation and must be created, accessed, and destroyed via a
* CursorManager. See cursor_manager.h for more details. Unless the ClientCursor is marked by the
* caller as "no timeout", it will be automatically destroyed by its cursor manager after a period
* of inactivity.
*/
class ClientCursor {
MONGO_DISALLOW_COPYING(ClientCursor);
public:
CursorId cursorid() const {
return _cursorid;
}
const NamespaceString& nss() const {
return _nss;
}
UserNameIterator getAuthenticatedUsers() const {
return makeUserNameIterator(_authenticatedUsers.begin(), _authenticatedUsers.end());
}
boost::optional<LogicalSessionId> getSessionId() const {
return _lsid;
}
bool isReadCommitted() const {
return _isReadCommitted;
}
/**
* Returns a pointer to the underlying query plan executor. All cursors manage a PlanExecutor,
* so this method never returns a null pointer.
*/
PlanExecutor* getExecutor() const {
return _exec.get();
}
/**
* Returns the query options bitmask. If you'd like to know if the cursor is tailable or
* awaitData, prefer using the specific methods isTailable() and isAwaitData() over using this
* method.
*/
int queryOptions() const {
return _queryOptions;
}
bool isTailable() const {
return _queryOptions & QueryOption_CursorTailable;
}
bool isAwaitData() const {
return _queryOptions & QueryOption_AwaitData;
}
const BSONObj& getOriginatingCommandObj() const {
return _originatingCommand;
}
/**
* Returns the total number of query results returned by the cursor so far.
*/
long long pos() const {
return _pos;
}
/**
* Increments the cursor's tracked number of query results returned so far by 'n'.
*/
void incPos(long long n) {
_pos += n;
}
/**
* Sets the cursor's tracked number of query results returned so far to 'n'.
*/
void setPos(long long n) {
_pos = n;
}
//
// Timing.
//
/**
* Returns the amount of time execution time available to this cursor. Only valid at the
* beginning of a getMore request, and only really for use by the maxTime tracking code.
*
* Microseconds::max() == infinity, values less than 1 mean no time left.
*/
Microseconds getLeftoverMaxTimeMicros() const {
return _leftoverMaxTimeMicros;
}
/**
* Sets the amount of execution time available to this cursor. This is only called when an
* operation that uses a cursor is finishing, to update its remaining time.
*
* Microseconds::max() == infinity, values less than 1 mean no time left.
*/
void setLeftoverMaxTimeMicros(Microseconds leftoverMaxTimeMicros) {
_leftoverMaxTimeMicros = leftoverMaxTimeMicros;
}
//
// Replication-related methods.
//
// Used to report replication position only in master-slave, so we keep them as TimeStamp rather
// than OpTime.
void updateSlaveLocation(OperationContext* opCtx);
void slaveReadTill(const Timestamp& t) {
_slaveReadTill = t;
}
/** Just for testing. */
Timestamp getSlaveReadTill() const {
return _slaveReadTill;
}
/**
* Returns the server-wide the count of living cursors. Such a cursor is called an "open
* cursor".
*/
static long long totalOpen();
friend std::size_t partitionOf(const ClientCursor* cursor) {
return cursor->cursorid();
}
private:
friend class CursorManager;
friend class ClientCursorPin;
/**
* Since the client cursor destructor is private, this is needed for using client cursors with
* smart pointers.
*/
struct Deleter {
void operator()(ClientCursor* cursor) {
delete cursor;
}
};
/**
* Constructs a ClientCursor. Since cursors must come into being registered and pinned, this is
* private. See cursor_manager.h for more details.
*/
ClientCursor(ClientCursorParams params,
CursorManager* cursorManager,
CursorId cursorId,
OperationContext* operationUsingCursor,
Date_t now);
/**
* Destroys a ClientCursor. This is private, since only the CursorManager or the ClientCursorPin
* is allowed to destroy a cursor.
*
* Cursors must be unpinned and deregistered from the CursorManager before they can be
* destroyed.
*/
~ClientCursor();
/**
* Marks this cursor as killed, so any future uses will return 'killStatus'. It is an error to
* call this method with Status::OK.
*/
void markAsKilled(Status killStatus);
/**
* Disposes this ClientCursor's PlanExecutor. Must be called before deleting a ClientCursor to
* ensure it has a chance to clean up any resources it is using. Can be called multiple times.
* It is an error to call any other method after calling dispose().
*/
void dispose(OperationContext* opCtx);
bool isNoTimeout() const {
return (_queryOptions & QueryOption_NoCursorTimeout);
}
// The ID of the ClientCursor. A value of 0 is used to mean that no cursor id has been assigned.
CursorId _cursorid = 0;
// Threads may read from this field even if they don't have the cursor pinned, as long as they
// have the correct partition of the CursorManager locked (just like _authenticatedUsers).
const NamespaceString _nss;
// The set of authenticated users when this cursor was created. Threads may read from this
// field (using the getter) even if they don't have the cursor pinned as long as they hold the
// correct partition's lock in the CursorManager. They must hold the lock to prevent the cursor
// from being freed by another thread during the read.
const std::vector<UserName> _authenticatedUsers;
// A logical session id for this cursor, if it is running inside of a session.
const boost::optional<LogicalSessionId> _lsid;
const bool _isReadCommitted = false;
CursorManager* _cursorManager;
// Tracks whether dispose() has been called, to make sure it happens before destruction. It is
// an error to use a ClientCursor once it has been disposed.
bool _disposed = false;
// Tracks the number of results returned by this cursor so far.
long long _pos = 0;
// Holds an owned copy of the command specification received from the client.
const BSONObj _originatingCommand;
// See the QueryOptions enum in dbclientinterface.h.
const int _queryOptions = 0;
// The replication position only used in master-slave.
Timestamp _slaveReadTill;
// Unused maxTime budget for this cursor.
Microseconds _leftoverMaxTimeMicros = Microseconds::max();
// The underlying query execution machinery. Must be non-null.
std::unique_ptr<PlanExecutor, PlanExecutor::Deleter> _exec;
//
// The following fields are used by the CursorManager and the ClientCursorPin. In most
// conditions, they can only be used while holding the CursorManager's mutex. Exceptions
// include:
// - If the ClientCursor is pinned, the CursorManager will never change '_isPinned' until
// asked to by the ClientCursorPin.
// - It is safe to read '_killed' while holding a collection lock, which must be held when
// interacting with a ClientCursorPin.
// - A ClientCursorPin can access these members after deregistering the cursor from the
// CursorManager, at which point it has sole ownership of the ClientCursor.
//
// While a cursor is being used by a client, it is marked as "pinned" by setting
// _operationUsingCursor to the current OperationContext.
//
// Cursors always come into existence in a pinned state (this must be non-null at construction).
//
// To write to this field one of the following must be true:
// 1) You have a lock on the appropriate partition in CursorManager and the cursor is unpinned
// (the field is null).
// 2) You own the cursor and the cursor manager it was associated with is gone (this can only
// happen in ClientCursorPin). In this case, nobody else will try to pin the cursor.
//
// To read this field one of the following must be true:
// 1) You have a lock on the appropriate partition in CursorManager.
// 2) You know you have the cursor pinned.
OperationContext* _operationUsingCursor;
Date_t _lastUseDate;
};
/**
* ClientCursorPin is an RAII class which must be used in order to access a cursor. On
* construction, the ClientCursorPin marks its cursor as in use, which is called "pinning" the
* cursor. On destruction, the ClientCursorPin marks its cursor as no longer in use, which is
* called "unpinning" the cursor. Pinning is used to prevent multiple concurrent uses of the same
* cursor--- pinned cursors cannot be deleted or timed out and cannot be used concurrently by other
* operations such as getMore. They can however, be marked as interrupted and instructed to destroy
* themselves through killCursors.
*
* A pin is obtained using the CursorManager. See cursor_manager.h for more details.
*
* A pin extends the lifetime of a ClientCursor object until the pin's release. Pinned ClientCursor
* objects cannot not be killed due to inactivity, and cannot be immediately erased by user kill
* requests (though they can be marked as interrupted). When a CursorManager is destroyed (e.g. by
* a collection drop), ownership of any still-pinned ClientCursor objects is transferred to their
* managing ClientCursorPin objects.
*
* Example usage:
* {
* StatusWith<ClientCursorPin> pin = cursorManager->pinCursor(opCtx, cursorid);
* if (!pin.isOK()) {
* // No cursor with id 'cursorid' exists, or it was killed while inactive. Handle the error
* here.
* return pin.getStatus();
* }
*
* ClientCursor* cursor = pin.getValue().getCursor();
* // Use cursor. Pin automatically released on block exit.
* }
*
* Clients that wish to access ClientCursor objects owned by collection cursor managers must hold
* the collection lock while calling any pin method, including pin acquisition by the RAII
* constructor and pin release by the RAII destructor. This guards from a collection drop (which
* requires an exclusive lock on the collection) occurring concurrently with the pin request or
* unpin request.
*
* Clients that wish to access ClientCursor objects owned by the global cursor manager need not
* hold any locks; the global cursor manager can only be destroyed by a process exit.
*/
class ClientCursorPin {
MONGO_DISALLOW_COPYING(ClientCursorPin);
public:
/**
* Moves 'other' into 'this'. The 'other' pin must have a pinned cursor. Moving an empty pin
* into 'this' is illegal.
*/
ClientCursorPin(ClientCursorPin&& other);
/**
* Moves 'other' into 'this'. 'other' must have a pinned cursor and 'this' must have no pinned
* cursor.
*/
ClientCursorPin& operator=(ClientCursorPin&& other);
/**
* Calls release().
*/
~ClientCursorPin();
/**
* Releases the pin. It does not delete the underlying cursor unless ownership has passed
* to us after kill. Turns into a no-op if release() or deleteUnderlying() have already
* been called on this pin.
*/
void release();
/**
* Deletes the underlying cursor. Cannot be called if release() or deleteUnderlying() have
* already been called on this pin.
*/
void deleteUnderlying();
/**
* Returns a pointer to the pinned cursor.
*/
ClientCursor* getCursor() const;
private:
friend class CursorManager;
ClientCursorPin(OperationContext* opCtx, ClientCursor* cursor);
OperationContext* _opCtx = nullptr;
ClientCursor* _cursor = nullptr;
};
void startClientCursorMonitor();
} // namespace mongo
|