1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
|
#!/usr/bin/env python
#
# Public Domain 2014-2016 MongoDB, Inc.
# Public Domain 2008-2014 WiredTiger, Inc.
#
# This is free and unencumbered software released into the public domain.
#
# Anyone is free to copy, modify, publish, use, compile, sell, or
# distribute this software, either in source code form or as a compiled
# binary, for any purpose, commercial or non-commercial, and by any
# means.
#
# In jurisdictions that recognize copyright laws, the author or authors
# of this software dedicate any and all copyright interest in the
# software to the public domain. We make this dedication for the benefit
# of the public at large and to the detriment of our heirs and
# successors. We intend this dedication to be an overt act of
# relinquishment in perpetuity of all present and future rights to this
# software under copyright law.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
# ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
# OTHER DEALINGS IN THE SOFTWARE.
import wiredtiger, wttest
from wtdataset import SimpleDataSet
from wtscenario import make_scenarios
# test_cursor_random02.py
# Cursor next_random operations
class test_cursor_random02(wttest.WiredTigerTestCase):
types = [
('lsm', dict(type='lsm:random')),
('table', dict(type='table:random'))
]
config = [
('not-sample', dict(config='next_random=true'))
]
records = [
('1', dict(records=1)),
('250', dict(records=250)),
('500', dict(records=500)),
('5000', dict(records=5000)),
('10000', dict(records=10000)),
('50000', dict(records=50000)),
]
scenarios = make_scenarios(config, records, types)
# Check that next_random works in the presence of a larger set of values,
# where the values are in an insert list.
def test_cursor_random_reasonable_distribution(self):
uri = self.type
num_entries = self.records
if uri == 'table:random':
config = 'leaf_page_max=100MB'
else:
config = ''
# Set the leaf-page-max value, otherwise the page might split.
ds = SimpleDataSet(self, uri, num_entries, config=config)
ds.populate()
# Setup an array to track which keys are seen
visitedKeys = [0] * (num_entries + 1)
# Setup a counter to see when we find a sequential key
sequentialKeys = 0
cursor = self.session.open_cursor(uri, None, 'next_random=true')
lastKey = None
for i in range(0, num_entries):
self.assertEqual(cursor.next(), 0)
current = cursor.get_key()
current = int(current)
visitedKeys[current] = visitedKeys[current] + 1
if lastKey != None:
if current == (lastKey + 1):
sequentialKeys += 1
lastKey = current
differentKeys = sum(x > 0 for x in visitedKeys)
#print visitedKeys
#print differentKeys
'''
self.tty('differentKeys: ' + str(differentKeys) + ' of ' + \
str(num_entries) + ', ' + \
str((int)((differentKeys * 100) / num_entries)) + '%')
'''
# Can't test for non-sequential data when there is 1 item in the table
if num_entries > 1:
self.assertGreater(num_entries - 1, sequentialKeys,
'cursor is returning sequential data')
self.assertGreater(differentKeys, num_entries / 4,
'next_random random distribution not adequate')
if __name__ == '__main__':
wttest.run()
|