1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
|
#!/usr/bin/env python
#
# Public Domain 2014-2016 MongoDB, Inc.
# Public Domain 2008-2014 WiredTiger, Inc.
#
# This is free and unencumbered software released into the public domain.
#
# Anyone is free to copy, modify, publish, use, compile, sell, or
# distribute this software, either in source code form or as a compiled
# binary, for any purpose, commercial or non-commercial, and by any
# means.
#
# In jurisdictions that recognize copyright laws, the author or authors
# of this software dedicate any and all copyright interest in the
# software to the public domain. We make this dedication for the benefit
# of the public at large and to the detriment of our heirs and
# successors. We intend this dedication to be an overt act of
# relinquishment in perpetuity of all present and future rights to this
# software under copyright law.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
# ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
# OTHER DEALINGS IN THE SOFTWARE.
import os
import wiredtiger, wttest, run
from wtscenario import make_scenarios
# test_join09.py
# Join bloom filters with false positives
class test_join09(wttest.WiredTigerTestCase):
nentries = 1000
bloomscen = [
('nobloom', dict(false_positives=False, config='')),
('bloom1000', dict(false_positives=False,
config='strategy=bloom,count=1000')),
('bloom10fp', dict(false_positives=True,
config='strategy=bloom,count=10,bloom_false_positives=true'))
]
scenarios = make_scenarios(bloomscen)
def gen_values(self, i):
s = str(i) # 345 => "345"
f = s[0:1] + s[0:1] + s[0:1] # 345 => "333"
return [s, f]
def populate(self, s, gen_values):
c = s.open_cursor('table:join09', None, None)
for i in range(0, self.nentries):
c.set_key(i)
c.set_value(*gen_values(i))
c.insert()
c.close()
# Common function for testing the most basic functionality
# of joins
def test_join(self):
self.session.create('table:join09',
'columns=(k,v0,v1),key_format=i,value_format=SS')
self.session.create('index:join09:index0','columns=(v0)')
self.session.create('index:join09:index1','columns=(v1)')
self.populate(self.session, self.gen_values)
jc = self.session.open_cursor('join:table:join09', None, None)
c0 = self.session.open_cursor('index:join09:index0', None, None)
c0.set_key('520')
self.assertEquals(0, c0.search())
self.session.join(jc, c0, 'compare=ge')
joinconfig = 'compare=eq,' + self.config
c1 = self.session.open_cursor('index:join09:index1', None, None)
c1.set_key('555')
self.assertEquals(0, c1.search())
self.session.join(jc, c1, joinconfig)
mbr = set(range(520,600)) | set(range(53,60))
fp_count = 0
while jc.next() == 0:
[k] = jc.get_keys()
[v0,v1] = jc.get_values()
self.assertEquals(self.gen_values(k), [v0, v1])
if not k in mbr:
# With false positives, we can see extra values
if self.false_positives:
fp_count += 1
continue
self.tty('**** ERROR: result ' + str(k) + ' is not in: ' +
str(mbr))
self.assertTrue(k in mbr)
mbr.remove(k)
if len(mbr) != 0:
self.tty('**** ERROR: did not see these: ' + str(mbr))
self.assertEquals(0, len(mbr))
# Turning on false positives does not guarantee we'll see extra
# values, but we've configured our test with a low count to
# make sure it happens.
if self.false_positives:
self.assertTrue(fp_count > 0)
jc.close()
c1.close()
c0.close()
self.session.drop('table:join09')
if __name__ == '__main__':
wttest.run()
|