-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathbktree.py
66 lines (49 loc) · 1.68 KB
/
bktree.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
from collections import deque
from operator import itemgetter
_getitem0 = itemgetter(0)
def hamming_distance(x, y):
return bin(x ^ y).count('1')
class BKTree(object):
def __init__(self):
self.tree = None
def add(self, item):
node = self.tree
if node is None:
self.tree = (item, {})
return
while True:
parent, children = node
distance = hamming_distance(item, parent)
node = children.get(distance)
if node is None:
children[distance] = (item, {})
break
def find(self, item, n):
if self.tree is None:
return []
candidates = deque([self.tree])
found = []
_candidates_popleft = candidates.popleft
_candidates_extend = candidates.extend
_found_append = found.append
while candidates:
candidate, children = _candidates_popleft()
distance = hamming_distance(candidate, item)
if distance <= n:
_found_append((distance, candidate))
if children:
lower = distance - n
upper = distance + n
_candidates_extend(c for d, c in children.items() if lower <= d <= upper)
found.sort(key=_getitem0)
return found
def __iter__(self):
if self.tree is None:
return
candidates = deque([self.tree])
_candidates_popleft = candidates.popleft
_candidates_extend = candidates.extend
while candidates:
candidate, children = _candidates_popleft()
yield candidate
_candidates_extend(children.values())