-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathordered_hash_table.py
76 lines (61 loc) · 2.47 KB
/
ordered_hash_table.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
from typing import Hashable, Any, NoReturn, List
from collections import namedtuple
from bisect import bisect_left
Element = namedtuple('Node', ['key_hash', 'item'])
# list.index doesn't assume ordering.. This does and consequently performs better..
def ordered_index(arr: List[int], x: int) -> int:
i = bisect_left(arr, x)
if i == len(arr) or arr[i] != x:
raise ValueError('key not found')
return i
class OrderedHashTable:
def __init__(self, capacity=1000):
self.capacity = capacity
# not using defaultdict because it is a dict which is what we're trying to build here..
self.buckets = [[] for _ in range(capacity)]
def get(self, key: Hashable) -> Any:
key_hash = hash(key)
bucket_num = self._get_bucket_num(key_hash)
return self.buckets[bucket_num][ordered_index(self._get_hashes(bucket_num), key_hash)].item
def put(self, key: Hashable, item: Any) -> NoReturn:
key_hash = hash(key)
bucket_num = self._get_bucket_num(key_hash)
new_node = Element(key_hash, item)
i = bisect_left(self._get_hashes(bucket_num), key_hash)
if i == len(self.buckets[bucket_num]):
self.buckets[bucket_num].append(new_node)
elif key_hash < self.buckets[bucket_num][i].key_hash:
self.buckets[bucket_num].insert(i, new_node)
elif key_hash == self.buckets[bucket_num][i].key_hash:
self.buckets[bucket_num][i] = new_node
def remove(self, key: Hashable) -> Element:
key_hash = hash(key)
bucket_num = self._get_bucket_num(key_hash)
return self.buckets[bucket_num].pop(ordered_index(self._get_hashes(bucket_num), key_hash))
def _get_bucket_num(self, key_hash: int) -> int:
return key_hash % self.capacity
def _get_hashes(self, bucket_num: int) -> List[int]:
return list(map(lambda n: n.key_hash, self.buckets[bucket_num]))
if __name__ == '__main__':
# basic tests
ht = OrderedHashTable()
try:
ht.get('not_available')
raise AssertionError('Found non existent')
except ValueError:
pass
ht.put('new_key', 100)
assert ht.get('new_key') == 100
ht.put('new_key', 120)
assert ht.get('new_key') == 120
ht.remove('new_key')
try:
ht.get('new_key')
raise AssertionError('Found non existent')
except ValueError:
pass
try:
ht.remove('new_key')
raise AssertionError('Found non existent')
except ValueError:
pass