def test_prune_with_four_buckets(self): """ Tests prune with a stupid table of 4 buckets, this can store at most 3 elements at once. """ ht = HashTable(buckets=4) # Adds elements one by one. d replaces 'e', then 'e' replaces 'b' ht.update({'e': 1, 'a': 3, 'b': 2}) ht.update({'d': 5}) ht.update({'e': 4}) self.assertEqual(set(ht.items()), set({ 'a': 3, 'd': 5, 'e': 4 }.items())) self.assertEqual(len(ht), 3, "The number of elements after pruning should be 3") # Increment existing 'a', then add 'b' which evicts 2 elements with the lowest value of 4 ht.increment('a') self.assertEqual(len(ht), 3) self.assertEqual(set(ht.items()), set({ 'a': 4, 'd': 5, 'e': 4 }.items())) ht.increment('b') self.assertEqual(len(ht), 2, "The number of elements after pruning should be 3") self.assertEqual(set(ht.items()), set({'b': 1, 'd': 5}.items()))
def test_update_with_hashtable(self): """ Update with a dictionary and test against it using set representation """ data1 = {'a': 1, 'b': 3, 'c': 2, 'd': 5} data2 = {'a': 18, 'b': 4, 'c': 6, 'e': 13} expected = {'a': 19, 'b': 7, 'c': 8, 'd': 5, 'e': 13} self.ht.update(data1) ht2 = HashTable(64) ht2.update(data2) self.ht.update(ht2) self.assertEqual(set(self.ht.items()), set(expected.items()))
class HashTableIterTypeTest(unittest.TestCase): """ Functional tests for HashTable use_unicode parameter """ def setUp(self): self.ht = HashTable(buckets=64) def test_itertype_default_unicode(self): self.ht.update([b'bytes', u'Unicode', 'String']) for key in self.ht: self.assertEqual(type(key), uni_type) for key, _ in self.ht.items(): self.assertEqual(type(key), uni_type) def test_itertype_use_unicode_true(self): self.ht = HashTable(buckets=64, use_unicode=True) self.ht.update([b'bytes', u'Unicode', 'String']) for key in self.ht: self.assertEqual(type(key), uni_type) for key, _ in self.ht.items(): self.assertEqual(type(key), uni_type) def test_itertype_use_unicode_false(self): self.ht = HashTable(buckets=64, use_unicode=False) self.ht.update([b'bytes', u'Unicode', 'String']) for key in self.ht: self.assertEqual(type(key), bytes) for key, _ in self.ht.items(): self.assertEqual(type(key), bytes)
def test_prune_with_eight_buckets(self): """ Tests prune with table of 8 buckets, which stores at most 6 elements and prunes itself down to 4 or less. """ ht = HashTable(buckets=8) # Init ht.update({'a': 3, 'b': 2, 'c': 4, 'd': 1, 'e': 5, 'f': 6}) self.assertEqual( set(ht.items()), set({ 'd': 1, 'b': 2, 'a': 3, 'c': 4, 'e': 5, 'f': 6 }.items())) self.assertEqual(len(ht), 6) # Evicts 2 elements (so that half of the table is free) before adding x ht.update(['x']) self.assertEqual(set(ht.items()), set({ 'x': 1, 'a': 3, 'c': 4, 'e': 5, 'f': 6 }.items())) self.assertEqual(len(ht), 5) # Evicts 3 elements because 'a' and 'b' share the count which needs to be included in the limit ht.update(['b', 'b', 'b']) self.assertEqual( set(ht.items()), set({ 'x': 1, 'b': 3, 'a': 3, 'c': 4, 'e': 5, 'f': 6 }.items())) ht['d'] += 1 self.assertEqual(set(ht.items()), set({ 'd': 1, 'c': 4, 'e': 5, 'f': 6 }.items()))
class HashTablePickleTest(unittest.TestCase): """ Functional tests for determining size (cardinality) of hashtable and iterations. """ def setUp(self): self.ht = HashTable(buckets=64) def tearDown(self): if os.path.isfile(filename): os.remove(filename) def check_hashtable(self, reloaded): self.assertEqual(len(reloaded), len(self.ht)) self.assertEqual(reloaded.buckets(), self.ht.buckets()) self.assertEqual(reloaded.total(), self.ht.total()) self.assertEqual(set(reloaded.items()), set(self.ht.items())) self.assertEqual(reloaded.quality(), self.ht.quality()) self.assertEqual(reloaded.cardinality(), self.ht.cardinality()) def store_and_load(self): with open(filename, 'wb') as outfile: pickle.dump(self.ht, outfile) with open(filename, 'rb') as outfile: reloaded = pickle.load(outfile) return reloaded def test_pickle_empty(self): reloaded = self.store_and_load() self.check_hashtable(reloaded) def test_pickle_simple(self): self.ht.update("boss") self.ht.update("pickling") reloaded = self.store_and_load() self.check_hashtable(reloaded) def test_pickle_deleted(self): self.ht.update("boss") self.ht.update("pickling") del self.ht['g'] del self.ht['s'] reloaded = self.store_and_load() self.check_hashtable(reloaded) def test_pickle_pruned(self): for i in range(120): self.ht.increment(str(i), 1 + ((i * 27) % 17)) reloaded = self.store_and_load() self.check_hashtable(reloaded) def test_pickle_large(self): self.ht = HashTable(buckets=2 ** 25) self.ht.update("boss") self.ht.update("pickling") self.ht.update("verylargetable") reloaded = self.store_and_load() self.check_hashtable(reloaded)
class HashTableTotalTest(unittest.TestCase): """ Functional tests for HashTable.total method """ def setUp(self): self.ht = HashTable(buckets=64) def test_simple_total(self): self.assertEqual(self.ht.total(), 0) self.ht.update("foo") self.assertEqual(self.ht.total(), 3) def test_set_reset_total(self): self.ht.update("foo") self.assertEqual(self.ht.total(), 3) self.ht['o'] += 2 self.assertEqual(self.ht.total(), 5) self.ht['f'] = 0 self.assertEqual(self.ht.total(), 4) def test_increment_total(self): self.ht.update("foo") self.ht.increment("f", 5) self.assertEqual(self.ht.total(), 8) self.ht.increment("a", 2) self.assertEqual(self.ht.total(), 10) self.ht.increment("r", 0) self.assertEqual(self.ht.total(), 10) def test_delete_total(self): self.ht.update("foo") del self.ht['o'] self.assertEqual(self.ht.total(), 1) def test_prune_total(self): self.ht = HashTable(buckets=4) self.ht.update("223334444") self.assertEqual(self.ht.total(), 9) self.ht.update("1") self.assertEqual(self.ht.total(), 10)
def test_prune_total(self): ht = HashTable(buckets=8) ht.update({'a': 3, 'b': 2, 'c': 4, 'd': 1, 'e': 5, 'f': 6}) ht.update("xbbbd") self.assertEqual(ht.total(), 26)
def test_prune_cardinality(self): ht = HashTable(buckets=8) ht.update({'a': 3, 'b': 2, 'c': 4, 'd': 1, 'e': 5, 'f': 6}) ht.update("xbgbbd") self.assertEqual(ht.cardinality(), 8)
class HashTableUpdateTest(unittest.TestCase): """ Functional tests for HashTable.update method, which adds another counter, dictionary, hashtable, tuple or list """ def setUp(self): self.ht = HashTable(buckets=64) def test_update_numbers(self): """ Negative test: calling update using numeric values as parameter yields TypeError """ with self.assertRaises(TypeError): self.ht.update(1) with self.assertRaises(TypeError): self.ht.update(1.0) def test_update_string(self): self.ht.update("foo") self.assertEqual(self.ht['f'], 1) self.assertEqual(self.ht['o'], 2) def test_update_tuple(self): tuple = ('foo', 'bar', 'foo') self.ht.update(tuple) self.assertEqual(self.ht['foo'], 2) self.assertEqual(self.ht['bar'], 1) def test_update_list(self): self.ht.update([str(i % 3) for i in range(5)]) self.assertEqual(self.ht['0'], 2) self.assertEqual(self.ht['1'], 2) self.assertEqual(self.ht['2'], 1) def test_update_split(self): self.ht.update("This is a sentence".split()) self.assertEqual(self.ht['is'], 1) self.assertEqual(self.ht['this'], 0) # lowercase def test_update_twice(self): tuple = ('foo', 'bar', 'foo') self.ht.update(tuple) self.ht.update(('foo', 'bar', 'foo')) self.assertEqual(self.ht['foo'], 4) self.assertEqual(self.ht['bar'], 2) def test_update_bytes(self): tuple = ('foo', 'bar', b'foo') self.ht.update(tuple) self.assertEqual(self.ht['foo'], 2) self.assertEqual(self.ht[b'foo'], 2) def test_update_unicode(self): tuple = ('foo', 'bar', u'foo') self.ht.update(tuple) self.assertEqual(self.ht['foo'], 2) self.assertEqual(self.ht[u'foo'], 2) def test_update_with_dictionary(self): """ Update with a dictionary and test against it using set representation """ data = {'a': 1, 'b': 3, 'c': 2, 'd': 5} self.ht.update(data) self.assertEqual(self.ht['b'], 3) self.assertEqual(set(self.ht.items()), set(data.items())) def test_update_with_hashtable(self): """ Update with a dictionary and test against it using set representation """ data1 = {'a': 1, 'b': 3, 'c': 2, 'd': 5} data2 = {'a': 18, 'b': 4, 'c': 6, 'e': 13} expected = {'a': 19, 'b': 7, 'c': 8, 'd': 5, 'e': 13} self.ht.update(data1) ht2 = HashTable(64) ht2.update(data2) self.ht.update(ht2) self.assertEqual(set(self.ht.items()), set(expected.items()))
class HashTableItemsTest(unittest.TestCase): """ Functional tests for determining size (cardinality) of hashtable and iterations. """ def setUp(self): self.ht = HashTable(buckets=64) def test_simple_length_test(self): self.assertEqual(len(self.ht), 0) self.ht.update("boss") self.assertEqual(len(self.ht), 3) self.ht.update("sad") self.assertEqual(len(self.ht), 5) def test_simple_cardinality_test(self): self.assertEqual(self.ht.cardinality(), 0) self.ht.update("boss") self.assertEqual(self.ht.cardinality(), 3) self.ht.update("sad") self.assertEqual(self.ht.cardinality(), 5) def test_delete_length_test(self): self.ht.update("boss") self.assertEqual(len(self.ht), 3) del self.ht['s'] self.assertEqual(len(self.ht), 2) del self.ht['s'] self.assertEqual(len(self.ht), 2) def test_delete_prune_length_iteration_test(self): self.ht = HashTable(buckets=8) self.ht.update("bbboss") self.assertEqual(len(self.ht), 3) del self.ht['s'] self.assertEqual(len(self.ht), 2) self.ht.update("122333") self.assertEqual(len(self.ht), 5) # should iterate over 5 elements self.assertEqual(set(self.ht.items()), set({ 'b': 3, 'o': 1, '1': 1, '2': 2, '3': 3 }.items())) # the next add will overflow because the deleted bucket is still physically there so the 'real' size is 5 self.ht.update("!") # overflow removes '1', 'o', and the empty bucket self.assertEqual(len(self.ht), 4) # should iterate over 4 elements self.assertEqual(set(self.ht.items()), set({ 'b': 3, '!': 1, '2': 2, '3': 3 }.items())) self.assertEqual(self.ht.cardinality(), 7)