def test_unicode(self): trie = Trie() trie.insert("hýždě", 0) trie.insert("hárá", 1) serialized = trie.serialize() self.compare( serialized, """ h0xc3 0xbd 0xc5 | 0xbe | d0xc4 | 0x9b | [0] 0xa1 r0xc3 | 0xa1 | [1] """) self.assertEqual(len(serialized), 82)
from _search import Trie, ResultMap, ResultFlag, serialize_search_data, Serializer basedir = pathlib.Path(os.path.dirname( os.path.realpath(__file__))) / 'js-test-data' def type_size_suffix(*, name_size_bytes, result_id_bytes, file_offset_bytes): return f'ns{name_size_bytes}-ri{result_id_bytes}-fo{file_offset_bytes}' # Basic error handling min_size = len( serialize_search_data( Serializer(name_size_bytes=1, result_id_bytes=2, file_offset_bytes=3), Trie(), ResultMap(), [], 0)) with open(basedir / 'short.bin', 'wb') as f: f.write(b'#' * (min_size - 1)) with open(basedir / 'wrong-magic.bin', 'wb') as f: f.write(b'MOS\2') f.write(b'\0' * (min_size - 4)) with open(basedir / 'wrong-version.bin', 'wb') as f: f.write(b'MCS\1') f.write(b'\0' * (min_size - 4)) with open(basedir / 'wrong-result-id-bytes.bin', 'wb') as f: f.write(Serializer.header_struct.pack(b'MCS', 2, 3 << 1, 0, 0, 0)) f.write(b'\0' * (min_size - Serializer.header_struct.size)) # Empty file, in all possible type size combinations
def test_multiple(self): trie = Trie() trie.insert("math", 0) trie.insert("math::vector", 1, lookahead_barriers=[4]) trie.insert("vector", 1) trie.insert("math::range", 2) trie.insert("range", 2) trie.insert("math::min", 3) trie.insert("min", 3) trie.insert("math::max", 4) trie.insert("max", 4) trie.insert("math::minmax", 5) trie.insert("minmax", 5) trie.insert("math::vector::minmax", 6, lookahead_barriers=[4, 12]) trie.insert("vector::minmax", 6, lookahead_barriers=[6]) trie.insert("minmax", 6) trie.insert("math::vector::min", 7) trie.insert("vector::min", 7) trie.insert("min", 7) trie.insert("math::vector::max", 8) trie.insert("vector::max", 8) trie.insert("max", 8) trie.insert("math::range::min", 9, lookahead_barriers=[4, 11]) trie.insert("range::min", 9, lookahead_barriers=[5]) trie.insert("min", 9) trie.insert("math::range::max", 10) trie.insert("range::max", 10) trie.insert("max", 10) serialized = trie.serialize() self.compare( serialized, """ math [0] ||| :$ ||| :vector [1] ||| | :$ ||| | :min [7] ||| | | max [6] ||| | ax [8] ||| range [2] ||| | :$ ||| | :min [9] ||| | ax [10] ||| min [3] ||| || max [5] ||| |ax [4] ||x [4, 8, 10] |in [3, 7, 9] || max [5, 6] vector [1] | :$ | :min [7] | | max [6] | ax [8] range [2] | :$ | :min [9] | ax [10] """) self.assertEqual(len(serialized), 340)
def test_empty(self): trie = Trie() serialized = trie.serialize() self.compare(serialized, "") self.assertEqual(len(serialized), 6)
def test(self): trie = Trie() map = ResultMap() trie.insert( "math", map.add("Math", "namespaceMath.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.NAMESPACE))) index = map.add("Math::Vector", "classMath_1_1Vector.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.CLASS)) trie.insert("math::vector", index) trie.insert("vector", index) index = map.add("Math::Range", "classMath_1_1Range.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.CLASS)) trie.insert("math::range", index) trie.insert("range", index) serialized = serialize_search_data(trie, map, search_type_map, 3) self.compare( serialized, """ 3 symbols math [0] | ::vector [1] | range [2] vector [1] range [2] 0: Math [type=NAMESPACE] -> namespaceMath.html 1: ::Vector [prefix=0[:0], type=CLASS] -> classMath_1_1Vector.html 2: ::Range [prefix=0[:0], type=CLASS] -> classMath_1_1Range.html (EntryType.PAGE, CssClass.SUCCESS, 'page'), (EntryType.NAMESPACE, CssClass.PRIMARY, 'namespace'), (EntryType.CLASS, CssClass.PRIMARY, 'class'), (EntryType.FUNC, CssClass.INFO, 'func') """) self.assertEqual(len(serialized), 277)
def test_multiple(self): trie = Trie() trie.insert("math", 0) trie.insert("math::vector", 1, lookahead_barriers=[4]) trie.insert("vector", 1) trie.insert("math::range", 2) trie.insert("range", 2) trie.insert("math::min", 3) trie.insert("min", 3) trie.insert("math::max", 4) trie.insert("max", 4) trie.insert("math::minmax", 5) trie.insert("minmax", 5) trie.insert("math::vector::minmax", 6, lookahead_barriers=[4, 12]) trie.insert("vector::minmax", 6, lookahead_barriers=[6]) trie.insert("minmax", 6) trie.insert("math::vector::min", 7) trie.insert("vector::min", 7) trie.insert("min", 7) trie.insert("math::vector::max", 8) trie.insert("vector::max", 8) trie.insert("max", 8) trie.insert("math::range::min", 9, lookahead_barriers=[4, 11]) trie.insert("range::min", 9, lookahead_barriers=[5]) trie.insert("min", 9) trie.insert("math::range::max", 10) trie.insert("range::max", 10) trie.insert("max", 10) for i in trie_type_sizes: with self.subTest(**i): serialized = trie.serialize(Serializer(**i)) self.compare( Deserializer(**i), serialized, """ math [0] ||| :$ ||| :vector [1] ||| | :$ ||| | :min [7] ||| | | max [6] ||| | ax [8] ||| range [2] ||| | :$ ||| | :min [9] ||| | ax [10] ||| min [3] ||| || max [5] ||| |ax [4] ||x [4, 8, 10] |in [3, 7, 9] || max [5, 6] vector [1] | :$ | :min [7] | | max [6] | ax [8] range [2] | :$ | :min [9] | ax [10] """) # Verify just the smallest and largest size, everything else # should fit in between if i['file_offset_bytes'] == 3 and i['result_id_bytes'] == 2: self.assertEqual(len(serialized), 340) elif i['file_offset_bytes'] == 4 and i['result_id_bytes'] == 4: self.assertEqual(len(serialized), 428) else: self.assertGreater(len(serialized), 340) self.assertLess(len(serialized), 428)
def test(self): trie = Trie() map = ResultMap() trie.insert( "math", map.add("Math", "namespaceMath.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.NAMESPACE))) index = map.add("Math::Vector", "classMath_1_1Vector.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.CLASS)) trie.insert("math::vector", index) trie.insert("vector", index) index = map.add("Math::Range", "classMath_1_1Range.html", flags=ResultFlag.from_type(ResultFlag.NONE, EntryType.CLASS)) trie.insert("math::range", index) trie.insert("range", index) for i in type_sizes: with self.subTest(**i): serialized = serialize_search_data(Serializer(**i), trie, map, search_type_map, 3) self.compare( serialized, """ 3 symbols math [0] | ::vector [1] | range [2] vector [1] range [2] 0: Math [type=NAMESPACE] -> namespaceMath.html 1: ::Vector [prefix=0[:0], type=CLASS] -> classMath_1_1Vector.html 2: ::Range [prefix=0[:0], type=CLASS] -> classMath_1_1Range.html (EntryType.PAGE, CssClass.SUCCESS, 'page'), (EntryType.NAMESPACE, CssClass.PRIMARY, 'namespace'), (EntryType.CLASS, CssClass.PRIMARY, 'class'), (EntryType.FUNC, CssClass.INFO, 'func') """) # Verify just the smallest and largest size, everything else # should fit in between if i['file_offset_bytes'] == 3 and i[ 'result_id_bytes'] == 2 and i['name_size_bytes'] == 1: self.assertEqual(len(serialized), 282) elif i['file_offset_bytes'] == 4 and i[ 'result_id_bytes'] == 4 and i['name_size_bytes'] == 2: self.assertEqual(len(serialized), 317) else: self.assertGreater(len(serialized), 282) self.assertLess(len(serialized), 317)