예제 #1
0
class SplitterTest(unittest.TestCase):

    def setUp(self):
        self.oktavia = Oktavia()
        self.splitter = self.oktavia.add_splitter('document')
        self.oktavia.add_word("abracadabra")
        self.splitter.split()
        self.oktavia.add_word("mississippi")
        self.splitter.split()
        self.oktavia.add_word("abracadabra mississippi")
        self.splitter.split()
        self.oktavia.build(5)

    def test_count(self):
        self.assertEqual(3, self.splitter.size())

    def test_get_splitter_index(self):
        self.assertEqual(0, self.splitter.get_index(0))
        self.assertEqual(0, self.splitter.get_index(10))
        self.assertEqual(1, self.splitter.get_index(11))
        self.assertEqual(1, self.splitter.get_index(21))
        self.assertEqual(2, self.splitter.get_index(22))
        self.assertEqual(2, self.splitter.get_index(44))

    def test_get_splitter_index_boundary(self):
        try:
            self.splitter.get_index(-1)
            self.fail("fm.get_index()")
        except:
            pass
        try:
            self.splitter.get_index(45)
            self.fail("fm.get_index()")
        except:
            pass

    def test_get_splitter_content(self):
        self.assertEqual("abracadabra mississippi", self.splitter.get_content(2))
        self.assertEqual("mississippi", self.splitter.get_content(1))
        self.assertEqual("abracadabra", self.splitter.get_content(0))

    def test_get_splitter_content_boundary(self):
        try:
            self.splitter.get_content(3)
            self.fail("fm.get_content()")
        except:
            pass
        try:
            self.splitter.get_content(-1)
            self.fail("fm.get_content()")
        except:
            pass

    def test_load_dump_and_count(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')
        self.assertEqual(3, self.splitter.size())

    def test_load_dump_and_get_splitter_index(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        self.assertEqual(0, self.splitter.get_index(0))
        self.assertEqual(0, self.splitter.get_index(10))
        self.assertEqual(1, self.splitter.get_index(11))
        self.assertEqual(1, self.splitter.get_index(21))
        self.assertEqual(2, self.splitter.get_index(22))
        self.assertEqual(2, self.splitter.get_index(44))

    def test_load_dump_and_get_splitter_index_boundary(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        try:
            self.splitter.get_index(-1)
            self.fail("fm.get_index()")
        except:
            pass
        try:
            self.splitter.get_index(45)
            self.fail("fm.get_index()")
        except:
            pass

    def test_load_dump_and_get_splitter_content(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        self.assertEqual("abracadabra mississippi", self.splitter.get_content(2))
        self.assertEqual("mississippi", self.splitter.get_content(1))
        self.assertEqual("abracadabra", self.splitter.get_content(0))

    def test_load_dump_and_get_splitter_content_boundary(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        try:
            self.splitter.get_content(3)
            self.fail("fm.get_content()")
        except:
            pass
        try:
            self.splitter.get_content(-1)
            self.fail("fm.get_content()")
        except:
            pass
예제 #2
0
class SplitterTest(unittest.TestCase):
    def setUp(self):
        self.oktavia = Oktavia()
        self.splitter = self.oktavia.add_splitter('document')
        self.oktavia.add_word("abracadabra")
        self.splitter.split()
        self.oktavia.add_word("mississippi")
        self.splitter.split()
        self.oktavia.add_word("abracadabra mississippi")
        self.splitter.split()
        self.oktavia.build(5)

    def test_count(self):
        self.assertEqual(3, self.splitter.size())

    def test_get_splitter_index(self):
        self.assertEqual(0, self.splitter.get_index(0))
        self.assertEqual(0, self.splitter.get_index(10))
        self.assertEqual(1, self.splitter.get_index(11))
        self.assertEqual(1, self.splitter.get_index(21))
        self.assertEqual(2, self.splitter.get_index(22))
        self.assertEqual(2, self.splitter.get_index(44))

    def test_get_splitter_index_boundary(self):
        try:
            self.splitter.get_index(-1)
            self.fail("fm.get_index()")
        except:
            pass
        try:
            self.splitter.get_index(45)
            self.fail("fm.get_index()")
        except:
            pass

    def test_get_splitter_content(self):
        self.assertEqual("abracadabra mississippi",
                         self.splitter.get_content(2))
        self.assertEqual("mississippi", self.splitter.get_content(1))
        self.assertEqual("abracadabra", self.splitter.get_content(0))

    def test_get_splitter_content_boundary(self):
        try:
            self.splitter.get_content(3)
            self.fail("fm.get_content()")
        except:
            pass
        try:
            self.splitter.get_content(-1)
            self.fail("fm.get_content()")
        except:
            pass

    def test_load_dump_and_count(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')
        self.assertEqual(3, self.splitter.size())

    def test_load_dump_and_get_splitter_index(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        self.assertEqual(0, self.splitter.get_index(0))
        self.assertEqual(0, self.splitter.get_index(10))
        self.assertEqual(1, self.splitter.get_index(11))
        self.assertEqual(1, self.splitter.get_index(21))
        self.assertEqual(2, self.splitter.get_index(22))
        self.assertEqual(2, self.splitter.get_index(44))

    def test_load_dump_and_get_splitter_index_boundary(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        try:
            self.splitter.get_index(-1)
            self.fail("fm.get_index()")
        except:
            pass
        try:
            self.splitter.get_index(45)
            self.fail("fm.get_index()")
        except:
            pass

    def test_load_dump_and_get_splitter_content(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        self.assertEqual("abracadabra mississippi",
                         self.splitter.get_content(2))
        self.assertEqual("mississippi", self.splitter.get_content(1))
        self.assertEqual("abracadabra", self.splitter.get_content(0))

    def test_load_dump_and_get_splitter_content_boundary(self):
        dump = self.oktavia.dump()
        self.oktavia.load(dump)
        self.splitter = self.oktavia.get_splitter('document')

        try:
            self.splitter.get_content(3)
            self.fail("fm.get_content()")
        except:
            pass
        try:
            self.splitter.get_content(-1)
            self.fail("fm.get_content()")
        except:
            pass