Ejemplo n.º 1
0
class StemmingTest(unittest.TestCase):
    def setUp(self):
        self.oktavia = Oktavia()
        self.oktavia.set_stemmer(snowballstemmer.EnglishStemmer())
        self.section = self.oktavia.add_section(u'document')
        self.oktavia.add_word(u"stemming baby", stemming=True)
        self.section.set_tail(u"doc1")
        self.oktavia.add_word(u"stemmed babies", stemming=True)
        self.section.set_tail(u"doc2")
        self.oktavia.build()

    def test_search_without_stemming(self):
        results = self.oktavia.raw_search(u'baby', stemming=False)
        self.assertEqual(1, len(results))

    def test_search_with_stemming(self):
        results = self.oktavia.raw_search(u'baby', stemming=True)
        self.assertEqual(1, len(results))

    def test_load_dump_and_search_without_stemming(self):
        dump = self.oktavia.dump()
        oktavia = Oktavia()
        oktavia.set_stemmer(snowballstemmer.EnglishStemmer())
        oktavia.load(dump)
        results = oktavia.raw_search(u'baby', stemming=False)
        self.assertEqual(1, len(results))

    def test_load_dump_and_search_with_stemming(self):
        dump = self.oktavia.dump()
        oktavia = Oktavia()
        oktavia.set_stemmer(snowballstemmer.EnglishStemmer())
        oktavia.load(dump)
        results = oktavia.raw_search(u'baby', stemming=True)
        self.assertEqual(1, len(results))
Ejemplo n.º 2
0
 def test_load_dump_and_search_with_stemming(self):
     dump = self.oktavia.dump()
     oktavia = Oktavia()
     oktavia.set_stemmer(snowballstemmer.EnglishStemmer())
     oktavia.load(dump)
     results = oktavia.raw_search(u'baby', stemming=True)
     self.assertEqual(1, len(results))