class  PySearcherTestCases(unittest.TestCase):
    def setUp(self):
        self.reader = WordReader()
        self.finder = Trie(self.reader)
        self.searcher = Searcher(self.finder, '')

    def tearDown(self):
        self.reader = None
        self.finder = None
        self.searcher = None

    def testRandomWord(self):
       """ Tests that non-empty words are found and they are not the same """
       word1 = self.searcher.randomWord()
       word2 = self.searcher.randomWord()
       self.assertTrue(len(word1) > 1, 'Word length too short')
       self.assertTrue(len(word2) > 1, 'Word length too short')
       self.assertNotEqual(word1, word2, 'Found the same word')

    def testRandomWords(self):
       """ Tests that a set of random words do not contain the same words """
       words = self.searcher.randomWord(5)
       self.assertTrue(len(set(words)) == 5, 'Did not find 5 unique words')

    def testBinaryOperationsAreWorking(self):
        """
        Checks that operations are not identic and that correct number of hits
        is returned for every known result.
        """
        self.reader.addFileName(MaterialFilePath, readNow=True)
        self.finder.addFromReader()

        results = []
        for operation in operations:
            results.append(self.searcher.search(operations[operation],
                                                returnCount=True))
        self.assertTrue(len(set(results)) == 6, #i.e. operations are not identic
                        'Searcher failed binary operation check')
        for searchTerm in binaryOperationsSearch:
            self.assertEqual(self.searcher.search(searchTerm, returnCount=True),
                             binaryOperationsSearch[searchTerm],
                            'Searcher found wrong number of hits on some search')
Example #2
0
        print '%25s\t%10d\t\t%14.3f ms' % ('trie:findWordCount', 2**(index+2), runtime)
        trieFindWordCountFile.write('%10d\t%14.3f\n' % (2**(index+2), runtime))

    runtimes = []
    for i in range(2,17):
        runtime = addWordsToEmptyList(punamusta, 2**i, repeats, '%25s\t%10d\t' % ('punamusta:addToEmpty', 2**i), False)
        print '%25s\t%10d\t\t%14.3f ms' % ('punamusta:addToEmpty', 2**i, runtime)
        punamustaAddFile.write('%10d\t%8.3f\n' % (2**i, runtime))
        runtimes.append(findWords(punamusta, words[7], repeats, printout=False))
    for index, runtime in enumerate(runtimes):
        print '%25s\t%10d\t%8.3f ms' % ('punamusta:findWordCount', 2**(index+2), runtime)
        punamustaFindWordCountFile.write('%10d\t%14.3f\n' % (2**(index+2), runtime))

    print 'Adding all words to Punamusta'
    punamusta.addFromReader()
    print 'Adding all words to Trie'
    trie.addFromReader()


    for i in range(4,10+1):
        runtime = findWords(trie, words[i], repeats, printout=False)
        print '%25s\t%10d\t\t%14.3f ms' % ('trie:findWordLength', i, runtime)
        trieFindLengthFile.write('%10d\t%14.3f\n' % (i, runtime))
    for i in range(4,10+1):
        runtime = findWords(punamusta, words[i], repeats, printout=False)
        print '%25s\t%10d\t\t%14.3f ms' % ('punamusta:findWordLength', i, runtime)
        punamustaFindLengthFile.write('%10d\t%14.3f\n' % (i, runtime))