def test_run_trigram(self): viterbi = ViterbiMath(self._unigramCount, self._bigramCount, self._trigramCount, self._tagWordCount) expected_tag_seq = "FW <s>\nFW the\nFW cat\nFW is\nIN pretty\n. .\n" viterbi.run(self._testFile, self._outputFile, 3) actual_tag_seq = open(self._outputFile, 'r').read() self.assertEquals(expected_tag_seq, actual_tag_seq, "run trigram test")
def test_run_bigram(self): viterbi = ViterbiMath(self._unigramCount, self._bigramCount, self._trigramCount, self._tagWordCount) expected_tag_seq = "<s> <s>\nDT the\nNN cat\nVBZ is\nRB pretty\n. .\n" viterbi.run(self._testFile, self._outputFile, 2) actual_tag_seq = open(self._outputFile, 'r').read() self.assertEquals(expected_tag_seq, actual_tag_seq, "run bigram test")
def test_run(self): viterbi = ViterbiMath(self._unigramCount, self._bigramCount, self._trigramCount, self._tagWordCount, self._vocabDict) viterbi.run("data/test.pos", "data/outputtest.txt", 2)