def test_BigramsApplyStopwords(self): # set up teststring = 'I like cats and birds.' bigrams = ['cats birds'] # test testtokenize = TokenizeOnWhitespacePunctuation(teststring, applyStopwords=True) self.assertEqual(bigrams, testtokenize.getBigrams())
def test_TokenizeOnWhitespacePunctuationBigrams(self): # set up teststring = 'I like cats and birds.' bigrams = ['i like', 'like cats', 'cats and', 'and birds'] # test testtokenize = TokenizeOnWhitespacePunctuation(teststring) self.assertEqual(bigrams, testtokenize.getBigrams())