def test_get_ngrams_example12(self): tokens = ['Dies', 'ist'] ngrams_result = get_ngrams(tokens=tokens, min_n=1, max_n=2) ngrams_expected = [ 'D', 'i', 'e', 's', 'i', 's', 't', 'Di', 'ie', 'es', 'is', 'st' ] self.assertCountEqual(ngrams_result, ngrams_expected)
def test_get_ngrams_example4(self): tokens = ['Regenbogen', 'Feuerwehr'] ngrams_result = get_ngrams(tokens=tokens, min_n=4, max_n=4) ngrams_expected = [ 'Rege', 'egen', 'genb', 'enbo', 'nbog', 'boge', 'ogen', 'Feue', 'euer', 'uerw', 'erwe', 'rweh', 'wehr' ] self.assertEqual(ngrams_result, ngrams_expected)