Пример #1
0
 def test_get_ngrams_example12(self):
     tokens = ['Dies', 'ist']
     ngrams_result = get_ngrams(tokens=tokens, min_n=1, max_n=2)
     ngrams_expected = [
         'D', 'i', 'e', 's', 'i', 's', 't', 'Di', 'ie', 'es', 'is', 'st'
     ]
     self.assertCountEqual(ngrams_result, ngrams_expected)
Пример #2
0
 def test_get_ngrams_example4(self):
     tokens = ['Regenbogen', 'Feuerwehr']
     ngrams_result = get_ngrams(tokens=tokens, min_n=4, max_n=4)
     ngrams_expected = [
         'Rege', 'egen', 'genb', 'enbo', 'nbog', 'boge', 'ogen', 'Feue',
         'euer', 'uerw', 'erwe', 'rweh', 'wehr'
     ]
     self.assertEqual(ngrams_result, ngrams_expected)