def test_get_token_offsets_simple(self): sentence = sentence_factory(""" x 1 x x 4 x x 8 x x 3 x """) X = get_token_offsets([sentence]) self.assertEqual(X, [1, 4, 8, 3])
def test_get_token_offsets_invalid_data(self): with self.assertRaises(KeyError): get_token_offsets([[{"aaa": "bbb"}]])
def test_get_token_offsets_empty(self): self.assertEqual(get_token_offsets([]), [])