Пример #1
0
 def test_addition_is_unique(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     vocabulary.add_from_text(self.example_line)
     self.assertNotEqual(vocabulary['world'], vocabulary['hello'])
     self.assertNotEqual(vocabulary['of'], vocabulary['hello'])
     self.assertNotEqual(vocabulary['of'], vocabulary['!'])
     self.assertNotEqual(vocabulary['world'], vocabulary['!'])
Пример #2
0
 def test_backward_translation_consistent(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     vocabulary.add_word('hi')
     self.assertEqual(vocabulary.i2w(vocabulary['hi']), 'hi')
Пример #3
0
 def test_add_already_known_word(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     vocabulary.add_word('<unk>')
     self.assertEqual(len(vocabulary), 1)
Пример #4
0
 def test_unk_ind(self):
     vocabulary = vocab.Vocabulary('<bla>', 2)
     vocabulary.add_word('hi')
     self.assertEqual(vocabulary.unk_ind, 2)
Пример #5
0
 def test_add_word(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     vocabulary.add_word('hi')
     self.assertEqual(len(vocabulary), 2)
Пример #6
0
 def test_lenght_after_addition(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     vocabulary.add_from_text(self.example_line)
     self.assertEqual(len(vocabulary), 6)
Пример #7
0
 def test_lenght_of_empty(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     self.assertEqual(len(vocabulary), 1)
Пример #8
0
    def test_addition_un_unks(self):
        vocabulary = vocab.Vocabulary('<unk>', 0)
        self.assertEqual(vocabulary['world'], 0)

        vocabulary.add_from_text(self.example_line)
        self.assertNotEqual(vocabulary['world'], 0)
Пример #9
0
 def test_getitem_for_unknown(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     self.assertEqual(vocabulary['a'], 0)
Пример #10
0
 def test_is_mapping(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     self.assertTrue(isinstance(vocabulary, Mapping))
Пример #11
0
 def test_getitem(self):
     vocabulary = vocab.Vocabulary('<unk>', 0)
     self.assertEqual(vocabulary['<unk>'], 0)