Ejemplo n.º 1
0
    def test_source_data_files(self):
        wmt_8k = translate_ende.TranslateEndeWmt8k()
        wmt_32k = translate_ende.TranslateEndeWmt32k()
        eval_split = problem.DatasetSplit.EVAL
        train_split = problem.DatasetSplit.TRAIN

        wmt_8k_eval_files = wmt_8k.source_data_files(eval_split)
        wmt_32k_eval_files = wmt_32k.source_data_files(eval_split)
        self.assertListEqual(wmt_8k_eval_files, wmt_32k_eval_files)
        self.assertGreater(len(wmt_8k_eval_files), 0)

        wmt_8k_train_files = wmt_8k.source_data_files(train_split)
        wmt_32k_train_files = wmt_32k.source_data_files(train_split)
        self.assertListEqual(wmt_8k_train_files, wmt_32k_train_files)
        self.assertGreater(len(wmt_8k_train_files), 0)
Ejemplo n.º 2
0
 def test_vocab_size(self):
     wmt_8k = translate_ende.TranslateEndeWmt8k()
     wmt_32k = translate_ende.TranslateEndeWmt32k()
     self.assertEqual(wmt_8k.approx_vocab_size, 8192)
     self.assertEqual(wmt_32k.approx_vocab_size, 32768)
Ejemplo n.º 3
0
 def test_additional_datasets(self):
     wmt_8k = translate_ende.TranslateEndeWmt8k()
     wmt_32k = translate_ende.TranslateEndeWmt32k()
     self.assertListEqual(wmt_8k.additional_training_datasets, [])
     self.assertListEqual(wmt_32k.additional_training_datasets, [])
Ejemplo n.º 4
0
 def vocab_problem(self):
     return translate_ende.TranslateEndeWmt32k()