Python eval_model Exemples, parlai.utils.testing.eval_model Python Exemples

Exemple #1

0

Afficher le fichier

 def test_batched(self):
     valid, test = testing_utils.eval_model(
         dict(
             task='integration_tests:chunky',
             model='parlai.agents.test_agents.test_agents:MockTorchAgent',
             batchsize=32,
         ),
         valid_datatype='valid:stream',
         test_datatype='test:stream',
     )
     assert valid['exs'] == 100
     assert test['exs'] == 100

Exemple #2

0

Afficher le fichier

    def test_stream_only(self):
        with self.assertRaises(ValueError):
            valid, test = testing_utils.eval_model(
                dict(
                    task='integration_tests:chunky',
                    model='parlai.agents.test_agents.test_agents:MockTorchAgent',
                    batchsize=32,
                ),
                valid_datatype='valid',
            )

        with self.assertRaises(ValueError):
            valid, test = testing_utils.eval_model(
                dict(
                    task='integration_tests:chunky',
                    model='parlai.agents.test_agents.test_agents:MockTorchAgent',
                    batchsize=32,
                ),
                valid_datatype='valid:stream',
                test_datatype='test',
            )

Exemple #3

0

Afficher le fichier

Fichier : test_eval_model.py Projet : Taekyung2/MichinAI

    def test_multitasking_metrics_macro(self):
        valid, test = testing_utils.eval_model({
            'task':
            'integration_tests:candidate,'
            'integration_tests:multiturnCandidate',
            'model':
            'random_candidate',
            'aggregate_micro':
            False,
        })

        task1_acc = valid['integration_tests:candidate/accuracy']
        task2_acc = valid['integration_tests:multiturnCandidate/accuracy']
        total_acc = valid['accuracy']
        # task 2 is 4 times the size of task 1
        self.assertEqual(
            total_acc,
            (task1_acc.value() + task2_acc.value()) * 0.5,
            'Task accuracy is averaged incorrectly',
        )

        valid, test = testing_utils.eval_model({
            'task':
            'integration_tests:candidate,'
            'integration_tests:multiturnCandidate',
            'model':
            'random_candidate',
            'aggregate_micro':
            False,
        })
        task1_acc = valid['integration_tests:candidate/accuracy']
        task2_acc = valid['integration_tests:multiturnCandidate/accuracy']
        total_acc = valid['accuracy']

        # metrics are combined correctly
        self.assertEqual(
            total_acc,
            (task1_acc.value() + task2_acc.value()) * 0.5,
            'Task accuracy is averaged incorrectly',
        )

Exemple #4

0

Afficher le fichier

    def test_multitasking_metrics(self):
        valid, test = testing_utils.eval_model({
            'task':
            'integration_tests:candidate,'
            'integration_tests:multiturnCandidate',
            'model':
            'random_candidate',
            'num_epochs':
            0.5,
        })

        task1_acc = valid['integration_tests:candidate/accuracy']
        task2_acc = valid['integration_tests:multiturnCandidate/accuracy']
        total_acc = valid['accuracy']
        # task 2 is 4 times the size of task 1
        self.assertEqual(
            total_acc,
            task1_acc + task2_acc,
            'Task accuracy is averaged incorrectly',
        )

        valid, test = testing_utils.eval_model({
            'task':
            'integration_tests:candidate,'
            'integration_tests:multiturnCandidate',
            'model':
            'random_candidate',
            'num_epochs':
            0.5,
        })
        task1_acc = valid['integration_tests:candidate/accuracy']
        task2_acc = valid['integration_tests:multiturnCandidate/accuracy']
        total_acc = valid['accuracy']

        # metrics are combined correctly
        self.assertEqual(
            total_acc,
            (task1_acc + task2_acc),
            'Task accuracy is averaged incorrectly',
        )

Exemple #5

0

Afficher le fichier

Fichier : test_light_whoami.py Projet : khanhgithead/ParlAI

 def test_short_pacer_pretrain(self):
     opt = {
         'model':
         'projects.light_whoami.agents.pacer:PacerPartialOnlyAgent',
         'model_file': VANILLA_128,
         'predictor_model_file': RPA_RERANKER,
         'pacer_n_tokens': 10,
         'pacer_frequency_ratio': 0.1,
         'beam_min_length': 10,
         **COMMON_OPT,
     }
     testing_utils.eval_model(opt, skip_test=True)
     opt = {
         'model': 'projects.light_whoami.agents.pacer:PacerAgent',
         'model_file': VANILLA_128,
         'predictor_model_file': RPA_RERANKER,
         'pacer_n_tokens': 10,
         'pacer_frequency_ratio': 0.1,
         'beam_min_length': 10,
         **COMMON_OPT,
     }
     testing_utils.eval_model(opt, skip_test=True)

Exemple #6

0

Afficher le fichier