Exemplo n.º 1
0
    def test_with_single_namespace_and_single_model(self, model_name):
        dataset = self.single_namespace_dataset
        namespace = "namespace_1"

        expected_vocab_size = self._get_expected_vocab_size(
            dataset, namespace, model_name)

        vocab = Vocabulary.from_pretrained_transformer_and_instances(
            dataset, {namespace: model_name})

        assert vocab.get_vocab_size(namespace) == expected_vocab_size
Exemplo n.º 2
0
    def test_only_updates_single_namespace_when_multiple_present(
            self, model_name):
        dataset = self.multiple_namespace_dataset
        namespace1 = "namespace_1"
        namespace2 = "namespace_2"

        namespace1_vocab_size = self._get_expected_vocab_size(
            dataset, namespace1, model_name)
        namespace2_vocab_size = Vocabulary.from_instances(
            dataset).get_vocab_size("namespace_2")

        vocab = Vocabulary.from_pretrained_transformer_and_instances(
            dataset, {namespace1: model_name})

        # Make sure only the desired namespace is extended
        assert vocab.get_vocab_size(namespace1) == namespace1_vocab_size
        assert vocab.get_vocab_size(namespace2) == namespace2_vocab_size
Exemplo n.º 3
0
    def test_with_different_models_per_namespace(self, namespace1_model_name,
                                                 namespace2_model_name):
        dataset = self.multiple_namespace_dataset
        namespace1 = "namespace_1"
        namespace2 = "namespace_2"

        namespace1_vocab_size = self._get_expected_vocab_size(
            dataset, namespace1, namespace1_model_name)
        namespace2_vocab_size = self._get_expected_vocab_size(
            dataset, namespace2, namespace2_model_name)

        vocab = Vocabulary.from_pretrained_transformer_and_instances(
            dataset, {
                namespace1: namespace1_model_name,
                namespace2: namespace2_model_name
            })

        assert vocab.get_vocab_size(namespace1) == namespace1_vocab_size
        assert vocab.get_vocab_size(namespace2) == namespace2_vocab_size