def setUp(self):
     self.data_handler = JointModelDataHandler.from_config(
         JointModelDataHandler.Config(),
         FeatureConfig(),
         [DocLabelConfig(), WordLabelConfig()],
         featurizer=SimpleFeaturizer.from_config(SimpleFeaturizer.Config(),
                                                 FeatureConfig()),
     )
Beispiel #2
0
    def test_intializing_embeds_from_config(self):
        feature_config = FeatureConfig(
            word_feat=WordFeatConfig(
                embedding_init_strategy=EmbedInitStrategy.RANDOM,
                embed_dim=5,
                pretrained_embeddings_path=tests_module.TEST_BASE_DIR,
            )
        )
        data_handler = JointModelDataHandler.from_config(
            JointModelDataHandler.Config(),
            feature_config,
            [DocLabelConfig(), WordLabelConfig()],
            featurizer=SimpleFeaturizer.from_config(
                SimpleFeaturizer.Config(), feature_config
            ),
        )

        data_handler.init_metadata_from_path(TRAIN_FILE, EVAL_FILE, TEST_FILE)

        pretrained_embeds = data_handler.metadata.features[
            DatasetFieldName.TEXT_FIELD
        ].pretrained_embeds_weight
        # test random initialization (values should be non-0)
        np.testing.assert_array_less(
            [0, 0, 0, 0, 0], np.absolute(pretrained_embeds[11].numpy())
        )

        feature_config = FeatureConfig(
            word_feat=WordFeatConfig(
                embedding_init_strategy=EmbedInitStrategy.ZERO,
                embed_dim=5,
                pretrained_embeddings_path=tests_module.TEST_BASE_DIR,
            )
        )
        data_handler = JointModelDataHandler.from_config(
            JointModelDataHandler.Config(),
            feature_config,
            [DocLabelConfig(), WordLabelConfig()],
            featurizer=SimpleFeaturizer.from_config(
                SimpleFeaturizer.Config(), feature_config
            ),
        )
        data_handler.init_metadata_from_path(TRAIN_FILE, EVAL_FILE, TEST_FILE)

        pretrained_embeds = data_handler.metadata.features[
            DatasetFieldName.TEXT_FIELD
        ].pretrained_embeds_weight
        # test zero initialization (values should all be 0)
        np.testing.assert_array_equal([0, 0, 0, 0, 0], pretrained_embeds[11].numpy())
Beispiel #3
0
 class Config(Task.Config):
     labels: List[TargetConfigBase]
     model: JointModel.Config = JointModel.Config()
     trainer: Trainer.Config = Trainer.Config()
     data_handler: JointModelDataHandler.Config = JointModelDataHandler.Config(
     )
     metric_reporter: IntentSlotMetricReporter.Config = (
         IntentSlotMetricReporter.Config())
Beispiel #4
0
 class Config(Task.Config):
     model: WordTaggingModel.Config = WordTaggingModel.Config()
     trainer: Trainer.Config = Trainer.Config()
     labels: WordLabelConfig = WordLabelConfig()
     data_handler: JointModelDataHandler.Config = JointModelDataHandler.Config(
     )
     metric_reporter: WordTaggingMetricReporter.Config = (
         WordTaggingMetricReporter.Config())
Beispiel #5
0
 class Config(Task.Config):
     model: Union[BaggingDocEnsemble.Config, BaggingIntentSlotEnsemble.Config]
     trainer: EnsembleTrainer.Config = EnsembleTrainer.Config()
     labels: List[TargetConfigBase]
     data_handler: JointModelDataHandler.Config = JointModelDataHandler.Config()
     metric_reporter: Union[
         ClassificationMetricReporter.Config, IntentSlotMetricReporter.Config
     ]