Python LabelModel.save примеры использования

Язык программирования: Python

Пространство имен/Пакет: snorkel.labeling.model

Класс/Тип: LabelModel

Метод/Функция: save

Примеров на hotexamples.com: 3

Python LabelModel.save - 3 примера найдено. Это лучшие примеры Python кода для snorkel.labeling.model.LabelModel.save, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

LabelModel(30)

fit(30)

predict(25)

predict_proba(19)

score(12)

_set_constants(7)

get_conditional_probs(6)

mu(5)

_set_class_balance(4)

save(3)

_generate_O(3)

_create_tree(3)

_create_L_ind(3)

_loss_mu(2)

_break_col_permutation_symmetry(2)

_get_augmented_label_matrix(2)

load(2)

m(2)

_generate_O_from_L_aug(1)

train_config(1)

_build_mask(1)

get_weights(1)

_loss_l2(1)

_init_params(1)

train_model(1)

Пример #1

Показать файл

    def train_model(self,
                    df_train: pd.DataFrame,
                    application_area_lfs: list,
                    analysis_path: str = "output",
                    label_output_path: str = "labels.jsonl",
                    save_model_path: str = None):
        """Using our labeling functions, we can train a probabilistic model which is able to generate weak labels for our data points

        :param df_train: The training data for the model
        :type df_train: pd.DataFrame
        :param application_area_lfs: A list of labeling functions to use in training the Label Model
        :type application_area_lfs: list
        :param analysis_path: Folder path where the model output should be stored, defaults to `PROJECT_ROOT/output`
        :type analysis_path: str, optional
        :param label_output_path: Path to file where probabilistic labels generated by the model should be stored, defaults to "labels.jsonl"
        :type label_output_path: str, optional
        :param save_model_path: A path to where the Label Model should be save at. If no path is provided, the model is not saved
        :type save_model_path: str, optional
        """
        file_name_timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
        applier = PandasLFApplier(lfs=application_area_lfs)
        L_train = applier.apply(df=df_train)

        model = LabelModel(cardinality=2, verbose=True)
        model.fit(L_train=L_train, n_epochs=800, log_freq=100)
        if (save_model_path is not None):
            model.save(save_model_path)

        int_labels, prob_labels = model.predict(L=L_train,
                                                return_probs=True,
                                                tie_break_policy="abstain")
        probs_df_train_filtered, probs_train_filtered = filter_unlabeled_dataframe(
            X=df_train, y=prob_labels, L=L_train)

        int_df_train_filtered, int_train_filtered = filter_unlabeled_dataframe(
            X=df_train, y=int_labels, L=L_train)
        # write out both labels. In the probability outputs, p_rel is the second probability listed
        assert list(probs_df_train_filtered["paperid"]) == list(
            int_df_train_filtered["paperid"])
        with open(f"{label_output_path}", mode="w") as out:
            for idx, paper_id in enumerate(probs_df_train_filtered["paperid"]):
                out.write(
                    json.dumps({
                        "id": paper_id,
                        # cast to int and float to get rid of nonserializable numpy types
                        "is_rel": int(int_train_filtered[idx]),
                        "p_rel": float(probs_train_filtered[idx][1])
                    }) + "\n")

        # output LF analysis to csv file sorted by coverage
        lf_analysis = LFAnalysis(L=L_train,
                                 lfs=application_area_lfs).lf_summary()
        with open(
                f"{self.PROJECT_ROOT}/output/{analysis_path}_{file_name_timestamp}.csv",
                "w") as outfile:
            lf_analysis = lf_analysis.sort_values("Coverage")
            lf_analysis.to_csv(outfile, encoding="utf-8", index=True)

Пример #2

Показать файл

Файл: test_label_model.py Проект: deepopinion/snorkel

    def test_save_and_load(self):
        L = np.array([[0, -1, 0], [0, 1, 1]])
        label_model = LabelModel(cardinality=2, verbose=False)
        label_model.fit(L, n_epochs=1)
        original_preds = label_model.predict(L)

        dir_path = tempfile.mkdtemp()
        save_path = dir_path + "label_model.pkl"
        label_model.save(save_path)

        label_model_new = LabelModel(cardinality=2, verbose=False)
        label_model_new.load(save_path)
        loaded_preds = label_model_new.predict(L)
        shutil.rmtree(dir_path)

        np.testing.assert_array_equal(loaded_preds, original_preds)

Пример #3

Показать файл

Файл: weak_labels.py Проект: georgetown-cset/weak-labeling-experiments

def train_model(training_data: pd.DataFrame,
                testing_data: pd.DataFrame,
                L_train: np.ndarray,
                save_model=True) -> LabelModel:
    """Train a label model using the label matrix generated by the labeling functions

    :param training_data: Dataframe of training data
    :type training_data: pd.DataFrame
    :param testing_data: Dataframe of testing data
    :type testing_data: pd.DataFrame
    :param L_train: The matrix of labels generated by the labeling functions on the training data
    :type L_train: np.ndarray
    :param save_model: Set this to `True` to save the model to disk, defaults to `True`
    :type save_model: bool, optional
    :return: A label model
    :rtype: LabelModel
    """
    # Build noise aware majority model
    model = LabelModel(cardinality=2, verbose=True)
    model.fit(L_train=L_train, n_epochs=800,
              log_freq=100)  # , class_balance=[0.673, 0.327])
    if (save_model):
        model.save("../output/model_export/saved_label_model.pkl")
    return model