pred = clf.predict(test)
    pred_unknow = clf.predict_unknow(test)
    #    print pred
    print "precision:", clf.metrics_precision(test_label, pred_unknow)
    print "recall:", clf.metrics_recall(test_label, pred_unknow)
    print "f1:", clf.metrics_f1(test_label, pred_unknow)
    print "accuracy:", clf.metrics_accuracy(test_label, pred_unknow)
    print "zero_one_loss:", clf.metrics_zero_one_loss(test_label, pred_unknow)
    test_proba = clf.predict_max_proba(test)
    print "my_zero_one_loss:", clf.metrics_my_zero_one_loss(test_proba)
    print
    clf.metrics_correct(test_label, pred_unknow)
    plot.get_instance()
    plot.plot_roc(test_label,
                  clf.predict_proba(test),
                  classes=clf.bayes.classes_.tolist(),
                  detail=True)
    plot.show()

    # 加载主客观分类数据集
#    feature = CHIFeature(subjective=False)
#    train_datas, class_label, _ = feature.get_key_words()
#    train = train_datas
#    if not sp.issparse(train_datas):
#        train = feature.cal_weight(train_datas)
#
#    test = Load.load_test_objective_balance()
#    test_datas, test_label, _ = feature.get_key_words(test)
#    test = test_datas
#    # 构建适合 bayes 分类的数据集
#    if not sp.issparse(train_datas):
Example #2
0
            print "origin my_zero_one_loss:", clf.metrics_my_zero_one_loss(test_proba)
            print
            clf.metrics_correct(test_label, pred_unknow)
#            plot.plot_roc(test_label, clf.predict_proba(test), classes=clf.bayes.classes_.tolist(), text='origin')

#        bayes.update(c_pred[0], test_datas[0].get("sentence"))
        incr_train_datas = Load.load_incr_datas()
        incr_train, incr_class_label, _ = feature.get_key_words(incr_train_datas)
        # 构建适合 bayes 分类的增量集
        fit_incr_train = incr_train
        if not sp.issparse(incr_train):
            fit_incr_train = feature.cal_weight_improve(incr_train, incr_class_label)

        clf.get_incr_classificator(fit_incr_train, incr_class_label, train, class_label, method=method_options[i])
        pred_unknow = clf.predict_unknow(test)

        print "incr precision:", clf.metrics_precision(test_label, pred_unknow)
        print "incr recall:", clf.metrics_recall(test_label, pred_unknow)
        print "incr f1:", clf.metrics_f1(test_label, pred_unknow)
        print "incr accuracy:", clf.metrics_accuracy(test_label, pred_unknow)
        print "incr zero_one_loss:", clf.metrics_zero_one_loss(test_label, pred_unknow)
        test_proba = clf.predict_max_proba(test)
        print "incr my_zero_one_loss:", clf.metrics_my_zero_one_loss(test_proba)
        print
        clf.metrics_correct(test_label, pred_unknow)
        plot.plot_roc(test_label, clf.predict_proba(test),
                      linestyle=linestyle[i],
                      classes=clf.bayes.classes_.tolist(),
                      text='incr ' + method_options_0[i])
    plot.show()
                          isbalance=False, minority_target=EMOTION_CLASS.keys())

    pred = clf.predict(test)
    pred_unknow = clf.predict_unknow(test)
#    print pred
    print "precision:", clf.metrics_precision(test_label, pred_unknow)
    print "recall:", clf.metrics_recall(test_label, pred_unknow)
    print "f1:", clf.metrics_f1(test_label, pred_unknow)
    print "accuracy:", clf.metrics_accuracy(test_label, pred_unknow)
    print "zero_one_loss:", clf.metrics_zero_one_loss(test_label, pred_unknow)
    test_proba = clf.predict_max_proba(test)
    print "my_zero_one_loss:", clf.metrics_my_zero_one_loss(test_proba)
    print
    clf.metrics_correct(test_label, pred_unknow)
    plot.get_instance()
    plot.plot_roc(test_label, clf.predict_proba(test), classes=clf.bayes.classes_.tolist(), detail=True)
    plot.show()

    # 加载主客观分类数据集
#    feature = CHIFeature(subjective=False)
#    train_datas, class_label, _ = feature.get_key_words()
#    train = train_datas
#    if not sp.issparse(train_datas):
#        train = feature.cal_weight(train_datas)
#
#    test = Load.load_test_objective_balance()
#    test_datas, test_label, _ = feature.get_key_words(test)
#    test = test_datas
#    # 构建适合 bayes 分类的数据集
#    if not sp.issparse(train_datas):
#        test = feature.cal_weight(test_datas)