コード例 #1
0
ファイル: train.py プロジェクト: catnlp/catnlp
import logging.config

from catnlp.common.load_file import load_config_file
from catnlp.ner.train import NerTrain

if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="训练模型")
    parser.add_argument("--task", type=str, default="NER", help="任务")
    parser.add_argument("--train_config",
                        type=str,
                        default="resources/config/ner/bert_biaffine.yaml",
                        help="训练配置")
    parser.add_argument("--log_config",
                        type=str,
                        default="resources/config/ner/logging.yaml",
                        help="日志配置")
    args = parser.parse_args()

    try:
        train_config = load_config_file(args.train_config)
        log_config = load_config_file(args.log_config)
        # logging.config.dictConfig(log_config)
    except Exception:
        raise RuntimeError("加载配置文件失败")

    task = args.task.lower()
    if task == "ner":
        ner_train = NerTrain(train_config)
    else:
        raise RuntimeError(f"{args.task}未开发")
コード例 #2
0
        type=str,
        default="resources/data/dataset/ner/zh/ccks/cmeee/0815",
        help="结果文件")
    parser.add_argument(
        "--predict_config",
        type=str,
        default="resources/config/ner/CMeEE/fusion_biaffine_kfold.yaml",
        help="预测配置")
    parser.add_argument("--log_config",
                        type=str,
                        default="resources/config/ner/logging.yaml",
                        help="日志配置")
    args = parser.parse_args()

    try:
        predict_config = load_config_file(args.predict_config)
        log_config = load_config_file(args.log_config)
        # logging.config.dictConfig(log_config)
    except Exception:
        raise RuntimeError("加载配置文件失败")

    task = args.task.lower()
    if task == "ner":
        print(predict_config)
        ner_service = NerFusion(predict_config)

        output_file = args.output_dir + f"/test_pred.json"
        with open(args.input_file, "r", encoding="utf-8") as sf, \
                open(output_file, "w", encoding="utf-8") as tf:
            lines = sf.readlines()
            for line in tqdm(lines):