コード例 #1
0
ファイル: reproduction.py プロジェクト: rgeorgi/intent
def extract_pos(ef: ExperimentFiles, overwrite=False):
    extraction_performed = False
    for tc in ef.tagger_configs():
        if not os.path.exists(tc.tagger_path()) or overwrite:
            if USE_CONDOR:
                args = tc.extract_args(True)
                condorify(*args)
            else:
                args, kwargs = tc.extract_args(False)
                extract_from_xigt(args, **kwargs)

            extraction_performed = True

    if extraction_performed and USE_CONDOR:
        if condor_email:
            condor.condor_wait_notify("Taggers have been extracted.", condor_email, "CONDOR: POS Tagger Extraction Complete")
        else:
            condor.condor_wait()
コード例 #2
0
ファイル: intent.py プロジェクト: rgeorgi/intent
# STATS
elif args.subcommand == CMD_STATS:
    igt_stats(flatten_list(args.FILE), type='xigt', show_filename=True)

# SPLIT
elif args.subcommand == CMD_SPLIT:
    split_corpus(flatten_list(args.FILE), args.train, args.dev, args.test, prefix=args.prefix, overwrite=args.overwrite,
                 nfold=args.nfold)

# FILTER
elif args.subcommand == CMD_FILTER:
    filter_corpus(flatten_list(getattr(args, ARG_INFILE)), getattr(args, ARG_OUTFILE), **vars(args))

# EXTRACT
elif args.subcommand == CMD_EXTRACT:
    extract_from_xigt(input_filelist=flatten_list(args.FILE), **vars(args))

# EVAL
elif args.subcommand == CMD_EVAL:
    evaluate_intent(flatten_list(args.FILE),
                    eval_alignment=args.alignment,
                    eval_ds=args.ds_projection,
                    eval_posproj=args.pos_projection,
                    classifier_path=args.classifier,
                    classifier_feats=args.classifier_feats,
                    eval_tagger=args.pos_tagger,
                    gold_tagmap=args.tagmap_gold, trans_tagmap=args.tagmap_trans, outpath=args.output)

# TEXT CONVERT
elif args.subcommand == CMD_TEXT:
    xc = text_to_xigtxml(args.FILE)