if os.path.exists("eval.clean." + TL): os.remove("eval.clean." + TL) if GUIDED_ALIGNMENT: if VERBOSE: print("GUIDED ALIGNMENT TRAINING", datetime.now()) if DELETE_EXISTING: FILE = "train.sp." + SL + "." + SL + ".align" if os.path.exists(FILE): os.remove(FILE) FILE = "train.sp." + TL + "." + TL + ".align" if os.path.exists(FILE): os.remove(FILE) if ALIGNER == "fast_align": sys.path.append(MTUOC) from MTUOC_guided_alignment_fast_align import guided_alignment_fast_align guided_alignment_fast_align(MTUOC, "train.sp", "train.sp", SL, TL, BOTH_DIRECTIONS, VERBOSE) if ALIGNER == "eflomal": sys.path.append(MTUOC) from MTUOC_guided_alignment_eflomal import guided_alignment_eflomal guided_alignment_eflomal(MTUOC, "train.sp", "train.sp", SL, TL, SPLIT_LIMIT, VERBOSE) if GUIDED_ALIGNMENT_VALID: if VERBOSE: print("GUIDED ALIGNMENT TRAINING", datetime.now()) if DELETE_EXISTING: FILE = "val.sp." + SL + "." + SL + ".align" if os.path.exists(FILE): os.remove(FILE) FILE = "val.sp." + TL + "." + TL + ".align"
linia = splitnumbers(linia, joiner) sortida.write(linia + "\n") entrada.close() sortida.close() if GUIDED_ALIGNMENT: if VERBOSE: print("GUIDED ALIGNMENT TRAINING", datetime.now()) if DELETE_EXISTING: FILE = "train.bpe." + SL + "." + SL + ".align" if os.path.exists(FILE): os.remove(FILE) if ALIGNER == "fast_align": sys.path.append(MTUOC) from MTUOC_guided_alignment_fast_align import guided_alignment_fast_align guided_alignment_fast_align(MTUOC, "train.bpe", "train.bpe", SL, TL, False, VERBOSE) if ALIGNER == "eflomal": sys.path.append(MTUOC) from MTUOC_guided_alignment_eflomal import guided_alignment_eflomal guided_alignment_eflomal(MTUOC, "train.bpe", "train.bpe", SL, TL, SPLIT_LIMIT, VERBOSE) if GUIDED_ALIGNMENT_VALID: if VERBOSE: print("GUIDED ALIGNMENT VALIDATION", datetime.now()) if DELETE_EXISTING: FILE = "val.bpe." + SL + "." + SL + ".align" if os.path.exists(FILE): os.remove(FILE) FILE = "val.bpe." + TL + "." + TL + ".align"
else: FILE = "train_COMBI." + SL + "." + SL + ".align" if os.path.exists(FILE): os.remove(FILE) if APPLY_BPE: FILE = "train_COMBI.bpe." + TL + "." + TL + ".align" else: FILE = "train_COMBI." + TL + "." + TL + ".align" if os.path.exists(FILE): os.remove(FILE) if ALIGNER == "fast_align": sys.path.append(MTUOC) from MTUOC_guided_alignment_fast_align import guided_alignment_fast_align if APPLY_BPE: guided_alignment_fast_align(MTUOC, "train_COMBI.bpe", "train_COMBI.bpe", SL, TL, BOTH_DIRECTIONS, VERBOSE) else: guided_alignment_fast_align(MTUOC, "train_COMBI", "train_COMBI", SL, TL, BOTH_DIRECTIONS, VERBOSE) if ALIGNER == "eflomal": sys.path.append(MTUOC) from MTUOC_guided_alignment_eflomal import guided_alignment_eflomal if APPLY_BPE: guided_alignment_eflomal(MTUOC, "train_COMBI.bpe", "train_COMBI.bpe", SL, TL, SPLIT_LIMIT, VERBOSE) else: guided_alignment_eflomal(MTUOC, "train_COMBI", "train_COMBI", SL, TL, SPLIT_LIMIT, VERBOSE)