import gzip
import sys

if __name__ == "__main__":
    
    parser = argparse.ArgumentParser(description='Chooses rules.')
    parser.add_argument('--use_synonyms')
    parser.add_argument('--inverse_synonyms',action='store_true')
    parser.add_argument('--additional_references')
    parser.add_argument('--debug', action='store_true')
    args = parser.parse_args(sys.argv[1:])
    set_debug(args.debug)
    
    #read synonyms
    if args.use_synonyms:
        ParallelMWE.load_synonym_dict(args.use_synonyms, args.inverse_synonyms)
    
    mweset=ParallelMWESet()
    
    if args.additional_references:
        myfile=gzip.open(args.additional_references)
        for line in myfile:
            mwe=ParallelMWE()
            mwe.parse(line)
            mweset.add(mwe)
        myfile.close()
    
    #read mwes
    mwelist=list()
    for line in sys.stdin:
        line=line.strip()
Example #2
0
if __name__ == "__main__":
    parser = argparse.ArgumentParser(description='select minimum amount of parallel MWEs to reproduce the bilingual expr.')
    parser.add_argument('--only_print_scores',action='store_true')
    parser.add_argument('--bilingual_exprs',required=True)
    parser.add_argument('--use_synonyms')
    parser.add_argument('--inverse_synonyms',action='store_true')
    parser.add_argument('--invert_synonym_direction',action='store_true')
    parser.add_argument('--threshold',default='2')
    parser.add_argument('--debug', action='store_true')
    args = parser.parse_args(sys.argv[1:])
    
    set_debug(args.debug)
    
    if args.use_synonyms:
        ParallelMWE.load_synonym_dict(args.use_synonyms, args.inverse_synonyms,args.invert_synonym_direction)
    
    mwes=list()
    #read MWEs
    for line in sys.stdin:
        line=line.strip()
        mwe=ParallelMWE()
        mwe.parse(line)
        mwes.append(mwe)
    
    reprlistofnonleafs=mwes[0].get_representative()
    
    bilExprs=list()
    #read bilingual exprs
    for line in gzip.open(args.bilingual_exprs,'r'):
        line=line.strip()