feats.update(('FORWARD3_{}_{}/{}/{}'.format(j, *w) for w in zip(sb_unit, sb_unit[1:], sb_unit[2:]))) feat_doc.append((label, sorted(feats))) yield feat_doc if __name__ == '__main__': try: which = sys.argv[1] writer = {'megam': feat_writer.megam_writer, 'crfsuite': feat_writer.crfsuite_writer}[which] out_dir = sys.argv[2] train_in, dev_in, test_in = sys.argv[3:6] sys.argv.extend(["1", "1"]) window_back = int(sys.argv[6]) window_forward = int(sys.argv[7]) except: print 'Usage: {} which(=megam|crfsuite) out_dir train dev test [window_back=1 window_forward=1]'.format(sys.argv[0]) exit(1) for (purpose, path) in zip(["train", "dev", "test"], [train_in, dev_in, test_in]): with open(path) as fi: with open(out_dir + '/' + purpose + '.' + which, 'w') as fo: writer(iter_features(common.lazy_load_dyads(fi), window_back, window_forward), fo) with open(out_dir + '/' + 'map.' + which, 'w') as f: cPickle.dump(LABEL_ID, f)
if __name__ == '__main__': try: which = sys.argv[1] writer = { 'megam': feat_writer.megam_writer, 'crfsuite': feat_writer.crfsuite_writer }[which] out_dir = sys.argv[2] train_in, dev_in, test_in = sys.argv[3:6] sys.argv.extend(["1", "1"]) window_back = int(sys.argv[6]) window_forward = int(sys.argv[7]) except: print 'Usage: {} which(=megam|crfsuite) out_dir train dev test [window_back=1 window_forward=1]'.format( sys.argv[0]) exit(1) for (purpose, path) in zip(["train", "dev", "test"], [train_in, dev_in, test_in]): with open(path) as fi: with open(out_dir + '/' + purpose + '.' + which, 'w') as fo: writer( iter_features(common.lazy_load_dyads(fi), window_back, window_forward), fo) with open(out_dir + '/' + 'map.' + which, 'w') as f: cPickle.dump(LABEL_ID, f)
def useWindowFrame(fi,LABEL_ID,window_back=1,window_forward=1): #window_back = 1 #window_forward = 1 return iter_features(lazy_load_dyads(fi),LABEL_ID, window_back, window_forward)