# First #read_blacklist(open('../data/blacklist.txt')) # LEARNING #read_terms(open('../data/mbto.obo')) #read_heads(open('../data/mbto.heads'), action='learn') #test.cleaning_helper() print '#' * 100 #test.cleaning_helper() # LEARNING print 'LEARNING' print "Reading lemma" read_lemma(open('../data/expe1_20120910/lemma')) print "Reading types" read_types(open('../data/expe1_20120910/types')) print "Reading heads" read_heads(open('../data/expe1_20120910/heads_tolearn'), action='learn') print "Saving" test.save(prefix='../dumps/expe1_20120910/expe1_20120910_after_learning') # TAGGING print "\nTAGGING" print "Tagging heads" read_heads(open('../data/expe1_20120910/heads_totag'), action='tag') print "Saving" test.save(prefix='../dumps/expe1_20120910/expe1_20120910_after_tagging') #trouves = 0 #non_trouves = 0 #for k,v in test.terms.items():
test.cleaning_helper() print print "Saving after learning onto" test.save(prefix=BASE_DUMPS + EXPE + u'_after_learning_onto') print '-' * 80 if FLAT_OK: ############################################################################# # LEARNING FLAT RESOURCES print 'LEARNING FLAT RESOURCES' print '-' * 80 ############################################################################# print "Reading flat resources types" read_types(codecs.open(BASE_DATA + u'types', encoding='UTF-8')) print '%d terms currently in memory.\n' % len(test.terms) print "Reading flat resources heads" read_heads(codecs.open(BASE_DATA + u'heads_tolearn_dico', encoding='UTF-8'), action='learn') print '%d terms currently in memory.\n' % len(test.terms) print "Saving after learning flat resources" test.save(prefix=BASE_DUMPS + EXPE + u'_after_learning_flat_resources') print '-' * 80 ############################################################################# # TAGGING print "TAGGING" print '-' * 80 #############################################################################
# First read_blacklist(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/blacklist.txt')) # LEARNING read_terms(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/bacteria_habitat_OntoBiotope-34')) read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_tolearn_onto'), action='learn') #test.cleaning_helper() print '#' * 100 #test.cleaning_helper() # LEARNING print 'LEARNING' print "Reading lemma" read_lemma(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/lemma')) print "Reading types" read_types(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/types')) print "Reading heads" read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_tolearn_dico'), action='learn') print "Saving" test.save(prefix='/bibdev/travail/typage/typage_biotope_task3.4/dumps/expe1_20120912/expe1_20120912_after_learning') # TAGGING print "\nTAGGING" print "Tagging heads" read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_totag'), action='tag') print "Saving" test.save(prefix='/bibdev/travail/typage/typage_biotope_task3.4/dumps/expe1_20120912/expe1_20120912_after_tagging') #trouves = 0 #non_trouves = 0 #for k,v in test.terms.items():
# First # read_blacklist(open('../data/blacklist.txt')) # LEARNING # read_terms(open('../data/mbto.obo')) # read_heads(open('../data/mbto.heads'), action='learn') # test.cleaning_helper() print "#" * 100 # test.cleaning_helper() # LEARNING print "LEARNING" print "Reading lemma" read_lemma(open("../data/expe1_20120908/lemma")) print "Reading types" read_types(open("../data/expe1_20120908/types")) print "Reading heads" read_heads(open("../data/expe1_20120908/heads_tolearn"), action="learn") print "Saving" test.save(prefix="../dumps/expe1/expe1_20120908_after_learning") # TAGGING print "\nTAGGING" print "Tagging heads" read_heads(open("../data/expe1_20120908/heads_totag"), action="tag") print "Saving" test.save(prefix="../dumps/expe1/expe1_20120908_after_tagging") # trouves = 0 # non_trouves = 0 # for k,v in test.terms.items():