Exemple #1
0
import test
from obo import read_terms
from onto_utils import read_heads, read_blacklist, read_types, read_lemma

# First
read_blacklist(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/blacklist.txt'))

# LEARNING
read_terms(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/bacteria_habitat_OntoBiotope-34'))
read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_tolearn_onto'), action='learn')
#test.cleaning_helper()
print '#' * 100
#test.cleaning_helper()

# LEARNING
print 'LEARNING'
print "Reading lemma"
read_lemma(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/lemma'))
print "Reading types"
read_types(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/types'))
print "Reading heads"
read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_tolearn_dico'), action='learn')
print "Saving"
test.save(prefix='/bibdev/travail/typage/typage_biotope_task3.4/dumps/expe1_20120912/expe1_20120912_after_learning')

# TAGGING
print "\nTAGGING"
print "Tagging heads"
read_heads(open('/bibdev/travail/typage/typage_biotope_task3.4/data/expe_20120912/heads_totag'), action='tag')
print "Saving"
test.save(prefix='/bibdev/travail/typage/typage_biotope_task3.4/dumps/expe1_20120912/expe1_20120912_after_tagging')
print 'Expects a flat resource: %s' % FLAT_OK
print '-' * 80

#############################################################################
# FIRST
print 'FIRST'
print '-' * 80
#############################################################################

print "Reading lemma"
read_lemma(codecs.open(BASE_DATA + u'lemma', encoding='UTF-8'))
print '%d lemma read.\n' % len(language.lemma)

if BLACKLIST_OK:
    print 'Reading blacklist'
    read_blacklist(codecs.open(BASE_DATA + u'blacklist', encoding='UTF-8'))
    print 'Blacklist content: %s\n' % ', '.join(test.blacklist)

print '-' * 80

if ONTO_OK:
    #############################################################################
    # LEARNING ONTO
    print 'LEARNING ONTO'
    print '-' * 80
    #############################################################################

    print "Reading onto"
    read_terms(codecs.open(BASE_DATA + u'onto'))
    print '%d terms currently in memory.\n' % len(test.terms)
    print 'The following inconsistencies were found in the ontology:'