# print grammar.hierarchy grammar.makeMapping(topLevel) # print grammar.pennToLevel for level in range(len(ec05)): gstats = GrammarStats() vstats = ValidationEvents() for ct,line in enumerate(file(trees)): if ct % 100 == 0: print "read trees", ct tree = grammar.transform(level + 1, zeroSplit( binarizeTree( treeToTuple(line.strip())))) # print treeToStr(tree) gstats.record(tree) for ct,line in enumerate(file(validation)): if ct % 1000 == 0: print "read validation trees", ct tree = grammar.transform(level + 1, zeroSplit( binarizeTree( treeToTuple(line.strip())))) vstats.record(tree) gstats.normalize() gstats.learnLambdas(vstats)