Exemplo n.º 1
0
    def __init__(self, outdir):
        Filter.__init__(self)
        OutputPrefacedPTBDerivation.__init__(self, outdir)

        self.outdir = outdir
        self.bad = OutputPrefacedPTBDerivation(os.path.join(outdir, 'failed'))
        self.bad_freqs = defaultdict(int)
Exemplo n.º 2
0
class BadAtom(Filter, OutputPrefacedPTBDerivation):
    def __init__(self, outdir):
        Filter.__init__(self)
        OutputPrefacedPTBDerivation.__init__(self, outdir)

        self.outdir = outdir
        self.bad = OutputPrefacedPTBDerivation(os.path.join(outdir, 'failed'))
        self.bad_freqs = defaultdict(int)
        
    def accept(self, root):
        for node in nodes(root):
            cat = node.cat
            
            if has_bad_subcat(cat):
                self.bad_freqs[str(cat)] += 1
                return False
        return True

    MergedTags = { 'VCD', 'VNV', 'VPT' }
    def accept_derivation(self, bundle):
        if self.accept(bundle.derivation):
            self.write_derivation(bundle)
        else:
            self.bad.write_derivation(bundle)

    def output(self):
        with file(os.path.join(self.outdir, 'failed_freqs'), 'w') as f:
            for badcat, freq in sorted_by_value_desc(self.bad_freqs):
                print >>f, '% 5d | %s' % (freq, badcat)
            
    arg_names = 'OUTDIR'
Exemplo n.º 3
0
    def __init__(self, outdir):
        Filter.__init__(self)
        OutputPrefacedPTBDerivation.__init__(self, outdir)

        self.outdir = outdir
        self.bad = OutputPrefacedPTBDerivation(os.path.join(outdir, 'failed'))
        self.bad_freqs = defaultdict(int)
Exemplo n.º 4
0
class BadAtom(Filter, OutputPrefacedPTBDerivation):
    def __init__(self, outdir):
        Filter.__init__(self)
        OutputPrefacedPTBDerivation.__init__(self, outdir)

        self.outdir = outdir
        self.bad = OutputPrefacedPTBDerivation(os.path.join(outdir, 'failed'))
        self.bad_freqs = defaultdict(int)

    def accept(self, root):
        for node in nodes(root):
            cat = node.cat

            if has_bad_subcat(cat):
                self.bad_freqs[str(cat)] += 1
                return False
        return True

    MergedTags = {'VCD', 'VNV', 'VPT'}

    def accept_derivation(self, bundle):
        if self.accept(bundle.derivation):
            self.write_derivation(bundle)
        else:
            self.bad.write_derivation(bundle)

    def output(self):
        with file(os.path.join(self.outdir, 'failed_freqs'), 'w') as f:
            for badcat, freq in sorted_by_value_desc(self.bad_freqs):
                print >> f, '% 5d | %s' % (freq, badcat)

    arg_names = 'OUTDIR'
Exemplo n.º 5
0
 def __init__(self, outdir):
     Filter.__init__(self)
     OutputPrefacedPTBDerivation.__init__(self, outdir)
Exemplo n.º 6
0
 def __init__(self, outdir):
     Filter.__init__(self)
     OutputPrefacedPTBDerivation.__init__(self, outdir)