Beispiel #1
0
    def __init__(self,
                 nnet_fname,
                 scaler_fname,
                 labels_fname,
                 ngram_fname,
                 logbase=1,
                 loglevel=logging.INFO,):
        self.nnet_fname = nnet_fname
        self.scaler_fname = scaler_fname
        self.labels_fname = labels_fname
        self.ngram_fname = ngram_fname
        self.logbase = logbase
        self.loglevel = loglevel
        self.loglevelname = logging._levelToName[loglevel].lower()

        Bantry.scaler = ScalerFactory(scaler_fname)
        Bantry.classifier = Classifier(nnet_fname, labels_fname,
                                       logbase=logbase)
        self.ng = Ngram(ngram_fname)
        Bantry.ngram = self.ng
        GramGraph.set_ngram(self.ng)
Beispiel #2
0
    def __init__(
        self,
        nnet_fname,
        scaler_fname,
        labels_fname,
        ngram_fname,
        logbase=1,
        loglevel=logging.INFO,
    ):
        self.nnet_fname = nnet_fname
        self.scaler_fname = scaler_fname
        self.labels_fname = labels_fname
        self.ngram_fname = ngram_fname
        self.logbase = logbase
        self.loglevel = loglevel
        self.loglevelname = logging._levelToName[loglevel].lower()

        Bantry.scaler = ScalerFactory(scaler_fname)
        Bantry.classifier = Classifier(nnet_fname,
                                       labels_fname,
                                       logbase=logbase)
        self.ng = Ngram(ngram_fname)
        Bantry.ngram = self.ng
        GramGraph.set_ngram(self.ng)
Beispiel #3
0
}.get(sys.argv[-1][:2].lower(), logging.INFO)

replace = lambda s: banti_fname.replace('.box', s)
log_fname = replace('.{}.log'.format(logging._levelToName[loglevel]).lower())
asis_fname = replace('.ml.txt')
nogram_out_fname = replace('.nogram.txt')
ngram_out_fname = replace('.gram.txt')

logging.basicConfig(filename=log_fname, level=loglevel, filemode="w")

############################## Set-up scaler, classifier, ngram etc.
Bantry.scaler = ScalerFactory(scaler_fname)
Bantry.classifier = Classifier(nnet_fname, labels_fname, logbase=1)
ng = Ngram(ngram_fname)
Bantry.ngram = ng
GramGraph.set_ngram(ng)

############################## Read Bantries & get Most likely output
bf = BantryFile(banti_fname)
with open(asis_fname, 'w', encoding='utf-8') as f:
    f.write(post_process(bf.text))

############################## Process using ngrams
ngrammed_lines, notgrammed_lines = [], []

for linenum in range(bf.num_lines):
    print("Line ", linenum)
    line_bantries = bf.get_line_bantires(linenum)
    gramgraph = GramGraph(line_bantries)
    gramgraph.process_tree()
    notgrammed_lines.append(gramgraph.get_best_apriori_str())