コード例 #1
0
    def __init__(self, data_path="../data/ngrams/", load_type="memory"):
        self.load_type = load_type
        self.unigrams = OrderedDict()
        self.bigrams = OrderedDict()
        self.trigrams = OrderedDict()
        self.quadgrams = OrderedDict()

        # this is ngrams database handler
        self.ngramdb = NgramDB(data_path + "ngrams.db")
        #self.ngramdb.create_table_all()
        if load_type == "memory":
            ngram_mem = NgramMem(data_path=data_path)
            ngram_mem.load_all(pickle=True)
            self.__count = ngram_mem.count
            self.__count_vocab = ngram_mem.count_vocab
        else:
            self.__count = self.ngramdb.count