Ejemplo n.º 1
0
def prepare_kiwi(train_file):
    """
    input: train file i.e. corpora
    output: kiwi model
    """
    numThread = 4
    kiwi = Kiwi(numThread)
    reader = ReaderExam(train_file)
    minCount = 5
    maxWordLength = 6
    minScore = 0.25
    kiwi.extractWords(reader.read, minCount, maxWordLength, minScore)
    kiwi.prepare()
    return kiwi
Ejemplo n.º 2
0
        self.input.close()
        self.output.close()

kiwi = Kiwi()
kiwi.load_user_dictionary(r'./server_project/test/userDict.txt')
kiwi.add_user_word('iXVDR', 'NNP', 3.0)

kiwi.prepare()
# handle = IOHandler(r'./server_project/test/input.txt', r'./server_project/test/result.txt')
# kiwi.analyze(handle.read, handle.write)


result = kiwi.analyze('강남에서 먹었던 오늘의 스파게티는 맛있었다.', 1)
for i in result:
    print(i)


class ReaderExam:
    def __init__(self, filePath):
        self.file = open(filePath, encoding='UTF8')
    
    def read(self, id):
        if id == 0: self.file.seek(0)
        return self.file.readline()

reader = ReaderExam(r'./server_project/test/input.txt')
print(kiwi.extractWords(reader.read, 1, 10, 0.25))
#kiwi.extract_add_words(reader.read, min_cnt = 1, max_word_len = 10, min_score = 0.25, pos_score = -3)