Пример #1
0
def Compute_Overlap(syns, sent):
    gloss = PunktSentenceTokenizer().tokenize(syns.definition())
    #     print(gloss)
    for u in gloss:
        gloss = set(nltk.word_tokenize(u))
    for i in syns.examples():
        print("example", i)
        s = set(nltk.word_tokenize(i))
        gloss = gloss.union(s)
        gloss = gloss.difference(functionwords)
    # print("Gloss:",gloss)
    if isinstance(sent, str):
        sentence = set(sent.split(" "))
    elif isinstance(sent, list):
        sentence = set(sent)
    elif isinstance(sent, set):
        pass
    else:
        print('yo')
    sentence = sentence.difference(functionwords)
    length = len(gloss.intersection(sentence))
    define = syns.definition()
    print(syns)
    print("Definition:", define, " Overlap:", length)
    return length