Esempio n. 1
0
    def test_similarity(self):
        data = [
            ("黄克功", "王怀安"),
            ("黄克功", "黄克功"),
            ("宋朝的历史", "明朝的历史"),
            ("电脑", "打印机"),
            ("怎么了?,。。。。", "怎么了?..,#$"),
            ("我喜欢你", "你喜欢我"),
            ("我要取票", "我要取票"),
            ("存钱", "取钱"),
            ("中国", "中华人民共和国"),
            ("喧闹的大街上人山人海", "热闹的街道上人来人往"),
            ("专心致志", "全神贯注"),
            ("爷爷爱吃土豆", "祖父喜欢吃马铃薯"),
            ("联想电脑多少钱", "联想笔记本价格"),
            ("今天天气怎么样", "我想去上海"),
            ("怎么花呗不能支付", "花呗付款不了怎么回事"),
            ("蚂蚁借呗的额度为什么会下降", "为什么借呗额度被降低了,没有不良记录"),
            ("蚂蚁借呗的额度为什么会下降", "为什么借呗额度被降低了"),
            ("花呗自动还款需要手续费ma", "花呗自动还款还要收手续费吗"),
            ("花呗怎么付款不鸟了", "帮忙看一下我花呗怎么用不了"),
            ("花呗被冻结怎么恢复", "花呗被封了怎么解除"),
            ("我借呗能不能开通", "如何开启借呗")
        ]
        for s1, s2 in data:      
            sv1 = synonym_cut(s1, 'wf')
            sv2 = synonym_cut(s2, 'wf')
            print(s1, 'VS', s2)
            print(sv1, 'VS', sv2)

            print("similarity1: ", similarity(sv1, sv2))
            print('similarity2: ', similarity2(s1, s2), '\n')
Esempio n. 2
0
 def test_similarity(self):
     data = [("电脑", "打印机"), ("怎么了?,。。。。", "怎么了?..,#$"), ("我喜欢你", "你喜欢我"),
             ("我要取票", "我要取票"), ("存钱", "取钱"), ("中国", "中华人民共和国"),
             ("喧闹的大街上人山人海", "热闹的街道上人来人往"), ("专心致志", "全神贯注"),
             ("爷爷爱吃土豆", "祖父喜欢吃马铃薯"), ("联想电脑多少钱", "联想笔记本价格"),
             ("今天天气怎么样", "我想去上海")]
     for s1, s2 in data:
         sv1 = synonym_cut(s1, 'wf')
         sv2 = synonym_cut(s2, 'wf')
         print(s1, 'VS', s2)
         print(sv1, 'VS', sv2)
         score = similarity(sv1, sv2)
         print("similarity1: ", score)
         print('similarity2: ', similarity2(s1, s2), '\n')
Esempio n. 3
0
 def test_similarity(self):
     data = [
         ("中国", "中华人民共和国"),
         ("喧闹的大街上人山人海", "热闹的街道上人来人往"),
         ("专心致志", "全神贯注"),
         ("爷爷爱吃土豆", "祖父喜欢吃马铃薯"),
         ("联想电脑多少钱", "联想笔记本价格"),
         ("今天天气怎么样", "我想去上海")
     ]
     for sentence1, sentence2 in data:
         sv1 = synonym_cut(sentence1, 'wf')
         sv2 = synonym_cut(sentence2, 'wf')
         print(sentence1, sv1)
         print(sentence2, sv2)
         sim = similarity(sv1, sv2)
         print("words similarity: ", str(sim), '\n')
Esempio n. 4
0
 def test_jaccard(self):
     print("语义相似度测试......")
     filename = ".\\log\\SemanticSimilarity_" + get_current_time() + ".md"
     file = open(filename, "w")
     file.write(
         "标签:测试文档\n#向量语义相似度测试:\n>Enter the SemanticSimilarity mode...\n")
     while True:
         try:
             sentence1 = input("\nsentence1\n>>")
             sentence2 = input("sentence2\n>>")
             sv1 = synonym_cut(sentence1, 'wf')
             sv2 = synonym_cut(sentence2, 'wf')
             print(sv1, sv2)
             sim = similarity(sv1, sv2)
             file.write("`>>" + sentence1 + "`\n")
             file.write("`>>" + sentence2 + "`\n")
             print("words similarity: " + str(sim))
             file.write("`" + "words similarity: " + str(sim) + "`\n")
         except KeyboardInterrupt:
             file.close()