Python most_similar示例

编程语言: Python

命名空间/包名称: texthero.representation

方法/功能: most_similar

hotexamples.com的示例: 5

Python most_similar - 已找到5个示例。这些是从开源项目中提取的最受好评的texthero.representation.most_similar现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

    def test_most_similar_simple(self):
        s = pd.Series(["one one one"])
        s = preprocessing.tokenize(s)
        df_embeddings = representation.word2vec(s, min_count=1, seed=1)

        to = "one"
        most_similar = representation.most_similar(df_embeddings, to)

        self.assertEqual(most_similar.shape, (1, ))

示例#2

显示文件

文件： test_indexes.py 项目： wurentidai/texthero

 def test_incorrect_index_most_similar(self):
     s = pd.DataFrame([[1.0], [2.0]], index=["word1", "word2"])
     result_s = representation.most_similar(s, "word1")
     t_different_index = pd.DataFrame(s.values, index=None)
     self.assertFalse(result_s.index.equals(t_different_index.index))

示例#3

显示文件

文件： test_indexes.py 项目： wurentidai/texthero

 def test_correct_index_most_similar(self):
     s = pd.DataFrame([[1.0], [2.0]], index=["word1", "word2"])
     result_s = representation.most_similar(s, "word1")
     t_same_index = pd.DataFrame(s.values, s.index)
     self.assertTrue(result_s.index.equals(t_same_index.index))

示例#4

显示文件

 def test_most_similar_raise_with_not_in_index(self):
     s_embed = pd.DataFrame(data=[1], index=["one"])
     to = "two"
     with self.assertRaisesRegex(ValueError, r"index"):
         representation.most_similar(s_embed, to)

示例#5

显示文件

    def test_most_similar_raise_with_series(self):
        s_embed = pd.Series({"one": 1})
        to = "one"

        with self.assertRaisesRegex(ValueError, r"Pandas|pandas"):
            representation.most_similar(s_embed, to)