예제 #1
0
 def test_top_words_digits_punctuation(self):
     s = pd.Series("123. .321 -h1n1 -cov2")
     s_true = pd.Series([1, 1, 1, 1], index=["123", "321", "cov2", "h1n1"])
     self.assertEqual(visualization.top_words(s).sort_index(), s_true)
예제 #2
0
 def test_top_words_digits(self):
     s = pd.Series("123 hello h1n1")
     s_true = pd.Series([1, 1, 1], index=["123", "h1n1", "hello"])
     self.assertEqual(visualization.top_words(s).sort_index(), s_true)
예제 #3
0
 def test_top_words_remove_external_punctuation(self):
     s = pd.Series("stop. please!")
     s_true = pd.Series([1, 1], index=["please", "stop"])
     self.assertEqual(visualization.top_words(s).sort_index(), s_true)
예제 #4
0
 def test_top_words_punctuation_between(self):
     s = pd.Series("can't hello-world u.s.a")
     s_true = pd.Series([1, 1, 1], index=["can't", "hello-world", "u.s.a"])
     self.assertEqual(visualization.top_words(s).sort_index(), s_true)
예제 #5
0
 def test_top_words_space_char(self):
     s = pd.Series("one \n\t")
     s_true = pd.Series([1], index=["one"])
     self.assertEqual(visualization.top_words(s), s_true)
예제 #6
0
 def test_top_words(self):
     s = pd.Series("one two two three three three")
     s_true = pd.Series([1, 3, 2], index=["one", "three", "two"])
     self.assertEqual(visualization.top_words(s).sort_index(), s_true)