Beispiel #1
0
    def test_reverse_transform_maxval(self):
        # test on static example texts
        vectorizer = CharVectorizer("abc", map_unknown_chars_to="X")
        texts = ["aaa", "bbb", "ccc", "abc", "???", "a?a"]
        expected = ["aaa", "bbb", "ccc", "abc", "XXX", "aXa"]

        matrix = vectorizer.transform(texts, len(texts[0]))
        rand = np.random.random_sample(matrix.shape)
        matrix = matrix + rand

        reverse_transformed = vectorizer.reverse_transform_maxval(matrix)
        for text_is, text_exp in zip(reverse_transformed, expected):
            self.assertEqual(text_is, text_exp)

        # test on 1000 random texts
        vectorizer = CharVectorizer(ALPHABET_LOWERCASE,
                                    map_unknown_chars_to="X")
        texts = create_random_texts(ALPHABET_LOWERCASE, 20, 1000)
        expected = texts

        matrix = vectorizer.transform(texts, len(texts[0]))
        rand = np.random.random_sample(matrix.shape)
        matrix = matrix + rand

        reverse_transformed = vectorizer.reverse_transform_maxval(matrix)
        for text_is, text_exp in zip(reverse_transformed, expected):
            self.assertEqual(text_is, text_exp)
 def test_reverse_transform_maxval(self):
     # test on static example texts
     vectorizer = CharVectorizer("abc", map_unknown_chars_to="X")
     texts = ["aaa", "bbb", "ccc", "abc", "???", "a?a"]
     expected = ["aaa", "bbb", "ccc", "abc", "XXX", "aXa"]
     
     matrix = vectorizer.transform(texts, len(texts[0]))
     rand = np.random.random_sample(matrix.shape)
     matrix = matrix + rand
     
     reverse_transformed = vectorizer.reverse_transform_maxval(matrix)
     for text_is, text_exp in zip(reverse_transformed, expected):
         self.assertEqual(text_is, text_exp)
     
     # test on 1000 random texts
     vectorizer = CharVectorizer(ALPHABET_LOWERCASE,
                                 map_unknown_chars_to="X")
     texts = create_random_texts(ALPHABET_LOWERCASE, 20, 1000)
     expected = texts
     
     matrix = vectorizer.transform(texts, len(texts[0]))
     rand = np.random.random_sample(matrix.shape)
     matrix = matrix + rand
     
     reverse_transformed = vectorizer.reverse_transform_maxval(matrix)
     for text_is, text_exp in zip(reverse_transformed, expected):
         self.assertEqual(text_is, text_exp)