def test_vector_lengths(self):
     vectorizer = CharVectorizer("abc", map_unknown_chars_to="1",
                                 fill_left_char="2", fill_right_char="3")
     self.assertEquals(vectorizer.get_one_char_vector_length(),
                       len("abc123"))
     self.assertEquals(vectorizer.get_vector_length(2),
                       len("abc123") * 2)
Beispiel #2
0
 def test_vector_lengths(self):
     vectorizer = CharVectorizer("abc",
                                 map_unknown_chars_to="1",
                                 fill_left_char="2",
                                 fill_right_char="3")
     self.assertEquals(vectorizer.get_one_char_vector_length(),
                       len("abc123"))
     self.assertEquals(vectorizer.get_vector_length(2), len("abc123") * 2)
 def test_sanity(self):
     count_chars = 20
     count_texts = 10
     vectorizer = CharVectorizer(ALPHABET_LOWERCASE)
     texts = create_random_texts(ALPHABET_LOWERCASE, count_chars,
                                 count_texts)
     matrix = vectorizer.transform(texts, count_chars)
     ones = 0
     zeros = 0
     for cell in np.nditer(matrix):
         if cell == 1:
             ones += 1
         else:
             zeros += 1
     
     self.assertEqual(ones, count_chars * count_texts)
     self.assertEqual(ones + zeros,
                     vectorizer.get_one_char_vector_length()
                     * count_chars * count_texts)
Beispiel #4
0
    def test_sanity(self):
        count_chars = 20
        count_texts = 10
        vectorizer = CharVectorizer(ALPHABET_LOWERCASE)
        texts = create_random_texts(ALPHABET_LOWERCASE, count_chars,
                                    count_texts)
        matrix = vectorizer.transform(texts, count_chars)
        ones = 0
        zeros = 0
        for cell in np.nditer(matrix):
            if cell == 1:
                ones += 1
            else:
                zeros += 1

        self.assertEqual(ones, count_chars * count_texts)
        self.assertEqual(
            ones + zeros,
            vectorizer.get_one_char_vector_length() * count_chars *
            count_texts)