def test_vectorizer6(): text = ['foo bar', 'baz'] v = PooledVectorizer(2, sent_start='<s>') v.fit(text) bounds1, X1 = v.transform(text) text2 = ['foo alpha', 'foo bravo', 'foo charlie', 'foo delta'] bounds2, X2 = v.transform(text2) assert X1.max() >= X2.max()
def test_vectorizer5(): text = ['foo bar baz foo', 'foo baz'] v = PooledVectorizer(2) bounds, X = v.fit(text).transform(text) assert_array_equal(bounds, [[0, 3], [3, 4]]) assert_array_equal(X, [[2, 3], [3, 4], [4, 2], [2, 4]])