示例#1
0
def test_pickle_ngram_vectorizer():
    X, V = features.make_unlabeled_ngram_dataset(
        A,
        max_ngram=1,
        return_transformer=True)
    s = cPickle.dumps(V)
    V2 = cPickle.loads(s)
    X2 = V2.transform(A)
    assert (X == X2).all()
示例#2
0
def test_unlabeled_unigrams():
    """
    Unigram amino acid counts should result in length 20 vectors
    """
    n = len(A)
    X = features.make_unlabeled_ngram_dataset(A, max_ngram=1)
    assert len(X) == n, "Expected %d vectors but got %d" % (n, len(X))
    assert len(X.shape) == 2
    assert X.shape[1] == 20, \
        "Expected feature vectors to be of length 20, got %d" % X.shape[1]