Esempio n. 1
0
def ngram_tuples(n, string, minlen=3, maxlen=25):
    return tlz.pipe(string,
                    utils.lower,
                    utils.splitter_of_words,
                    utils.filter_whitespace,
                    utils.filter_shorter_than(minlen),
                    utils.filter_longer_than(maxlen),
                    utils.filter_stopwords,
                    sliding_window_c(n))
Esempio n. 2
0
def test__filter_shorter_than(tokenset, mintokenlen, count):
    length = tlz.pipe(tokenset, utils.filter_shorter_than(mintokenlen), list,
                      len)
    assert (length == count)
def test__filter_shorter_than(tokenset, mintokenlen, count):
    length = tlz.pipe(tokenset,
                      utils.filter_shorter_than(mintokenlen),
                      list,
                      len)
    assert(length == count)
Esempio n. 4
0
def ngram_tuples(n, string, minlen=3, maxlen=25):
    return tlz.pipe(string, utils.lower, utils.splitter_of_words,
                    utils.filter_whitespace, utils.filter_shorter_than(minlen),
                    utils.filter_longer_than(maxlen), utils.filter_stopwords,
                    sliding_window_c(n))