Python ngrams示例

编程语言: Python

命名空间/包名称: nvtext

方法/功能: ngrams

hotexamples.com的示例: 2

Python ngrams - 已找到2个示例。这些是从开源项目中提取的最受好评的nvtext.ngrams现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： test_text.py 项目： williamBlazing/cudf

def test_ngrams():
    # bigrams
    strings = ["this is my favorite", "book on my bookshelf"]
    dstrings = nvstrings.to_device(strings)
    expected = [
        "this_is",
        "is_my",
        "my_favorite",
        "favorite_book",
        "book_on",
        "on_my",
        "my_bookshelf",
    ]
    tokens = nvtext.tokenize(dstrings)
    outcome = nvtext.ngrams(tokens, N=2, sep="_")
    assert outcome.to_host() == expected

    # trigrams
    strings = ["this is my favorite", "book on my bookshelf"]
    dstrings = nvstrings.to_device(strings)
    expected = [
        "this-is-my",
        "is-my-favorite",
        "my-favorite-book",
        "favorite-book-on",
        "book-on-my",
        "on-my-bookshelf",
    ]
    tokens = nvtext.tokenize(dstrings)
    outcome = nvtext.ngrams(tokens, N=3, sep="-")
    assert outcome.to_host() == expected

示例#2

显示文件

def test_ngrams():
    # bigrams
    strings = ['this is my favorite', 'book on my bookshelf']
    dstrings = nvstrings.to_device(strings)
    expected = [
        'this_is',
        'is_my',
        'my_favorite',
        'favorite_book',
        'book_on',
        'on_my',
        'my_bookshelf'
    ]
    tokens = nvtext.tokenize(dstrings)
    outcome = nvtext.ngrams(tokens, N=2, sep='_')
    assert outcome.to_host() == expected

    # trigrams
    strings = ['this is my favorite', 'book on my bookshelf']
    dstrings = nvstrings.to_device(strings)
    expected = [
        'this-is-my',
        'is-my-favorite',
        'my-favorite-book',
        'favorite-book-on',
        'book-on-my',
        'on-my-bookshelf'
    ]
    tokens = nvtext.tokenize(dstrings)
    outcome = nvtext.ngrams(tokens, N=3, sep='-')
    assert outcome.to_host() == expected