Python sgrank示例

编程语言: Python

命名空间/包名称: textacy.extract.keyterms

方法/功能: sgrank

hotexamples.com的示例: 10

Python sgrank - 已找到10个示例。这些是从开源项目中提取的最受好评的textacy.extract.keyterms.sgrank现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def test_window_size(spacy_doc):
    result_10 = kt.sgrank(spacy_doc, window_size=10)
    result_100 = kt.sgrank(spacy_doc, window_size=100)
    assert len(result_10) > 0 and len(result_100) > 0
    assert result_10 != result_100
    with pytest.raises(ValueError):
        _ = kt.sgrank(spacy_doc, window_size=1)

示例#2

显示文件

def test_empty_doc(empty_spacy_doc):
    result = kt.sgrank(empty_spacy_doc)
    assert isinstance(result, list)
    assert len(result) == 0

示例#3

显示文件

def test_normalize_callable(spacy_doc):
    result = kt.sgrank(spacy_doc, normalize=lambda tok: tok.text.upper())
    assert len(result) > 0
    assert all(term == term.upper() for term, _ in result)

示例#4

显示文件

def test_normalize_lower(spacy_doc):
    result = kt.sgrank(spacy_doc, normalize="lower")
    assert len(result) > 0
    assert all(term == term.lower() for term, _ in result)

示例#5

显示文件

def test_normalize_none(spacy_doc):
    result = kt.sgrank(spacy_doc, normalize=None)
    assert len(result) > 0
    assert any(term != term.lower() for term, _ in result)

示例#6

显示文件

def test_topn_float(spacy_doc):
    result = kt.sgrank(spacy_doc, topn=0.2)
    assert len(result) > 0
    with pytest.raises(ValueError):
        _ = kt.sgrank(spacy_doc, topn=2.0)

示例#7

显示文件

def test_topn(spacy_doc):
    for n in (5, 25):
        result = kt.sgrank(spacy_doc, topn=n)
        assert 0 < len(result) <= n

示例#8

显示文件

def test_ngrams_2_3(spacy_doc):
    result = kt.sgrank(spacy_doc, ngrams=(2, 3))
    assert len(result) > 0
    assert all(2 <= len(term.split()) <= 3 for term, _ in result)

示例#9

显示文件

def test_ngrams_1(spacy_doc):
    result = kt.sgrank(spacy_doc, ngrams=1)
    assert len(result) > 0
    assert all(len(term.split()) == 1 for term, _ in result)

示例#10

显示文件

def test_default(spacy_doc):
    result = kt.sgrank(spacy_doc)
    assert isinstance(result, list) and len(result) > 0
    assert all(isinstance(ts, tuple) and len(ts) == 2 for ts in result)
    assert all(
        isinstance(ts[0], str) and isinstance(ts[1], float) for ts in result)