Python Document_Index示例

编程语言: Python

命名空间/包名称: osp.corpus.models

类/类型: Document_Index

hotexamples.com的示例: 17

Python Document_Index - 已找到17个示例。这些是从开源项目中提取的最受好评的osp.corpus.models.Document_Index现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

es_insert(5)

es_count(1)

es_create(1)

es_delete(1)

es_reset(1)

示例#1

显示文件

文件： corpus_index.py 项目： MichaelEdage/open-syllabus-project

def reset():

    """
    Reset the index.
    """

    Document_Index.es_reset()

示例#2

显示文件

文件： corpus_index.py 项目： MichaelEdage/open-syllabus-project

def delete():

    """
    Delete the index.
    """

    Document_Index.es_delete()

示例#3

显示文件

文件： corpus_index.py 项目： MichaelEdage/open-syllabus-project

def create():

    """
    Create the index.
    """

    Document_Index.es_create()

示例#4

显示文件

文件： test_text_to_docs.py 项目： MichaelEdage/open-syllabus-project

def test_matches(add_doc, add_text):

    """
    When documents match the query, write doc -> text rows.
    """

    wp1 = add_doc(content='War and Peace, Leo Tolstoy 1')
    wp2 = add_doc(content='War and Peace, Leo Tolstoy 2')
    wp3 = add_doc(content='War and Peace, Leo Tolstoy 3')

    ak1 = add_doc(content='Anna Karenina, Leo Tolstoy 1')
    ak2 = add_doc(content='Anna Karenina, Leo Tolstoy 2')

    Document_Index.es_insert()

    text = add_text(title='War and Peace', surname='Tolstoy')
    text_to_docs(text.id)

    # Should write 3 citation links.
    assert Citation.select().count() == 3

    # Should match "War and Peace," ignore "Anna Karenina".
    for doc in [wp1, wp2, wp3]:

        assert Citation.select().where(
            Citation.text==text,
            Citation.document==doc,
            Citation.tokens.contains(text.hash_tokens),
        )

示例#5

显示文件

文件： corpus_index.py 项目： MichaelEdage/open-syllabus-project

def insert():

    """
    Index documents.
    """

    Document_Index.es_insert()

示例#6

显示文件

文件： test_text_to_docs.py 项目： project-renard-survey/open-syllabus-project

def test_matches(add_doc, add_text):

    """
    When documents match the query, write doc -> text rows.
    """

    wp1 = add_doc(content='War and Peace, Leo Tolstoy 1')
    wp2 = add_doc(content='War and Peace, Leo Tolstoy 2')
    wp3 = add_doc(content='War and Peace, Leo Tolstoy 3')

    ak1 = add_doc(content='Anna Karenina, Leo Tolstoy 1')
    ak2 = add_doc(content='Anna Karenina, Leo Tolstoy 2')

    Document_Index.es_insert()

    text = add_text(title='War and Peace', surname='Tolstoy')
    text_to_docs(text.id)

    # Should write 3 citation links.
    assert Citation.select().count() == 3

    # Should match "War and Peace," ignore "Anna Karenina".
    for doc in [wp1, wp2, wp3]:

        assert Citation.select().where(
            Citation.text==text,
            Citation.document==doc,
            Citation.tokens.contains(text.hash_tokens),
        )

示例#7

显示文件

文件： test_text_to_docs.py 项目： MichaelEdage/open-syllabus-project

def test_no_matches(add_doc, add_text):

    """
    When no documents match, don't write any rows.
    """

    add_doc(content='War and Peace, Leo Tolstoy')
    Document_Index.es_insert()

    text = add_text(title='Master and Man', surname='Tolstoy')
    text_to_docs(text.id)

    # Shouldn't write any rows.
    assert Citation.select().count() == 0

示例#8

显示文件

文件： test_text_to_docs.py 项目： project-renard-survey/open-syllabus-project

def test_no_matches(add_doc, add_text):

    """
    When no documents match, don't write any rows.
    """

    add_doc(content='War and Peace, Leo Tolstoy')
    Document_Index.es_insert()

    text = add_text(title='Master and Man', surname='Tolstoy')
    text_to_docs(text.id)

    # Shouldn't write any rows.
    assert Citation.select().count() == 0

示例#9

显示文件

文件： test_es_insert.py 项目： project-renard-survey/open-syllabus-project

def test_es_insert(add_doc):
    """
    Document_Index.es_insert() should index the document body and id.
    """

    doc = add_doc(content='text')

    Document_Index.es_insert()

    es_doc = config.es.get(
        index='document',
        id=doc.id,
    )

    assert es_doc['_source']['body'] == 'text'

示例#10

显示文件

文件： test_es_insert.py 项目： MichaelEdage/open-syllabus-project

def test_es_insert(add_doc):

    """
    Document_Index.es_insert() should index the document body and id.
    """

    doc = add_doc(content='text')

    Document_Index.es_insert()

    es_doc = config.es.get(
        index='document',
        id=doc.id,
    )

    assert es_doc['_source']['body'] == 'text'

示例#11

显示文件

文件： corpus_index.py 项目： MichaelEdage/open-syllabus-project

def count():

    """
    Count documents.
    """

    click.echo(Document_Index.es_count())

示例#12

显示文件

文件： test_text_to_docs.py 项目： project-renard-survey/open-syllabus-project

def test_citation_formats(title, surname, content, add_doc, add_text):

    """
    Test title/author -> citation formats.
    """

    # Pad tokens around the match.
    padded = ('XXX '*1000) + content + (' XXX'*1000)

    doc = add_doc(content=padded)
    Document_Index.es_insert()

    text = add_text(title=title, surname=surname)
    text_to_docs(text.id)

    assert Citation.select().where(
        Citation.text==text,
        Citation.document==doc,
        Citation.tokens.contains(text.hash_tokens),
    )

示例#13

显示文件