Beispiel #1
0
def test_constellation_add(germaparl, discoursemes):

    corpus = get_corpus(germaparl)

    # init constellation
    topic_query = format_cqp_query(
        discoursemes['topic'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    topic_dump = corpus.query(
        topic_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const = Constellation(topic_dump)

    # add discourseme
    disc1_query = format_cqp_query(
        discoursemes['disc1'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    disc1_dump = corpus.query(
        disc1_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const.add_discourseme(disc1_dump)

    assert len(const.df) == 1599
    assert 'topic' in const.discoursemes
    assert len(const.discoursemes) == 2
def test_constellation_add():

    topic_query = format_cqp_query(TOPIC_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)

    # init constellation
    topic_dump = CORPUS.query(topic_query,
                              context=None,
                              context_break=S_CONTEXT)

    const = Constellation(topic_dump)

    # add discourseme
    disc1_query = format_cqp_query(DISC1_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)

    disc1_dump = CORPUS.query(disc1_query,
                              context=None,
                              context_break=S_CONTEXT)

    const.add_discourseme(disc1_dump)

    print(const.df)
    print(const.discoursemes.keys())
def test_constellation_init():

    # init constellation
    topic_query = format_cqp_query(TOPIC_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)

    topic_dump = CORPUS.query(topic_query,
                              context=None,
                              context_break=S_CONTEXT)

    const = Constellation(topic_dump)

    print(const.df)
Beispiel #4
0
def test_constellation_coll(germaparl, discoursemes):

    corpus = get_corpus(germaparl)

    # init constellation
    topic_query = format_cqp_query(
        discoursemes['topic'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    topic_dump = corpus.query(
        topic_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const = Constellation(topic_dump)

    # add discourseme 1
    disc1_query = format_cqp_query(
        discoursemes['disc1'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    disc1_dump = corpus.query(
        disc1_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const.add_discourseme(disc1_dump, name='disc1')

    # add discourseme 2
    disc2_query = format_cqp_query(
        discoursemes['disc2'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    disc2_dump = corpus.query(
        disc2_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const.add_discourseme(disc2_dump, name='disc2')

    dfs = const.collocates(windows=list(range(1, 21)))
    assert len(dfs) == 20
    assert len(dfs[1]) == 2
    assert len(dfs[20]) == 5
Beispiel #5
0
def test_constellation_init(germaparl, discoursemes):

    corpus = get_corpus(germaparl)

    # init constellation
    topic_query = format_cqp_query(
        discoursemes['topic'],
        p_query=discoursemes['parameters']['p_query'],
        s_query=discoursemes['parameters']['s_query'],
        flags=discoursemes['parameters']['flags_query'],
        escape=discoursemes['parameters']['escape_query'])
    topic_dump = corpus.query(
        topic_query,
        context=None,
        context_break=discoursemes['parameters']['s_context'])
    const = Constellation(topic_dump)

    assert isinstance(const.df, DataFrame)
    assert len(const.df) == 2777
def test_constellation_conc():

    topic_query = format_cqp_query(TOPIC_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)

    # init constellation
    topic_dump = CORPUS.query(topic_query,
                              context=None,
                              context_break=S_CONTEXT)

    const = Constellation(topic_dump)

    # add discourseme 1
    disc1_query = format_cqp_query(DISC1_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)
    disc1_dump = CORPUS.query(disc1_query,
                              context=None,
                              context_break=S_CONTEXT)

    const.add_discourseme(disc1_dump, name='disc1')

    # add discourseme 2
    disc2_query = format_cqp_query(DISC2_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)
    disc2_dump = CORPUS.query(disc2_query,
                              context=None,
                              context_break=S_CONTEXT)

    const.add_discourseme(disc2_dump, name='disc2')

    lines = const.concordance(s_show=['text_id'])
    print(lines)
def test_constellation_coll():

    topic_query = format_cqp_query(TOPIC_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)

    # init constellation
    topic_dump = CORPUS.query(topic_query,
                              context=None,
                              context_break=S_CONTEXT)
    const = Constellation(topic_dump)

    # add discourseme 1
    disc1_query = format_cqp_query(DISC1_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)
    disc1_dump = CORPUS.query(disc1_query,
                              context=None,
                              context_break=S_CONTEXT)

    const.add_discourseme(disc1_dump, name='disc1')

    # add discourseme 2
    disc2_query = format_cqp_query(DISC2_ITEMS,
                                   p_query=P_QUERY,
                                   s_query=S_QUERY,
                                   flags="%cd",
                                   escape=False)
    disc2_dump = CORPUS.query(disc2_query,
                              context=None,
                              context_break=S_CONTEXT)

    const.add_discourseme(disc2_dump, name='disc2')

    lines = const.collocates(windows=list(range(1, 20)))
    print(lines)