Пример #1
0
def test_arc_is_complete():
    arc1 = Arc(NonTerminal('DT', 'the'), 2, 3, 1, [10])
    arc2 = Arc(NonTerminal('NP', 'DT', 'N'), 2, 3, 1, [12])
    arc3 = Arc(NonTerminal('NP', 'DT', 'N'), 2, 3, 2, [14])
    assert arc1.is_complete()
    assert not arc2.is_complete()
    assert arc3.is_complete()
Пример #2
0
def test_grammar_import():
    grammar = Grammar()
    grammar.load(StringIO(test_gram))
    assert grammar['NP'] == {NonTerminal('S', 'NP', 'VP'), }
    assert grammar['V'] == {
        NonTerminal('VP', 'V'), NonTerminal('VP', 'V', 'NP')}
    with pytest.raises(ValueError):
        grammar.load(StringIO('S NP VP'))
Пример #3
0
def test_extend():
    agenda = Agenda(simple_tokens, simple_lexicon)
    current = agenda.choose_next()
    assert current == Arc(Terminal('PN', 'I'), 0, 1, 1)
    agenda.predict(simple_grammar, current)
    agenda.extend(current)
    my_agenda = [
        Arc(Terminal('V', 'SLEEP'), 1, 2, 1),
        Arc(NonTerminal('NP', 'PN'), 0, 0, 0),
        Arc(NonTerminal('NP', 'PN'), 0, 1, 1)]
    for arc in agenda:
        assert arc in my_agenda
    for arc in my_agenda:
        assert arc in agenda
Пример #4
0
def test_choose_next():
    agenda = Agenda(simple_tokens, simple_lexicon)
    assert agenda.choose_next() == Arc(Terminal('PN', 'I'), 0, 1, 1)
    assert agenda.choose_next() == Arc(Terminal('V', 'SLEEP'), 1, 2, 1)
    agenda.agenda.append(Arc(NonTerminal('NP', 'N'), 0, 1, 0))
    # no completed arcs to select
    with pytest.raises(ValueError):
        assert agenda.choose_next()
Пример #5
0
def test_grammar_add():
    grammar = Grammar()
    grammar.add(NonTerminal.from_string('np --> n'))
    assert grammar['N'] == {NonTerminal('NP', 'N')}
    grammar.add(NonTerminal('vp', 'v', 'np'))
    assert grammar['V'] == {NonTerminal('VP', 'V', 'NP')}
    grammar.add(NonTerminal('NP', 'N', 'Y'))
    assert grammar['N'] == {
        NonTerminal('NP', 'N'), NonTerminal('NP', 'N', 'Y')}
Пример #6
0
def test_arc_eq():
    rule = NonTerminal('NP', 'N')
    start = 1
    end = 2
    dot = 1
    assert (
        Arc(rule, start, end, dot) ==
        Arc(rule, start, end, dot))
    assert(
        Arc(rule, start, end, dot) !=
        Arc(rule, start + 1, end, dot))
Пример #7
0
def test_nonterminal_eq():
    nonterminal1 = 'NP --> DT N'
    nonterminal2 = 'NP --> N'
    assert NonTerminal.from_string(nonterminal1) == \
        NonTerminal.from_string(nonterminal1)
    assert NonTerminal.from_string(nonterminal1) != \
        NonTerminal.from_string(nonterminal2)
    assert NonTerminal.from_string(nonterminal1) < \
        NonTerminal.from_string(nonterminal2)
Пример #8
0
def test_chart():
    chart = Chart(['I', 'SLEEP'])
    chart.add(Arc(NonTerminal('PN', 'I'), 0, 1, 1))
    assert not chart.is_sentence
    chart.add(Arc(NonTerminal('V', 'SLEEP'), 1, 2, 1))
    chart.add(Arc(NonTerminal('NP', 'PN'), 0, 1, 1, [1]))
    chart.add(Arc(NonTerminal('VP', 'V'), 1, 2, 1, [2]))
    chart.add(Arc(NonTerminal('S', 'VP'), 1, 2, 1, [2]))
    assert not chart.is_sentence
    chart.add(Arc(NonTerminal('S', 'NP', 'VP'), 0, 2, 2, [3, 4]))
    assert chart.is_sentence
    answer = [
        '0    1    2',
        ' ----       PN --> I',
        '      ----  V --> SLEEP',
        ' ----       NP --> PN',
        '      ----  VP --> V',
        '      ----  S --> VP',
        ' ---------  S --> NP VP']
    assert str(chart) == '\n'.join(answer)
Пример #9
0
def test_arc_extend():
    key = Arc(NonTerminal('N', 'cat'), start=0, end=1, dot=1)
    arc = Arc(NonTerminal('NP', 'N'), start=0, end=0, dot=0)
    ext = arc.get_extended(key)
    assert ext.rule == NonTerminal('NP', 'N')
    assert ext.start == 0
    assert ext.end == 1
    assert ext.dot == 1
    assert ext.history == [key]

    # key parent does not match current node in arc children
    arc = Arc(NonTerminal('VP', 'V'), start=0, end=0, dot=0)
    with pytest.raises(ValueError):
        arc.get_extended(key)
    arc = Arc(NonTerminal('NP', 'N'), start=1, end=2, dot=0)
    with pytest.raises(ValueError):
        arc.get_extended(key)
    arc = Arc(NonTerminal('NP', 'DT', 'N'), start=0, end=2, dot=1)
    with pytest.raises(ValueError):
        arc.get_extended(key)
Пример #10
0
def test_rule_len():
    assert len(NonTerminal('VP', 'ADV', 'V')) == 3
Пример #11
0
def test_nonterminal_str():
    rules = [
        'VP --> V',
        'NP --> DT ADJ N']
    for nonterminal in rules:
        assert str(NonTerminal.from_string(nonterminal)) == nonterminal
Пример #12
0
def test_nonterminal_const():
    nonterminal = NonTerminal('NP', 'DT', 'N')
    assert nonterminal.parent == 'NP'
    assert nonterminal.children == ('DT', 'N')

    nonterminal = NonTerminal.from_string('NP --> DT N')
    assert nonterminal.parent == 'NP'
    assert nonterminal.children == ('DT', 'N')

    with pytest.raises(ValueError):
        NonTerminal.from_string('--> V')
    with pytest.raises(ValueError):
        NonTerminal.from_string('NP VP --> V')
    with pytest.raises(ValueError):
        NonTerminal.from_string('VP -->')
    with pytest.raises(ValueError):
        NonTerminal('VP')
    with pytest.raises(ValueError):
        NonTerminal('VP', 'AUX V')
    with pytest.raises(ValueError):
        NonTerminal('S VP', 'V')

    assert NonTerminal('S', 'V').is_sentence
    assert not NonTerminal('VP', 'V').is_sentence
    assert not NonTerminal('VP', 'V').is_terminal
Пример #13
0
def test_arc_string():
    arc1 = Arc(NonTerminal('NP', 'N'), 0, 0, 0, [None])
    assert str(arc1) == '<0> NP --> *0 N [None] <0> {}'.format(id(arc1))
    arc2 = Arc(NonTerminal('VP', 'AUX', 'V'), 2, 4, 2, [arc1, None])
    assert str(arc2) == \
        '<2> VP --> AUX V *2 [{}, None] <4> {}'.format(id(arc1), id(arc2))
Пример #14
0
def test_terminal_str():
    rules = [
        'VP --> V',
        'NP --> DT ADJ N']
    for rule in rules:
        assert str(NonTerminal.from_string(rule)) == rule
Пример #15
0
def test_terminal_eq():
    rule1 = 'NP --> DT N'
    rule2 = 'NP --> N'
    assert NonTerminal.from_string(rule1) == NonTerminal.from_string(rule1)
    assert NonTerminal.from_string(rule1) != NonTerminal.from_string(rule2)
    assert NonTerminal.from_string(rule1) < NonTerminal.from_string(rule2)
Пример #16
0
simple_grammar.load(StringIO("""
    S --> NP VP
    NP --> PN
    VP --> V
    """))
simple_lexicon = Lexicon()
simple_lexicon.load(StringIO("""
    I : PN
    sleep : V
    """))
simple_parser = Parser(simple_grammar, simple_lexicon)
simple_sentence = ' i   sleep '
simple_tokens = ['I', 'SLEEP']
simple_parse = '[.S [.NP [.PN I]][.VP [.V SLEEP]]]'
simple_chart = [
    Arc(NonTerminal('S', 'NP', 'VP'), 0, 2, 2),
    Arc(NonTerminal('NP', 'PN'), 0, 1, 1),
    Arc(NonTerminal('VP', 'V'), 1, 2, 1),
    Arc(Terminal('PN', 'I'), 0, 1, 1),
    Arc(Terminal('V', 'SLEEP'), 1, 2, 1)]

complex_grammar = Grammar()
complex_grammar.load(StringIO("""
    S --> NP VP
    NP --> DT N
    NP --> DT ADJ N
    NP --> PN
    VP --> V
    VP --> VP NP
    VP --> AUX VP
    """))