Beispiel #1
0
    def test_comment(self):
        self.run_parser('#helloworld', 'comment', peek='', pos=(0, 11), ast=[
                AstNode('comment_text', 'helloworld', (0, 1))
            ])

        self.run_parser('#helloworld\nfoo', 'comment', peek='f', pos=(1, 0), ast=[
                AstNode('comment_text', 'helloworld', (0, 1))
            ])
Beispiel #2
0
    def test_char_range(self):
        self.run_parser('z-', 'CHARNOBRACE', peek='-', pos=(0, 1), ast=[
                AstNode('CHAR', 'z', (0, 0))
            ])

        self.run_parser('a-z-', 'CHARRANGE', peek='-', pos=(0, 3), ast=[
                AstNode('CHARRANGE', 'a-z', (0, 0),
                    AstNode('CHAR', 'a', (0, 0)), AstNode('CHAR', 'z', (0, 2)))
            ])
Beispiel #3
0
    def test_hex(self):
        self.run_parser('1234', 'HEXDIGIT', peek='2', pos=(0, 1))

        self.run_parser('23', 'HEX_ESCAPED_CHAR',
            [AstNode('HEX_ESCAPED_CHAR', '23', (0, 0))])

        self.run_parser('4abc', 'UNICODE_ESCAPED_CHAR_16',
            [AstNode('UNICODE_ESCAPED_CHAR_16', '4abc', (0, 0))])

        self.run_parser('def01234', 'UNICODE_ESCAPED_CHAR_32',
            [AstNode('UNICODE_ESCAPED_CHAR_32', 'def01234', (0, 0))])
Beispiel #4
0
 def test_indicators(self):
     self.run_parser('-', 'neg_indicator', [
             AstNode('neg_indicator', '-', (0, 0))
         ])
     self.run_parser('?', 'lookahead_indicator', [
             AstNode('lookahead_indicator', '?', (0, 0))
         ])
     self.run_parser('+', 'occurrence_indicator', [
             AstNode('occurrence_indicator', '+', (0, 0))
         ])
     self.run_parser('*', 'occurrence_indicator', [
             AstNode('occurrence_indicator', '*', (0, 0))
         ])
     self.run_parser('?', 'occurrence_indicator', [
             AstNode('occurrence_indicator', '?', (0, 0))
         ])
Beispiel #5
0
    def test_range_special(self):
        self.run_parser('[]]', 'range', [
                AstNode('range', '[]]', (0, 0), AstNode('CHARBRACE', ']', (0, 1)))
            ])

        self.run_parser('[]-]', 'range', [
                AstNode('range', '[]-]', (0, 0),
                    AstNode('CHARBRACE', ']', (0, 1)),
                    AstNode('CHARDASH', '-', (0, 2)))
            ])

        self.run_parser('[]-X]', 'range', [
                AstNode('range', '[]-X]', (0, 0),
                    AstNode('CHARBRACE', ']', (0, 1)),
                    AstNode('CHARDASH', '-', (0, 2)),
                    AstNode('CHAR', 'X', (0, 3)))
            ])
Beispiel #6
0
    def test_names(self):
        self.run_parser('foobar', 'name', [AstNode('name', 'foobar', (0, 0))])
        self.run_parser('FOOBAR', 'name', [AstNode('name', 'FOOBAR', (0, 0))])
        self.run_parser('_fooBAR1234', 'name', [AstNode('name', '_fooBAR1234', (0, 0))])

        self.run_parser('>foobar<', 'expandedname', [
                AstNode('expandedname', '>foobar<', (0, 0),
                    AstNode('name', 'foobar', (0, 1)))
            ])

        self.run_parser('<foobar>', 'unreportedname', [
                AstNode('unreportedname', '<foobar>', (0, 0),
                    AstNode('name', 'foobar', (0, 1)))
            ])
Beispiel #7
0
    def test_error_on_fail(self):
        self.run_parser('!', 'error_on_fail', [AstNode('error_on_fail', '!', (0, 0))])

        self.run_parser('!"fail"', 'error_on_fail', [
                AstNode('error_on_fail', '!"fail"', (0, 0),
                        AstNode('literal', '"fail"', (0, 1),
                            AstNode('CHAR_NO_DBLQUOTE', 'fail', (0, 2)))
                    )
            ])

        self.run_parser('!   "fail"', 'error_on_fail', [
                AstNode('error_on_fail', '!   "fail"', (0, 0),
                        AstNode('literal', '"fail"', (0, 4),
                            AstNode('CHAR_NO_DBLQUOTE', 'fail', (0, 5)))
                    )
            ])
Beispiel #8
0
 def test_declaration_set(self):
     text = 'myrule := foobar\notherrule := baz #comments'
     self.run_parser(text, 'declaration_set', [
             AstNode('declaration_set', text, (0, 0),
                     AstNode('declaration', 'myrule := foobar\n', (0, 0),
                             AstNode('name', 'myrule', (0, 0)),
                             AstNode('seq_group', ' foobar\n', (0, 9),
                                     AstNode('element_token', 'foobar\n', (0, 10),
                                         AstNode('name', 'foobar', (0, 10)))
                                 )
                         ),
                     AstNode('declaration', 'otherrule := baz #comments', (1, 0),
                             AstNode('name', 'otherrule', (1, 0)),
                             AstNode('seq_group', ' baz #comments', (1, 12),
                                     AstNode('element_token', 'baz #comments', (1, 13),
                                         AstNode('name', 'baz', (1, 13)))
                                 )
                         )
                 )
         ])
Beispiel #9
0
    def test_declaration(self):
        self.run_parser('myrule ::= foobar', 'declaration', [
                AstNode('declaration', 'myrule ::= foobar', (0, 0),
                        AstNode('name', 'myrule', (0, 0)),
                        AstNode('seq_group', ' foobar', (0, 10),
                                AstNode('element_token', 'foobar', (0, 11),
                                    AstNode('name', 'foobar', (0, 11)))
                            )
                    )
            ])

        self.run_parser('myrule := foobar', 'declaration', [
                AstNode('declaration', 'myrule := foobar', (0, 0),
                        AstNode('name', 'myrule', (0, 0)),
                        AstNode('seq_group', ' foobar', (0, 9),
                                AstNode('element_token', 'foobar', (0, 10),
                                    AstNode('name', 'foobar', (0, 10)))
                            )
                    )
            ])

        self.run_parser(' <myrule> ::= foobar', 'declaration', [
                AstNode('declaration', ' <myrule> ::= foobar', (0, 0),
                        AstNode('unreportedname', '<myrule>', (0, 1),
                            AstNode('name', 'myrule', (0, 2))),
                        AstNode('seq_group', ' foobar', (0, 13),
                                AstNode('element_token', 'foobar', (0, 14),
                                    AstNode('name', 'foobar', (0, 14)))
                            )
                    )
            ])

        self.run_parser(' >myrule< ::= foobar    ', 'declaration', [
                AstNode('declaration', ' >myrule< ::= foobar    ', (0, 0),
                        AstNode('expandedname', '>myrule<', (0, 1),
                            AstNode('name', 'myrule', (0, 2))),
                        AstNode('seq_group', ' foobar    ', (0, 13),
                                AstNode('element_token', 'foobar    ', (0, 14),
                                    AstNode('name', 'foobar', (0, 14)))
                            )
                    )
            ])

        self.run_parser_fail('<foobar := foo', 'declaration',
                '(1, 8): Expected closing ">"')

        self.run_parser_fail('>foobar := foo', 'declaration',
                '(1, 8): Expected closing "<"')

        self.run_parser_fail('!foobar := foo', 'declaration',
                '(1, 1): Expected name, <unreported>, or >expanded< declaration')

        self.run_parser_fail('foobar << foo', 'declaration',
                '(1, 8): Expected := or ::= operator')
Beispiel #10
0
    def test_element_token(self):
        self.run_parser('foobar', 'element_token',[
                AstNode('element_token', 'foobar', (0, 0),
                    AstNode('name', 'foobar', (0, 0)))
            ])

        self.run_parser('?foobar', 'element_token',[
                AstNode('element_token', '?foobar', (0, 0),
                        AstNode('lookahead_indicator', '?', (0, 0)),
                        AstNode('name', 'foobar', (0, 1))
                    )
            ])

        self.run_parser('-foobar', 'element_token',[
                AstNode('element_token', '-foobar', (0, 0),
                        AstNode('neg_indicator', '-', (0, 0)),
                        AstNode('name', 'foobar', (0, 1))
                    )
            ])

        self.run_parser('foobar+', 'element_token',[
                AstNode('element_token', 'foobar+', (0, 0),
                        AstNode('name', 'foobar', (0, 0)),
                        AstNode('occurrence_indicator', '+', (0, 6))
                    )
            ])

        self.run_parser('foobar*', 'element_token',[
                AstNode('element_token', 'foobar*', (0, 0),
                        AstNode('name', 'foobar', (0, 0)),
                        AstNode('occurrence_indicator', '*', (0, 6))
                    )
            ])

        self.run_parser('foobar?', 'element_token',[
                AstNode('element_token', 'foobar?', (0, 0),
                        AstNode('name', 'foobar', (0, 0)),
                        AstNode('occurrence_indicator', '?', (0, 6))
                    )
            ])

        self.run_parser('? foobar + !"fail"', 'element_token',[
                AstNode('element_token', '? foobar + !"fail"', (0, 0),
                        AstNode('lookahead_indicator', '?', (0, 0)),
                        AstNode('name', 'foobar', (0, 2)),
                        AstNode('occurrence_indicator', '+', (0, 9)),
                        AstNode('error_on_fail', '!"fail"', (0, 11),
                                AstNode('literal', '"fail"', (0, 12),
                                    AstNode('CHAR_NO_DBLQUOTE', 'fail', (0, 13)))
                            )
                    )
            ])
Beispiel #11
0
    def test_escaped_char(self):
        self.run_parser('\\x42', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\x42', (0, 0),
                    AstNode('HEX_ESCAPED_CHAR', '42', (0, 2)))
            ])

        self.run_parser('\\u201d', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\u201d', (0, 0),
                    AstNode('UNICODE_ESCAPED_CHAR_16', '201d', (0, 2)))
            ])

        self.run_parser('\\Uabcdef01', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\Uabcdef01', (0, 0),
                    AstNode('UNICODE_ESCAPED_CHAR_32', 'abcdef01', (0, 2)))
            ])

        self.run_parser('\\777', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\777', (0, 0),
                    AstNode('OCTAL_ESCAPED_CHAR', '777', (0, 1)))
            ])

        self.run_parser('\\t', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\t', (0, 0),
                    AstNode('SPECIAL_ESCAPED_CHAR', 't', (0, 1)))
            ])

        self.run_parser('\\n', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\n', (0, 0),
                    AstNode('SPECIAL_ESCAPED_CHAR', 'n', (0, 1)))
            ])

        self.run_parser('\\"', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\"', (0, 0),
                    AstNode('SPECIAL_ESCAPED_CHAR', '"', (0, 1)))
            ])

        self.run_parser('\\\\', 'ESCAPED_CHAR', [
                AstNode('ESCAPED_CHAR', '\\\\', (0, 0),
                    AstNode('SPECIAL_ESCAPED_CHAR', '\\', (0, 1)))
            ])

        self.run_parser_fail('\\x', 'ESCAPED_CHAR',
                '(1, 3): Expected two hex digits following "\\x"')

        self.run_parser_fail('\\u', 'ESCAPED_CHAR',
                '(1, 3): Expected four hex digits following "\\u"')

        self.run_parser_fail('\\U', 'ESCAPED_CHAR',
                '(1, 3): Expected eight hex digits following "\\U"')

        self.run_parser_fail('\\', 'ESCAPED_CHAR',
                '(1, 2): Expected escape sequence following "\\"')
Beispiel #12
0
    def test_groups(self):
        self.run_parser('/', 'fo_indicator', peek='', pos=(0, 1))
        self.run_parser(',', 'seq_indicator', peek='', pos=(0, 1))

        # TODO: modify fo_group to discard 'ts' like seq_group
        self.run_parser(' hello /foobar / world', 'fo_group', [
                AstNode('fo_group', ' hello /foobar / world', (0, 0),
                        AstNode('element_token', 'hello ', (0, 1),
                            AstNode('name', 'hello', (0, 1))),
                        AstNode('element_token', 'foobar ', (0, 8),
                            AstNode('name', 'foobar', (0, 8))),
                        AstNode('element_token', 'world', (0, 17),
                            AstNode('name', 'world', (0, 17))),
                    )
            ])

        self.run_parser(' hello ,foobar , world', 'seq_group', [
                AstNode('seq_group', ' hello ,foobar , world', (0, 0),
                        AstNode('element_token', 'hello ', (0, 1),
                            AstNode('name', 'hello', (0, 1))),
                        AstNode('element_token', 'foobar ', (0, 8),
                            AstNode('name', 'foobar', (0, 8))),
                        AstNode('element_token', 'world', (0, 17),
                            AstNode('name', 'world', (0, 17))),
                    )
            ])

        self.run_parser('! "fail",  hello, foobar', 'seq_group', [
                AstNode('seq_group', '! "fail",  hello, foobar', (0, 0),
                        AstNode('error_on_fail', '! "fail"', (0, 0),
                                AstNode('literal', '"fail"', (0, 2),
                                    AstNode('CHAR_NO_DBLQUOTE', 'fail', (0, 3)))
                            ),
                        AstNode('element_token', 'hello', (0, 11),
                            AstNode('name', 'hello', (0, 11))),
                        AstNode('element_token', 'foobar', (0, 18),
                            AstNode('name', 'foobar', (0, 18))),
                    )
            ])

        self.run_parser(' hello , foobar/world, !"fail"', 'seq_group', [
                AstNode('seq_group', ' hello , foobar/world, !"fail"', (0, 0),
                        AstNode('element_token', 'hello ', (0, 1),
                            AstNode('name', 'hello', (0, 1))),
                        AstNode('fo_group', 'foobar/world', (0, 9),
                                AstNode('element_token', 'foobar', (0, 9),
                                    AstNode('name', 'foobar', (0, 9))),
                                AstNode('element_token', 'world', (0, 16),
                                    AstNode('name', 'world', (0, 16)))
                            ),
                        AstNode('error_on_fail', '!"fail"', (0, 23),
                                AstNode('literal', '"fail"', (0, 24),
                                    AstNode('CHAR_NO_DBLQUOTE', 'fail', (0, 25)))
                            )
                    )
            ])

        self.run_parser('( hello ,foobar , world)   ', 'group', [
                AstNode('seq_group', ' hello ,foobar , world', (0, 1),
                        AstNode('element_token', 'hello ', (0, 2),
                            AstNode('name', 'hello', (0, 2))),
                        AstNode('element_token', 'foobar ', (0, 9),
                            AstNode('name', 'foobar', (0, 9))),
                        AstNode('element_token', 'world', (0, 18),
                            AstNode('name', 'world', (0, 18))),
                    )
            ])

        self.run_parser_fail('12345', 'seq_group',
                '(1, 1): Expected one or more terms in sequence')

        self.run_parser_fail('(foobar', 'group',
                '(1, 8): Expected closing ")"')
Beispiel #13
0
 def test_octal(self):
     self.run_parser('01234567', 'OCTAL_ESCAPED_CHAR',
         [AstNode('OCTAL_ESCAPED_CHAR', '012', (0, 0))])
Beispiel #14
0
    def test_literal(self):
        self.run_parser('c"foo"', 'literal', pos=(0, 6), ast=[
                AstNode('literal', 'c"foo"', (0, 0),
                        AstNode('literalDecorator', 'c', (0, 0)),
                        AstNode('CHAR_NO_DBLQUOTE', 'foo', (0, 2))
                    )
            ])

        self.run_parser("c'foo'", 'literal', pos=(0, 6), ast=[
                AstNode('literal', "c'foo'", (0, 0),
                        AstNode('literalDecorator', 'c', (0, 0)),
                        AstNode('CHAR_NO_SNGLQUOTE', 'foo', (0, 2))
                    )
            ])

        self.run_parser('"foo"', 'literal', pos=(0, 5), ast=[
                AstNode('literal', '"foo"', (0, 0),
                        AstNode('CHAR_NO_DBLQUOTE', 'foo', (0, 1))
                    )
            ])

        self.run_parser("'foo'", 'literal', pos=(0, 5), ast=[
                AstNode('literal', "'foo'", (0, 0),
                        AstNode('CHAR_NO_SNGLQUOTE', 'foo', (0, 1))
                    )
            ])

        self.run_parser('"foo\\nbar\\n"', 'literal', [
                AstNode('literal', '"foo\\nbar\\n"', (0, 0),
                        AstNode('CHAR_NO_DBLQUOTE', 'foo', (0, 1)),
                        AstNode('ESCAPED_CHAR', '\\n', (0, 4),
                            AstNode('SPECIAL_ESCAPED_CHAR', 'n', (0, 5))),
                        AstNode('CHAR_NO_DBLQUOTE', 'bar', (0, 6)),
                        AstNode('ESCAPED_CHAR', '\\n', (0, 9),
                            AstNode('SPECIAL_ESCAPED_CHAR', 'n', (0, 10)))
                    )
            ])

        self.run_parser_fail('"foobar', 'literal',
                '(1, 2): Expected closing double-quote')

        self.run_parser_fail("'foobar", 'literal',
                '(1, 2): Expected closing single-quote')
Beispiel #15
0
    def test_range(self):
        self.run_parser('[a-z]', 'range', [
                AstNode('range', '[a-z]', (0, 0),
                        AstNode('CHARRANGE', 'a-z', (0, 1),
                                AstNode('CHAR', 'a', (0, 1)),
                                AstNode('CHAR', 'z', (0, 3))
                            )
                    )
            ])

        self.run_parser('[a-z-]', 'range', [
                AstNode('range', '[a-z-]', (0, 0),
                        AstNode('CHARRANGE', 'a-z', (0, 1),
                                AstNode('CHAR', 'a', (0, 1)),
                                AstNode('CHAR', 'z', (0, 3))),
                        AstNode('CHAR', '-', (0, 4))
                    )
            ])

        self.run_parser('[a-zA-Z0-9]', 'range', [
                AstNode('range', '[a-zA-Z0-9]', (0, 0),
                        AstNode('CHARRANGE', 'a-z', (0, 1),
                            AstNode('CHAR', 'a', (0, 1)), AstNode('CHAR', 'z', (0, 3))),
                        AstNode('CHARRANGE', 'A-Z', (0, 4),
                            AstNode('CHAR', 'A', (0, 4)), AstNode('CHAR', 'Z', (0, 6))),
                        AstNode('CHARRANGE', '0-9', (0, 7),
                            AstNode('CHAR', '0', (0, 7)), AstNode('CHAR', '9', (0, 9)))
                    )
            ])

        self.run_parser('[a]', 'range', [
                AstNode('range', '[a]', (0, 0), AstNode('CHAR', 'a', (0, 1)))
            ])

        self.run_parser('[qwerty]', 'range', [
                AstNode('range', '[qwerty]', (0, 0),
                        AstNode('CHAR', 'q', (0, 1)),
                        AstNode('CHAR', 'w', (0, 2)),
                        AstNode('CHAR', 'e', (0, 3)),
                        AstNode('CHAR', 'r', (0, 4)),
                        AstNode('CHAR', 't', (0, 5)),
                        AstNode('CHAR', 'y', (0, 6))
                    )
            ])

        self.run_parser('[a-]', 'range', [
                AstNode('range', '[a-]', (0, 0),
                    AstNode('CHAR', 'a', (0, 1)), AstNode('CHAR', '-', (0, 2)))
            ])

        self.run_parser('[]a-]', 'range', [
                AstNode('range', '[]a-]', (0, 0),
                        AstNode('CHARBRACE', ']', (0, 1)),
                        AstNode('CHAR', 'a', (0, 2)),
                        AstNode('CHAR', '-', (0, 3))
                    )
            ])

        self.run_parser('[]a]', 'range', [
                AstNode('range', '[]a]', (0, 0),
                        AstNode('CHARBRACE', ']', (0, 1)),
                        AstNode('CHAR', 'a', (0, 2))
                    )
            ])

        self.run_parser('[]--]', 'range', [
                AstNode('range', '[]--]', (0, 0),
                        AstNode('CHARBRACE', ']', (0, 1)),
                        AstNode('CHARDASH', '-', (0, 2)),
                        AstNode('CHAR', '-', (0, 3))
                    )
            ])

        self.run_parser('[\\v-\\t]', 'range', [
                AstNode('range', '[\\v-\\t]', (0, 0),
                        AstNode('CHARRANGE', '\\v-\\t', (0, 1),
                                AstNode('ESCAPED_CHAR', '\\v', (0, 1),
                                    AstNode('SPECIAL_ESCAPED_CHAR', 'v', (0, 2))),
                                AstNode('ESCAPED_CHAR', '\\t', (0, 4),
                                    AstNode('SPECIAL_ESCAPED_CHAR', 't', (0, 5)))
                            )
                    )
            ])

        self.run_parser_fail('[foo', 'range', '(1, 5): Expected closing "]"')