Python parse Examples, dxr.trigrammer.regex_grammar.parse Python Examples

Example #1

0

Show file

File: core.py Project: abbeyj/dxr

def _path_trigram_filter(path, is_case_sensitive):
    """Return an ES filter clause that returns docs whose paths match the
    given path all the way to their ends.

    If a given path starts with a /, the user is explicitly requesting a match
    starting at the root level.

    """
    if path.startswith('/'):
        path = path[1:]  # Leading slashes aren't stored in the index.
        regex = '^{0}$'  # Insist it start at the beginning.
    else:
        regex = '(/|^){0}$'  # Start at any path segment.

    return es_regex_filter(
        regex_grammar.parse(
            regex.format(
                re.escape(
                    path.encode('ascii', 'backslashreplace')
                )
            )
        ),
        'path',
        is_case_sensitive
    )

Example #2

0

Show file

File: test_trigrammer.py Project: Darshnik/dxr

def test_python_visitor():
    """Make sure we can render out Python regexes from parse trees.

    There's just one difference from JS so far.

    """
    eq_(PythonRegexVisitor().visit(regex_grammar.parse(r'\a')), r'\a')

Example #3

0

Show file

File: test_trigrammer.py Project: zz22zz222/dxr

def test_python_visitor():
    """Make sure we can render out Python regexes from parse trees.

    There's just one difference from JS so far.

    """
    eq_(PythonRegexVisitor().visit(regex_grammar.parse(r'\a')), r'\a')

Example #4

0

Show file

File: core.py Project: nbstar/dxr

 def filter(self):
     glob = self._term["arg"]
     try:
         return es_regex_filter(
             regex_grammar.parse(glob_to_regex(glob)), "path", is_case_sensitive=self._term["case_sensitive"]
         )
     except NoTrigrams:
         raise BadTerm("Path globs need at least 3 literal characters in a row " "for speed.")

Example #5

0

Show file

File: test_trigrammer.py Project: Darshnik/dxr

def js_eq(regex, expected):
    """Assert that taking a regex apart into an AST and then building a JS
    regex from it matches the expected result.

    :arg regex: A string representing a regex pattern
    :arg expected: What to compare the reconstructed regex against

    """
    eq_(JsRegexVisitor().visit(regex_grammar.parse(regex)), expected)

Example #6

0

Show file

File: test_trigrammer.py Project: zz22zz222/dxr

def js_eq(regex, expected):
    """Assert that taking a regex apart into an AST and then building a JS
    regex from it matches the expected result.

    :arg regex: A string representing a regex pattern
    :arg expected: What to compare the reconstructed regex against

    """
    eq_(JsRegexVisitor().visit(regex_grammar.parse(regex)), expected)

Example #7

0

Show file

File: core.py Project: bozzmob/dxr

 def filter(self):
     glob = self._term['arg']
     try:
         return es_regex_filter(
             regex_grammar.parse(glob_to_regex(glob)),
             'path',
             is_case_sensitive=self._term['case_sensitive'])
     except NoTrigrams:
         raise BadTerm('Path globs need at least 3 literal characters in a row '
                       'for speed.')

Example #8

0

Show file

 def filter(self):
     glob = self._term['arg']
     try:
         return es_regex_filter(
             regex_grammar.parse(glob_to_regex(glob)),
             'path',
             is_case_sensitive=self._term['case_sensitive'])
     except NoTrigrams:
         raise BadTerm('Path globs need at least 3 literal characters in a row '
                       'for speed.')

Example #9

0

Show file

File: core.py Project: na-g/dxr

    def _regex_filter(self, path_seg_property_name, no_trigrams_error_text):
        """Return an ES regex filter that matches this filter's glob against the
        path segment at path_seg_property_name.

        """
        glob = self._term['arg']
        try:
            return es_regex_filter(
                regex_grammar.parse(glob_to_regex(glob)),
                path_seg_property_name,
                is_case_sensitive=self._term['case_sensitive'])
        except NoTrigrams:
            raise BadTerm(no_trigrams_error_text)

Example #10

0

Show file

File: core.py Project: jbradberry/dxr

    def _regex_filter(self, path_seg_property_name, no_trigrams_error_text):
        """Return an ES regex filter that matches this filter's glob against the
        path segment at path_seg_property_name.

        """
        glob = self._term['arg']
        try:
            return es_regex_filter(
                regex_grammar.parse(glob_to_regex(glob)),
                path_seg_property_name,
                is_case_sensitive=self._term['case_sensitive'])
        except NoTrigrams:
            raise BadTerm(no_trigrams_error_text)

Example #11

0

Show file

File: core.py Project: modulexcite/dxr

def _path_trigram_filter(path, is_case_sensitive):
    """Return an ES filter clause that returns docs whose paths match the
    given path all the way to their ends.

    If a given path starts with a /, the user is explicitly requesting a match
    starting at the root level.

    """
    if path.startswith('/'):
        path = path[1:]  # Leading slashes aren't stored in the index.
        regex = '^{0}$'  # Insist it start at the beginning.
    else:
        regex = '(/|^){0}$'  # Start at any path segment.

    return es_regex_filter(regex_grammar.parse(regex.format(re.escape(path))),
                           'path', is_case_sensitive)

Example #12

0

Show file

    def __init__(self, term, enabled_plugins):
        """Compile the Python equivalent of the regex so we don't have to lean
        on the regex cache during highlighting.

        Python's regex cache is naive: after it hits 100, it just clears: no
        LRU.

        """
        super(RegexpFilter, self).__init__(term, enabled_plugins)
        try:
            self._parsed_regex = regex_grammar.parse(term['arg'])
        except ParseError:
            raise BadTerm('Invalid regex.')
        self._compiled_regex = (
                re.compile(PythonRegexVisitor().visit(self._parsed_regex),
                           flags=0 if self._term['case_sensitive'] else re.I))

Example #13

0

Show file

File: core.py Project: jbradberry/dxr

    def __init__(self, term, enabled_plugins):
        """Compile the Python equivalent of the regex so we don't have to lean
        on the regex cache during highlighting.

        Python's regex cache is naive: after it hits 100, it just clears: no
        LRU.

        """
        super(RegexpFilter, self).__init__(term, enabled_plugins)
        try:
            self._parsed_regex = regex_grammar.parse(term['arg'])
        except ParseError:
            raise BadTerm('Invalid regex.')
        self._compiled_regex = (
                re.compile(PythonRegexVisitor().visit(self._parsed_regex),
                           flags=0 if self._term['case_sensitive'] else re.I))

Example #14

0

Show file

File: test_trigrammer.py Project: Darshnik/dxr

def test_parse_regexp():
    regex_grammar.parse('hello+ dolly')
    regex_grammar.parse('hello+|hi')
    regex_grammar.parse(r'(hello|hi) dolly')
    regex_grammar.parse(r'(hello|hi|) dolly')
    regex_grammar.parse(r'(hello||hi) dolly')
    regex_grammar.parse(r'|hello|hi')
    regex_grammar.parse(ur'aböut \d{2}')
    assert_raises(ParseError, regex_grammar.parse, '[smoo')

    # This isn't supported yet, so it's better to throw an error than to
    # quietly misinterpret the user's intent:
    assert_raises(ParseError, regex_grammar.parse, '(?:hi)')

Example #15

0

Show file

File: test_trigrammer.py Project: Darshnik/dxr

def visit_regex(regex):
    return SubstringTreeVisitor().visit(regex_grammar.parse(regex))

Example #16

0

Show file

File: test_trigrammer.py Project: zz22zz222/dxr

def test_parse_regexp():
    regex_grammar.parse('hello+ dolly')
    regex_grammar.parse('hello+|hi')
    regex_grammar.parse(r'(hello|hi) dolly')
    regex_grammar.parse(r'(hello|hi|) dolly')
    regex_grammar.parse(r'(hello||hi) dolly')
    regex_grammar.parse(r'|hello|hi')
    regex_grammar.parse(ur'aböut \d{2}')
    assert_raises(ParseError, regex_grammar.parse, '[smoo')

    # This isn't supported yet, so it's better to throw an error than to
    # quietly misinterpret the user's intent:
    assert_raises(ParseError, regex_grammar.parse, '(?:hi)')

Example #17

0

Show file

File: test_trigrammer.py Project: zz22zz222/dxr

def visit_regex(regex):
    return SubstringTreeVisitor().visit(regex_grammar.parse(regex))