def __init__(self, lexer, parser, parent): Token.__init__(self, 'Term', lexer, parser, parent) self.term = None self.lft = None self.rgt = None self.op = None # Expect a term. ttype, token = lexer.token() if lexer.current_is('varname'): if not parent.is_defined(token): lexer.error('Undeclared variable %s' % token, self, ValueError) self.term = Variable(lexer, parser, parent) elif lexer.current_is('open_function_call'): self.term = FunctionCall(lexer, parser, parent) elif lexer.current_is('string_delimiter'): self.term = String(lexer, parser, parent) elif lexer.next_if('number'): self.term = Number(token) elif lexer.next_if('keyword', 'false'): self.term = Number(0) elif lexer.next_if('keyword', 'true'): self.term = Number(1) elif lexer.next_if('octal_number'): self.term = Number(int(token[1:], 8)) elif lexer.next_if('hex_number'): self.term = Number(int(token[2:], 16)) elif lexer.current_is('regex_delimiter'): self.term = Regex(lexer, parser, parent) else: lexer.syntax_error('Expected term but got %s' % ttype, self) self.mark_end()
def __init__(self, lexer, parser, parent): Token.__init__(self, 'Extract', lexer, parser, parent) self.varnames = [] self.variables = {} self.append = False self.source = None if parser.no_prompt: msg = "'extract' keyword does not work with --no-prompt" lexer.syntax_error(msg, self) # First expect a regular expression. lexer.expect(self, 'keyword', 'extract') lexer.expect(self, 'whitespace') self.regex = Regex(lexer, parser, parent) # Expect "as" keyword. lexer.expect(self, 'whitespace') if lexer.next_if('keyword', 'as'): self.append = False elif lexer.next_if('keyword', 'into'): self.append = True else: _, token = lexer.token() msg = 'Expected "as" or "into" but got %s' % token lexer.syntax_error(msg, self) # Expect a list of variable names. while 1: # Variable name. lexer.expect(self, 'whitespace') _, token = lexer.token() lexer.expect(self, 'varname') if token in self.variables: lexer.syntax_error('Duplicate variable name %s', self) self.varnames.append(token) self.variables[token] = [] # Comma. if lexer.next_if('comma'): continue break self.parent.define(**self.variables) if len(self.varnames) != self.regex.n_groups: count = (len(self.varnames), self.regex.n_groups) error = '%s variables, but regex has %s groups' % count lexer.syntax_error(error, self) # Handle the "from" keyword. lexer.skip('whitespace') if lexer.next_if('keyword', 'from'): lexer.expect(self, 'whitespace') self.source = Term(lexer, parser, parent) self.mark_end()
def __init__(self, lexer, parser, parent): Token.__init__(self, "Extract", lexer, parser, parent) self.varnames = [] self.variables = {} self.append = False self.source = None if parser.no_prompt: msg = "'extract' keyword does not work with --no-prompt" lexer.syntax_error(msg, self) # First expect a regular expression. lexer.expect(self, "keyword", "extract") lexer.expect(self, "whitespace") self.regex = Regex(lexer, parser, parent) # Expect "as" keyword. lexer.expect(self, "whitespace") if lexer.next_if("keyword", "as"): self.append = False elif lexer.next_if("keyword", "into"): self.append = True else: _, token = lexer.token() msg = 'Expected "as" or "into" but got %s' % token lexer.syntax_error(msg, self) # Expect a list of variable names. while 1: # Variable name. lexer.expect(self, "whitespace") _, token = lexer.token() lexer.expect(self, "varname") if token in self.variables: lexer.syntax_error("Duplicate variable name %s", self) self.varnames.append(token) self.variables[token] = [] # Comma. if lexer.next_if("comma"): continue break self.parent.define(**self.variables) if len(self.varnames) != self.regex.n_groups: count = (len(self.varnames), self.regex.n_groups) error = "%s variables, but regex has %s groups" % count lexer.syntax_error(error, self) # Handle the "from" keyword. lexer.skip("whitespace") if lexer.next_if("keyword", "from"): lexer.expect(self, "whitespace") self.source = Term(lexer, parser, parent) self.mark_end()
class Extract(Token): def __init__(self, lexer, parser, parent): Token.__init__(self, 'Extract', lexer, parser, parent) self.varnames = [] self.variables = {} self.append = False self.source = None if parser.no_prompt: msg = "'extract' keyword does not work with --no-prompt" lexer.syntax_error(msg, self) # First expect a regular expression. lexer.expect(self, 'keyword', 'extract') lexer.expect(self, 'whitespace') self.regex = Regex(lexer, parser, parent) # Expect "as" keyword. lexer.expect(self, 'whitespace') if lexer.next_if('keyword', 'as'): self.append = False elif lexer.next_if('keyword', 'into'): self.append = True else: _, token = lexer.token() msg = 'Expected "as" or "into" but got %s' % token lexer.syntax_error(msg, self) # Expect a list of variable names. while 1: # Variable name. lexer.expect(self, 'whitespace') _, token = lexer.token() lexer.expect(self, 'varname') if token in self.variables: lexer.syntax_error('Duplicate variable name %s', self) self.varnames.append(token) self.variables[token] = [] # Comma. if lexer.next_if('comma'): continue break self.parent.define(**self.variables) if len(self.varnames) != self.regex.n_groups: count = (len(self.varnames), self.regex.n_groups) error = '%s variables, but regex has %s groups' % count lexer.syntax_error(error, self) # Handle the "from" keyword. lexer.skip('whitespace') if lexer.next_if('keyword', 'from'): lexer.expect(self, 'whitespace') self.source = Term(lexer, parser, parent) self.mark_end() def extract(self, context): # Re-initialize the variable content, because this method # might be called multiple times. for varname in self.varnames: self.variables[varname] = [] if self.source is None: buffer = self.parent.get('__response__') else: buffer = self.source.value(context) #print "Buffer contains", buffer # Walk through all lines, matching each one against the regular # expression. for line in buffer: match = self.regex.value(context).search(line) if match is None: continue # If there was a match, store the extracted substrings in our # list variables. i = 0 for varname in self.varnames: i += 1 try: value = match.group(i) except IndexError: # This happens if the user provided a regex with less # groups in it than the number of variables. msg = 'Extract: %s variables, but regular expression' % i msg += '\ncontains only %s groups.' % (i - 1) self.lexer.runtime_error(msg, self) self.variables[varname].append(value) def value(self, context): self.extract(context) if not self.append: self.parent.define(**self.variables) else: for key in self.variables: existing = self.parent.get(key) self.parent.define(**{key: existing + self.variables[key]}) return 1 def dump(self, indent = 0): mode = self.append and 'into' or 'as' source = self.source is not None and self.source or 'buffer' print (' ' * indent) + self.name, self.regex.string, print mode, self.varnames, "from", source
class Extract(Token): def __init__(self, lexer, parser, parent): Token.__init__(self, "Extract", lexer, parser, parent) self.varnames = [] self.variables = {} self.append = False self.source = None if parser.no_prompt: msg = "'extract' keyword does not work with --no-prompt" lexer.syntax_error(msg, self) # First expect a regular expression. lexer.expect(self, "keyword", "extract") lexer.expect(self, "whitespace") self.regex = Regex(lexer, parser, parent) # Expect "as" keyword. lexer.expect(self, "whitespace") if lexer.next_if("keyword", "as"): self.append = False elif lexer.next_if("keyword", "into"): self.append = True else: _, token = lexer.token() msg = 'Expected "as" or "into" but got %s' % token lexer.syntax_error(msg, self) # Expect a list of variable names. while 1: # Variable name. lexer.expect(self, "whitespace") _, token = lexer.token() lexer.expect(self, "varname") if token in self.variables: lexer.syntax_error("Duplicate variable name %s", self) self.varnames.append(token) self.variables[token] = [] # Comma. if lexer.next_if("comma"): continue break self.parent.define(**self.variables) if len(self.varnames) != self.regex.n_groups: count = (len(self.varnames), self.regex.n_groups) error = "%s variables, but regex has %s groups" % count lexer.syntax_error(error, self) # Handle the "from" keyword. lexer.skip("whitespace") if lexer.next_if("keyword", "from"): lexer.expect(self, "whitespace") self.source = Term(lexer, parser, parent) self.mark_end() def extract(self, context): # Re-initialize the variable content, because this method # might be called multiple times. for varname in self.varnames: self.variables[varname] = [] if self.source is None: buffer = self.parent.get("__response__") else: buffer = self.source.value(context) # print "Buffer contains", buffer # Walk through all lines, matching each one against the regular # expression. for line in buffer: match = self.regex.value(context).search(line) if match is None: continue # If there was a match, store the extracted substrings in our # list variables. i = 0 for varname in self.varnames: i += 1 try: value = match.group(i) except IndexError: # This happens if the user provided a regex with less # groups in it than the number of variables. msg = "Extract: %s variables, but regular expression" % i msg += "\ncontains only %s groups." % (i - 1) self.lexer.runtime_error(msg, self) self.variables[varname].append(value) def value(self, context): self.extract(context) if not self.append: self.parent.define(**self.variables) else: for key in self.variables: existing = self.parent.get(key) self.parent.define(**{key: existing + self.variables[key]}) return 1 def dump(self, indent=0): mode = self.append and "into" or "as" source = self.source is not None and self.source or "buffer" print (" " * indent) + self.name, self.regex.string, print mode, self.varnames, "from", source