def test_group_by(self): self.assert_parsed_select( 'SELECT foo FROM bar GROUP BY baz', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None)], tq_ast.TableId('bar', None), None, [tq_ast.ColumnId('baz')], None, None, None, None))
def p_column_id(p): """column_id : id_component_list | id_component_list DOT STAR""" if len(p) == 2: p[0] = tq_ast.ColumnId(p[1]) else: p[0] = tq_ast.ColumnId(p[1] + '.*')
def test_select_comparison(self): self.assert_parsed_select( 'SELECT foo = bar FROM baz', tq_ast.Select([ tq_ast.SelectField( tq_ast.BinaryOperator('=', tq_ast.ColumnId('foo'), tq_ast.ColumnId('bar')), None, None) ], tq_ast.TableId('baz', None), None, None, None, None, None, None))
def test_limit(self): self.assert_parsed_select( 'SELECT SUM(foo) FROM bar GROUP BY baz LIMIT 10', tq_ast.Select([ tq_ast.SelectField( tq_ast.FunctionCall('sum', [tq_ast.ColumnId('foo')]), None, None) ], tq_ast.TableId('bar', None), None, [tq_ast.ColumnId('baz')], None, None, 10, None))
def test_subquery(self): self.assert_parsed_select( 'SELECT foo FROM (SELECT val AS foo FROM table)', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None)], tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('val'), 'foo', None)], tq_ast.TableId('table', None), None, None, None, None, None, None), None, None, None, None, None, None))
def test_multiple_select(self): self.assert_parsed_select( 'SELECT a AS foo, b bar, a + 1 baz FROM test_table', tq_ast.Select([ tq_ast.SelectField(tq_ast.ColumnId('a'), 'foo', None), tq_ast.SelectField(tq_ast.ColumnId('b'), 'bar', None), tq_ast.SelectField( tq_ast.BinaryOperator('+', tq_ast.ColumnId('a'), tq_ast.Literal(1)), 'baz', None) ], tq_ast.TableId('test_table', None), None, None, None, None, None, None))
def test_having(self): self.assert_parsed_select( 'SELECT foo + 2 FROM bar HAVING foo > 3', tq_ast.Select([ tq_ast.SelectField( tq_ast.BinaryOperator('+', tq_ast.ColumnId('foo'), tq_ast.Literal(2)), None, None) ], tq_ast.TableId('bar', None), None, None, tq_ast.BinaryOperator('>', tq_ast.ColumnId('foo'), tq_ast.Literal(3)), None, None, None))
def test_null_comparison_functions(self): self.assert_parsed_select( 'SELECT foo IS NULL, bar IS NOT NULL FROM table', tq_ast.Select([ tq_ast.SelectField( tq_ast.UnaryOperator('is_null', tq_ast.ColumnId('foo')), None, None), tq_ast.SelectField( tq_ast.UnaryOperator('is_not_null', tq_ast.ColumnId('bar')), None, None) ], tq_ast.TableId('table', None), None, None, None, None, None, None))
def test_within_clause(self): self.assert_parsed_select( 'SELECT fullname, COUNT(citiesLived.yearsLived) WITHIN ' 'citiesLived AS numberOfTimesInEachCity FROM table', tq_ast.Select([ tq_ast.SelectField(tq_ast.ColumnId('fullname'), None, None), tq_ast.SelectField( tq_ast.FunctionCall( 'count', [tq_ast.ColumnId('citiesLived.yearsLived')]), 'numberOfTimesInEachCity', 'citiesLived') ], tq_ast.TableId('table', None), None, None, None, None, None, None))
def test_within_record(self): self.assert_parsed_select( 'SELECT fullname, COUNT(children.name) WITHIN RECORD AS ' 'numberOfChildren FROM table', tq_ast.Select([ tq_ast.SelectField(tq_ast.ColumnId('fullname'), None, None), tq_ast.SelectField( tq_ast.FunctionCall('count', [tq_ast.ColumnId('children.name')]), 'numberOfChildren', 'RECORD') ], tq_ast.TableId('table', None), None, None, None, None, None, None))
def test_join_each(self): self.assert_parsed_select( 'SELECT 0 FROM table1 t1 JOIN EACH table2 t2 ON t1.foo = t2.bar', tq_ast.Select( [tq_ast.SelectField(tq_ast.Literal(0), None, None)], tq_ast.Join(tq_ast.TableId('table1', 't1'), [ tq_ast.PartialJoin( tq_ast.TableId('table2', 't2'), tq_ast.JoinType.INNER, tq_ast.BinaryOperator('=', tq_ast.ColumnId('t1.foo'), tq_ast.ColumnId('t2.bar')), ), ]), None, None, None, None, None, None))
def test_left_outer_join(self): self.assert_parsed_select( 'SELECT t1.foo, t2.bar ' 'FROM table1 t1 LEFT OUTER JOIN EACH table2 t2 ON t1.id = t2.id', tq_ast.Select( [ tq_ast.SelectField(tq_ast.ColumnId('t1.foo'), None, None), tq_ast.SelectField(tq_ast.ColumnId('t2.bar'), None, None) ], tq_ast.Join(tq_ast.TableId('table1', 't1'), [ tq_ast.PartialJoin( tq_ast.TableId('table2', 't2'), tq_ast.JoinType.LEFT_OUTER, tq_ast.BinaryOperator('=', tq_ast.ColumnId('t1.id'), tq_ast.ColumnId('t2.id')), ), ]), None, None, None, None, None, None)) self.assert_parsed_select( 'SELECT t1.foo, t2.bar ' 'FROM table1 t1 LEFT JOIN table2 t2 ON t1.id = t2.id', tq_ast.Select( [ tq_ast.SelectField(tq_ast.ColumnId('t1.foo'), None, None), tq_ast.SelectField(tq_ast.ColumnId('t2.bar'), None, None) ], tq_ast.Join(tq_ast.TableId('table1', 't1'), [ tq_ast.PartialJoin( tq_ast.TableId('table2', 't2'), tq_ast.JoinType.LEFT_OUTER, tq_ast.BinaryOperator('=', tq_ast.ColumnId('t1.id'), tq_ast.ColumnId('t2.id')), ), ]), None, None, None, None, None, None))
def test_multi_clause_case(self): self.assert_parsed_select( 'SELECT CASE WHEN x = 4 THEN 16 WHEN x = 5 THEN 25 END', tq_ast.Select([ tq_ast.SelectField( tq_ast.CaseExpression([ tq_ast.CaseClause( tq_ast.BinaryOperator('=', tq_ast.ColumnId('x'), tq_ast.Literal(4)), tq_ast.Literal(16)), tq_ast.CaseClause( tq_ast.BinaryOperator('=', tq_ast.ColumnId('x'), tq_ast.Literal(5)), tq_ast.Literal(25)), ]), None, None) ], None, None, None, None, None, None, None))
def test_select_from_table(self): self.assert_parsed_select( 'SELECT foo FROM bar', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None)], tq_ast.TableId('bar', None), None, None, None, None, None, None))
def test_dot_separated_table_name(self): self.assert_parsed_select( 'SELECT foo FROM dataset.table', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None)], tq_ast.TableId('dataset.table', None), None, None, None, None, None, None))
def test_record_star(self): self.assert_parsed_select( 'SELECT foo.* FROM table', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo.*'), None, None)], tq_ast.TableId('table', None), None, None, None, None, None, None))
def test_fully_qualified_name(self): self.assert_parsed_select( 'SELECT table.foo FROM table', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('table.foo'), None, None)], tq_ast.TableId('table', None), None, None, None, None, None, None))
def test_aggregates(self): self.assert_parsed_select( 'SELECT MAX(foo) FROM bar', tq_ast.Select([ tq_ast.SelectField( tq_ast.FunctionCall('max', [tq_ast.ColumnId('foo')]), None, None) ], tq_ast.TableId('bar', None), None, None, None, None, None, None))
def test_multiple_table_select(self): self.assert_parsed_select( 'SELECT foo FROM table1, table2', tq_ast.Select( [tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None)], tq_ast.TableUnion([ tq_ast.TableId('table1', None), tq_ast.TableId('table2', None), ]), None, None, None, None, None, None))
def test_redundant_commas_allowed(self): # In most cases, a comma at the end of a comma-separated list is OK. self.assert_parsed_select( 'SELECT foo IN (1, 2, 3,), bar, FROM table1, table2, ' 'GROUP BY col1, col2,', tq_ast.Select([ tq_ast.SelectField( tq_ast.FunctionCall('in', [ tq_ast.ColumnId('foo'), tq_ast.Literal(1), tq_ast.Literal(2), tq_ast.Literal(3) ]), None, None), tq_ast.SelectField(tq_ast.ColumnId('bar'), None, None) ], tq_ast.TableUnion([ tq_ast.TableId('table1', None), tq_ast.TableId('table2', None) ]), None, [tq_ast.ColumnId('col1'), tq_ast.ColumnId('col2')], None, None, None, None))
def test_order_by_multiple_fields(self): self.assert_compiled_select( 'SELECT value FROM table1 ORDER BY value2, value DESC', typed_ast.Select( select_fields=[ typed_ast.SelectField( typed_ast.ColumnRef('table1', 'value', tq_types.INT), 'value', None) ], table=typed_ast.Table('table1', self.table1_type_ctx), where_expr=typed_ast.Literal(True, tq_types.BOOL), group_set=None, having_expr=typed_ast.Literal(True, tq_types.BOOL), orderings=[ tq_ast.Ordering(tq_ast.ColumnId('value2'), True), tq_ast.Ordering(tq_ast.ColumnId('value'), False) ], limit=None, type_ctx=self.make_type_context( [(None, 'value', tq_types.INT)], self.make_type_context([('table1', 'value', tq_types.INT) ]))))
def test_order_by(self): self.assert_parsed_select( 'SELECT foo, bar, baz FROM table ORDER BY foo DESC, bar, baz ASC,', tq_ast.Select([ tq_ast.SelectField(tq_ast.ColumnId('foo'), None, None), tq_ast.SelectField(tq_ast.ColumnId('bar'), None, None), tq_ast.SelectField(tq_ast.ColumnId('baz'), None, None) ], tq_ast.TableId('table', None), None, None, None, [ tq_ast.Ordering(tq_ast.ColumnId('foo'), False), tq_ast.Ordering(tq_ast.ColumnId('bar'), True), tq_ast.Ordering(tq_ast.ColumnId('baz'), True) ], None, None))
def expand_select_fields(self, select_fields, table_expr): """Expand any stars into a list of all context columns. Arguments: select_fields: A list of uncompiled select fields, some of which can be tq_ast.Star. table_expr: The compiled table expression to reference, if necessary. """ table_ctx = table_expr.type_ctx star_select_fields = [] for table_name, col_name in table_ctx.columns: if table_name is not None: col_ref = table_name + '.' + col_name else: col_ref = col_name # Joins are special: the aliases default to a fully-qualified name. if isinstance(table_expr, typed_ast.Join): alias = table_name + '.' + col_name else: alias = col_name star_select_fields.append( tq_ast.SelectField(tq_ast.ColumnId(col_ref), alias, None)) result_fields = [] for field in select_fields: if isinstance(field, tq_ast.Star): result_fields.extend(star_select_fields) elif (field.expr and isinstance(field.expr, tq_ast.ColumnId) and field.expr.name.endswith('.*')): prefix = field.expr.name[:-len('.*')] record_star_fields = [ f for f in star_select_fields if f.alias.startswith(prefix) ] result_fields.extend(record_star_fields) else: result_fields.append(field) return result_fields
def test_group_each_by(self): self.assert_parsed_select( 'SELECT 0 FROM table GROUP EACH BY foo', tq_ast.Select([tq_ast.SelectField(tq_ast.Literal(0), None, None)], tq_ast.TableId('table', None), None, [tq_ast.ColumnId('foo')], None, None, None, None))