Example #1
0
    def test_ctas(self):
        expression = parse_one("SELECT * FROM y")

        self.assertEqual(
            Rewriter(expression).ctas("x").expression.sql(),
            "CREATE TABLE x AS SELECT * FROM y",
        )

        self.assertEqual(
            Rewriter(expression).ctas(
                "x", db="foo", file_format="parquet").expression.sql("hive"),
            "CREATE TABLE foo.x STORED AS parquet AS SELECT * FROM y",
        )

        self.assertEqual(expression.sql(), "SELECT * FROM y")

        rewriter = Rewriter(expression).ctas("x")
        self.assertEqual(rewriter.expression.sql(),
                         "CREATE TABLE x AS SELECT * FROM y")
        self.assertEqual(
            rewriter.ctas("y").expression.sql(),
            "CREATE TABLE y AS SELECT * FROM y",
        )

        expression = parse_one("CREATE TABLE x AS SELECT * FROM y")
        rewriter = Rewriter(expression, copy=False).ctas("x",
                                                         file_format="ORC")
        self.assertEqual(expression.sql("hive"),
                         "CREATE TABLE x STORED AS ORC AS SELECT * FROM y")
Example #2
0
 def test_text(self):
     column = parse_one("a.b.c")
     self.assertEqual(column.text("this"), "c")
     self.assertEqual(column.text("y"), "")
     self.assertEqual(
         parse_one("select * from x.y").find(exp.Table).text("db"), "x")
     self.assertEqual(parse_one("select *").text("this"), "")
     self.assertEqual(parse_one("1 + 1").text("this"), "1")
     self.assertEqual(parse_one("'a'").text("this"), "a")
Example #3
0
    def test_pretty(self):
        with open(os.path.join(self.fixtures_dir, "pretty.sql"),
                  encoding="utf-8") as f:
            lines = f.read().split(";")
            size = len(lines)

            for i in range(0, size, 2):
                if i + 1 < size:
                    sql = lines[i]
                    pretty = lines[i + 1].strip()
                    generated = transpile(sql, pretty=True)[0]
                    self.assertEqual(generated, pretty)
                    self.assertEqual(parse_one(sql), parse_one(pretty))
Example #4
0
    def test_find_all(self):
        expression = parse_one("""
            SELECT *
            FROM (
                SELECT b.*
                FROM a.b b
            ) x
            JOIN (
              SELECT c.foo
              FROM a.c c
              WHERE foo = 1
            ) y
              ON x.c = y.foo
            CROSS JOIN (
              SELECT *
              FROM (
                SELECT d.bar
                FROM d
              ) nested
            ) z
              ON x.c = y.foo
            """)

        self.assertEqual(
            [
                table.args["this"].args["this"]
                for table in expression.find_all(exp.Table)
            ],
            ["d", "c", "b"],
        )
Example #5
0
    def test_column(self):
        column = parse_one("a.b.c")
        self.assertEqual(column.args["this"].args["this"], "c")
        self.assertEqual(column.args["table"].args["this"], "b")
        self.assertEqual(column.args["db"].args["this"], "a")

        column = parse_one("a")
        self.assertEqual(column.args["this"].args["this"], "a")
        self.assertIsNone(column.args.get("table"))
        self.assertIsNone(column.args.get("db"))

        column = parse_one("a.b.c.d")
        self.assertIsNone(column.args.get("this"))
        self.assertIsNone(column.args.get("table"))
        self.assertIsNone(column.args.get("db"))
        self.assertEqual(
            [f.args["this"] for f in column.args["fields"]],
            ["a", "b", "c", "d"],
        )
Example #6
0
    def test_add_selects(self):
        expression = parse_one("SELECT * FROM (SELECT * FROM x) y")

        self.assertEqual(
            Rewriter(expression).add_selects(
                "a",
                "sum(b) as c",
            ).expression.sql("hive"),
            "SELECT *, a, SUM(b) AS c FROM (SELECT * FROM x) AS y",
        )
Example #7
0
    def test_transform_no_infinite_recursion(self):
        expression = parse_one("a")

        def fun(node):
            if isinstance(
                    node,
                    exp.Column) and node.args["this"].args["this"] == "a":
                return parse_one("FUN(a)")
            return node

        self.assertEqual(expression.transform(fun).sql(), "FUN(a)")
Example #8
0
 def test_find(self):
     expression = parse_one(
         "CREATE TABLE x STORED AS PARQUET AS SELECT * FROM y")
     self.assertTrue(expression.find(exp.Create))
     self.assertFalse(expression.find(exp.Group))
     self.assertEqual(
         [
             table.args["this"].args["this"]
             for table in expression.find_all(exp.Table)
         ],
         ["y", "x"],
     )
Example #9
0
    def test_transform_simple(self):
        expression = parse_one("IF(a > 0, a, b)")

        def fun(node):
            if isinstance(
                    node,
                    exp.Column) and node.args["this"].args["this"] == "a":
                return parse_one("c - 2")
            return node

        actual_expression_1 = expression.transform(fun)
        self.assertEqual(actual_expression_1.sql(dialect="presto"),
                         "IF(c - 2 > 0, c - 2, b)")
        self.assertIsNot(actual_expression_1, expression)

        actual_expression_2 = expression.transform(fun, copy=False)
        self.assertEqual(actual_expression_2.sql(dialect="presto"),
                         "IF(c - 2 > 0, c - 2, b)")
        self.assertIs(actual_expression_2, expression)

        with self.assertRaises(ValueError):
            parse_one("a").transform(lambda n: None)
Example #10
0
 def test_hash(self):
     self.assertEqual(
         {
             parse_one("select a.b"),
             parse_one("1+2"),
             parse_one('"a".b'),
             parse_one("a.b.c.d"),
         },
         {
             parse_one("select a.b"),
             parse_one("1+2"),
             parse_one('"a"."b"'),
             parse_one("a.b.c.d"),
         },
     )
Example #11
0
    def test_identify(self):
        expression = parse_one("""
            SELECT a, "b", c AS c, d AS "D", e AS "y|z'"
            FROM y."z"
        """)

        assert expression.args["expressions"][0].args["this"].args[
            "this"] == "a"
        assert expression.args["expressions"][1].args["this"].args[
            "this"] == "b"
        assert expression.args["expressions"][2].args["alias"].args[
            "this"] == "c"
        assert expression.args["expressions"][3].args["alias"].args[
            "this"] == "D"
        assert expression.args["expressions"][4].args["alias"].args[
            "this"] == "y|z'"
        table = expression.args["from"].args["expressions"][0]
        assert table.args["this"].args["this"] == "z"
        assert table.args["db"].args["this"] == "y"
Example #12
0
 def test_sql(self):
     assert parse_one("x + y * 2").sql() == "x + y * 2"
     assert (parse_one('select "x"').sql(dialect="hive",
                                         pretty=True) == "SELECT\n  `x`")
Example #13
0
 def test_depth(self):
     self.assertEqual(parse_one("x(1)").find(exp.Literal).depth, 1)
Example #14
0
 def test_eq(self):
     self.assertEqual(parse_one("`a`", read="hive"), parse_one('"a"'))
     self.assertEqual(parse_one("`a`", read="hive"), parse_one('"a"  '))
     self.assertEqual(parse_one("`a`.b", read="hive"), parse_one('"a"."b"'))
     self.assertEqual(parse_one("select a, b+1"),
                      parse_one("SELECT a, b + 1"))
     self.assertEqual(parse_one("`a`.`b`.`c`", read="hive"),
                      parse_one("a.b.c"))
     self.assertNotEqual(parse_one("a.b.c.d", read="hive"),
                         parse_one("a.b.c"))
     self.assertEqual(parse_one("a.b.c.d", read="hive"),
                      parse_one("a.b.c.d"))
     self.assertEqual(parse_one("a + b * c - 1.0"), parse_one("a+b*c-1.0"))
     self.assertNotEqual(parse_one("a + b * c - 1.0"),
                         parse_one("a + b * c + 1.0"))
     self.assertEqual(parse_one("a as b"), parse_one("a AS b"))
     self.assertNotEqual(parse_one("a as b"), parse_one("a"))
     self.assertEqual(
         parse_one("ROW() OVER(Partition by y)"),
         parse_one("ROW() OVER (partition BY y)"),
     )
     self.assertEqual(parse_one("TO_DATE(x)", read="hive"),
                      parse_one("ts_or_ds_to_date_str(x)"))
Example #15
0
    def test_function_arguments_validation(self):
        with self.assertRaises(ParseError):
            parse_one("IF(a > 0, a, b, c)")

        with self.assertRaises(ParseError):
            parse_one("IF(a > 0)")
Example #16
0
 def test_functions(self):
     # pylint: disable=too-many-statements
     self.assertIsInstance(parse_one("ABS(a)"), exp.Abs)
     self.assertIsInstance(parse_one("APPROX_DISTINCT(a)"),
                           exp.ApproxDistinct)
     self.assertIsInstance(parse_one("ARRAY(a)"), exp.Array)
     self.assertIsInstance(parse_one("ARRAY_AGG(a)"), exp.ArrayAgg)
     self.assertIsInstance(parse_one("ARRAY_CONTAINS(a, 'a')"),
                           exp.ArrayContains)
     self.assertIsInstance(parse_one("ARRAY_SIZE(a)"), exp.ArraySize)
     self.assertIsInstance(parse_one("AVG(a)"), exp.Avg)
     self.assertIsInstance(parse_one("CEIL(a)"), exp.Ceil)
     self.assertIsInstance(parse_one("CEILING(a)"), exp.Ceil)
     self.assertIsInstance(parse_one("COALESCE(a, b)"), exp.Coalesce)
     self.assertIsInstance(parse_one("COUNT(a)"), exp.Count)
     self.assertIsInstance(parse_one("DATE_ADD(a, 1)"), exp.DateAdd)
     self.assertIsInstance(parse_one("DATE_DIFF(a, 2)"), exp.DateDiff)
     self.assertIsInstance(parse_one("DATE_STR_TO_DATE(a)"),
                           exp.DateStrToDate)
     self.assertIsInstance(parse_one("DAY(a)"), exp.Day)
     self.assertIsInstance(parse_one("EXP(a)"), exp.Exp)
     self.assertIsInstance(parse_one("FLOOR(a)"), exp.Floor)
     self.assertIsInstance(parse_one("GREATEST(a, b)"), exp.Greatest)
     self.assertIsInstance(parse_one("IF(a, b, c)"), exp.If)
     self.assertIsInstance(parse_one("INITCAP(a)"), exp.Initcap)
     self.assertIsInstance(parse_one("JSON_PATH(a, '$.name')"),
                           exp.JSONPath)
     self.assertIsInstance(parse_one("LEAST(a, b)"), exp.Least)
     self.assertIsInstance(parse_one("LN(a)"), exp.Ln)
     self.assertIsInstance(parse_one("LOG10(a)"), exp.Log10)
     self.assertIsInstance(parse_one("MAX(a)"), exp.Max)
     self.assertIsInstance(parse_one("MIN(a)"), exp.Min)
     self.assertIsInstance(parse_one("MONTH(a)"), exp.Month)
     self.assertIsInstance(parse_one("POW(a, 2)"), exp.Pow)
     self.assertIsInstance(parse_one("POWER(a, 2)"), exp.Pow)
     self.assertIsInstance(parse_one("QUANTILE(a, 0.90)"), exp.Quantile)
     self.assertIsInstance(parse_one("REGEX_LIKE(a, 'test')"),
                           exp.RegexLike)
     self.assertIsInstance(parse_one("ROUND(a)"), exp.Round)
     self.assertIsInstance(parse_one("ROUND(a, 2)"), exp.Round)
     self.assertIsInstance(parse_one("STR_POSITION(a, 'test')"),
                           exp.StrPosition)
     self.assertIsInstance(parse_one("STR_TO_UNIX(a, 'format')"),
                           exp.StrToUnix)
     self.assertIsInstance(parse_one("STRUCT_EXTRACT(a, 'test')"),
                           exp.StructExtract)
     self.assertIsInstance(parse_one("SUM(a)"), exp.Sum)
     self.assertIsInstance(parse_one("SQRT(a)"), exp.Sqrt)
     self.assertIsInstance(parse_one("STDDEV(a)"), exp.Stddev)
     self.assertIsInstance(parse_one("STDDEV_POP(a)"), exp.StddevPop)
     self.assertIsInstance(parse_one("STDDEV_SAMP(a)"), exp.StddevSamp)
     self.assertIsInstance(parse_one("TIME_TO_STR(a, 'format')"),
                           exp.TimeToStr)
     self.assertIsInstance(parse_one("TIME_TO_TIME_STR(a)"),
                           exp.TimeToTimeStr)
     self.assertIsInstance(parse_one("TIME_TO_UNIX(a)"), exp.TimeToUnix)
     self.assertIsInstance(parse_one("TIME_STR_TO_DATE(a)"),
                           exp.TimeStrToDate)
     self.assertIsInstance(parse_one("TIME_STR_TO_TIME(a)"),
                           exp.TimeStrToTime)
     self.assertIsInstance(parse_one("TIME_STR_TO_UNIX(a)"),
                           exp.TimeStrToUnix)
     self.assertIsInstance(parse_one("TS_OR_DS_ADD(a, 1, 'day')"),
                           exp.TsOrDsAdd)
     self.assertIsInstance(parse_one("TS_OR_DS_TO_DATE(a)"),
                           exp.TsOrDsToDate)
     self.assertIsInstance(parse_one("TS_OR_DS_TO_DATE_STR(a)"),
                           exp.TsOrDsToDateStr)
     self.assertIsInstance(parse_one("UNIX_TO_STR(a, 'format')"),
                           exp.UnixToStr)
     self.assertIsInstance(parse_one("UNIX_TO_TIME(a)"), exp.UnixToTime)
     self.assertIsInstance(parse_one("UNIX_TO_TIME_STR(a)"),
                           exp.UnixToTimeStr)
     self.assertIsInstance(parse_one("VARIANCE(a)"), exp.Variance)
     self.assertIsInstance(parse_one("VARIANCE_POP(a)"), exp.VariancePop)
     self.assertIsInstance(parse_one("VARIANCE_SAMP(a)"), exp.VarianceSamp)
Example #17
0
 def fun(node):
     if isinstance(
             node,
             exp.Column) and node.args["this"].args["this"] == "a":
         return parse_one("FUN(a)")
     return node
Example #18
0
 def test_column(self):
     columns = parse_one(
         "select a, ARRAY[1] b, case when 1 then 1 end").find_all(
             exp.Column)
     assert len(list(columns)) == 1
Example #19
0
 def add_selects(self, *selects, read=None):
     select = self.expression.find(exp.Select)
     for sql in selects:
         select.args["expressions"].append(parse_one(sql, read=read))
     return self.expression