def testWhereRewriteWithRelated(self):
        """Test WHERE when pseudonym value exists in two different tables."""
        schema = test_util.GetCarsSchema()

        # add 'related' field just for this test
        for field in schema:
            if field['name'] == 'Make':
                field['related'] = 'cars_name'
                break

        # this value determined by running the test, not by manual calc
        ciphertext = 'sspWKAH/NKuUyX8ji1mmSw=='

        # test 1, use table_id
        table_id = _TABLE_ID
        master_key = test_util.GetMasterKey()
        as_clause = query_lib._AsClause({})
        stack = [
            util.FieldToken('Make'),
            util.StringLiteralToken('"Hello"'),
            util.OperatorToken('==', 2)
        ]
        where_clause_1 = query_lib._WhereClause(stack,
                                                as_clause=as_clause,
                                                schema=schema,
                                                nsquare=_TEST_NSQUARE,
                                                master_key=master_key,
                                                table_id=table_id)
        rewritten_sql_1 = where_clause_1.Rewrite()
        self.assertEqual(
            rewritten_sql_1,
            'WHERE (%sMake == "%s")' % (util.PSEUDONYM_PREFIX, ciphertext))

        # test 2, change table_id, query should be same as test #1
        table_id = _TABLE_ID + '_other'
        master_key = test_util.GetMasterKey()
        as_clause = query_lib._AsClause({})
        stack = [
            util.FieldToken('Make'),
            util.StringLiteralToken('"Hello"'),
            util.OperatorToken('==', 2)
        ]
        where_clause_2 = query_lib._WhereClause(stack,
                                                as_clause=as_clause,
                                                schema=schema,
                                                nsquare=_TEST_NSQUARE,
                                                master_key=master_key,
                                                table_id=table_id)
        rewritten_sql_2 = where_clause_2.Rewrite()
        self.assertEqual(
            rewritten_sql_2,
            'WHERE (%sMake == "%s")' % (util.PSEUDONYM_PREFIX, ciphertext))

        # verify different tables were used
        self.assertNotEqual(where_clause_1.table_id, where_clause_2.table_id)
        # and verify that same WHERE query="literal" was generated
        self.assertEqual(rewritten_sql_1, rewritten_sql_2)
 def testExtractUnencryptedQueries(self):
     stacks = [
         [util.FieldToken('Year')], [1],
         [util.FieldToken('Year'), 1,
          util.OperatorToken('+', 2)], [util.ProbabilisticToken('Price')],
         [util.FieldToken('GROUP_CONCAT(%sModel)' % util.PSEUDONYM_PREFIX)],
         [util.FieldToken('SUM(Year + 1)')]
     ]
     unencrypted_expression_list = [
         'Year AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '0_',
         '1 AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '1_',
         '(Year + 1) AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '2_',
         'SUM(Year + 1) AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '3_'
     ]
     self.assertEqual(query_lib._ExtractUnencryptedQueries(stacks, {}),
                      unencrypted_expression_list)
     stacks = [
         [util.FieldToken('Year')], [1],
         [util.FieldToken('Year'), 1,
          util.OperatorToken('+', 2)], [util.ProbabilisticToken('Price')],
         [util.FieldToken('GROUP_CONCAT(%sModel)' % util.PSEUDONYM_PREFIX)],
         [util.FieldToken('SUM(Year + 1)')]
     ]
     within = {4: 'w1', 5: 'w2'}
     unencrypted_expression_list = [
         'Year AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '0_',
         '1 AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '1_',
         '(Year + 1) AS ' + util.UNENCRYPTED_ALIAS_PREFIX + '2_',
         'SUM(Year + 1) WITHIN w2 AS ' + util.UNENCRYPTED_ALIAS_PREFIX +
         '3_'
     ]
     self.assertEqual(query_lib._ExtractUnencryptedQueries(stacks, within),
                      unencrypted_expression_list)
 def testHavingRewrite(self):
     schema = test_util.GetCarsSchema()
     master_key = test_util.GetMasterKey()
     as_clause = query_lib._AsClause({})
     stack = [util.FieldToken('SUM(Year)'), 1, util.OperatorToken('<', 2)]
     having_clause = query_lib._HavingClause(stack,
                                             as_clause=as_clause,
                                             schema=schema,
                                             nsquare=_TEST_NSQUARE,
                                             master_key=master_key,
                                             table_id=_TABLE_ID)
     self.assertEqual(having_clause.Rewrite(), 'HAVING (SUM(Year) < 1)')
     stack = [
         1000,
         util.AggregationQueryToken(
             'TO_BASE64(BYTES(PAILLIER_SUM(FROM_BASE64(' +
             util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price), \'0\')))'),
         util.OperatorToken('==', 2)
     ]
     having_clause = query_lib._HavingClause(stack,
                                             as_clause=as_clause,
                                             schema=schema,
                                             nsquare=_TEST_NSQUARE,
                                             master_key=master_key,
                                             table_id=_TABLE_ID)
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       having_clause.Rewrite)
     stack = [
         util.FieldToken('GROUP_CONCAT(' + util.PSEUDONYM_PREFIX +
                         'Model)'),
         util.BuiltInFunctionToken('len'), 5,
         util.OperatorToken('>', 2)
     ]
     having_clause = query_lib._HavingClause(stack,
                                             as_clause=as_clause,
                                             schema=schema,
                                             nsquare=_TEST_NSQUARE,
                                             master_key=master_key,
                                             table_id=_TABLE_ID)
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       having_clause.Rewrite)
     stack = []
     having_clause = query_lib._HavingClause(stack,
                                             as_clause=as_clause,
                                             schema=schema,
                                             nsquare=_TEST_NSQUARE,
                                             master_key=master_key,
                                             table_id=_TABLE_ID)
     self.assertEqual(having_clause.Rewrite(), '')
 def testRewrittenAggregation(self):
     stack = [
         util.FieldToken('Year'),
         util.AggregationFunctionToken('DISTINCTCOUNT', 1)
     ]
     self.assertEqual(interpreter.ToInfix(list(stack)),
                      'COUNT(DISTINCT Year)')
예제 #5
0
 def testComputeRowsEvaluate2(self):
     # Query is 'SELECT 1 + a, 1 * b, "hello"'
     # There are two rows of values for a and b (shown in query).
     # Result becomes as below:
     # 1 + a | 1 * b | "hello"
     #   2       3     "hello"
     #   4       5     "hello"
     stack = [[1, util.FieldToken('a'),
               util.OperatorToken('+', 2)],
              [1, util.FieldToken('b'),
               util.OperatorToken('*', 2)],
              [util.StringLiteralToken('"hello"')]]
     query = {'a': [1, 3], 'b': [3, 5]}
     real_result = [['2', '3', 'hello'], ['4', '5', 'hello']]
     result = encrypted_bigquery_client._ComputeRows(stack, query)
     self.assertEqual(result, real_result)
 def testReplaceAliasWhenNested(self):
     # Query is 'SELECT a + b as a, a + b as b'
     stacks = [[
         util.FieldToken('a'),
         util.FieldToken('b'),
         util.OperatorToken('+', 2)
     ],
               [
                   util.FieldToken('a'),
                   util.FieldToken('b'),
                   util.OperatorToken('+', 2)
               ]]
     alias = {0: 'a', 1: 'b'}
     new_stack = query_lib._ReplaceAlias(stacks, alias)
     real_stack = [['a', 'b', '+'], ['a', 'b', '+', 'b', '+']]
     self.assertEqual(new_stack, real_stack)
 def testGroupByRewrite(self):
     test_schema = test_util.GetCarsSchema()
     as_clause = query_lib._AsClause({})
     within_clause = query_lib._WithinClause({})
     select_clause = query_lib._SelectClause([['1']],
                                             as_clause=as_clause,
                                             within_clause=within_clause,
                                             schema=test_schema,
                                             nsquare=_TEST_NSQUARE)
     select_clause.Rewrite()
     fields = [util.FieldToken('Price')]
     clause = query_lib._GroupByClause(fields,
                                       schema=test_schema,
                                       nsquare=_TEST_NSQUARE,
                                       select_clause=select_clause)
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       clause.Rewrite)
     fields = [util.FieldToken('Invoice_Price'), util.FieldToken('Make')]
     clause = query_lib._GroupByClause(fields,
                                       schema=test_schema,
                                       nsquare=_TEST_NSQUARE,
                                       select_clause=select_clause)
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       clause.Rewrite)
     fields = [util.FieldToken('Make')]
     clause = query_lib._GroupByClause(fields,
                                       schema=test_schema,
                                       nsquare=_TEST_NSQUARE,
                                       select_clause=select_clause)
     self.assertEqual(clause.Rewrite(),
                      'GROUP BY %sMake' % util.PSEUDONYM_PREFIX)
     fields = [util.FieldToken('Year')]
     clause = query_lib._GroupByClause(fields,
                                       schema=test_schema,
                                       nsquare=_TEST_NSQUARE,
                                       select_clause=select_clause)
     self.assertEqual(clause.Rewrite(), 'GROUP BY Year')
     fields = []
     clause = query_lib._GroupByClause(fields,
                                       schema=test_schema,
                                       nsquare=_TEST_NSQUARE,
                                       select_clause=select_clause)
     self.assertEqual(clause.Rewrite(), '')
 def testWhereRewrite(self):
     schema = test_util.GetCarsSchema()
     master_key = test_util.GetMasterKey()
     as_clause = query_lib._AsClause({})
     stack = [
         util.FieldToken('Make'),
         util.StringLiteralToken('"Hello"'),
         util.OperatorToken('==', 2)
     ]
     where_clause = query_lib._WhereClause(stack,
                                           as_clause=as_clause,
                                           schema=schema,
                                           nsquare=_TEST_NSQUARE,
                                           master_key=master_key,
                                           table_id=_TABLE_ID)
     self.assertEqual(
         where_clause.Rewrite(),
         'WHERE (%sMake == "HS57DHbh2KlkqNJREmu1wQ==")' %
         util.PSEUDONYM_PREFIX)
     stack = [
         util.FieldToken('Model'),
         util.StringLiteralToken('"A"'),
         util.OperatorToken('contains', 2)
     ]
     where_clause = query_lib._WhereClause(stack,
                                           as_clause=as_clause,
                                           schema=schema,
                                           nsquare=_TEST_NSQUARE,
                                           master_key=master_key,
                                           table_id=_TABLE_ID)
     self.assertEqual(
         where_clause.Rewrite(),
         'WHERE (%sModel contains to_base64(left(bytes(sha1(concat(left('
         '%sModel, 24), \'yB9HY2qv+DI=\'))), 8)))' %
         (util.SEARCHWORDS_PREFIX, util.SEARCHWORDS_PREFIX))
     stack = []
     where_clause = query_lib._WhereClause(stack,
                                           as_clause=as_clause,
                                           schema=schema,
                                           nsquare=_TEST_NSQUARE,
                                           master_key=master_key,
                                           table_id=_TABLE_ID)
     self.assertEqual(where_clause.Rewrite(), '')
 def testAsConstructColumnNames(self):
     alias = {0: 'a'}
     columns = [[util.FieldToken('b')], [1, 2, util.OperatorToken('+', 2)]]
     as_clause = query_lib._AsClause(alias)
     self.assertEqual(as_clause.ConstructColumnNames(columns),
                      [{
                          'name': 'a'
                      }, {
                          'name': '(1 + 2)'
                      }])
 def testSimpleWhere(self):
     schema = test_util.GetCarsSchema()
     key = test_util.GetMasterKey()
     stack = [1, 2, util.OperatorToken('>', 2)]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(1 > 2)')
     stack = [1, 2, util.OperatorToken('=', 2)]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(1 = 2)')
     stack = [util.FieldToken('PI()'), 1, util.OperatorToken('>', 2)]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(PI() > 1)')
     stack = [1, util.OperatorToken('>', 2)]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [util.FieldToken('Year'), 2000, util.OperatorToken('<', 2)]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(Year < 2000)')
 def testExtractEncryptedQueries(self):
     # Original query is 'SELECT (111 + a_1) * a, TRUE OR False, null, PI(),
     # FUNC_PI, a1'
     # Query sent to server becomes 'SELECT a, a_1, FUNC_PI, a1'
     stacks = [[
         util.FieldToken('a'), 111,
         util.FieldToken('a_1'),
         util.OperatorToken('+', 2),
         util.OperatorToken('*', 2)
     ], ['TRUE', 'False', util.OperatorToken('OR', 2)], ['null'],
               [util.BuiltInFunctionToken('PI')],
               [util.FieldToken('FUNC_PI')], [util.FieldToken('a1')],
               [util.FieldToken('a.b')],
               [
                   util.UnencryptedQueryToken('%s0_' %
                                              util.UNENCRYPTED_ALIAS_PREFIX)
               ]]
     query_list = query_lib._ExtractFieldQueries(stacks, strize=True)
     expect_query_list = set([
         'a', 'a_1', 'FUNC_PI', 'a1',
         'a.b AS a' + util.PERIOD_REPLACEMENT + 'b'
     ])
     self.assertEqual(expect_query_list, query_list)
예제 #12
0
 def PushSingleToken(tokens):
   """Push the topmost token onto the stack."""
   if util.IsFloat(tokens[0]):
     try:
       token = int(tokens[0])
     except ValueError:
       token = float(tokens[0])
   elif tokens[0].startswith('\'') or tokens[0].startswith('"'):
     token = util.StringLiteralToken(tokens[0])
   elif tokens[0].lower() in util.BIGQUERY_CONSTANTS:
     token = util.LiteralToken(tokens[0].lower(),
                               util.BIGQUERY_CONSTANTS[tokens[0].lower()])
   else:
     token = util.FieldToken(tokens[0])
   math_stack.append(token)
 def testCheckValidSumAverageArgument(self):
     stack = [
         util.FieldToken('Year'),
         util.FieldToken('Year'),
         util.OperatorToken('*', 2),
         util.HomomorphicIntToken('Invoice_Price'),
         util.OperatorToken('+', 2)
     ]
     expected_stack = [[['Year', 'Year', '*'],
                        [util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price']],
                       True, True]
     self.assertEqual(interpreter.CheckValidSumAverageArgument(stack),
                      expected_stack)
     stack = [
         2,
         util.FieldToken('Year'),
         util.FieldToken('Year'),
         util.OperatorToken('*', 2),
         util.HomomorphicIntToken('Invoice_Price'),
         util.OperatorToken('+', 2),
         util.OperatorToken('*', 2)
     ]
     expected_stack = [[
         [2, 'Year', 'Year', '*', '*'],
         [2, util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price', '*']
     ], True, True]
     self.assertEqual(interpreter.CheckValidSumAverageArgument(stack),
                      expected_stack)
     stack = [util.ProbabilisticToken('Price')]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.CheckValidSumAverageArgument, stack)
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.HomomorphicFloatToken('Holdback_Percentage'),
         util.OperatorToken('*', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.CheckValidSumAverageArgument, stack)
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.FieldToken('Year'),
         util.OperatorToken('*', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.CheckValidSumAverageArgument, stack)
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.FieldToken('Year'),
         util.OperatorToken('/', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.CheckValidSumAverageArgument, stack)
예제 #14
0
def _CollapseFunctions(stack):
    """Collapses functions by evaluating them for actual values.

  Replaces a function's postfix expression with a single token. If the function
  can be evaluated (no fields included as arguments), the single token is
  the value of function's evaluation. Otherwise, the function is collapsed
  into a single token without evaluation.

  Arguments:
    stack: The stack whose functions are to be collapsed and resolved.

  Raises:
    bigquery_client.BigqueryInvalidQueryError: If a field exists inside
    the arguments of a function.

  Returns:
    True iff a function is found and collapsed. In other words, another
    potential function can still exist.
  """
    for i in xrange(len(stack)):
        if isinstance(stack[i], util.BuiltInFunctionToken):
            start_idx, postfix_expr = interpreter.GetSingleValue(stack[:i + 1])
            if util.IsEncryptedExpression(postfix_expr):
                raise bigquery_client.BigqueryInvalidQueryError(
                    'Invalid aggregation function argument: Cannot put an encrypted '
                    'field as an argument to a built-in function.', None, None,
                    None)
            # If the expression has no fields, we want to get the actual value.
            # But, if the field has a field, we have to get the infix string instead.
            try:
                result = interpreter.Evaluate(list(postfix_expr))
                if isinstance(result, basestring):
                    result = util.StringLiteralToken('"%s"' % result)
                elif result is None:
                    result = util.LiteralToken('NULL', None)
                elif str(result).lower() in ['true', 'false']:
                    result = util.LiteralToken(str(result).lower(), result)
                stack[start_idx:i + 1] = [result]
            except bigquery_client.BigqueryInvalidQueryError:
                result = interpreter.ToInfix(list(postfix_expr))
                stack[start_idx:i + 1] = [util.FieldToken(result)]
            return True
    return False
 def testRewriteEncryptedFields(self):
     queries = [
         util.FieldToken('Year'),
         util.FieldToken('Model'),
         util.FieldToken('Make'),
         util.FieldToken('Invoice_Price'),
         util.FieldToken('Price'),
         util.FieldToken('Website'),
         util.FieldToken('Description')
     ]
     rewritten_queries = [
         util.FieldToken('Year'),
         util.ProbabilisticToken('Model'),
         util.PseudonymToken('Make'),
         util.HomomorphicIntToken('Invoice_Price'),
         util.ProbabilisticToken('Price'),
         util.SearchwordsToken('Website'),
         util.SearchwordsToken('Description')
     ]
     test_schema = test_util.GetCarsSchema()
     new_queries = query_lib._RewriteEncryptedFields([queries], test_schema)
     self.assertEqual(new_queries, [rewritten_queries])
 def testExpandExpression(self):
     stack = [
         util.FieldToken('x'),
         util.FieldToken('y'),
         util.OperatorToken('+', 2),
         util.FieldToken('x'),
         util.OperatorToken('+', 2), 2,
         util.FieldToken('z'),
         util.OperatorToken('*', 2),
         util.OperatorToken('-', 2), 5,
         util.OperatorToken('-', 2), 3,
         util.OperatorToken('+', 2)
     ]
     list_fields, constant = interpreter._ExpandExpression(stack)
     self.assertEqual(
         list_fields,
         [[2.0, util.FieldToken('x')], [1.0, util.FieldToken('y')],
          [-2.0, util.FieldToken('z')]])
     self.assertEqual(constant, -2.0)
     stack = [
         util.FieldToken('x'), 4,
         util.OperatorToken('+', 2), 6,
         util.OperatorToken('*', 2), 2,
         util.OperatorToken('/', 2)
     ]
     list_fields, constant = interpreter._ExpandExpression(stack)
     self.assertEqual(list_fields, [[3.0, util.FieldToken('x')]])
     self.assertEqual(constant, 12.0)
     stack = [
         util.FieldToken('x'), 1,
         util.OperatorToken('+', 2),
         util.FieldToken('y'),
         util.OperatorToken('*', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter._ExpandExpression, stack)
     stack = [
         util.FieldToken('x'),
         util.FieldToken('y'),
         util.OperatorToken('/', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter._ExpandExpression, stack)
 def testEncryptedContains(self):
     schema = test_util.GetCarsSchema()
     key = test_util.GetMasterKey()
     stack = [
         util.FieldToken('Year'),
         util.BuiltInFunctionToken('string'),
         util.StringLiteralToken('"1"'),
         util.OperatorToken('CONTAINS', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '(string(Year) contains "1")')
     stack = [
         util.SearchwordsToken('Model'),
         util.StringLiteralToken('"A"'),
         util.OperatorToken('contains', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '(' + util.SEARCHWORDS_PREFIX + 'Model contains '
         'to_base64(left(bytes(sha1(concat(left(' +
         util.SEARCHWORDS_PREFIX + 'Model, 24), \'yB9HY2qv+DI=\'))), 8)))')
     stack = [
         util.SearchwordsToken('Model'),
         util.FieldToken('Year'),
         util.OperatorToken('contains', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [
         util.PseudonymToken('Make'), 'A',
         util.OperatorToken('contains', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [
         util.SearchwordsToken('Model'),
         util.SearchwordsToken('Model'),
         util.OperatorToken('contains', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [
         'Hello',
         util.SearchwordsToken('Model'),
         util.OperatorToken('contains', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [
         util.SearchwordsToken('Model'),
         util.StringLiteralToken('"A"'),
         util.OperatorToken('contains', 2),
         util.OperatorToken('not', 1)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         'not (' + util.SEARCHWORDS_PREFIX + 'Model contains '
         'to_base64(left(bytes(sha1(concat(left(' +
         util.SEARCHWORDS_PREFIX + 'Model, 24), \'yB9HY2qv+DI=\'))), 8)))')
     schema = test_util.GetPlacesSchema()
     stack = [
         util.SearchwordsToken('citiesLived.place'),
         util.StringLiteralToken('"A"'),
         util.OperatorToken('contains', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '(citiesLived.' + util.SEARCHWORDS_PREFIX + 'place contains '
         'to_base64(left(bytes(sha1(concat(left(citiesLived.' +
         util.SEARCHWORDS_PREFIX + 'place, 24), \'cBKPKGiY2cg=\'))), 8)))')
 def testEncryptedEquality(self):
     schema = test_util.GetCarsSchema()
     key = test_util.GetMasterKey()
     stack = [
         util.FieldToken('Year'), 1,
         util.OperatorToken('+', 2), 2000,
         util.OperatorToken('=', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '((Year + 1) = 2000)')
     stack = [
         util.FieldToken('Year'),
         util.PseudonymToken('Make'),
         util.OperatorToken('=', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '(Year = ' + util.PSEUDONYM_PREFIX + 'Make)')
     stack = [
         util.PseudonymToken('Make'),
         util.StringLiteralToken('"Hello"'),
         util.OperatorToken('==', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(' +
         util.PSEUDONYM_PREFIX + 'Make == "HS57DHbh2KlkqNJREmu1wQ==")')
     stack = [
         util.StringLiteralToken('"Hello"'),
         util.PseudonymToken('Make'),
         util.OperatorToken('==', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '("HS57DHbh2KlkqNJREmu1wQ==" == ' + util.PSEUDONYM_PREFIX +
         'Make)')
     stack = [
         util.StringLiteralToken('"Hello"'),
         util.PseudonymToken('Make'),
         util.OperatorToken('!=', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '("HS57DHbh2KlkqNJREmu1wQ==" != ' + util.PSEUDONYM_PREFIX +
         'Make)')
     stack = [
         util.PseudonymToken('Make'),
         util.PseudonymToken('Make2'),
         util.OperatorToken('==', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID),
         '(' + util.PSEUDONYM_PREFIX + 'Make == ' + util.PSEUDONYM_PREFIX +
         'Make2)')
     stack = [
         util.HomomorphicIntToken('Invoice_Price'), 2,
         util.OperatorToken('==', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     stack = [
         util.PseudonymToken('Make'),
         util.ProbabilisticToken('Price'),
         util.OperatorToken('=', 2)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       interpreter.RewriteSelectionCriteria, stack, schema,
                       key, _TABLE_ID)
     schema = test_util.GetPlacesSchema()
     stack = [
         util.PseudonymToken('spouse.spouseName'),
         util.StringLiteralToken('"Hello"'),
         util.OperatorToken('=', 2)
     ]
     self.assertEqual(
         interpreter.RewriteSelectionCriteria(stack, schema, key,
                                              _TABLE_ID), '(spouse.' +
         util.PSEUDONYM_PREFIX + 'spouseName = "HS57DHbh2KlkqNJREmu1wQ==")')
 def testRewriteAggregations(self):
     stack = [
         util.CountStarToken(),
         util.AggregationFunctionToken('COUNT', 1)
     ]
     rewritten_stack = ['COUNT(*)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.ProbabilisticToken('Price'),
         util.AggregationFunctionToken('COUNT', 1)
     ]
     rewritten_stack = ['COUNT(' + util.PROBABILISTIC_PREFIX + 'Price)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.ProbabilisticToken('Price'), 4,
         util.AggregationFunctionToken('COUNT', 2)
     ]
     rewritten_stack = ['COUNT(' + util.PROBABILISTIC_PREFIX + 'Price, 4)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.FieldToken('Year'), 5,
         util.AggregationFunctionToken('DISTINCTCOUNT', 2),
         util.FieldToken('Year'),
         util.AggregationFunctionToken('COUNT', 1),
         util.OperatorToken('+', 2)
     ]
     rewritten_stack = ['COUNT(DISTINCT Year, 5)', 'COUNT(Year)', '+']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         0,
         util.BuiltInFunctionToken('cos'),
         util.AggregationFunctionToken('COUNT', 1)
     ]
     rewritten_stack = ['COUNT(1.0)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.StringLiteralToken('"Hello"'), 2,
         util.BuiltInFunctionToken('left'),
         util.StringLiteralToken('"y"'),
         util.BuiltInFunctionToken('concat'),
         util.AggregationFunctionToken('GROUP_CONCAT', 1)
     ]
     rewritten_stack = ['GROUP_CONCAT("Hey")']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.FieldToken('Year'),
         util.FieldToken('Year'),
         util.OperatorToken('*', 2),
         util.AggregationFunctionToken('SUM', 1)
     ]
     rewritten_stack = ['SUM((Year * Year))']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.AggregationFunctionToken('SUM', 1)
     ]
     rewritten_stack = [
         0.0, 'COUNT(' + util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price)',
         '*', 1.0, 'TO_BASE64(BYTES(PAILLIER_SUM(FROM_BASE64(' +
         util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price), \'0\')))', '*', '+'
     ]
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.HomomorphicFloatToken('Holdback_Percentage'),
         util.AggregationFunctionToken('AVG', 1)
     ]
     rewritten_stack = [
         0.0,
         'COUNT(' + util.HOMOMORPHIC_FLOAT_PREFIX + 'Holdback_Percentage)',
         '*', 1.0, 'TO_BASE64(BYTES(PAILLIER_SUM(FROM_BASE64(' +
         util.HOMOMORPHIC_FLOAT_PREFIX + 'Holdback_Percentage), \'0\')))',
         '*', '+',
         'COUNT(' + util.HOMOMORPHIC_FLOAT_PREFIX + 'Holdback_Percentage)',
         '/'
     ]
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.HomomorphicIntToken('Invoice_Price'), 2,
         util.OperatorToken('+', 2), 5,
         util.OperatorToken('*', 2),
         util.AggregationFunctionToken('SUM', 1)
     ]
     rewritten_stack = [
         0.0, 'COUNT(' + util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price)',
         '*', 5.0, 'TO_BASE64(BYTES(PAILLIER_SUM(FROM_BASE64(' +
         util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price), \'0\')))', '*', '+',
         0.0, 'COUNT(' + util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price)',
         '*', 1.0, 'SUM((2 * 5))', '*', '+', '+'
     ]
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.PseudonymToken('Make'), 2,
         util.AggregationFunctionToken('DISTINCTCOUNT', 2)
     ]
     rewritten_stack = [
         'COUNT(DISTINCT ' + util.PSEUDONYM_PREFIX + 'Make, 2)'
     ]
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.FieldToken('Year'),
         util.AggregationFunctionToken('TOP', 1)
     ]
     rewritten_stack = ['TOP(Year)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.PseudonymToken('Make'), 5, 1,
         util.AggregationFunctionToken('TOP', 3)
     ]
     rewritten_stack = ['TOP(' + util.PSEUDONYM_PREFIX + 'Make, 5, 1)']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.FieldToken('Year'),
         util.BuiltInFunctionToken('cos'),
         util.HomomorphicIntToken('Invoice_Price'),
         util.OperatorToken('+', 2),
         util.AggregationFunctionToken('SUM', 1)
     ]
     rewritten_stack = [
         0.0, 'COUNT(' + util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price)',
         '*', 1.0, 'SUM(cos(Year))', '*', '+', 0.0,
         'COUNT(' + util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price)', '*',
         1.0, 'TO_BASE64(BYTES(PAILLIER_SUM(FROM_BASE64(' +
         util.HOMOMORPHIC_INT_PREFIX + 'Invoice_Price),'
         ' \'0\')))', '*', '+', '+'
     ]
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.ProbabilisticToken('Model'),
         util.AggregationFunctionToken('DISTINCTCOUNT', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.ProbabilisticToken('Price'),
         util.AggregationFunctionToken('SUM', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.HomomorphicFloatToken('Holdback_Percentage'),
         util.OperatorToken('*', 2),
         util.AggregationFunctionToken('SUM', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.HomomorphicFloatToken('Holdback_Percentage'),
         util.BuiltInFunctionToken('cos'),
         util.AggregationFunctionToken('SUM', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.AggregationFunctionToken('TOP', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.FieldToken('Year'),
         util.AggregationFunctionToken('SUM', 1),
         util.AggregationFunctionToken('SUM', 1)
     ]
     rewritten_stack = ['SUM(SUM(Year))']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.HomomorphicIntToken('Invoice_Price'),
         util.AggregationFunctionToken('SUM', 1),
         util.AggregationFunctionToken('SUM', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
     stack = [
         util.FieldToken('Year'),
         util.AggregationFunctionToken('GROUP_CONCAT', 1),
         util.AggregationFunctionToken('GROUP_CONCAT', 1)
     ]
     rewritten_stack = ['GROUP_CONCAT(GROUP_CONCAT(Year))']
     self.assertEqual(
         query_lib._RewriteAggregations([stack], _TEST_NSQUARE),
         [rewritten_stack])
     stack = [
         util.PseudonymToken('Make'),
         util.AggregationFunctionToken('GROUP_CONCAT', 1),
         util.AggregationFunctionToken('GROUP_CONCAT', 1)
     ]
     self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                       query_lib._RewriteAggregations, [stack],
                       _TEST_NSQUARE)
 def testInit(self):
     """Test __init__()."""
     f = util.FieldToken('foo')
     self.assertEqual(f, 'foo')
 def testSetAlias(self):
     """Test property alias SetAlias()."""
     f = util.FieldToken('foo')
     ret = f.SetAlias('bar')
     self.assertEqual(f._alias, 'bar')
     self.assertEqual(ret, f)
예제 #22
0
    def testEncryptedEquality(self):
        schema = test_util.GetCarsSchema()
        key = test_util.GetMasterKey()
        stack = [
            util.FieldToken('Year'), 1,
            util.OperatorToken('+', 2), 2000,
            util.OperatorToken('=', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID),
            '((Year + 1) = 2000)')
        stack = [
            util.FieldToken('Year'),
            util.PseudonymToken('Make'),
            util.OperatorToken('=', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID),
            '(Year = ' + util.PSEUDONYM_PREFIX + 'Make)')
        stack = [
            util.PseudonymToken('Make'),
            util.StringLiteralToken('"Hello"'),
            util.OperatorToken('==', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID), '(' +
            util.PSEUDONYM_PREFIX + 'Make == "HS57DHbh2KlkqNJREmu1wQ==")')

        # begin: tests about 'related' schema option

        schema2 = test_util.GetCarsSchema()
        for field in schema2:
            if field['name'] == 'Make':
                field['related'] = 'cars_name'

        # value is deterministic calc with related instead of _TABLE_ID
        stack = [
            util.PseudonymToken('Make', related=_RELATED),
            util.StringLiteralToken('"Hello"'),
            util.OperatorToken('==', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema2, key,
                                                 _TABLE_ID), '(' +
            util.PSEUDONYM_PREFIX + 'Make == "sspWKAH/NKuUyX8ji1mmSw==")')

        # token with related attribute makes no sense if schema doesn't have it
        stack = [
            util.StringLiteralToken('"Hello"'),
            util.PseudonymToken('Make', related=_RELATED),
            util.OperatorToken('==', 2)
        ]
        self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                          interpreter.RewriteSelectionCriteria, stack, schema,
                          key, _TABLE_ID)

        # end: tests about 'related' schema option

        stack = [
            util.StringLiteralToken('"Hello"'),
            util.PseudonymToken('Make'),
            util.OperatorToken('==', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID),
            '("HS57DHbh2KlkqNJREmu1wQ==" == ' + util.PSEUDONYM_PREFIX +
            'Make)')

        stack = [
            util.StringLiteralToken('"Hello"'),
            util.PseudonymToken('Make'),
            util.OperatorToken('!=', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID),
            '("HS57DHbh2KlkqNJREmu1wQ==" != ' + util.PSEUDONYM_PREFIX +
            'Make)')

        stack = [
            util.PseudonymToken('Make'),
            util.PseudonymToken('Make2'),
            util.OperatorToken('==', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID),
            '(' + util.PSEUDONYM_PREFIX + 'Make == ' + util.PSEUDONYM_PREFIX +
            'Make2)')
        stack = [
            util.HomomorphicIntToken('Invoice_Price'), 2,
            util.OperatorToken('==', 2)
        ]
        self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                          interpreter.RewriteSelectionCriteria, stack, schema,
                          key, _TABLE_ID)
        stack = [
            util.PseudonymToken('Make'),
            util.ProbabilisticToken('Price'),
            util.OperatorToken('=', 2)
        ]
        self.assertRaises(bigquery_client.BigqueryInvalidQueryError,
                          interpreter.RewriteSelectionCriteria, stack, schema,
                          key, _TABLE_ID)
        schema = test_util.GetPlacesSchema()
        stack = [
            util.PseudonymToken('spouse.spouseName'),
            util.StringLiteralToken('"Hello"'),
            util.OperatorToken('=', 2)
        ]
        self.assertEqual(
            interpreter.RewriteSelectionCriteria(stack, schema, key,
                                                 _TABLE_ID), '(spouse.' +
            util.PSEUDONYM_PREFIX + 'spouseName = "HS57DHbh2KlkqNJREmu1wQ==")')