tail = Function('tail', fgsort, fgsort) # rec defs append = RecFunction('append', fgsort, fgsort, fgsort) length = RecFunction('length', fgsort, intsort) AddRecDefinition(append, (x, y), If(x == nil, y, cons(head(x), append(tail(x), y)))) AddRecDefinition(length, x, If(x == nil, 0, length(tail(x)) + 1)) # axioms AddAxiom(x, head(cons(hx, x)) == hx) AddAxiom(x, tail(cons(hx, x)) == x) AddAxiom(x, cons(hx, x) != nil) # len(append(x, y)) = len(x) + len(y) goal = length(append(x, y)) == length(x) + length(y) # adt pfp of goal base_case = length(append(nil, y)) == length(nil) + length(y) induction_hypothesis = length(append(tx, y)) == length(tx) + length(y) induction_step = length(append(cons(hx, tx), y)) == length(cons(hx, tx)) + length(y) pfp_goal = And(base_case, Implies(induction_hypothesis, induction_step)) np_solver = NPSolver() solution = np_solver.solve(pfp_goal) if not solution.if_sat: print('goal is valid')
AddRecDefinition( htree, x, If(x == nil, fgsetsort.lattice_bottom, SetAdd(SetUnion(htree(lft(x)), htree(rght(x))), x))) AddRecDefinition( reach_lr, (x, y), If(x == y, True, Or(reach_lr(lft(x), y), reach_lr(rght(x), y)))) AddAxiom((), lft(nil) == nil) AddAxiom((), rght(nil) == nil) # vc goal = Implies(tree(x), Implies(reach_lr(x, y), tree(y))) # check validity with natural proof solver and no hardcoded lemmas np_solver = NPSolver() solution = np_solver.solve(make_pfp_formula(goal)) if not solution.if_sat: print('goal (no lemmas) is valid') else: print('goal (no lemmas) is invalid') # hardcoded lemmas lemma_params = (x, y) lemma_body = Implies(reach_lr(x, y), Implies(tree(x), tree(y))) lemmas = {(lemma_params, lemma_body)} # check validity of lemmas solution = np_solver.solve(make_pfp_formula(lemma_body)) if not solution.if_sat: print('lemma is valid') else:
def solveProblem(lemma_grammar_args, lemma_grammar_terms, goal, name, grammar_string, config_params=None, annctx=default_annctx): # Extract relevant parameters for running the verification-synthesis engine from config_params if config_params is None: config_params = {} lemma_grammar_terms = get_all_subterms(lemma_grammar_terms) valid_lemmas = set() invalid_lemmas = [] cex_models = [] true_cex_models = [] # Determine proof mode for goal goal_instantiation_mode = config_params.get('goal_instantiation_mode', None) supported_goal_instantiation_modes = { proveroptions.manual_instantiation, proveroptions.depth_one_stratified_instantiation, proveroptions.fixed_depth, proveroptions.lean_instantiation, proveroptions.lean_instantiation_with_lemmas } if goal_instantiation_mode is None: # stratified instantiation by default goal_instantiation_mode = proveroptions.depth_one_stratified_instantiation elif goal_instantiation_mode not in supported_goal_instantiation_modes: # The set of instantiation terms must stay constant # TODO: check for unsoundness of algorithm if instantiation mode has automatic adaptive depth. # If the check passes there is no need for this branch of the condition. raise ValueError( 'Unsupported or unknown proof (instantiation) mode for goal.') # Create properly configured solver object that checks the goal in the presence of 0 or more lemmas # IMPORTANT: this is the solver object that will always be used to attempt proving the goal. Doing this # standardises the configuration used to prove the goal and ensures that the changes made to the # solver object are reflected everywhere in the pipeline. goal_fo_solver = NPSolver() goal_fo_solver.options.instantiation_mode = goal_instantiation_mode if goal_instantiation_mode == proveroptions.manual_instantiation: goal_manual_instantiation_terms = config_params.get( 'goal_instantiation_terms', None) if goal_manual_instantiation_terms is None: raise ValueError( 'Instantiation terms must be specified for goal in manual mode.' ) goal_fo_solver.options.terms_to_instantiate = goal_manual_instantiation_terms elif goal_instantiation_mode == proveroptions.fixed_depth: # Default depth is 1 goal_instantiation_depth = config_params.get( 'goal_instantiation_depth', 1) goal_fo_solver.options.depth = goal_instantiation_depth config_params['goal_solver'] = goal_fo_solver # check if goal is fo provable goal_fo_npsolution = goal_fo_solver.solve(goal) if goal_fo_npsolution.if_sat: print('goal is not first-order provable.') else: print('goal is first-order provable.') exit(0) # check if goal is fo provable using its own pfp pfp_of_goal = make_pfp_formula(goal) goal_pfp_solver = NPSolver() goal_pfp_solver.options.instantiation_mode = goal_instantiation_mode if goal_instantiation_mode == proveroptions.manual_instantiation: warnings.warn( 'Manual instantiation mode: PFP of goal will be proved using the same terms the goal itself.' ) goal_pfp_npsolution = goal_pfp_solver.solve(pfp_of_goal) if goal_pfp_npsolution.if_sat: print('goal cannot be proved using induction.') else: print('goal is provable using induction.') exit(0) # goal_npsolution_instantiation_terms = goal_fo_npsolution.extraction_terms # config_params['goal_npsolution_instantiation_terms'] = goal_npsolution_instantiation_terms # Temporarily disabling expanding the set of extraction terms depending on the grammar. # goal_extraction_terms = grammar.goal_extraction_terms(goal_npsolution_instantiation_terms, # lemma_grammar_args, lemma_grammar_terms, annctx) # config_params['goal_extraction_terms'] = goal_extraction_terms # Extract relevant instantiation/extraction terms for lemmas given the grammar # This set is constant lemma_instantiation_terms = grammar.lemma_instantiation_terms( lemma_grammar_args, lemma_grammar_terms, annctx) # Initial timeout (in seconds) for streaming config_params['streaming_timeout'] = 15 * 60 if config_params['streaming_timeout'] < 20: raise ValueError( 'Cannot time streams with small timeouts. Use >= 20 seconds.') # Dictionary for logging pipeline analytics if options.analytics: config_params['analytics'] = {'total_lemmas': 0, 'time_charged': 0} # Some fixed utility functions for interpreting synthesis outputs # Values used to convert CVC4 versions of membership, insertion to z3py versions SetIntSort = SetSort(IntSort()) membership = Function('membership', IntSort(), SetIntSort, BoolSort()) insertion = Function('insertion', IntSort(), SetIntSort, SetIntSort) addl_decls = {'member': membership, 'insert': insertion} swap_fcts = {insertion: SetAdd} replace_fcts = {membership: IsMember} # List of recursive boolean-valued rec defs that can appear on the left hand side of a lemma recs = get_boolean_recursive_definitions() # continuously get valid lemmas until goal has been proven while True: sygus_results = getSygusOutput(valid_lemmas, lemma_grammar_args, goal, name, grammar_string, config_params, annctx) if sygus_results is None or sygus_results == []: exit('No lemmas proposed. Instance failed.') for rhs_pre, lhs_pre in sygus_results: rhs_pre = rhs_pre.strip() lhs_pre = lhs_pre.strip() if options.analytics: config_params['analytics']['total_lemmas'] += 1 # Casting the lemma into a Z3Py expression if options.analytics: curr_time = time.time() config_params['analytics']['lemma_time'] = int( curr_time - config_params['analytics']['proposal_start_time']) pre_validation = time.time() rhs_lemma = translateLemma(rhs_pre, lemma_grammar_args, addl_decls, swap_fcts, replace_fcts, annctx) index = int(lhs_pre[:-1].split(' ')[-1]) lhs_func = recs[index] lhs_arity = lhs_func.arity() lhs_lemma_args = tuple(lemma_grammar_args[:lhs_arity]) lhs_lemma = lhs_func(lhs_lemma_args) z3py_lemma_body = Implies(lhs_lemma, rhs_lemma) z3py_lemma_params = tuple( [arg for arg in lemma_grammar_args if is_var_decl(arg)]) z3py_lemma = (z3py_lemma_params, z3py_lemma_body) if options.verbose > 0: print('proposed lemma: {}'.format(str(z3py_lemma_body))) if options.verbose >= 10 and options.analytics: print('total lemmas so far: ' + str(config_params['analytics']['total_lemmas'])) if z3py_lemma in invalid_lemmas or z3py_lemma in valid_lemmas: if options.use_cex_models or options.use_cex_true_models: print('lemma has already been proposed') if z3py_lemma in invalid_lemmas: print( 'Something is wrong. Lemma was re-proposed in the presence of countermodels. ' 'Exiting.') # TODO: remove after replacing this with a check for terms in the grammar if z3py_lemma in valid_lemmas: print( 'This is a currently known limitation of the tool. Consider restricting your grammar to ' 'have terms of lesser height.') exit('Instance failed.') else: # No countermodels. Check if streaming mode for synthesis is enabled. if not options.streaming_synthesis_swtich: raise RuntimeError( 'Lemmas reproposed with countermodels and streaming disabled. Unsupported.' ) if options.verbose >= 7: print( 'Countermodels not enabled. Retrying lemma synthesis.' ) if options.analytics: post_validation = time.time() validation_time = post_validation - pre_validation config_params['analytics'][ 'time_charged'] += validation_time if options.verbose >= 10: print('Current lemma handled in: ' + str(validation_time) + 's') print('Time charged so far: ' + str( config_params['analytics']['time_charged']) + 's') continue pfp_lemma = make_pfp_formula(z3py_lemma_body) lemmaprover = NPSolver() lemmaprover.options.instantiation_mode = proveroptions.manual_instantiation lemmaprover.options.terms_to_instantiate = lemma_instantiation_terms lemma_npsolution = lemmaprover.solve(pfp_lemma, valid_lemmas) if options.analytics and options.streaming_synthesis_swtich: post_validation = time.time() validation_time = post_validation - pre_validation config_params['analytics']['time_charged'] += validation_time if options.verbose >= 10: print('Current lemma handled in: ' + str(validation_time) + 's') print('Time charged so far: ' + str(config_params['analytics']['time_charged']) + 's') if lemma_npsolution.if_sat: if options.verbose >= 4: print('proposed lemma cannot be proved.') if options.debug: # Check that the terms needed from the pfp of the proposed # lemma do not exceed lemma_grammar_terms. # Otherwise finite model extraction will not work. needed_instantiation_terms = get_foreground_terms( pfp_lemma, annctx=annctx) remaining_terms = needed_instantiation_terms - lemma_instantiation_terms if remaining_terms != set(): raise ValueError( 'lemma_terms is too small.\n' 'Lemma: {}\n' 'Terms needed after pfp computation: {}' ''.format(str(z3py_lemma_body), remaining_terms)) invalid_lemmas = invalid_lemmas + [z3py_lemma] use_cex_models_fallback = False if options.use_cex_true_models: if options.verbose >= 4: print('using true counterexample models') true_model_size = 5 true_cex_model, true_model_terms = gen_lfp_model( true_model_size, annctx, invalid_formula=z3py_lemma) if true_cex_model is not None: # Use after gen_lfp_model fixes values on elements not in the lfp (as sort.lattice_bottom) # true_model_terms = {z3.IntVal(elem) for elem in true_cex_model.fg_universe} const = [ arg for arg in lemma_grammar_args if not is_var_decl(arg, annctx) ] lemma_arity = len(lemma_grammar_args) - len(const) args = itertools.product(true_model_terms, repeat=lemma_arity) instantiations = [ arg for arg in args if z3.is_false( true_cex_model.smtmodel. eval(z3.substitute( z3py_lemma[1], list( zip(lemma_grammar_args[:lemma_arity], arg))), model_completion=True)) ] true_cex_models = true_cex_models + [ (true_cex_model, {instantiations[0]}) ] config_params['true_cex_models'] = true_cex_models else: # No LFP countermodel found. Supplant with PFP countermodel. use_cex_models_fallback = True if options.verbose >= 4: print( 'No true countermodel obtained. Using pfp countermodel instead.' ) if options.use_cex_models or use_cex_models_fallback: extraction_terms = lemma_npsolution.extraction_terms cex_model = FiniteModel(lemma_npsolution.model, extraction_terms, annctx=annctx) cex_models = cex_models + [cex_model] else: if options.verbose >= 3: print('proposed lemma was proven.') valid_lemmas.add(z3py_lemma) if options.streaming_synthesis_swtich: # Check if lemma helps prove goal using originally configured goal solver object # TODO: introduce warning or extend streaming algorithm to multiple lemma case goal_npsolution = goal_fo_solver.solve(goal, {z3py_lemma}) if not goal_npsolution.if_sat: # Lemma is useful. Wrap up processes and exit. print( 'Goal has been proven. Lemmas used to prove goal:') for lem in valid_lemmas: print(lem[1]) if options.analytics: # Update analytics entries for the current lemma before exiting. total_time = config_params['analytics'][ 'time_charged'] + config_params['analytics'][ 'lemma_time'] if options.verbose >= 0: print('Total lemmas proposed: ' + str(config_params['analytics'] ['total_lemmas'])) if options.verbose >= 0: print('Total time charged: ' + str(total_time) + 's') # Close the stream try: sygus_results.throw(StopProposal) except StopIteration: pass exit(0) else: # Lemma does not help prove goal. Try the next lemma in the stream. continue else: # Not streaming mode: reset countermodels and invalid lemmas to [] and try synthesis again. # We have additional information to retry the proofs. cex_models = [] invalid_lemmas = [] break # Update countermodels before next round of synthesis config_params['cex_models'] = cex_models # reset everything and increase streaming timeout if streaming mode is on if options.streaming_synthesis_swtich: # Compute the timeout of the next streaming call config_params['streaming_timeout'] *= 2 # Make each streaming call 15 minutes flat if config_params['streaming_timeout'] >= 15 * 60: # The following round of streaming will be too expensive. Exit. exit('Timeout reached. Exiting') if options.analytics: config_params['analytics']['time_charged'] = 0 config_params['analytics']['total_lemmas'] = 0 valid_lemmas = set() invalid_lemmas = []
from naturalproofs.prover import NPSolver import naturalproofs.proveroptions as proveroptions # Declarations a, zero = Consts('a zero', fgsort) suc = Function('suc', fgsort, fgsort) pred = Function('pred', fgsort, fgsort) AddAxiom(a, pred(suc(a)) == a) nat = RecFunction('nat', fgsort, boolsort) even = RecFunction('even', fgsort, boolsort) odd = RecFunction('odd', fgsort, boolsort) AddRecDefinition(nat, a, If(a == zero, True, nat(pred(a)))) AddRecDefinition(even, a, If(a == zero, True, odd(pred(a)))) AddRecDefinition(odd, a, If(a == zero, False, If(a == suc(zero), True, even(pred(a))))) # Problem parameters goal = Implies(nat(a), Or(even(a), odd(a))) pfp_of_goal = make_pfp_formula(goal) # Call a natural proofs solver npsolver = NPSolver() # Ask for proof npsolution = npsolver.solve(pfp_of_goal) class EvenOddTest(unittest.TestCase): def test1(self): self.assertFalse(npsolution.if_sat) if __name__ == '__main__': unittest.main()
AddRecDefinition(plus, (x, y), If(x == zero, y, succ(plus(pred(x), y)))) # axioms AddAxiom(x, pred(succ(x)) == x) AddAxiom(x, succ(x) != zero) goal = plus(x, y) == plus(y, x) # adt pfp of goal base_case = plus(zero, y) == plus(y, zero) induction_hypothesis = plus(nx, y) == plus(y, nx) induction_step = plus(succ(nx), y) == plus(y, succ(nx)) pfp_goal = Implies(induction_hypothesis, induction_step) orig_np_solver = NPSolver() orig_solution = orig_np_solver.solve(pfp_goal) print('Commutativity of addition: no lemma') if not orig_solution.if_sat: print(' -- goal is valid') else: print(' -- goal is invalid') # adt pfp of inductive case lemma: zero + x = x base_case = plus(zero, zero) == plus(zero, zero) induction_hypothesis = plus(zero, ny) == plus(ny, zero) induction_step = plus(zero, succ(ny)) == plus(succ(ny), zero) pfp_goal = And(base_case, Implies(induction_hypothesis, induction_step)) base_np_solver = NPSolver() base_solution = base_np_solver.solve(pfp_goal) print('Lemma for base case: zero + x = x')
import naturalproofs.proveroptions as proveroptions # Declarations x, y, nil = Consts('x y nil', fgsort) nxt = Function('nxt', fgsort, fgsort) lst = RecFunction('lst', fgsort, boolsort) ls = RecFunction('ls', fgsort, fgsort, boolsort) AddRecDefinition(lst, x, If(x == nil, True, lst(nxt(x)))) AddRecDefinition(ls, (x, y), If(x == nil, True, ls(nxt(x), y))) # Problem parameters goal = Implies(ls(x, nil), lst(x)) lemma1_params = (x, y) lemma1_body = Implies(And(ls(x, y), lst(y)), lst(x)) lemmas = {(lemma1_params, lemma1_body)} # Call a natural proofs solver npsolver = NPSolver() # Configure the solver npsolver.options.instantiation_mode = proveroptions.manual_instantiation npsolver.options.terms_to_instantiate = {x, y, nil} # Ask for proof npsolution = npsolver.solve(goal, lemmas) class LsListTest(unittest.TestCase): def test1(self): self.assertFalse(npsolution.if_sat) if __name__ == '__main__': unittest.main()