(s, worse), (s, better) = question arp_bb_question_list.append((s, better)) mdp_plot.plot_test_questions(arp_bb_question_list, world.features, walls=True, show=False, arrow_color='k', feature_colors=lava_colors, filename=os.path.join(project_path, 'figs/lava/arb-bb.png')) ###arp-pref tester = vav.TrajectoryRankingBasedTester(world, precision, rollout_length, debug, use_suboptimal_rankings=True) size_verification_test = tester.get_size_verification_test() print("number of questions", size_verification_test) print("arp-pref test questions") for question in tester.test: print(question) pref_halfspaces = np.array(tester.halfspaces) for i, question in enumerate(tester.test): mdp_plot.plot_preference_query(question.traj_better, question.traj_worse, world.features,
precision=precision, epsilon_gap=eps_gap) elif verifier_name == "state-optimal-action_ranker": tester = vav.RankingBasedTester(true_world, precision, debug=debug) elif verifier_name == "optimal_action": tester = vav.OptimalRankingBasedTester(true_world, precision, debug=debug) elif verifier_name == "trajectory_aec": tester = vav.TrajectoryRankingBasedTester(true_world, precision, rollout_length, debug=debug) elif verifier_name == "optimal_action_allquestions": tester = vav.OptimalRankingBasedTesterAll(true_world, precision, debug=debug) elif verifier_name == "scot": tester = vav.SCOTVerificationTester(true_world, precision, num_rollouts, rollout_length, debug=debug) else:
elif verifier_name == "arp-bb": tester = vav.ARPBlackBoxTester(true_world, Qopt, opt_policy, precision, debug=debug, teacher=teacher, tests=tests, halfspaces=halfspaces) elif verifier_name == "arp-pref": tester = vav.TrajectoryRankingBasedTester( true_world, Qopt, opt_policy, precision, rollout_length, debug=debug, use_suboptimal_rankings=True) elif verifier_name == "scot": tester = vav.SCOTVerificationTester(true_world, Qopt, opt_policy, precision, num_rollouts, rollout_length, debug=debug) else: print("invalid verifier name")