コード例 #1
0
    (s, worse), (s, better) = question
    arp_bb_question_list.append((s, better))

mdp_plot.plot_test_questions(arp_bb_question_list,
                             world.features,
                             walls=True,
                             show=False,
                             arrow_color='k',
                             feature_colors=lava_colors,
                             filename=os.path.join(project_path,
                                                   'figs/lava/arb-bb.png'))

###arp-pref
tester = vav.TrajectoryRankingBasedTester(world,
                                          precision,
                                          rollout_length,
                                          debug,
                                          use_suboptimal_rankings=True)
size_verification_test = tester.get_size_verification_test()
print("number of questions", size_verification_test)

print("arp-pref test questions")
for question in tester.test:
    print(question)

pref_halfspaces = np.array(tester.halfspaces)

for i, question in enumerate(tester.test):
    mdp_plot.plot_preference_query(question.traj_better,
                                   question.traj_worse,
                                   world.features,
コード例 #2
0
                        precision=precision,
                        epsilon_gap=eps_gap)

                elif verifier_name == "state-optimal-action_ranker":
                    tester = vav.RankingBasedTester(true_world,
                                                    precision,
                                                    debug=debug)

                elif verifier_name == "optimal_action":
                    tester = vav.OptimalRankingBasedTester(true_world,
                                                           precision,
                                                           debug=debug)

                elif verifier_name == "trajectory_aec":
                    tester = vav.TrajectoryRankingBasedTester(true_world,
                                                              precision,
                                                              rollout_length,
                                                              debug=debug)

                elif verifier_name == "optimal_action_allquestions":
                    tester = vav.OptimalRankingBasedTesterAll(true_world,
                                                              precision,
                                                              debug=debug)

                elif verifier_name == "scot":
                    tester = vav.SCOTVerificationTester(true_world,
                                                        precision,
                                                        num_rollouts,
                                                        rollout_length,
                                                        debug=debug)

                else:
コード例 #3
0
                elif verifier_name == "arp-bb":
                    tester = vav.ARPBlackBoxTester(true_world,
                                                   Qopt,
                                                   opt_policy,
                                                   precision,
                                                   debug=debug,
                                                   teacher=teacher,
                                                   tests=tests,
                                                   halfspaces=halfspaces)

                elif verifier_name == "arp-pref":
                    tester = vav.TrajectoryRankingBasedTester(
                        true_world,
                        Qopt,
                        opt_policy,
                        precision,
                        rollout_length,
                        debug=debug,
                        use_suboptimal_rankings=True)

                elif verifier_name == "scot":
                    tester = vav.SCOTVerificationTester(true_world,
                                                        Qopt,
                                                        opt_policy,
                                                        precision,
                                                        num_rollouts,
                                                        rollout_length,
                                                        debug=debug)

                else:
                    print("invalid verifier name")