def main(argv): args = get_args(argv) x = env_args(args) print(x) env = make(**vars(x)) policy_mod = import_module(args.policy_source) policy_class = getattr(policy_mod, 'DaggerPolicy') policy = policy_class(**vars(args)) dagger = Dagger(env, policy, **vars(args)) dagger.num_probes = 10 dagger.test(args.save_file_name) env.close()
def main(argv): args = get_args(argv) policy_mod = import_module(args.policy_source) policy_class = getattr(policy_mod, 'DaggerPolicy') policy = policy_class(**vars(args)) x = env_args(args) env = make(**vars(x)) args.iterations = 0 args.num_rollouts = 250 print(args.num_rollouts) dagger = Dagger(env, policy, **vars(args)) dagger.num_probes = 0 dagger.explore_only() env.close()