コード例 #1
0
    parser.add_argument('--net_size', type=int, default=None)
    parser.add_argument('--exp_name', type=str, default=None)
    # parser.add_argument('--exp_name', type=str, default=timestamp())
    # parser.add_argument('--mode', type=str, default='local')
    # parser.add_argument('--log_dir', type=str, default=None)
    args = parser.parse_args()

    return args


if __name__ == "__main__":
    args = parse_args()

    if args.env is None:
        variant = ENV_PARAMS[DEFAULT_ENV]
    else:
        variant = ENV_PARAMS[args.env]

    # Net size
    if args.net_size is not None:
        variant['net_size'] = args.net_size

    # Experiment name
    if args.exp_name is None:
        exp_name = variant['env_name']
    else:
        exp_name = args.exp_name

    setup_logger(exp_name, variant=variant)
    experiment(variant)
コード例 #2
0
        expt_variant['env_params']['subtask'] = args.subtask

    expt_variant['log_dir'] = args.log_dir
    expt_variant['load_dir'] = args.load_dir

    # Net size
    if args.net_size is not None:
        expt_variant['net_size'] = args.net_size

    expt_variant['gpu'] = args.gpu

    expt_variant['seed'] = args.seed

    expt_variant['render_q'] = args.render_q

    # Algo params
    expt_variant['algo_params']['render'] = args.render

    log_dir = setup_logger(expt_name,
                           variant=expt_variant,
                           snapshot_mode=args.snap_mode,
                           snapshot_gap=args.snap_gap,
                           log_dir=args.log_dir)
    dir_filename = os.path.realpath(__file__)
    filename = os.path.split(dir_filename)[1]
    copyfile(dir_filename, os.path.join(log_dir, filename))

    algo = experiment(expt_variant)

    # input('Press a key to close the script...')
コード例 #3
0
ファイル: sac_ant.py プロジェクト: domingoesteban/robolearn
    )
    algorithm = SoftActorCritic(env=env,
                                policy=policy,
                                qf=qf,
                                vf=vf,
                                **variant['algo_params'])
    if ptu.gpu_enabled():
        algorithm.cuda()
    algorithm.train()


if __name__ == "__main__":
    # noinspection PyTypeChecker
    variant = dict(
        algo_params=dict(
            num_epochs=1000,
            num_steps_per_epoch=1000,
            num_steps_per_eval=1000,
            batch_size=128,
            max_path_length=999,
            discount=0.99,
            soft_target_tau=0.001,
            policy_lr=3E-4,
            qf_lr=3E-4,
            vf_lr=3E-4,
        ),
        net_size=300,
    )
    setup_logger('name-of-experiment', variant=variant)
    experiment(variant)