def auto_td3_benchmarks():
    """Run experiments for TD3 benchmarking."""
    td3_env_ids = [
        env_id for env_id in MuJoCo1M_ENV_SET if env_id != 'Reacher-v2'
    ]

    iterate_experiments(td3_metarl_tf, td3_env_ids)
def auto_vpg_benchmarks():
    """Run experiments for VPG benchmarking."""
    iterate_experiments(vpg_metarl_pytorch, MuJoCo1M_ENV_SET)
    iterate_experiments(vpg_metarl_tf, MuJoCo1M_ENV_SET)
def auto_trpo_benchmarks():
    """Run experiments for TRPO benchmarking."""
    iterate_experiments(trpo_metarl_pytorch, MuJoCo1M_ENV_SET)
    iterate_experiments(trpo_metarl_tf, MuJoCo1M_ENV_SET)
def auto_ddpg_benchmarks():
    """Run experiments for DDPG benchmarking."""
    iterate_experiments(ddpg_metarl_tf, MuJoCo1M_ENV_SET)
Esempio n. 5
0
def continuous_mlp_q_function_tf_ddpg_benchmarks():
    """Run benchmarking experiments for Continuous MLP QFunction on TF-DDPG."""
    iterate_experiments(continuous_mlp_q_function,
                        MuJoCo1M_ENV_SET,
                        seeds=_seeds)
def her_benchmarks():
    """Run experiments for HER benchmarking."""
    iterate_experiments(her_metarl_tf, Fetch1M_ENV_SET)
def gaussian_cnn_baseline_tf_ppo_benchmarks():
    """Run benchmarking experiments for Gaussian CNN Baseline on TF-PPO."""
    iterate_experiments(gaussian_cnn_baseline, PIXEL_ENV_SET, seeds=_seeds)
def gaussian_mlp_baseline_tf_ppo_benchmarks():
    """Run benchmarking experiments for Gaussian MLP Baseline on TF-PPO."""
    iterate_experiments(gaussian_mlp_baseline, MuJoCo1M_ENV_SET, seeds=_seeds)
def continuous_mlp_baseline_tf_ppo_benchmarks():
    """Run benchmarking experiments for Continuous MLP Baseline on TF-PPO."""
    iterate_experiments(continuous_mlp_baseline,
                        MuJoCo1M_ENV_SET,
                        seeds=_seeds)
Esempio n. 10
0
def gaussian_mlp_policy_tf_ppo_benchmarks():
    """Run benchmarking experiments for Gaussian MLP Policy on TF-PPO."""
    iterate_experiments(gaussian_mlp_policy, MuJoCo1M_ENV_SET, seeds=_seeds)
Esempio n. 11
0
def continuous_mlp_policy_tf_ddpg_benchmarks():
    """Run benchmarking experiments for Continuous MLP Policy on TF-DDPG."""
    seeds = random.sample(range(100), 5)
    iterate_experiments(continuous_mlp_policy, MuJoCo1M_ENV_SET, seeds=seeds)
Esempio n. 12
0
def categorical_mlp_policy_tf_ppo_benchmarks():
    """Run benchmarking experiments for Categorical MLP Policy on TF-PPO."""
    iterate_experiments(categorical_mlp_policy, STATE_ENV_SET, seeds=_seeds)
Esempio n. 13
0
def categorical_cnn_policy_tf_ppo_benchmarks():
    """Run benchmarking experiments for Categorical CNN Policy on TF-PPO."""
    iterate_experiments(categorical_cnn_policy, PIXEL_ENV_SET, seeds=_seeds)