Exemple #1
0
        cost=dict(
            cost_type='nn',
            network=(
                nn.Relu(ds, 200) >> nn.Relu(200) >> nn.Gaussian(1)
            ),
        ),

    ),
    train=dict(
        num_epochs=1000,
        learning_rate=1e-3,
        model_learning_rate=1e-3 * horizon,
        beta_start=1e-4,
        beta_end=10.0,
        beta_rate=5e-5,
        beta_increase=0,
        batch_size=2,
        dump_every=100,
        summary_every=50,
    ),
    data=dict(
        num_rollouts=100,
        init_std=0.5,
        smooth_noise=True,
    ),
    dump_data=True,
    seed=0,
    out_dir='out/vae/reacher',
)
run(experiment, remote=False, gpu=False, num_threads=1, instance_type='m5.4xlarge')
Exemple #2
0
from parasol.experiment import run, sweep

experiment = dict(
    experiment_type='solar',
    experiment_name='reacher-mpc',
    env={
        "environment_name": "Reacher",
    },
    control={
        'control_type': 'mpc',
        'horizon': 20,
    },
    # model='s3://parasol-experiments/vae/reacher-image/reacher-image_model{prior{prior_type}}-blds/weights/model-1700.pkl',
    model='out/reacher_mpc/nnds/weights/model-final.pkl',
    horizon=50,
    seed=0,
    rollouts_per_iter=2,
    num_iters=20,
    num_videos=2,
    out_dir='out/solar/reacher_mpc',
    model_train={'num_epochs': 100})
run(experiment, remote=False)
Exemple #3
0
        'random_target': False,
        'pd_cost': True,
        'easy_cost': False,
    },
    control=dict(
        control_type='lqrflm',
        data_strength=50,
        prior_type='model',
        horizon=50,
        init_std=0.5,
        kl_step=2.0,
    ),
    model='data/vae/reacher-image/weights/model-final.pkl',
    horizon=50,
    seed=0,
    rollouts_per_iter=40,
    num_iters=10,
    buffer_size=None,
    smooth_noise=False,
    num_videos=2,
    out_dir='data/solar/reacher-image/',
    model_train={
        'num_epochs': 0
    }
)
run(
    experiment,
    remote=False,
    num_threads=1,
)