예제 #1
0
파일: pointmass.py 프로젝트: jcoreyes/erl
                batch_size=128,
                lr=1e-3,
                # weight_decay=0.01,
            ),
            save_period=5,
        ),
        renderer_kwargs=dict(
            # create_image_format='HWC',
            # output_image_format='CWH',
            output_image_format='CHW',
            flatten_image=True,
            # normalize_image=False,
        ),
        evaluation_goal_sampling_mode="reset_of_env",
        exploration_goal_sampling_mode="vae_prior",
        launcher_config=dict(unpack_variant=True, ))

    search_space = {
        "seed": range(5),
    }
    sweeper = hyp.DeterministicHyperparameterSweeper(
        search_space,
        default_parameters=variant,
    )

    variants = []
    for variant in sweeper.iterate_hyperparameters():
        variants.append(variant)

    run_variants(rig_experiment, variants, process_args)
예제 #2
0
            dict(m=0, b=0),
        ],
        'qf_kwargs.output_activation': [Clamp(max=0)],
    }
    sweeper = hyp.DeterministicHyperparameterSweeper(
        search_space,
        default_parameters=variant,
    )

    variants = []
    for variant in sweeper.iterate_hyperparameters():
        env_type = variant['env_type']
        eval_goals = 'sasha/presampled_goals/affordances/combined/{0}_goals.pkl'.format(
            env_type)
        variant['presampled_goal_kwargs']['eval_goals'] = eval_goals

        if env_type in ['top_drawer', 'bottom_drawer']:
            variant['env_class'] = SawyerRigAffordancesV0
            variant['env_kwargs']['env_type'] = env_type
        if env_type == 'tray':
            variant['env_class'] = SawyerRigMultiobjTrayV0
        if env_type == 'pnp':
            variant['env_class'] = SawyerRigMultiobjV0

        variants.append(variant)

    run_variants(awac_rig_experiment,
                 variants,
                 run_id=0,
                 process_args_fn=process_args)  #HERE
예제 #3
0
        # 'num_pybullet_objects':[None],
        'policy_kwargs.min_log_std': [-6],
        'trainer_kwargs.awr_weight': [1.0],
        'trainer_kwargs.awr_use_mle_for_vf': [True, ],
        'trainer_kwargs.awr_sample_actions': [False, ],
        'trainer_kwargs.clip_score': [2, ],
        'trainer_kwargs.awr_min_q': [True, ],
        'trainer_kwargs.reward_transform_kwargs': [None, ],
        'trainer_kwargs.terminal_transform_kwargs': [dict(m=0, b=0),],
        'qf_kwargs.output_activation': [Clamp(max=0)],
    }
    sweeper = hyp.DeterministicHyperparameterSweeper(
        search_space, default_parameters=variant,
    )

    variants = []
    for variant in sweeper.iterate_hyperparameters():
        env_type = variant['env_type']
        obj = variant['env_kwargs']['object_subset'][0]
        eval_goals = 'sasha/presampled_goals/affordances/combined/{0}_{1}_goals.pkl'.format(env_type, obj)
        variant['presampled_goal_kwargs']['eval_goals'] = eval_goals

        if env_type == 'tray':
            variant['env_class'] = SawyerRigMultiobjTrayV0
        if env_type == 'pnp':
            variant['env_class'] = SawyerRigMultiobjV0

        variants.append(variant)

    run_variants(awac_rig_experiment, variants, run_id=50) #HERE