Exemple #1
0
            actor = Actor.Actor(sess, state_dim, action_dim, actor_lr, tau,
                                batch_size)
        elif actor_type == "rnn":
            actor = RNNActor.Actor(sess, state_dim, action_dim, actor_lr, tau,
                                   batch_size, num_of_action)

        critic = Critic.Critic(sess, state_dim, action_dim, critic_lr, tau,
                               gamma, actor.get_num_trainable_vars(),
                               critic_reg_weight)

        if noise_type == "gaussian":
            actor_noise = Noise.GaussianNoise(action_dim=action_dim,
                                              sigma=sigma)
        elif noise_type == "ou":
            actor_noise = Noise.OrnsteinUhlenbeckActionNoise(mu=np.zeros(
                [int(action_dim / num_of_action)]),
                                                             sigma=sigma)

        exp_detail = utils.experiment_detail_saver(domain_name, task_name,
                                                   step_size, actor_lr,
                                                   critic_lr, tau, gamma,
                                                   sigma, batch_size,
                                                   critic_reg_weight)

        print(exp_detail)
        utils.append_file_writer(video_dir, "experiment_detail.txt", "num of action : " \
                        + str(num_of_action) + "\n")
        print("num of action : " + str(num_of_action))

        utils.append_file_writer(video_dir, "experiment_detail.txt", "actor type : " \
                         + actor_type + "\n")
Exemple #2
0
    gamma = 0.99
    sigma = 0.2
    critic_reg_weight = 0.0
    noise_type = "ou"

    assert noise_type in ["ou","gaussian"]

    with tf.Session(config=tf_config) as sess:
                        #state_dim : 1d, action_spec : scalar
        actor = Actor.Actor(sess, state_dim, env.action_spec().shape[0], actor_lr, tau, batch_size)
        critic = Critic.Critic(sess, state_dim, env.action_spec().shape[0], critic_lr, tau, gamma, actor.get_num_trainable_vars(),critic_reg_weight)

        if noise_type == "gaussian":
            actor_noise = Noise.GaussianNoise(action_dim=env.action_spec().shape[0],sigma=sigma)
        elif noise_type == "ou":
            actor_noise = Noise.OrnsteinUhlenbeckActionNoise(mu=np.zeros([env.action_spec().shape[0]]), sigma=sigma)

        exp_detail = utils.experiment_detail_saver(
                            domain_name, task_name, step_size,
                            actor_lr, critic_lr, tau,
                            gamma, sigma, batch_size,
                            critic_reg_weight)

        print(exp_detail)
        utils.append_file_writer(video_dir, "experiment_detail.txt", "Critic origin type : "\
                                 +critic.critic_origin_type+"\n")
        utils.append_file_writer(video_dir, "experiment_detail.txt", "Noise type : " \
                                 + noise_type + "\n")

        utils.append_file_writer(video_dir, "experiment_detail.txt",exp_detail)