Python Agent.save Examples

Programming Language: Python

Namespace/Package Name: dqn_agent

Class/Type: Agent

Method/Function: save

Examples at hotexamples.com: 2

Python Agent.save - 2 examples found. These are the top rated real world Python examples of dqn_agent.Agent.save extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Agent(30)

act(30)

step(25)

load_model(4)

train(4)

store_transition(3)

save_model(3)

get_action(3)

select_action(2)

test(2)

choose_action(2)

learn(2)

save(2)

run(2)

get_done(1)

train_dqn(1)

convert_action(1)

update_exploration(1)

train_model(1)

stock_experience(1)

update_exploration_value(1)

update_network(1)

update_replay_memory(1)

update_target_Q_network_weights(1)

update_target_model(1)

update_target_network(1)

store_experience(1)

set_exploration_scheme(1)

dqn(1)

sim_learn(1)

set_paramter(1)

get_greedy_action(1)

save_the_model(1)

Q_values(1)

retrain(1)

replay(1)

predict(1)

load_the_model(1)

load(1)

inventory(1)

initialize_neural_net_weights(1)

init_episode(1)

get_reward(1)

write_history(1)

Example #1

Show file

File: main.py Project: cpow-89/Deep-Reinforcement-Learning-Nanodegree---Project-1-Navigation

def main():
    parser = argparse.ArgumentParser(description="Run Extended Q-Learning with given config")
    parser.add_argument("-c",
                        "--config",
                        type=str,
                        metavar="",
                        required=True,
                        help="Config file name - file must be available as .json in ./configs")

    args = parser.parse_args()

    # load config files
    with open(os.path.join(".", "configs", args.config), "r") as read_file:
        config = json.load(read_file)

    env = UnityEnvironment(file_name=os.path.join(*config["general"]["env_path"]))
    agent = Agent(config=config)

    if config["train"]["run_training"]:
        scores = sessions.train(agent, env, config)
        helper.plot_scores(scores)
        agent.save()
    else:
        agent.load()
        sessions.test(agent, env)

    env.close()

Example #2

Show file

        o_t_reshaped = np.reshape(o_t, (x_dim, y_dim, 2))
        o_tp1_reshaped = np.reshape(o_tp1, (x_dim, y_dim, 2))

        agent.update_replay_memory(o_t_reshaped, a_t, r_tp1, o_tp1_reshaped,
                                   episode_done)

        ep_reward += r_tp1

        if not c.test and episode_done:
            tsp_cost = tsp_computer.rl_cost(dqn_env.steps)
            if max_reward < ep_reward:
                str_out = 'max_reward={} < ep_reward={}'.format(
                    max_reward, ep_reward)
                max_reward = ep_reward
                agent.save(global_step=global_step)
                log.debug(
                    'saving graph {} -> steps: \n{}, \nstep_length: {}, rl_cost: {}, reward: {}, str_out={}'
                    .format(global_step, dqn_env.steps, len(dqn_env.steps),
                            tsp_cost, ep_reward, str_out))
            if len(dqn_env.steps) == len(
                    tsp_computer.coords.keys()) and best_tsp > tsp_cost:
                best_tsp = tsp_cost
                with open(os.path.join(save_dir, "path.txt"), "a") as myfile:
                    myfile.write('iteration {}, rl_cost {}: {}\n'.format(
                        global_step, tsp_cost, dqn_env.steps))

            completed_episodes += 1
            episode_reward.append(ep_reward)
            episode_length.append(t)
            rl_cost.append(tsp_computer.rl_cost(dqn_env.steps))