Python DQN.load_state_dict示例

编程语言: Python

命名空间/包名称: dqnClass

类/类型: DQN

方法/功能: load_state_dict

hotexamples.com的示例: 2

Python DQN.load_state_dict - 已找到2个示例。这些是从开源项目中提取的最受好评的dqnClass.DQN.load_state_dict现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

DQN(5)

eval(2)

load_state_dict(2)

chooseAction(1)

parameters(1)

state_dict(1)

storePastResults(1)

train(1)

示例#1

显示文件

文件： DQN_smaller.py 项目： sagau59/TetrisRepo

_, _, screen_height, screen_width = init_screen.shape

# Get number of actions from gym action space

n_actions = 4
policy_net = DQN(screen_height, screen_width, n_actions,layers=20).to(device)
target_net = DQN(screen_height, screen_width, n_actions,layers=20).to(device)
PATH = 'C:/Users/sagau/Google Drive/smaller1.pth'
optimizer = optim.Adam(policy_net.parameters(),lr=1e-4)

load_mode = False
if load_mode:
    model_dict = torch.load(PATH,map_location=torch.device('cpu'))
    i_episode = model_dict['epoch']
    optimizer.load_state_dict(model_dict['optimizer'])
    policy_net.load_state_dict(model_dict['state_dict'])
    target_net.load_state_dict(model_dict['state_dict'])
    episode_durations = model_dict['episode_durations']
    total_reward_list = model_dict['total_reward_list']
    point_list = model_dict['point_list']
    plot_durations()
else:     
    i_episode = 0
    target_net.load_state_dict(policy_net.state_dict())
    target_net.eval()
    episode_durations = []
    total_reward_list = []
    point_list = []

memory = ReplayMemory(10000000)
steps_done = 0

示例#2

显示文件

######################################################################

init_screen = get_screen()
_, _, screen_height, screen_width = init_screen.shape

# Get number of actions from gym action space

n_actions = 4
#PATH = 'C:/Users/sagau/Desktop/Kaggle/TetrisRepo/models/model1_2.pth'
policy_net = DQN(screen_height, screen_width, n_actions,layers=20)
policy_net.eval()
policy_net = DQN(screen_height, screen_width, n_actions,layers=20).to(device)

PATH = 'C:/Users/sagau/Google Drive/transfersmaller.pth'
model_dict = torch.load(PATH,map_location=torch.device('cpu'))
policy_net.load_state_dict(model_dict['state_dict'])
    
######################################################################
# Play with model !
sleep_time = 0.2
game = Tetris(nb_rows=8,nb_cols=6)
done = game.generate_block(choice=random.randint(0,3))
rows = 0
for t in count():
#    for t in range(200):
    state = get_screen()
    action = select_action(state,0)
#    print(action.item())
    game.play_active_block(action.item())
    if game.block_reached_end():
        rows = rows + game.clear_rows()