def main(): lake_env = gym.make('FrozenLake-v0', is_slippery=False) coffee_env = coffeegame.CoffeeEnv() taxi_env = gym.make('Taxi-v3').env lake_agent = QLearningAgent(lake_env, 100, 20000, decay_rate=0.001, alpha=0.1, gamma=0.6, epsilon=1, rendering_enabled=False) coffee_agent = QLearningAgent(coffee_env, 100, 20000, decay_rate=0.01, alpha=0.1, gamma=0.6, epsilon=1, rendering_enabled=False) taxi_agent = QLearningAgent(taxi_env, 150, 100000, decay_rate=0.01, alpha=0.1, gamma=0.6, epsilon=1, rendering_enabled=False) lake_agent.learn("FrozenLake-v0 (non-slippery)")
outstr+=' {:6.2f}'.format(val) print(outstr) LEFT = 0 DOWN = 1 RIGHT = 2 UP = 3 import coffeegame import numpy as np # import getch learning_rate = 0.1 discount_rate = 0.6 env = coffeegame.CoffeeEnv() action_space_size = env.action_space.n state_space_size = env.observation_space.n #create the qtable q_table = np.zeros((state_space_size, action_space_size)) #reset environment state = env.reset() while(True): #print some stuff env.render() printQTable(q_table) print('0: LEFT, 1: DOWN, 2: RIGHT, 3:UP') # get next action from user