def get_actions(): possibleTorques = np.array([-1.0, 0.0, 1.0]) possibleActions = np.array( list( possibleIterations(possibleTorques, possibleTorques, possibleTorques, possibleTorques))) return possibleActions
def __init__(self): self.env = gym.make("BipedalWalker-v2") self.obs = self.env.reset() self.bestScore = 0 possibleTorques = np.array([-1.0, 0.0, 1.0]) self.possibleActions = np.array(list(possibleIterations(possibleTorques, possibleTorques, possibleTorques, possibleTorques))) print(self.possibleActions.shape) tf.reset_default_graph() self.initNetworkGraph()