Python negativeGrid示例

编程语言: Python

命名空间/包名称: gridWorld

方法/功能: negativeGrid

hotexamples.com的示例: 2

Python negativeGrid - 已找到2个示例。这些是从开源项目中提取的最受好评的gridWorld.negativeGrid现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

"""

import numpy as np
import matplotlib.pyplot as plt
from gridWorld import standardGrid, negativeGrid
from iterativePolicyEvaluation import printPolicy, printValues
from monteCarloControl import argMax
from td0Prediction import randomAction


GAMMA = 0.9
ALPHA = 0.1
ACTIONS = {'U','D','L','R'}

if __name__ == '__main__':
    grid = negativeGrid(stepCost = -0.1)
    
    print ("Rewards:")
    printValues(grid.rewards,grid)
    
    Q = {}
    
    states = grid.allStates()
    
    for s in states:
        Q[s] = {}
        for a in ACTIONS:
            Q[s][a] = 0
    
    
    updateCountsSarsa = {}

示例#2

显示文件

文件： valueIteration.py 项目： AidinFerdowsi/DynamicProgramming

Created on Mon Jan  7 11:37:45 2019

@author: user
"""

import numpy as np
from gridWorld import standardGrid, negativeGrid
from iterativePolicyEvaluation import printValues, printPolicy

EPSILON = 10e-4
GAMMA = 0.9
ACTIONS = ('U', 'D', 'L', 'R')

if __name__ == '__main__':

    grid = negativeGrid()

    policy = {}
    for s in grid.actions.keys():
        policy[s] = np.random.choice(ACTIONS)

    print("Rewards:")
    printValues(grid.rewards, grid)

    print("Initial Policy:")
    printPolicy(policy, grid)

    V = {}
    states = grid.allStates()

    for s in states: