Python GridWorldMDP.init示例

编程语言: Python

命名空间/包名称: simple_rl.tasks.grid_world.GridWorldMDPClass

类/类型: GridWorldMDP

方法/功能: __init__

hotexamples.com的示例: 10

Python GridWorldMDP.__init__ - 已找到10个示例。这些是从开源项目中提取的最受好评的simple_rl.tasks.grid_world.GridWorldMDPClass.GridWorldMDP.__init__现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

__init__(8)

GridWorldMDP(2)

_transition_func(1)

execute_agent_action(1)

get_actions(1)

get_init_state(1)

reset(1)

reward_func(1)

transition_func(1)

示例#1

显示文件

 def __init__(self,
              gamma=0.99,
              slip_prob=0.00,
              name="puddle",
              puddle_rects=[(0.1, 0.8, 0.5, 0.7), (0.4, 0.7, 0.5, 0.4)],
              goal_locs=[[1.0, 1.0]],
              is_goal_terminal=True,
              rand_init=False,
              step_cost=0.0):
     '''
     Args:
         gamma (float)
         slip_prob (float)
         name (str)
         puddle_rects (list): [(top_left_x, top_left_y), (bot_right_x, bot_right_y)]
         is_goal_terminal (bool)
         rand_init (bool)
         step_cost (float)
     '''
     self.delta = 0.05
     self.puddle_rects = puddle_rects
     GridWorldMDP.__init__(self,
                           width=1.0,
                           height=1.0,
                           init_loc=[0.25, 0.6],
                           goal_locs=goal_locs,
                           gamma=gamma,
                           name=name,
                           is_goal_terminal=is_goal_terminal,
                           rand_init=rand_init,
                           step_cost=step_cost)

示例#2

显示文件

 def __init__(self,
              width=9,
              height=9,
              init_loc=(1, 1),
              goal_locs=[(9, 9)],
              gamma=0.99,
              slip_prob=0.00,
              name="four_room",
              is_goal_terminal=True,
              rand_init=False,
              step_cost=0.0):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
     '''
     GridWorldMDP.__init__(self,
                           width,
                           height,
                           init_loc,
                           goal_locs=goal_locs,
                           walls=self._compute_walls(width, height),
                           gamma=gamma,
                           slip_prob=slip_prob,
                           name=name,
                           is_goal_terminal=is_goal_terminal,
                           rand_init=rand_init,
                           step_cost=step_cost)

示例#3

显示文件

 def __init__(self, gamma=0.99, slip_prob=0.00, name="puddle", is_goal_terminal=True, rand_init=False):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
     '''
     GridWorldMDP.__init__(self, width=1.0, height=1.0, init_loc=[0.0,0.0], goal_locs=[1.0,1.0], gamma=gamma, name=name, is_goal_terminal=is_goal_terminal, rand_init=rand_init)

示例#4

显示文件

 def __init__(self, width=9, height=9, init_loc=(1,1), goal_locs=[(9,9)], gamma=0.99):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
     '''
     GridWorldMDP.__init__(self, width, height, init_loc, goal_locs, walls=self._compute_walls(width, height), gamma=gamma)

示例#5

显示文件

文件： PuddleMDPClass.py 项目： david-abel/simple_rl

 def __init__(self, gamma=0.99, slip_prob=0.00, name="puddle", puddle_rects=[(0.1, 0.8, 0.5, 0.7), (0.4, 0.7, 0.5, 0.4)], goal_locs=[[1.0, 1.0]], is_goal_terminal=True, rand_init=False, step_cost=0.0):
     '''
     Args:
         gamma (float)
         slip_prob (float)
         name (str)
         puddle_rects (list): [(top_left_x, top_left_y), (bot_right_x, bot_right_y)]
         is_goal_terminal (bool)
         rand_init (bool)
         step_cost (float)
     '''
     self.delta = 0.05
     self.puddle_rects = puddle_rects
     GridWorldMDP.__init__(self, width=1.0, height=1.0, init_loc=[0.25, 0.6], goal_locs=goal_locs, gamma=gamma, name=name, is_goal_terminal=is_goal_terminal, rand_init=rand_init, step_cost=step_cost)

示例#6

显示文件

文件： ColorMDPClass.py 项目： seansegal/simple_rl

 def __init__(self, width=9, height=9, rand_init=False, is_four_room=False, num_colors=5, init_loc=(1,1), goal_locs=[(9,9)], gamma=0.99, slip_prob=0.00, name="color"):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
     '''
     self.num_colors = num_colors
     if is_four_room:
         walls = self._compute_walls(width, height)
     else:
         walls = []
     init_state = ColorState(init_loc[0], init_loc[1], color=random.randint(1, self.num_colors))
     GridWorldMDP.__init__(self, width, height, init_loc, rand_init=rand_init, init_state=init_state, goal_locs=goal_locs, walls=walls, gamma=gamma, slip_prob=slip_prob, name=str(self.num_colors) + name)

示例#7

显示文件

 def __init__(self, gamma=0.99, slip_prob=0.00, name="puddle", puddle_rects=[], goal_locs=[[1.0, 1.0]], is_goal_terminal=True, rand_init=False, step_cost=0.0):
     '''
     Args:
         gamma (float)
         slip_prob (float)
         name (str)
         puddle_rects (list): [(top_left_x, top_left_y), (bot_right_x, bot_right_y)]
         is_goal_terminal (bool)
         rand_init (bool)
         step_cost (float)
     '''
     self.delta = 0.2 #0.05
     self.puddle_rects = puddle_rects
     GridWorldMDP.__init__(self, width=1.0, height=1.0, init_loc=[0.6, 0.0], goal_locs=goal_locs, gamma=gamma, name=name, is_goal_terminal=is_goal_terminal, rand_init=rand_init, step_cost=step_cost)
     self.screen = pygame.display.set_mode((720,720))
     self.gamma = 0.9

示例#8

显示文件

文件： FourRoomMDPClass.py 项目： david-abel/simple_rl

 def __init__(self, width=9, height=9, init_loc=(1,1), goal_locs=[(9,9)], lava_locs=[()], gamma=0.99, slip_prob=0.00, name="four_room", is_goal_terminal=True, rand_init=False, lava_cost=0.01, step_cost=0.0):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
         lava_locs (list of tuples)
         gamma (float)
         slip_prob (float)
         name (str)
         is_goal_terminal (bool)
         rand_init (bool)
         lava_cost (float)
         step_cost (float)
     '''
     GridWorldMDP.__init__(self, width, height, init_loc, goal_locs=goal_locs, lava_locs=lava_locs, walls=self._compute_walls(width, height), gamma=gamma, slip_prob=slip_prob, name=name, is_goal_terminal=is_goal_terminal, rand_init=rand_init, lava_cost=lava_cost, step_cost=step_cost)

示例#9

显示文件

文件： LTLGridWorldMDPClass.py 项目： roma-patel/ltl-amdp

    def __init__(self,
                 ltltask='F a',
                 ap_map={'a': (1, 1)},
                 width=5,
                 height=3,
                 init_loc=(1, 1),
                 rand_init=False,
                 goal_locs=[(5, 3)],
                 lava_locs=[()],
                 walls=[],
                 is_goal_terminal=True,
                 gamma=0.99,
                 init_state=None,
                 slip_prob=0.0,
                 step_cost=0.0,
                 lava_cost=0.01,
                 name="gridworld"):

        GridWorldMDP.__init__(self, width, height, init_loc, rand_init,
                              goal_locs, lava_locs, walls, is_goal_terminal,
                              gamma, init_state, slip_prob, step_cost,
                              lava_cost, name)

        self.ap_map = ap_map
        self.automata = LTLautomata(ltltask)  # construct automata
        self.init_q = self.automata.init_state
        #initialize
        init_state = LTLGridWorldState(
            self.init_loc[0], self.init_loc[1], self.init_q
        ) if init_state is None or self.rand_init else self.init_state
        MDP.__init__(self,
                     LTLGridWorldMDP.ACTIONS,
                     self._transition_func,
                     self._reward_func,
                     init_state=init_state,
                     gamma=gamma)
        self.cur_state = init_state

示例#10

显示文件

 def __init__(self,
              gamma=0.99,
              slip_prob=0.00,
              name="puddle",
              is_goal_terminal=True,
              rand_init=False):
     '''
     Args:
         height (int)
         width (int)
         init_loc (tuple: (int, int))
         goal_locs (list of tuples: [(int, int)...])
     '''
     self.delta = 0.01
     self.puddle_rects = [(0.1, 0.8, 0.5, 0.7), (0.4, 0.7, 0.5, 0.4)]
     GridWorldMDP.__init__(self,
                           width=1.0,
                           height=1.0,
                           init_loc=[0.25, 0.6],
                           goal_locs=[[1.0, 1.0]],
                           gamma=gamma,
                           name=name,
                           is_goal_terminal=is_goal_terminal,
                           rand_init=rand_init)

Python GridWorldMDP.__init__示例

Python GridWorldMDP.init示例