Python World.perform_actionの例

プログラミング言語: Python

名前空間/パッケージ名: world

クラス/型: World

メソッド/関数: perform_action

hotexamples.comのコード掲載数: 4

Python World.perform_action - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのworld.World.perform_actionの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

World(30)

stopState(7)

add(7)

__init__(6)

__str__(6)

moveList(5)

setState(5)

allStates(5)

buildLineSegmentTestWorld(4)

buildEllipse(4)

from_string(4)

singleMoveList(4)

perform_action(4)

allMoveList(4)

get_player(3)

performPreyMove(3)

addPlayer(3)

buildLineSegmentWorld(3)

nextPreyStates(2)

loadStartArea(2)

add_element(2)

init_schedules(2)

addEnemy(2)

from_snapshot(2)

add_garden(2)

loadSimulation(2)

addObject(2)

addCell(2)

apply_command(2)

to_s(2)

del_player(2)

__create__(2)

addArea(2)

buildAccelArrow(2)

get_location(2)

buildAccelSphere(2)

spawn_predator(2)

spawn_prey(2)

startSimulation(2)

buildGlobalGoal(2)

stopSimulation(2)

turn(2)

marking_fox(1)

marking_rabbit(1)

newGame(1)

moveEye(1)

move_snake(1)

offX(1)

next_gen(1)

occupied(1)

コード例 #1

ファイルを表示

ファイル: arrowconstructiontransform.py プロジェクト: anthonytw/transformed-qlearner

class ArrowConstructionTransformTrainer(ArrowConstructionTransform):
    def __init__(self):
        # Initialize super.
        ArrowConstructionTransform.__init__(self)
        
        # Define training world.
        self.training_world = World(1, 1)
        self.reset_training_world()
    
    # Learn the Q-table.
    def learn_policy(self):
        # Initialize Q-learner.
        qlearner = QLearner( \
            self.state_space,
            self.actions,
            self.handle_action,
            self.reset_training_world )
        
        # Initialize reward states.
        goal_states = [ \
            ( 0, self.state_space[1].index(World.ArrowState.Arrows_Complete) ),
            ( 1, self.state_space[1].index(World.ArrowState.Arrows_Complete) ) ]
        for goal_state in goal_states:
            qlearner.set_r_value( goal_state, 100 )
        
        #print qlearner.r_table
        
        # Run Q-learner.
        qlearner.execute(goal_states, 300, 30)
        
        # Return policy.
        return qlearner.get_policy()
    
    # Expands the reduced state into the training world.
    def expand_training_state(self, reduced_state):
        # Set world state based on reduced state.
        expanded_state = World.State.from_state(self.training_world.agent_state)
        expanded_state.arrows = self.state_space[1][reduced_state[1]]
        expanded_state.minerals = expanded_state._world.needed_minerals if self.state_space[0][reduced_state[0]] else 0
        expanded_state.bamboo = expanded_state._world.needed_bamboo if self.state_space[0][reduced_state[0]] else 0
        return expanded_state
    
    # Resets the training world.
    def reset_training_world(self):
        self.training_world.world_state[0][0] = World.SiteState.Useless
    
    # Handles an action.
    def handle_action(self, reduced_state, action_index):
        action = self.actions[action_index]
        expanded_state = self.expand_training_state(reduced_state)
        #print " -- Reduced state : " + str(reduced_state)
        #print " -- Expanded state: " + str(expanded_state)
        expanded_state = self.training_world.perform_action(expanded_state, action)
        #print " -- Expanded state: " + str(expanded_state)
        new_reduced_state = self.reduce_state(expanded_state)
        #print " -- Reduced state : " + str(new_reduced_state)
                
        return new_reduced_state

コード例 #2

ファイルを表示

ファイル: bambootransform.py プロジェクト: anthonytw/transformed-qlearner

class BambooTransformTrainer(BambooTransform):
    def __init__(self):
        # Initialize super.
        BambooTransform.__init__(self)
        
        # Define training world.
        self.training_world = World(1, 1)
        self.reset_training_world()
    
    # Learn the Q-table.
    def learn_policy(self):
        # Initialize Q-learner.
        qlearner = QLearner( \
            self.state_space,
            self.actions,
            self.handle_action,
            self.reset_training_world )
        
        # Initialize reward states.
        goal_states = [ \
            ( self.state_space[0].index(World.SiteState.Useless), ),
            ( self.state_space[0].index(World.SiteState.Bamboo_Planted), ) ]
        for goal_state in goal_states:
            qlearner.set_r_value( goal_state, 100 )
        
        #print qlearner.r_table
        
        # Run Q-learner.
        qlearner.execute(goal_states, 250, 15)
        
        # Return policy.
        return qlearner.get_policy()
    
    # Expands the reduced state into the training world.
    def expand_training_state(self, reduced_state):
        # Set world state based on reduced state.
        expanded_state = World.State.from_state(self.training_world.agent_state)
        self.training_world.world_state[0][0] = self.state_space[0][reduced_state[0]]
        return expanded_state
    
    # Resets the training world.
    def reset_training_world(self):
        self.training_world.world_state[0][0] = World.SiteState.Useless
    
    # Handles an action.
    def handle_action(self, reduced_state, action_index):
        action = self.actions[action_index]
        expanded_state = self.expand_training_state(reduced_state)
        #print " -- Reduced state : " + str(reduced_state)
        #print " -- Expanded state: " + str(expanded_state)
        expanded_state = self.training_world.perform_action(expanded_state, action)
        #print " -- Expanded state: " + str(expanded_state)
        new_reduced_state = self.reduce_state(expanded_state)
        #print " -- Reduced state : " + str(new_reduced_state)
                
        return new_reduced_state

コード例 #3

ファイルを表示

ファイル: positiontransform.py プロジェクト: anthonytw/transformed-qlearner

class PositionTransformTrainer(PositionTransform):
    def __init__(self):
        # Initialize super.
        PositionTransform.__init__(self)

        # Define training world.
        self.training_world = World(3, 3)
        self.training_world.world_state[PositionTransform.VerticleState.At + 1][
            PositionTransform.HorizontalState.At + 1
        ] = World.SiteState.Mineral_Deposit

    # Learn the Q-table.
    def learn_policy(self):
        # Initialize Q-learner.
        qlearner = QLearner(self.state_space, self.actions, self.handle_action, self.reset_training_world)

        # Initialize reward states.
        goal_states = [(PositionTransform.HorizontalState.At + 1, PositionTransform.VerticleState.At + 1)]
        for goal_state in goal_states:
            qlearner.set_r_value(goal_state, 100)

        # print qlearner.r_table

        # Run Q-learner.
        qlearner.execute(goal_states, 300, 50)

        # Return policy.
        return qlearner.get_policy()

    # Expands the reduced state into the training world.
    def expand_training_state(self, reduced_state):
        # Set world state based on reduced state.
        expanded_state = World.State.from_state(self.training_world.agent_state)
        expanded_state.x = reduced_state[0]
        expanded_state.y = reduced_state[1]
        return expanded_state

    # Resets the training world.
    def reset_training_world(self):
        # Training world does not require a reset in this transformation.
        pass

    # Handles an action.
    def handle_action(self, reduced_state, action_index):
        action = self.actions[action_index]
        expanded_state = self.expand_training_state(reduced_state)
        # print " -- Reduced state : " + str(reduced_state)
        # print " -- Expanded state: " + str(expanded_state)
        expanded_state = self.training_world.perform_action(expanded_state, action)
        # print " -- Expanded state: " + str(expanded_state)
        new_reduced_state = self.reduce_state(expanded_state)
        # print " -- Reduced state : " + str(new_reduced_state)
        return new_reduced_state

コード例 #4

ファイルを表示

ファイル: fulltransform.py プロジェクト: anthonytw/transformed-qlearner

class FullTransformTrainer(FullTransform):
    def __init__(self, cell_width, cell_height):
        # Initialize super.
        FullTransform.__init__(self, cell_width, cell_height)
        
        # Define training world.
        self.training_world = World(cell_width, cell_height)
        self.reset_training_world()
    
    # Learn the Q-table.
    def learn_policy(self):
        # Initialize Q-learner.
        qlearner = QLearner( \
            self.state_space,
            self.actions,
            self.handle_action,
            self.reset_training_world )
        
        # Initialize goal states.
        goal_states = []
        print "Enumerating goal states..."
        print self.state_space_dim
        for state_index in xrange(qlearner.r_table.size):
            state = numpy.unravel_index(state_index, qlearner.r_table.shape)
            if state[FullTransform.StateOffset.Arrows] == World.ArrowState.Arrows_Complete:
                goal_states.append(tuple(state))
        print "Goal states: %d" % len(goal_states)
        
        for goal_state in goal_states:
            qlearner.set_r_value( goal_state, 100 )
        
        #print qlearner.r_table
        
        # Run Q-learner.
        print "Total states: %d" % (qlearner.r_table.size)
        qlearner.execute(goal_states, 500000, 50)
        
        # Return policy.
        return qlearner.get_policy()
    
    # Expands the reduced state into the training world.
    def expand_training_state(self, reduced_state):
        # Set world state based on reduced state.
        expanded_state = World.State.from_state(self.training_world.agent_state)
        world = expanded_state._world
        
        # Set world state.
        for index in xrange(self.world_size):
            (x, y) = numpy.unravel_index(index, self.world_shape)
            world.world_state[y][x]
        
        # Set other elements.
        expanded_state.x = reduced_state[FullTransform.StateOffset.X]
        expanded_state.y = reduced_state[FullTransform.StateOffset.Y]
        expanded_state.minerals = 50 * reduced_state[FullTransform.StateOffset.Minerals]
        expanded_state.bamboo = 50 * reduced_state[FullTransform.StateOffset.Bamboo]
        expanded_state.arrows = reduced_state[FullTransform.StateOffset.Arrows]
            
        return expanded_state
    
    # Resets the training world.
    def reset_training_world(self):
        pass
        
    # Handles an action.
    def handle_action(self, reduced_state, action_index):
        action = self.actions[action_index]
        expanded_state = self.expand_training_state(reduced_state)
        expanded_state = self.training_world.perform_action(expanded_state, action)
        new_reduced_state = self.reduce_state(expanded_state)
                
        return new_reduced_state