Python Game示例

编程语言: Python

命名空间/包名称: PhotosynthesisAI

类/类型: Game

hotexamples.com的示例: 6

Python Game - 已找到6个示例。这些是从开源项目中提取的最受好评的PhotosynthesisAI.Game现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

get_nn_features(5)

get_linear_features(2)

示例#1

显示文件

    def play_move(self, game: Game, moves: List[Move]):
        available_actions = [move.move_id for move in moves]
        start_state = game.get_nn_features(self)
        action = np.random.choice(game.total_num_actions,
                                  p=self.policy(
                                      start_state,
                                      available_actions=available_actions))
        move = self.action_to_move(action, moves)
        # Perform the action -> Get the reward and observe the next state
        new_state, reward = self.env.step(move)
        action = np.random.choice(game.total_num_actions,
                                  p=self.policy(
                                      start_state,
                                      available_actions=available_actions))
        # new_action = np.random.choice(
        #     game.total_num_actions,
        #     p=self.policy(new_state, available_actions=available_actions)
        # )
        q_values_new_state = self.estimator.predict(
            state_features=new_state, available_actions=available_actions)

        # value that we should have got
        # The Q-learning target policy is a greedy one, hence the `max`
        td_target = reward + self.discount_factor * np.nanmax(
            q_values_new_state)
        self.estimator.update(action, start_state, td_target)

示例#2

显示文件

文件： base_rl.py 项目： tom-clements/PhotosynthesisAI

 def play_move(self, game: Game, moves: List[Move]):
     available_actions = [move.move_id for move in moves]
     self.state = game.get_nn_features(self)
     if len(available_actions) == 1:
         self.action = available_actions[0]
     else:
         self.action = self._get_policy_action(game, available_actions)
     move = self._action_to_move(self.action, moves)
     # Perform the action -> Get the reward and observe the next state
     new_state, reward = self.env.step(move)
     if self.train:
         td_target = self.get_td_target(new_state, reward, available_actions)
         self.estimator.update(self.state, td_target)

示例#3

显示文件

 def _set_estimator(self, game: Game):
     if not self.estimator:
         self.estimator = LinearEstimator(game.total_num_actions,
                                          game.get_linear_features(self))

示例#4

显示文件

文件： deep_tensorflow.py 项目： tom-clements/PhotosynthesisAI

 def _set_estimator(self, game: Game):
     if not self.estimator:
         self.estimator = TensorflowNNEstimator(game.total_num_actions,
                                                game.get_nn_features(self))

示例#5

显示文件

文件： deep_pytorch.py 项目： tom-clements/PhotosynthesisAI

 def _set_estimator(self, game: Game):
     if not self.estimator:
         self.estimator = TorchEstimator(game.total_num_actions,
                                         game.get_nn_features(self),
                                         load_model=self.load_model,
                                         name=self.name)

示例#6

显示文件

 def _set_estimator(self, game: Game):
     if not self.estimator:
         self.estimator = NeuralNetworkEstimator(game.total_num_actions,
                                                 game.get_nn_features(self))