Python Network.set_weightsの例

プログラミング言語: Python

名前空間/パッケージ名: models.network

クラス/型: Network

メソッド/関数: set_weights

hotexamples.comのコード掲載数: 2

Python Network.set_weights - 2件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのmodels.network.Network.set_weightsの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Network(30)

load_state_dict(8)

parameters(4)

cuda(4)

inference(4)

generate_share_alphas(4)

get_by_id(3)

eval(3)

state_dict(3)

get_sub_net(3)

set_weights(2)

get_weights(2)

training_steps(2)

train_step(1)

save(1)

optional_label(1)

recurrent_inference(1)

symbols(1)

to(1)

reactions(1)

train(1)

species(1)

initial_inference(1)

named_parameters(1)

loss_function(1)

load_from_file(1)

SaveModelReport(1)

get_variables(1)

get_channel_frequency(1)

get_by_owner(1)

getInstances(1)

getInstance(1)

forward(1)

feedForward(1)

computeLoss(1)

backwardPropagate(1)

SetReportingOn(1)

update_training_steps(1)

コード例 #1

ファイルを表示

ファイル: __init__.py プロジェクト: ipsec/muzero

class SharedStorage(object):

    def __init__(self, config: MuZeroConfig):
        self.config = config
        self.network = Network(self.config)
        self._started = False

    def get_network_weights(self):
        return self.network.get_weights()

    def update_network(self, weights):
        self.network.set_weights(weights)
        if not self._started:
            self._started = True

    def started(self):
        return self._started

コード例 #2

ファイルを表示

ファイル: actor.py プロジェクト: ipsec/muzero

class Actor:
    def __init__(self,
                 config: MuZeroConfig,
                 storage: SharedStorage,
                 replay_buffer: ReplayBuffer,
                 temperature: float = 1.0):
        self.config = config
        self.network = Network(self.config)
        self.storage = storage
        self.replay_buffer = replay_buffer
        self.temperature = temperature
        self.name = f"games-{temperature}"
        self.summary = create_summary(name=self.name)
        self.games_played = 0
        self.metrics_games = Sum(self.name, dtype=tf.int32)
        self.metrics_temperature = Sum(self.name, dtype=tf.float32)
        self.metrics_rewards = Mean(self.name, dtype=tf.float32)
        self.started = False

    def update_metrics(self):
        with self.summary.as_default():
            tf.summary.scalar(f'games-played', self.metrics_games.result(),
                              self.games_played)
            tf.summary.scalar(f'games-temperature',
                              self.metrics_temperature.result(),
                              self.games_played)
            tf.summary.scalar(f'games-rewards', self.metrics_rewards.result(),
                              self.games_played)

        self.metrics_temperature.reset_states()
        self.metrics_rewards.reset_states()

    def start(self):
        while self.games_played < self.config.training_steps:
            game = self.play_game()
            self.games_played += 1
            self.metrics_games(1)
            self.metrics_rewards(sum(game.rewards))
            self.update_metrics()

            self.replay_buffer.save_game.remote(game)

            if not self.started:
                self.started = ray.get(self.storage.started.remote())
                continue

            if self.games_played % self.config.checkpoint_interval == 0:
                weights = ray.get(self.storage.get_network_weights.remote())
                self.network.set_weights(weights)

        print(f"Actor: {self.name } finished.")

    def play_game(self) -> Game:
        game = Game(self.config.discount)
        min_max_stats = MinMaxStats(self.config.known_bounds)

        # Use Exponential Decay to reduce temperature over time
        temperature = max(
            self.temperature * (1 - self.config.temperature_decay_factor)**
            self.network.training_steps(), self.config.temperature_min)
        self.metrics_temperature(temperature)

        while not game.terminal() and len(
                game.history) < self.config.max_moves:

            # At the root of the search tree we use the representation function to
            # obtain a hidden state given the current observation.
            root = Node(0)
            current_observation = game.get_observation_from_index(-1)
            network_output = self.network.initial_inference(
                current_observation)
            expand_node(root, game.to_play(), game.legal_actions(),
                        network_output)
            backpropagate([root], network_output.value, game.to_play(),
                          self.config.discount, min_max_stats)
            add_exploration_noise(self.config, root)

            # We then run a Monte Carlo Tree Search using only action sequences and the
            # model learned by the network.
            run_mcts(self.config, root, game.action_history(), self.network,
                     min_max_stats)
            action = select_action(root, temperature)
            game.apply(action)
            game.store_search_statistics(root)

        return game