Python TrainingBatch._replace Examples

Programming Language: Python

Namespace/Package Name: ml.rl.types

Class/Type: TrainingBatch

Method/Function: _replace

Examples at hotexamples.com: 3

Python TrainingBatch._replace - 3 examples found. These are the top rated real world Python examples of ml.rl.types.TrainingBatch._replace extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

TrainingBatch(4)

_replace(3)

as_parametric_sarsa_training_batch(1)

Example #1

Show file

File: batch_preprocessor.py Project: Fengdan92/Horizon

    def __call__(self, batch: TrainingBatch) -> TrainingBatch:
        training_input = cast(Union[DiscreteDqnInput, ParametricDqnInput],
                              batch.training_input)

        preprocessed_state = self.state_preprocessor(
            training_input.state.float_features.value,
            training_input.state.float_features.presence,
        )
        preprocessed_next_state = self.state_preprocessor(
            training_input.next_state.float_features.value,
            training_input.next_state.float_features.presence,
        )
        new_training_input = training_input._replace(
            state=training_input.state._replace(
                float_features=preprocessed_state),
            next_state=training_input.next_state._replace(
                float_features=preprocessed_next_state),
        )
        return batch._replace(training_input=new_training_input)

Example #2

Show file

File: batch_preprocessor.py Project: Fengdan92/Horizon

    def __call__(self, batch: TrainingBatch) -> TrainingBatch:
        batch = super().__call__(batch)

        training_input = cast(PolicyNetworkInput, batch.training_input)

        action_before_preprocessing = cast(FeatureVector,
                                           training_input.action)
        preprocessed_action = self.action_preprocessor(
            action_before_preprocessing.float_features.value,
            action_before_preprocessing.float_features.presence,
        )
        next_action_before_preprocessing = cast(FeatureVector,
                                                training_input.next_action)
        preprocessed_next_action = self.action_preprocessor(
            next_action_before_preprocessing.float_features.value,
            next_action_before_preprocessing.float_features.presence,
        )
        return batch._replace(training_input=training_input._replace(
            action=action_before_preprocessing._replace(
                float_features=preprocessed_action),
            next_action=next_action_before_preprocessing._replace(
                float_features=preprocessed_next_action),
        ))

Example #3

Show file

File: batch_preprocessor.py Project: Fengdan92/Horizon

    def __call__(self, batch: TrainingBatch) -> TrainingBatch:
        batch = super().__call__(batch)

        if isinstance(batch.training_input, ParametricDqnInput):
            training_input = cast(ParametricDqnInput, batch.training_input)
            preprocessed_tiled_next_state = self.state_preprocessor(
                training_input.tiled_next_state.float_features.value,
                training_input.tiled_next_state.float_features.presence,
            )
            preprocessed_action = self.action_preprocessor(
                training_input.action.float_features.value,
                training_input.action.float_features.presence,
            )
            preprocessed_next_action = self.action_preprocessor(
                training_input.next_action.float_features.value,
                training_input.next_action.float_features.presence,
            )
            preprocessed_possible_actions = self.action_preprocessor(
                training_input.possible_actions.float_features.value,
                training_input.possible_actions.float_features.presence,
            )
            preprocessed_possible_next_actions = self.action_preprocessor(
                training_input.possible_next_actions.float_features.value,
                training_input.possible_next_actions.float_features.presence,
            )
            return batch._replace(training_input=training_input._replace(
                action=training_input.action._replace(
                    float_features=preprocessed_action),
                next_action=training_input.next_action._replace(
                    float_features=preprocessed_next_action),
                possible_actions=training_input.possible_actions._replace(
                    float_features=preprocessed_possible_actions),
                possible_next_actions=training_input.possible_next_actions.
                _replace(float_features=preprocessed_possible_next_actions),
                tiled_next_state=training_input.tiled_next_state._replace(
                    float_features=preprocessed_tiled_next_state),
            ))
        elif isinstance(batch.training_input, SARSAInput):
            training_input_sarsa = cast(SARSAInput, batch.training_input)
            preprocessed_tiled_next_state = self.state_preprocessor(
                training_input_sarsa.tiled_next_state.float_features.
                value,  # type: ignore
                training_input_sarsa.tiled_next_state.float_features.
                presence,  # type: ignore
            )
            preprocessed_action = self.action_preprocessor(
                training_input_sarsa.action.float_features.
                value,  # type: ignore
                training_input_sarsa.action.float_features.
                presence,  # type: ignore
            )
            preprocessed_next_action = self.action_preprocessor(
                training_input_sarsa.next_action.float_features.
                value,  # type: ignore
                training_input_sarsa.next_action.float_features.
                presence,  # type: ignore
            )
            return batch._replace(training_input=training_input_sarsa._replace(
                action=training_input_sarsa.action._replace(  # type: ignore
                    float_features=preprocessed_action),
                next_action=training_input_sarsa.next_action.
                _replace(  # type: ignore
                    float_features=preprocessed_next_action),
                tiled_next_state=training_input_sarsa.tiled_next_state.
                _replace(  # type: ignore
                    float_features=preprocessed_tiled_next_state),
            ))
        else:
            assert False, "Invalid training_input type: " + str(
                type(batch.training_input))