def RL_start(): obsact = None doCallWithNoParams(Network.kRLStart) doStandardRecv(Network.kRLStart) obsact = Observation_action() obsact.o = network.getObservation() obsact.a = network.getAction() return obsact
def RL_start(self): self.reward_return = 0.0 self.step_count = 1 self.episode_count += 1 self.prevact = None self.exitStatus = 0 obs = self.env.env_start() action = self.agent.agent_start(obs) obsact = Observation_action() obsact.o = obs obsact.a = action self.prevact = action return obsact