Esempio n. 1
0
def RL_start():
	obsact = None
	doCallWithNoParams(Network.kRLStart)
	doStandardRecv(Network.kRLStart)
	obsact = Observation_action()
	obsact.o = network.getObservation()
	obsact.a = network.getAction()
	return obsact
Esempio n. 2
0
def RL_start():
	obsact = None
	doCallWithNoParams(Network.kRLStart)
	doStandardRecv(Network.kRLStart)
	obsact = Observation_action()
	obsact.o = network.getObservation()
	obsact.a = network.getAction()
	return obsact
Esempio n. 3
0
 def RL_start(self):
     self.reward_return = 0.0
     self.step_count = 1
     self.episode_count += 1
     self.prevact = None
     self.exitStatus = 0
     obs = self.env.env_start()
     action = self.agent.agent_start(obs)
     obsact = Observation_action()
     obsact.o = obs
     obsact.a = action
     self.prevact = action
     return obsact
Esempio n. 4
0
	def RL_start(self):
		self.reward_return = 0.0
		self.step_count = 1
		self.episode_count += 1
		self.prevact = None
		self.exitStatus = 0
		obs = self.env.env_start()
		action = self.agent.agent_start(obs)
		obsact = Observation_action()
		obsact.o = obs
		obsact.a = action
		self.prevact = action
		return obsact