Python scale_action 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: model.ModelUtil

메소드/함수: scale_action

hotexamples.com에서의 예제들: 7

Python scale_action - 7개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 model.ModelUtil.scale_action에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

 def predict(self,
             state,
             deterministic_=True,
             evaluation_=False,
             p=None,
             sim_index=None,
             bootstrapping=False):
     # states = np.zeros((self._batch_size, self._state_length), dtype=self._settings['float_type'])
     # states[0, ...] = state
     # state = np.array(state, dtype=self._settings['float_type'])
     state = norm_state(state, self._state_bounds)
     state = np.array(state, dtype=self._settings['float_type'])
     self._model.setStates(state)
     # action_ = lasagne.layers.get_output(self._model.getActorNetwork(), state, deterministic=deterministic_).mean()
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # if deterministic_:
     action_ = scale_action(
         self._model.getActorNetwork().predict(
             state, batch_size=1)[:, :self._action_length],
         self._action_bounds)
     # action_ = scale_action(self._q_action_target()[0], self._action_bounds)
     # else:
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # action_ = q_valsActA[0]
     return action_

예제 #2

파일 보기

파일: AlgorithmInterface.py 프로젝트: skylbc/SMBAE

 def predict(self,
             state,
             deterministic_=True,
             evaluation_=False,
             p=None,
             sim_index=None,
             bootstrapping=False):
     # states = np.zeros((self._batch_size, self._state_length), dtype=self._settings['float_type'])
     # states[0, ...] = state
     """
     if ( ('disable_parameter_scaling' in self._settings) and (self._settings['disable_parameter_scaling'])):
         pass
     else:
     """
     # print ("Agent state bounds: ", self._state_bounds)
     state = norm_state(state, self._state_bounds)
     # print ("Agent normalized state: ", state)
     state = np.array(state, dtype=self._settings['float_type'])
     self._model.setStates(state)
     # action_ = lasagne.layers.get_output(self._model.getActorNetwork(), state, deterministic=deterministic_).mean()
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # if deterministic_:
     if (('disable_parameter_scaling' in self._settings)
             and (self._settings['disable_parameter_scaling'])):
         action_ = self._q_action()
         # action_ = scale_action(self._q_action()[0], self._action_bounds)
     else:
         action_ = scale_action(self._q_action(), self._action_bounds)
     # print ("Agent Scaled action: ", action_)
     # action_ = scale_action(self._q_action_target()[0], self._action_bounds)
     # else:
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # action_ = q_valsActA[0]
     return action_

예제 #3

파일 보기

파일: QPropKeras.py 프로젝트: skylbc/SMBAE

 def predictWithDropout(self, state, deterministic_=True):
     # states = np.zeros((self._batch_size, self._state_length), dtype=self._settings['float_type'])
     # states[0, ...] = state
     state = np.array(state, dtype=self._settings['float_type'])
     state = norm_state(state, self._state_bounds)
     action_ = scale_action(
         self._model.getActorNetwork().predict(
             states, batch_size=1)[:, :self._action_length],
         self._action_bounds)
     # else:
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # action_ = q_valsActA[0]
     return action_

예제 #4

파일 보기

파일: QPropKeras.py 프로젝트: skylbc/SMBAE

 def predict(self,
             state,
             deterministic_=True,
             evaluation_=False,
             p=None,
             sim_index=None,
             bootstrapping=False):
     state = norm_state(state, self._state_bounds)
     state = np.array(state, dtype=self._settings['float_type'])
     action_ = scale_action(
         self._model.getActorNetwork().predict(
             state, batch_size=1)[:, :self._action_length],
         self._action_bounds)
     return action_

예제 #5

파일 보기

파일: AlgorithmInterface.py 프로젝트: MCCCSunny/RL-Framework

 def predict(self,
             state,
             deterministic_=True,
             evaluation_=False,
             p=None,
             sim_index=None,
             bootstrapping=False):
     state = norm_state(state, self._state_bounds)
     state = np.array(state, dtype=self._settings['float_type'])
     self._model.setStates(state)
     if (('disable_parameter_scaling' in self._settings)
             and (self._settings['disable_parameter_scaling'])):
         action_ = self._q_action()[0]
     else:
         action_ = scale_action(
             self._q_action()[0],
             self._action_bounds)  # transform the action value to a range
     return action_

예제 #6

파일 보기

파일: AlgorithmInterface.py 프로젝트: skylbc/SMBAE

 def predictWithDropout(self, state, deterministic_=True):
     # states = np.zeros((self._batch_size, self._state_length), dtype=self._settings['float_type'])
     # states[0, ...] = state
     """
     if ( ('disable_parameter_scaling' in self._settings) and (self._settings['disable_parameter_scaling'])):
         pass
     else:
     """
     state = np.array(state, dtype=self._settings['float_type'])
     state = norm_state(state, self._state_bounds)
     self._model.setStates(state)
     # action_ = lasagne.layers.get_output(self._model.getActorNetwork(), state, deterministic=deterministic_).mean()
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # if deterministic_:
     action_ = scale_action(self._q_action_drop(), self._action_bounds)
     # else:
     # action_ = scale_action(self._q_action()[0], self._action_bounds)
     # action_ = q_valsActA[0]
     return action_

예제 #7

파일 보기

파일: AlgorithmInterface.py 프로젝트: MCCCSunny/RL-Framework

 def predictWithDropout(self, state, deterministic_=True):
     state = np.array(state, dtype=self._settings['float_type'])
     state = norm_state(state, self._state_bounds)
     self._model.setStates(state)
     action_ = scale_action(self._q_action_drop()[0], self._action_bounds)
     return action_