Python softmax Examples

Programming Language: Python

Namespace/Package Name: assistive_bandits.envs.utils

Method/Function: softmax

Examples at hotexamples.com: 10

Python softmax - 10 examples found. These are the top rated real world Python examples of assistive_bandits.envs.utils.softmax extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

 def get_action(self, obs):
     act_dist = softmax(self.means / self.softmax_temp)
     act = np.random.choice(range(self.env.nA), p=act_dist)
     return act

Example #2

Show file

 def likelihood(self, state, obs, act):
     """ Computes the likelihood of taking the action given the state. """
     act_dist = softmax(state['means'] / state['temp'])
     return act_dist[act]

Example #3

Show file

 def act_probs_from_counts(self, counts, **kwargs):
     means = np.array([arm.mean() for arm in self.env.arms])
     act_dist = softmax(means / self.softmax_temp)
     return act_dist

Example #4

Show file

 def likelihood(self, state, obs, act):
     arm_vals = state['means'] + state['ucl_bonus']
     act_dist = softmax(arm_vals / state['softmax_temp'])
     return act_dist[act]

Example #5

Show file

 def get_action_from_state(self, state, obs):
     act_dist = softmax(state['means'] / state['temp'])
     act = np.random.choice(range(self.env.nA), p=act_dist)
     return act

Example #6

Show file

 def get_action_from_state(self, state, obs):
     arm_vals = state['means'] + state['ucl_bonus']
     act_dist = softmax(arm_vals / state['softmax_temp'])
     act = self.np_random.choice(range(self.env.nA), p=act_dist)
     return act

Example #7

Show file

 def get_action(self, obs):
     self.arm_vals = self.means + self.ucl_bonus
     act_dist = softmax(self.arm_vals / self.softmax_temp)
     act = self.np_random.choice(range(self.env.nA), p=act_dist)
     return act

Example #8

Show file

 def likelihood(self, state, obs, act):
     """ Computes the likelihood of taking the action given the state. """
     return softmax(state['Q_human'][obs] / self.softmax_temp)[act]

Example #9

Show file

 def get_action_from_state(self, state, obs):
     act_dist = softmax(state['Q_human'][obs] / self.softmax_temp)
     act = np.random.choice(range(self.env.nA), p=act_dist)
     return act

Example #10

Show file

 def get_action(self, obs):
     act_dist = softmax(self.Q_human[obs] / self.softmax_temp)
     act = self.np_random.choice(range(self.env.nA), p=act_dist)
     return act