Python NaiveProbabilityMatchingAgent 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: ml_gym.agents.allocation_agents

메소드/함수: NaiveProbabilityMatchingAgent

hotexamples.com에서의 예제들: 5

Python NaiveProbabilityMatchingAgent - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 ml_gym.agents.allocation_agents.NaiveProbabilityMatchingAgent에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

 def test_episode_done_raises_error(self):
     env = attention_allocation.LocationAllocationEnv()
     agent = allocation_agents.NaiveProbabilityMatchingAgent(
         action_space=env.action_space, observation_space=env.observation_space, reward_fn=None
     )
     observation = env.reset()
     with self.assertRaises(core.EpisodeDoneError):
         agent.act(observation, done=True)

예제 #2

파일 보기

 def test__allocate_by_counts(self):
     """Check allocation proportions match probabilities from counts."""
     env = attention_allocation.LocationAllocationEnv()
     agent = allocation_agents.NaiveProbabilityMatchingAgent(
         action_space=env.action_space, observation_space=env.observation_space, reward_fn=None
     )
     counts = [3, 6, 8]
     n_resource = 20
     n_samples = 100
     samples = [agent._allocate(n_resource, counts) for _ in range(n_samples)]
     counts_normalized = [(count / float(np.sum(counts))) for count in counts]
     samples_normalized = [(count / float(np.sum(samples))) for count in np.sum(samples, axis=0)]
     self.assertTrue(np.all(np.isclose(counts_normalized, samples_normalized, atol=0.05)))

예제 #3

파일 보기

 def test_allocate_by_counts_zero(self):
     """Check allocations are even when counts are zero."""
     env = attention_allocation.LocationAllocationEnv()
     agent = allocation_agents.NaiveProbabilityMatchingAgent(
         action_space=env.action_space, observation_space=env.observation_space, reward_fn=None
     )
     counts = [0, 0, 0]
     n_resource = 15
     n_samples = 100
     samples = [agent._allocate(n_resource, counts) for _ in range(n_samples)]
     mean_samples = np.sum(samples, axis=0) / float(n_samples)
     expected_mean = n_resource / float(len(counts))
     std_dev = np.std(samples)
     means_close = [np.abs(mean - expected_mean) < std_dev for mean in mean_samples]
     self.assertTrue(np.all(means_close))

예제 #4

파일 보기

 def test_update_counts(self):
     """Check that counts are updated correctly given an observation."""
     env = attention_allocation.LocationAllocationEnv()
     agent_params = allocation_agents.NaiveProbabilityMatchingAgentParams()
     agent_params.decay_prob = 0
     agent = allocation_agents.NaiveProbabilityMatchingAgent(
         action_space=env.action_space,
         observation_space=env.observation_space,
         reward_fn=None,
         params=agent_params,
     )
     counts = [3, 6, 8]
     observation = np.array([1, 2, 0])
     updated_counts = agent._update_beliefs(observation, counts)
     self.assertTrue(np.all(np.equal(updated_counts, [4, 8, 8])))

예제 #5

파일 보기

 def test_can_interact_with_attention_env(self):
     env = attention_allocation.LocationAllocationEnv()
     agent = allocation_agents.NaiveProbabilityMatchingAgent(
         action_space=env.action_space, observation_space=env.observation_space, reward_fn=None
     )
     test_util.run_test_simulation(env=env, agent=agent)