def test_next_policy_action(self):
     bot = BotSimpleRL(self.env, self.player)
     bot.init_q_state(0)
     assert bot.next_policy_action(bot.dehasher(0), 0) == -1
     pass
 def test_next_random_action(self):
     bot = BotSimpleRL(self.env, self.player)
     assert bot.next_random_action(bot.dehasher(0), 0) == 0
     assert 0