def _generate_covering_classifier(self, state, match_set): self.covering_occur_num += 1 clas = Classifier(self.parameters, self.env, state) used_actions = [classifier.action for classifier in match_set] available_actions = list( set(range(self.env.num_actions)) - set(used_actions)) clas.action = numpy.random.choice(available_actions) clas.time_stamp = self.time_stamp return clas