def giveReward(self, r): PolicyGradientAgent.giveReward(self, r) if self.actaspg: self.explorationlayer.drawRandomWeights()
def getAction(self): self.explorationlayer.setState(self.lastobs) action = PolicyGradientAgent.getAction(self) return action