def __init__(self, environment): ''' Constructor ''' EpisodicTask.__init__(self, environment) self.prev_time = 0 self.current_time = 0 self.reward = 0
def __init__(self, env, episodeLength): EpisodicTask.__init__(self, env) #self.inDim = 1 #self.outDim = 1 self.counter = 0 self.history = [] self.total = [] self.episodeLength = episodeLength
def __init__(self, size, opponent = None, **args): EpisodicTask.__init__(self, PenteGame((size, size))) self.setArgs(**args) if opponent == None: opponent = RandomGomokuPlayer(self.env) elif isclass(opponent): # assume the agent can be initialized without arguments then. opponent = opponent(self.env) if not self.opponentStart: opponent.color = PenteGame.WHITE self.opponent = opponent self.minmoves = 9 self.maxmoves = self.env.size[0] * self.env.size[1] self.reset()
def __init__(self, size, opponent=None, **args): EpisodicTask.__init__(self, PenteGame((size, size))) self.setArgs(**args) if opponent == None: opponent = RandomGomokuPlayer(self.env) elif isclass(opponent): # assume the agent can be initialized without arguments then. opponent = opponent(self.env) if not self.opponentStart: opponent.color = PenteGame.WHITE self.opponent = opponent self.minmoves = 9 self.maxmoves = self.env.size[0] * self.env.size[1] self.reset()
def __init__(self, size, opponent=None, **args): EpisodicTask.__init__(self, GoGame(size)) self.setArgs(**args) if opponent == None: opponent = RandomGoPlayer(self.env) elif isclass(opponent): # assume the agent can be initialized without arguments then. opponent = opponent(self.env) else: opponent.game = self.env if not self.opponentStart: opponent.colour = GoGame.WHITE self.opponent = opponent self.reset()
def __init__(self, size, opponent = None, **args): EpisodicTask.__init__(self, CaptureGame(size)) self.setArgs(**args) if opponent == None: opponent = RandomCapturePlayer(self.env) elif isclass(opponent): # assume the agent can be initialized without arguments then. opponent = opponent(self.env) else: opponent.game = self.env if not self.opponentStart: opponent.color = CaptureGame.WHITE self.opponent = opponent self.maxmoves = self.env.size * self.env.size self.minmoves = 3 self.reset()
def __init__(self, environment, deltaP, deltaF, deltaS, discount, backtest=False): """ Standard constructor for the asset allocation task. Args: environment (Environment): market environment object deltaP (double): proportional transaction costs rate deltaF (double): fixed transaction cost rate deltaS (double): short selling borrowing cost rate discount (double): discount factor backtest (bool): flag for training mode or test mode """ # Initialize episodic task EpisodicTask.__init__(self, environment) # Transaction costs self.deltaP = deltaP self.deltaF = deltaF self.deltaS = deltaS # Discount factor self.discount = discount # Backtesting self.backtest = backtest # Report stores allocations and portfolio log-returns for backtesting self.report = pd.DataFrame(columns=list(self.env.data.columns) + ['ptfLogReturn']) # Initialize allocation self.initializeAllocation()