Exemplo n.º 1
0
 def __init__(self, use_rbf=False, n_features=None):
     self.env = gym.make("CartPole-v0")
     self.name = "SparseCartPole"
     self.env._max_episode_steps = int(1e10)
     self.use_rbf = use_rbf
     self.action_dim = 2
     if self.use_rbf is True:
         self.obs_dim = n_features
         self.rbf = rbf.Fourier(4, self.obs_dim, dtype="numpy")
     else:
         self.obs_dim = 4
     self.action_type = "discrete"
Exemplo n.º 2
0
 def __init__(self, use_rbf=False, n_features=None):
     self.env = gym.make("Acrobot-v1")
     self.name = "Acrobot"
     self.env._max_episode_steps = int(1e10)
     self.action_dim = 3
     self.action_type = "discrete"
     self.use_rbf = use_rbf
     if self.use_rbf is True:
         self.obs_dim = n_features
         self.rbf = rbf.Fourier(6, self.obs_dim, dtype="numpy")
     else:
         self.obs_dim = 6
Exemplo n.º 3
0
    def __init__(self, use_rbf=False, n_features=256):
        self.env = gym.make("LunarLander-v2")
        self.env._max_episode_steps = int(1e10)
        self.action_dim = 4
        self.name = "LunarLander"

        self.use_rbf = use_rbf
        if self.use_rbf is True:
            self.obs_dim = n_features
            self.rbf = rbf.Fourier(8, self.obs_dim, dtype="numpy")
        else:
            self.obs_dim = 8
        self.action_type = "discrete"
Exemplo n.º 4
0
 def __init__(self, use_rbf=False):
     self.env = gym.make("Pendulum-v0")
     self.action_dim = 1
     self.action_type = "continuous"
     self.name = "Pendulum"
     self.env._max_episode_steps = int(1e10)
     self.use_rbf = use_rbf
     if self.use_rbf is True:
         self.obs_dim = 128
         self.rbf = rbf.Fourier(3, self.obs_dim, dtype="numpy")
     else:
         self.obs_dim = 3
     self.action_type = "continuous"
Exemplo n.º 5
0
 def __init__(self, use_rbf=False):
     self.env = gym.make("InvertedDoublePendulumMuJoCoEnv-v0")
     self.name = "InvertedDoublePendulum"
     self.env._max_episode_steps = int(1e10)
     # self.tilecode = tilecode
     self.use_rbf = use_rbf
     self.action_dim = 1
     if self.use_rbf is True:
         self.obs_dim = 512
         self.rbf = rbf.Fourier(11, self.obs_dim, dtype="numpy")
         # self.tc = tilecoding.TileCoder([4, 4, 4, 4], [(-2.4, 2.4), (-10., 10), (-41.8, 41.8), (-10, 10)], 4)
         # self.obs_dim = self.tc.n_tiles
         # print(self.obs_dim)
     else:
         self.obs_dim = 11
     self.action_type = "continuous"