コード例 #1
0
def test_gym():
    np.random.seed(1)
    mdp = Gym('Acrobot-v1', 1000, .99)
    mdp.seed(1)
    mdp.reset()
    for i in range(10):
        ns, r, ab, _ = mdp.step([np.random.randint(mdp.info.action_space.n)])
    ns_test = np.array([
        0.9996687, -0.02573896, 0.9839331, -0.17853762, -0.17821608, 0.5534913
    ])

    assert np.allclose(ns, ns_test)
コード例 #2
0
def test_gym():
    np.random.seed(1)
    mdp = Gym('Acrobot-v1', 1000, .99)
    mdp.seed(1)
    mdp.reset()
    for i in range(10):
        ns, r, ab, _ = mdp.step([np.random.randint(mdp.info.action_space.n)])
    ns_test = np.array([
        0.99989477, 0.01450661, 0.97517825, -0.22142128, -0.02323116,
        0.40630765
    ])

    assert np.allclose(ns, ns_test)