Exemplo n.º 1
0
    def check(s):
        index, values = features.transform(s)
        reversed_state = features.reverse(index, values)

        if not np.allclose(s, reversed_state):
            delta = s - reversed_state
            log.info("State %s reversed into %s", s, reversed_state)
            log.info("Delta %s", delta)
Exemplo n.º 2
0
def load_replays(file_names):
    l_states = []
    l_rewards = []

    for file_name in file_names:
        print "Load file %s" % file_name
        data = np.load(file_name)

        for row in data:
            state = features.reverse(*row[0])
#            state = features.to_dense(row[0])
            l_states.append(state)
            l_rewards.append(max(row[1]))

    states = np.array(l_states)
    rewards = np.array(l_rewards)

    return xgb.DMatrix(states, label=rewards)