def check(s): index, values = features.transform(s) reversed_state = features.reverse(index, values) if not np.allclose(s, reversed_state): delta = s - reversed_state log.info("State %s reversed into %s", s, reversed_state) log.info("Delta %s", delta)
def load_replays(file_names): l_states = [] l_rewards = [] for file_name in file_names: print "Load file %s" % file_name data = np.load(file_name) for row in data: state = features.reverse(*row[0]) # state = features.to_dense(row[0]) l_states.append(state) l_rewards.append(max(row[1])) states = np.array(l_states) rewards = np.array(l_rewards) return xgb.DMatrix(states, label=rewards)