def log_return(r: []): layers.summarize_tensor(r, 'Return')
def act(x: [so]): qs = q_network(x) a = tf.argmax(qs, axis=1) # qm = tf.reduce_max(qs, axis=1) layers.summarize_tensor(a) return a, qs