"right-hurr-kick": [["down", "right", "z"], 0.025, 0.025, 1.75],
    "low-heavy-kick": [["down", "ctrl"], 0.025, 0.025, 1],
    "low-medium-kick": [["down", "z"], 0.025, 0.025, 0.75],
    "low-light-kick": [["down", "x"], 0.025, 0.025, 0.75],
    "low-heavy-punch": [["down", "shift"], 0.025, 0.025, 1],
    "low-medium-punch": [["down", "v"], 0.025, 0.025, 1],
    "low-light-punch": [["down", "c"], 0.025, 0.025, 1]
}

names_mov = list(movements.keys())

coord = (8, 95, 512, 475)  #coordinates are different for every user...
env = Env.Enviroment(coord)
state = env.start_game(Open=True)
env.set_gamma(0.95)
Net = net.ActorCritic(state.shape, len(movements))
env.set_policy_net(Net)
file = r"\training_1\cp.ckpt"


def make_batches(env, batch=32, steps=1, gamma=0.95):
    """ 
    Make batches of n_steps(bootstrapping)

    Network expects float and Gray images, so we convert them

    Returns: Initial_state,rewards,next_state,index of finished episodes,actions
    """
    states = []
    rewards = []
    next_states = []