import numpy as np from pygame.locals import * import pygame import random as rd from snake_env import Render, Map import time nagents = 3 M = Map(nagents=nagents, ncandies=3, gridsize=40) e = Render(M, spacing=20) step = 0 while True: index = 0 print(step) e.render() next_move = rd.randint(0, 3) print(next_move) M.agents[index].nextAction(next_move) step += 1 r, done = M.step() time.sleep(0.5) # if done: # e.reset()
from snake_env import Render, Map from IA import IA_rl, IA_random, IA_minimax n_agents = 2 n_candies = 10 gridsize = 30 n_total_iter = 2000 sliding_window = 100 step = 10 IA_learning = IA_rl.IA(0) adversary = IA_random.IA(1) #adversary = IA_minimax.IA(1) M = Map(nagents=n_agents, ncandies=n_candies, gridsize=gridsize) e = Render(M, spacing=20) q = None current_result = 0 all_results = [] result = [] for match in range(1, n_total_iter + 1): while True: #e.render() if len(M.activeAgents) < n_agents: if 0 in M.activeAgents: current_result += 1