aliases[min(c)] = set(c) print aliases #gw = AliasGridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[],aliases=aliases) gw = GridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[]) try: t = pickle.load(open("pca_trace.pck")) except: t = gw.trace(100000) pickle.dump(t,open("pca_trace.pck","w"), pickle.HIGHEST_PROTOCOL) policy0 = np.zeros(gw.nfeatures()) nclusters = len(aliases) colors = create_cluster_colors_rgb(nclusters,False) print colors colormap = {} for i,cc in enumerate(aliases.values()): for s in cc: colormap[s] = colors[i] w0, weights0 = LSPI(t, 0.005, gw, policy0, maxiter=10, method="sparse", debug = False, timer = True, show=True, ncpus=6) #w0, weights0 = LSPIRmax(t, 0.003, gw, policy0, maxiter = 100000, show = True, resample_epsilon = 0.1, rmax = 1000) # w0, weights0 = LSPIRmax(t, 0.003, gw, policy0, maxiter=100) # w0, weights0 = LSPI(t, 0.005, gw, policy0, maxiter=10, method="parallel", debug = False, timer = True, show=True, format="csr",ncpus=6) try: pickle.dump(w0,open("weights.pck","w"),pickle.HIGHEST_PROTOCOL) except: print "Save failed!"
aliases = {} for c in cc: aliases[min(c)] = set(c) print(aliases) #gw = AliasGridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[],aliases=aliases) gw = GridworldGui(nrows=32, ncols=64, endstates=endstates, walls=[]) try: t = pickle.load(open("pca_trace.pck")) except: t = gw.trace(100000) pickle.dump(t, open("pca_trace.pck", "w"), pickle.HIGHEST_PROTOCOL) policy0 = np.zeros(gw.nfeatures()) nclusters = len(aliases) colors = create_cluster_colors_rgb(nclusters, False) print(colors) colormap = {} for i, cc in enumerate(aliases.values()): for s in cc: colormap[s] = colors[i] w0, weights0 = LSPI(t, 0.005, gw, policy0, maxiter=10, method="sparse", debug=False, timer=True,
def gen_colors(lbls): uniq = set(lbls) c = create_cluster_colors_rgb(len(uniq)) cmap = dict(zip(uniq,c)) return [cmap[i] for i in lbls]