Beispiel #1
0
        aliases[min(c)] = set(c)
    print aliases


    #gw = AliasGridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[],aliases=aliases)
    gw = GridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[])
    try:
        t = pickle.load(open("pca_trace.pck"))
    except:
        t = gw.trace(100000)
        pickle.dump(t,open("pca_trace.pck","w"), pickle.HIGHEST_PROTOCOL)


    policy0 = np.zeros(gw.nfeatures())
    nclusters = len(aliases)
    colors = create_cluster_colors_rgb(nclusters,False)
    print colors

    colormap = {}
    for i,cc in enumerate(aliases.values()):
        for s in cc:
            colormap[s] = colors[i]

    w0, weights0 = LSPI(t, 0.005, gw, policy0, maxiter=10, method="sparse", debug = False, timer = True, show=True, ncpus=6)
    #w0, weights0 = LSPIRmax(t, 0.003, gw, policy0, maxiter = 100000, show = True, resample_epsilon = 0.1, rmax = 1000)
    # w0, weights0 = LSPIRmax(t, 0.003, gw, policy0, maxiter=100)
    # w0, weights0 = LSPI(t, 0.005, gw, policy0, maxiter=10, method="parallel", debug = False, timer = True, show=True, format="csr",ncpus=6)
    try:
        pickle.dump(w0,open("weights.pck","w"),pickle.HIGHEST_PROTOCOL)
    except:
        print "Save failed!"
Beispiel #2
0
    aliases = {}
    for c in cc:
        aliases[min(c)] = set(c)
    print(aliases)

    #gw = AliasGridworldGui(nrows=32,ncols=64,endstates=endstates,walls=[],aliases=aliases)
    gw = GridworldGui(nrows=32, ncols=64, endstates=endstates, walls=[])
    try:
        t = pickle.load(open("pca_trace.pck"))
    except:
        t = gw.trace(100000)
        pickle.dump(t, open("pca_trace.pck", "w"), pickle.HIGHEST_PROTOCOL)

    policy0 = np.zeros(gw.nfeatures())
    nclusters = len(aliases)
    colors = create_cluster_colors_rgb(nclusters, False)
    print(colors)

    colormap = {}
    for i, cc in enumerate(aliases.values()):
        for s in cc:
            colormap[s] = colors[i]

    w0, weights0 = LSPI(t,
                        0.005,
                        gw,
                        policy0,
                        maxiter=10,
                        method="sparse",
                        debug=False,
                        timer=True,
Beispiel #3
0
def gen_colors(lbls):
    uniq = set(lbls)
    c = create_cluster_colors_rgb(len(uniq))
    cmap = dict(zip(uniq,c))
    return [cmap[i] for i in lbls]