Python RBFObserverGridworldGui 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: gridworld.gridworldgui

hotexamples.com에서의 예제들: 3

Python RBFObserverGridworldGui - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 gridworld.gridworldgui.RBFObserverGridworldGui에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

RBFObserverGridworldGui(1)

complete_trace(1)

evaluate_func_policy(1)

linear_policy(1)

mainloop(1)

nfeatures(1)

set_arrows(1)

set_heatmap(1)

test(1)

예제 #1

파일 보기

파일: test_lspi.py 프로젝트: stober/lspi

    pi = [gw.linear_policy(w0,s) for s in range(gw.nstates)]
    gw.set_arrows(pi)    
    gw.background()
    gw.mainloop()

if test_realpca:
    import pdb
    #pdb.set_trace()
    #endstates = [32, 2016, 1024, 1040, 1056, 1072]
    #endstates = [16,256,264,272,280,496]
    endstates = [272] # [16]
    #endstates = [0] # TODO find proper endstates
    # ogw = ObserverGridworldGui("/Users/stober/wrk/lspi/bin/16/5comp.npy", "/Users/stober/wrk/lspi/bin/16/states.npy", endstates = endstates, walls=None)
    # just isnt' working for state 16
    # nrbf 40 works best
    ogw = RBFObserverGridworldGui("/Users/stober/wrk/lspi/bin/16/20comp.npy", "/Users/stober/wrk/lspi/bin/16/states.npy", endstates = endstates, walls=None, nrbf=80)
    # ogw.load_features('rbf_obs_features.pck')
    # ogw = ObserverGridworldGui("/Users/stober/wrk/lspi/bin/32/observations4.npy", "/Users/stober/wrk/lspi/bin/32/states.npy", endstates = endstates, walls=None)
    # ogw = GridworldGui(nrows=16,ncols=32,endstates = endstates, walls=[])
    try:
        #raise Exception # force a trace regeneration
        t = pickle.load(open(workspace + "/traces/complete_trace.pck"))
    except:
        pass
        #t = ogw.trace(100000)
        #pickle.dump(t, open(workspace + "/traces/real_pca_trace.pck","w"), pickle.HIGHEST_PROTOCOL)

    #pdb.set_trace()
    #print ogw.phi(0,0)
    #raise Exception

예제 #2

파일 보기

파일: test_lspi.py 프로젝트: QueensGambit/lspi

    gw.background()
    gw.mainloop()

if test_realpca:
    import pdb
    #pdb.set_trace()
    #endstates = [32, 2016, 1024, 1040, 1056, 1072]
    #endstates = [16,256,264,272,280,496]
    endstates = [272]  # [16]
    #endstates = [0] # TODO find proper endstates
    # ogw = ObserverGridworldGui("/Users/stober/wrk/lspi/bin/16/5comp.npy", "/Users/stober/wrk/lspi/bin/16/states.npy", endstates = endstates, walls=None)
    # just isnt' working for state 16
    # nrbf 40 works best
    ogw = RBFObserverGridworldGui("/Users/stober/wrk/lspi/bin/16/20comp.npy",
                                  "/Users/stober/wrk/lspi/bin/16/states.npy",
                                  endstates=endstates,
                                  walls=None,
                                  nrbf=80)
    # ogw.load_features('rbf_obs_features.pck')
    # ogw = ObserverGridworldGui("/Users/stober/wrk/lspi/bin/32/observations4.npy", "/Users/stober/wrk/lspi/bin/32/states.npy", endstates = endstates, walls=None)
    # ogw = GridworldGui(nrows=16,ncols=32,endstates = endstates, walls=[])
    try:
        #raise Exception # force a trace regeneration
        t = pickle.load(open(workspace + "/traces/complete_trace.pck"))
    except:
        pass
        #t = ogw.trace(100000)
        #pickle.dump(t, open(workspace + "/traces/real_pca_trace.pck","w"), pickle.HIGHEST_PROTOCOL)

    #pdb.set_trace()
    #print ogw.phi(0,0)

예제 #3

파일 보기

파일: 2d_rotation.py 프로젝트: DaomingLyu/lspi

if __name__ == '__main__':

    workspace = "{0}/wrk/lspi/bin".format(os.environ['HOME'])

    if False:
        # fix isomap issue on bad matches
        ematrix = pickle.load(open('ematrix0.pck'))
        y, s, adj = isomap(ematrix)

    if True:

        endstates = [272]  # [16]

        ogw = RBFObserverGridworldGui(
            "/Users/stober/wrk/lspi/bin/16/20comp.npy",
            "/Users/stober/wrk/lspi/bin/16/states.npy",
            endstates=endstates,
            walls=None,
            nrbf=80)

        # ogw = RBFObserverGridworld("/Users/stober/wrk/lspi/bin/16/20comp.npy", "/Users/stober/wrk/lspi/bin/16/states.npy", endstates = endstates, walls=None, nrbf=80)

        t = pickle.load(open(workspace + "/traces/complete_trace.pck"))

        old_endstates = [16, 256, 264, 272, 280, 496]
        t = modify_endstates(t, old_endstates, endstates, action_costs=True)

        policy0 = np.zeros(ogw.nfeatures())
        w0, weights0 = LSPI(t,
                            0.005,
                            ogw,
                            policy0,