Python BrainDQN.getAction Examples

Programming Language: Python

Namespace/Package Name: DQN

Class/Type: BrainDQN

Method/Function: getAction

Examples at hotexamples.com: 3

Python BrainDQN.getAction - 3 examples found. These are the top rated real world Python examples of DQN.BrainDQN.getAction extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

BrainDQN(5)

getAction(3)

getAction_1(2)

setInitState(2)

setPerception(2)

getAction_test(1)

getLoss(1)

Example #1

Show file

def playWeChatJump():
    actions = 10
    brain = BrainDQN(actions)  #action采用one-hot编码
    observation0 = game.init_state()
    brain.setInitState(observation0)
    while 1 != 0:
        action = brain.getAction()
        nextObservation, reward, terminal = game.frame_step(action)
        nextObservation = np.reshape(nextObservation, (80, 80, 1))
        brain.setPerception(nextObservation, action, reward, terminal)

Example #2

Show file

brain = BrainDQN(actions, num_sensor)
com = GameState(P_1, P_2, noise, num_sensor)
terminal = True
recording = 100000

while (recording > 0):
    # initialization
    if (terminal == True):
        com.ini()
        observation0, reward0, terminal = com.frame_step(
            np.zeros(actions), policy, False)
        brain.setInitState(observation0)

    # train
    action, recording = brain.getAction()
    nextObservation, reward, terminal = com.frame_step(action, policy, True)
    loss = brain.setPerception(nextObservation, action, reward)

    # test
    if (recording + 1) % 500 == 0:

        Loss.append(loss)
        print "iteration : %d , loss : %f ." % (100000 - recording, loss)

        success = 0.0
        fre = 0
        num = 1000.0
        for ind in range(1000):
            T = 0
            com.ini_test()

Example #3

Show file

File: main.py Project: ziping0509X/SensorModel

        print("iterations:%d" % Time)
        actionIput = Qnetwork.getAction_1(actionNum=ACTION_NUM, stateInput=stateInput,Time= Time)
        reward,actionshow = Env.getReward(stateInput=stateInput, actionInput=actionIput)
        ActionShow.append(actionshow)
        nextState = Env.creatSensor(Power=sig[Time + 1])
        loss = Qnetwork.getLoss(currentState=stateInput, nextState=nextState, action=actionIput, reward=reward)
        Time = Time + 1
        R_total += reward
        Reward.append(R_total)

    else:

        #get satate\action\reward\nextstate
        stateInput = Env.creatSensor(Power=sig[Time])
        print("iterations:%d" %Time)
        actionIput = Qnetwork.getAction(actionNum= ACTION_NUM,stateInput= stateInput)
        reward,actionshow = Env.getReward(stateInput= stateInput,actionInput= actionIput)
        ActionShow.append(actionshow)
        nextState = Env.creatSensor(Power= sig[Time+1])

        #get loss and train Qnetwork
        loss = Qnetwork.getLoss(currentState= stateInput,nextState= nextState,action=actionIput,reward= reward)

        R_total += reward
        Reward.append(R_total)

        if not loss == 0:
            Loss.append(loss)

        Time = Time + 1