Python Agent.ACPGAg Examples

Programming Language: Python

Class/Type: Agent

Method/Function: ACPGAg

Examples at hotexamples.com: 2

Python Agent.ACPGAg - 2 examples found. These are the top rated real world Python examples of Agent.ACPGAg from package cleanrl extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Agent(30)

AlphaBetaAgent(6)

AgentFactory(4)

ACPGAg(2)

Chooser(2)

Brain(2)

CFAgent(2)

Agent_PG(1)

consumption_value_low(1)

runAwayBehaviour(1)

production_value(1)

placeall(1)

make(1)

deserializeAgent(1)

createAgentList(1)

consumption_value_high(1)

AgentTool(1)

CopyToTargetNetwork(1)

ActionValue(1)

AbsorbSample(1)

AgentQLearn(1)

BS_Agent(1)

AlphabetaAgent(1)

scriptedBehaviour(1)

Example #1

Show file

import gym
import Agent
import random
import numpy as np


def RandomActionDiscrete(ActionProp):
    ActionSize = len(ActionProp)
    Action = np.random.choice(np.arange(ActionSize), p=ActionProp)
    ActionOut = np.zeros(ActionSize)
    ActionOut[Action] = 1
    return Action, ActionOut


env = gym.make("CartPole-v1")
Ag = Agent.ACPGAg(2, 4)

EpisodeTime = 200
CurrentEpisode = 0
DoneTimes = 0
while True:
    Observation = env.reset()
    O_array = []
    R_array = []
    A_array = []
    AccReward = 0
    CurrentEpisode += 1
    if CurrentEpisode % 50 == 0:
        print(DoneTimes)
        DoneTimes = 0
    for t in range(EpisodeTime):

Example #2

Show file

import random
import numpy as np

def RandomActionDiscrete(ActionProp):
    ActionSize = len(ActionProp)
    ActionOut = np.zeros(ActionSize)
    rand = random.uniform(0,1)
    for ActionIndex in range(ActionSize):
        if rand < ActionProp[ActionIndex]:
            ActionOut[ActionIndex] = 1
            return ActionIndex, ActionOut
    ActionOut[ActionSize-1] = 1
    return ActionSize-1, ActionOut

env = gym.make("Acrobot-v1")
Ag = Agent.ACPGAg(3, 6)

CurrentEpisode = 0
while True:
    Observation = env.reset()
    O_array = []
    R_array = []
    A_array = []
    CurrentEpisode += 1
    rememberTimeStep = 0
    StepTime = 0
    score = 0
    while True:
        StepTime += 1
        if CurrentEpisode%100 == 0:
            env.render()