Python Agent.execute Exemples

Langage de programmation: Python

Espace de nommage/Pack: agent.agent

Class/Type: Agent

Méthode/Fonction: execute

Exemples au hotexamples.com: 3

Python Agent.execute - 3 exemples trouvés. Ce sont les exemples réels les mieux notés de agent.agent.Agent.execute extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

Agent(30)

act(15)

inventory(4)

expReplay(4)

__init__(4)

execute(3)

get_noise(3)

get_action(2)

egreedy_action(2)

act_fcnet(2)

act_ffnet(2)

inventory1(2)

at_goal(2)

init_broker(2)

collect_transition_data(2)

cuda(2)

get_greedy_action(1)

get_judgements(1)

get_losses(1)

get_next_action(1)

_build(1)

get_step_value(1)

get_stochastic_action(1)

handler(1)

get_exploration_policy(1)

history(1)

init_or_update_local(1)

isExit(1)

has_finished_episode(1)

fitnetwork(1)

get_epsilon_policy(1)

competition(1)

action_process(1)

append(1)

append_sample(1)

buy_inventory(1)

calculate_margin(1)

choose_action(1)

connect(1)

get_commands(1)

display_state(1)

do_predicted_play(1)

eval(1)

REPORTING_PERIOD(1)

exp_replay(1)

act_covnet(1)

getTDError(1)

isLoggedIn(1)

Méthodes fréquemment utilisées

Agent (30)

act (15)

inventory (4)

expReplay (4)

__init__ (4)

execute (3)

get_noise (3)

get_action (2)

egreedy_action (2)

act_fcnet (2)

Méthodes fréquemment utilisées

act_ffnet (2)

inventory1 (2)

at_goal (2)

init_broker (2)

collect_transition_data (2)

cuda (2)

get_greedy_action (1)

get_judgements (1)

get_losses (1)

get_next_action (1)

_build (1)

get_step_value (1)

get_stochastic_action (1)

handler (1)

get_exploration_policy (1)

history (1)

init_or_update_local (1)

isExit (1)

has_finished_episode (1)

fitnetwork (1)

Méthodes fréquemment utilisées

_build (1)

get_step_value (1)

get_stochastic_action (1)

handler (1)

get_exploration_policy (1)

history (1)

init_or_update_local (1)

isExit (1)

has_finished_episode (1)

fitnetwork (1)

get_epsilon_policy (1)

competition (1)

action_process (1)

append (1)

append_sample (1)

buy_inventory (1)

calculate_margin (1)

choose_action (1)

connect (1)

get_commands (1)

display_state (1)

do_predicted_play (1)

eval (1)

REPORTING_PERIOD (1)

exp_replay (1)

act_covnet (1)

getTDError (1)

isLoggedIn (1)

Méthodes fréquemment utilisées

get_epsilon_policy (1)

competition (1)

action_process (1)

append (1)

append_sample (1)

buy_inventory (1)

calculate_margin (1)

choose_action (1)

connect (1)

get_commands (1)

display_state (1)

do_predicted_play (1)

eval (1)

REPORTING_PERIOD (1)

exp_replay (1)

act_covnet (1)

getTDError (1)

isLoggedIn (1)

Exemple #1

0

Afficher le fichier

Fichier : worker.py Projet : DanielSmithMichigan/dqn

def objective(args): NUM_TESTS_FOR_NOISE = 1 env = gym.make('LunarLander-v2') learningRate = args # numIntermediateLayers = int(numIntermediateLayers) # intermediateLayerSize = int(intermediateLayerSize) # finalLayerSize = int(finalLayerSize) # layers = [] # for i in range(numIntermediateLayers): # layers.append(intermediateLayerSize) # layers.append(finalLayerSize) # print("Layers: ",layers) # print("Priority: ",priorityExponent) # print("LR: ",learningRate) totalResult = 0 for i in range(NUM_TESTS_FOR_NOISE): sess = tf.Session() a = Agent( sess=sess, env=env, numAvailableActions=4, numObservations=8, rewardsMovingAverageSampleLength=20, gamma=1, nStepUpdate=1, includeIntermediatePairs=False, maxRunningMinutes=30, # test parameters episodesPerTest=1, numTestPeriods=40000, numTestsPerTestPeriod=30, episodeStepLimit=1024, intermediateTests=False, render=False, showGraph=False, # hyperparameters valueMin=-400.0, valueMax=300.0, numAtoms=14, maxMemoryLength=100000, batchSize=256, networkSize=[128, 128, 256], learningRate=learningRate, priorityExponent=0, epsilonInitial = 2, epsilonDecay = .9987, minFramesForTraining = 2048, noisyLayers = False, maxGradientNorm = 4, minExploration = .15, ) testResults = np.array(a.execute()) performance = np.mean(testResults[np.argpartition(-testResults,range(4))[:4]]) totalResult = totalResult + performance print(str(learningRate)+","+str(performance)) return -totalResult

Exemple #2

0

Afficher le fichier

Fichier : dbEntry.py Projet : DanielSmithMichigan/dqn

# agentName="agent_842763505", # hyperparameters rewardScaling=rewardScaling, nStepReturns=1, maxMemoryLength=int(1e6), batchSize=64, learningRate=6.25e-4, priorityExponent=0, epsilonInitial=1, epsilonDecay=.999975, minExploration=.01, maxExploration=1.0, minFramesForTraining=2048, maxGradientNorm=5, preNetworkSize=[128, 128], postNetworkSize=[256], numQuantiles=8, embeddingDimension=16, kappa=1.0, trainingIterations=3, tau=0.001) performance = a.execute()[0] cur = db.cursor() cur.execute( "insert into experiments (label, x1, x2, x3, x4, y) values ('{0}', '{1}', '{2}', '{3}', '{4}', '{5}')" .format(experimentName, rewardScaling, 0, 0, 0, performance)) db.commit() cur.close() db.close()

Exemple #3

0

Afficher le fichier

Fichier : dqn.py Projet : DanielSmithMichigan/dqn

intermediateTests=False, render=False, showGraph=True, saveModel=True, loadModel=False, disableRandomActions=False, disableTraining=False, # agentName="agent_223120799", # hyperparameters rewardScaling=pow(10, -.75), nStepReturns=1, maxMemoryLength=int(1e6), batchSize=64, learningRate=6.25e-4, priorityExponent=0, epsilonInitial=1, epsilonDecay=.999, minExploration=.01, maxExploration=1.0, minFramesForTraining=2048, maxGradientNorm=5, preNetworkSize=[256, 256], postNetworkSize=[512], numQuantiles=32, embeddingDimension=64, kappa=1.0, trainingIterations=3, tau=0.001) testResults = a.execute()