Python Experiment.doEpisode 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: experiment

클래스/타입: Experiment

메소드/함수: doEpisode

hotexamples.com에서의 예제들: 2

Python Experiment.doEpisode - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 experiment.Experiment.doEpisode에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Experiment(30)

__init__(14)

_last_instance(8)

compare(6)

add_tx(6)

add_grad(6)

doTest(3)

add_config_file(3)

DiscountedReturn(3)

add_chart(3)

analyse(3)

add_init_net_snapshot(2)

add_log(2)

case_prefix(2)

_walk_cases(2)

add_plot(2)

close_log_file(2)

SVD(2)

begin_experiment(2)

doEpisode(2)

collectLatticeLogs(1)

cnt_id(1)

compile(1)

close(1)

compute_explo(1)

clean_logs(1)

ConvertDataTob64String(1)

doEpisodeWithMemory(1)

foo(1)

get_control_result(1)

get_experiment_result(1)

makedir(1)

matches(1)

pause(1)

perform(1)

resume(1)

run_exp(1)

slaves(1)

start_game(1)

wait(1)

check_speicalpoint(1)

apply_lr(1)

calculate(1)

add_monitored_vars(1)

FixedConflictWorkload(1)

OutstandingReqArrivalRate(1)

PoissonArrivalRate(1)

ZipfianWorkload(1)

_get_model(1)

_oneInteraction(1)

예제 #1

파일 보기

파일: main_nn.py 프로젝트: zydmayday/runfast

def trainQValueNetwork(loopNum=10000, startTurn=0, history_filename='train_winners_nn', inputNum=192, type=1):
	'''
	通过让三个agent互相玩游戏，然后来训练出一个Q值网络
	三个agent的网络保存在playeri里面，数字分别代表的是训练了多少次后得出的网络
	胜负情况记录在train_winners里面
	'''
	agents = []
	winners = {}
	if os.path.isfile(history_filename):
		with open(history_filename, 'r') as f:
			winners = pickle.load(f)
			startTurn = sum([v for i,v in winners.items()]) 

	for i in range(0, 3):
		playerName = PLAYER_LIST[i]
		nw = RunFastNetwork(playerName, inputNum=inputNum, hiddenNum=inputNum, outNum=1)
		nw.loadNet(playerName, startTurn)
		rfa = RunFastAgent(playerName, nw)
		agents.append(rfa)
		 
	env = RunFastEnvironment()
	exp = Experiment(env, agents, type=type)

	for i in xrange(startTurn, startTurn + loopNum):

		if i % 200 == 0:
			for agent in agents:
				agent.saveNet()

			with open(history_filename, 'w') as f:
				pickle.dump(winners, f)
		# exp.setTurn(i)
		winner = exp.doEpisode()
		if winners.has_key(winner):
			winners[winner] += 1
		else:
			winners[winner] = 1

	for agent in agents:
		agent.saveNet()

	with open(history_filename, 'w') as f:
		pickle.dump(winners, f)


	print winners
	with open(history_filename, 'w') as f:
		pickle.dump(winners, f)

예제 #2

파일 보기

파일: main_dn.py 프로젝트: zydmayday/runfast

def trainDeepNetwork(loopNum=10000, startTurn=0, history_filename='train_winners_dn', type=1, inputNum=192):
	'''
	用深度网络来训练Q值
	'''
	agents = []
	winners = {}

	# load history match
	if os.path.isfile(history_filename):
		with open(history_filename, 'r') as f:
			winners = pickle.load(f)
			startTurn = sum([v for i,v in winners.items()]) 

	# load agents with network
	for i in range(0, 3):
		playerName = PLAYER_LIST[i]
		nw = RunFastDeepNetwork(playerName, inputNum=inputNum, hidden1Num=inputNum, hidden2Num=inputNum, hidden3Num=inputNum, outNum=1)
		nw.loadNet(playerName, startTurn)
		rfa = RunFastAgent(playerName, nw)
		agents.append(rfa)
		 
	env = RunFastEnvironment()
	exp = Experiment(env, agents, type=type)

	for i in range(startTurn, startTurn + loopNum):

		if i % 200 == 0:
			for agent in agents:
				agent.saveNet()

			with open(history_filename, 'w') as f:
				pickle.dump(winners, f)

		# exp.setTurn(i)
		winner = exp.doEpisode()
		if winners.has_key(winner):
			winners[winner] += 1
		else:
			winners[winner] = 1

	for agent in agents:
		agent.saveNet()
	with open(history_filename, 'w') as f:
		pickle.dump(winners, f)

	print winners
	with open(history_filename, 'w') as f:
		pickle.dump(winners, f)