Python LoopModel.perform_action_aの例

プログラミング言語: Python

クラス/型: LoopModel

メソッド/関数: perform_action_a

hotexamples.comのコード掲載数: 6

Python LoopModel.perform_action_a - 6件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのLoopModel.perform_action_a パッケージから Sypyの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

LoopModel(6)

get_states_by_id(3)

perform_action_a(3)

perform_action_b(1)

set_current_state_by_state_id(1)

コード例 #1

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: huiwq1990/ReinforcementLearning

def test_transition_6_0():
    model = LoopModel()
    (state0, state6) = model.get_states_by_id([0, 6])
    model.set_current_state_by_state_id(6)
    reward = model.perform_action_a()
    assert model.current_state == state0
    assert reward == 0

コード例 #2

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: avain/6.804-bayesianRL

def test_transition_6_0():
	model = LoopModel()
	(state0, state6) = model.get_states_by_id([0, 6])
	model.set_current_state_by_state_id(6)
	reward = model.perform_action_a()
	assert model.current_state == state0
	assert reward == 0

コード例 #3

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: avain/6.804-bayesianRL

def test_loop_a():
	model = LoopModel()
	(state0, state1, state2, state3, state4) = model.get_states_by_id([0, 1, 2, 3, 4])
	assert model.current_state == state0
	reward = model.perform_action_a()
	assert model.current_state == state1
	assert reward == 0
	reward = model.perform_action_a()
	assert model.current_state == state2
	assert reward == 0
	reward = model.perform_action_a()
	assert model.current_state == state3
	assert reward == 0
	reward = model.perform_action_a()
	assert model.current_state == state4
	assert reward == 0	
	reward = model.perform_action_a()
	assert model.current_state == state0
	assert reward == 1

コード例 #4

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: huiwq1990/ReinforcementLearning

def test_loop_a():
    model = LoopModel()
    (state0, state1, state2, state3,
     state4) = model.get_states_by_id([0, 1, 2, 3, 4])
    assert model.current_state == state0
    reward = model.perform_action_a()
    assert model.current_state == state1
    assert reward == 0
    reward = model.perform_action_a()
    assert model.current_state == state2
    assert reward == 0
    reward = model.perform_action_a()
    assert model.current_state == state3
    assert reward == 0
    reward = model.perform_action_a()
    assert model.current_state == state4
    assert reward == 0
    reward = model.perform_action_a()
    assert model.current_state == state0
    assert reward == 1

コード例 #5

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: avain/6.804-bayesianRL

def test_loop_b():
	model = LoopModel()
	(state0, state5, state6, state7, state8) = model.get_states_by_id([0, 5, 6, 7, 8])
	assert model.current_state == state0
	reward = model.perform_action_b()
	assert model.current_state == state5
	assert reward == 0
	reward = model.perform_action_b()
	assert model.current_state == state6
	assert reward == 0
	reward = model.perform_action_b()
	assert model.current_state == state7
	assert reward == 0
	reward = model.perform_action_b()
	assert model.current_state == state8
	assert reward == 0
	reward = model.perform_action_a()
	assert model.current_state == state0
	assert reward == 2

コード例 #6

ファイルを表示

ファイル: LoopModelTest.py プロジェクト: huiwq1990/ReinforcementLearning

def test_loop_b():
    model = LoopModel()
    (state0, state5, state6, state7,
     state8) = model.get_states_by_id([0, 5, 6, 7, 8])
    assert model.current_state == state0
    reward = model.perform_action_b()
    assert model.current_state == state5
    assert reward == 0
    reward = model.perform_action_b()
    assert model.current_state == state6
    assert reward == 0
    reward = model.perform_action_b()
    assert model.current_state == state7
    assert reward == 0
    reward = model.perform_action_b()
    assert model.current_state == state8
    assert reward == 0
    reward = model.perform_action_a()
    assert model.current_state == state0
    assert reward == 2