Python MonteCarlo.learn_policy Examples

Programming Language: Python

Namespace/Package Name: MonteCarlo

Class/Type: MonteCarlo

Method/Function: learn_policy

Examples at hotexamples.com: 2

Python MonteCarlo.learn_policy - 2 examples found. These are the top rated real world Python examples of MonteCarlo.MonteCarlo.learn_policy extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

MonteCarlo(29)

set_temperature(3)

train(3)

update(3)

apply(3)

get_temperature(2)

change_density(2)

checkIfAcceptMove(2)

mcycles(2)

getError(2)

learn_policy(2)

accept_change(2)

get_play(2)

random_direction(1)

runSimulation(1)

best_move(1)

run_episodes(1)

randomVariant(1)

step(1)

subtract(1)

temperature(1)

add(1)

random_agent(1)

mc_prediction(1)

price(1)

next_state(1)

next_pair(1)

calcMonteCarlo(1)

get_sorted(1)

getPrice(1)

getPlay(1)

generateP1(1)

compare(1)

calcMonteCarloLinGen(1)

inCircle(1)

Example #1

Show file

def run_trial(planning_horizon):

    blocks_world_builder = BlocksWorldBuilder(blocks_world_size)
    ctrl = SimpleMonteCarloControl()
    planner = Planner(planning_horizon)
    mc = MonteCarlo(blocks_world_builder,
                    planner,
                    control=ctrl,
                    max_episode_length=blocks_world_size * 2,
                    planning_factor=0,
                    plan_on_empty_policy=True,
                    exploring_starts=True,
                    exploring_factor=0)

    mc.learn_policy(number_episodes=number_of_episodes,
                    show_progress_bar=True,
                    evaluate_return_ratio=False)

    data = pd.DataFrame({
        'episode': range(len(mc.returns)),
        #'return_ratio': mc.return_ratios,
        'observed_returns': mc.returns,
        #'optimal_returns': mc.optimal_returns
    })

    return data

Example #2

Show file

import os
import sys

# Make sure the path of the framework is included in the import path
sys.path.insert(
    0, os.path.abspath(os.path.join(os.path.dirname(__file__), '../..')))

from tests import test_policy
from MonteCarlo import MonteCarlo
from mdp import BlocksWorldBuilder
from control import SimpleMonteCarloControl, SgdMonteCarloControl
from planner import Planner

from matplotlib import pyplot as plt

mdp_builder = BlocksWorldBuilder(blocks_world_size=7)
planner = Planner(planning_horizon=5)
ctrl = SimpleMonteCarloControl()
mc = MonteCarlo(mdp_builder,
                planner,
                control=ctrl,
                max_episode_length=14,
                planning_factor=0,
                plan_on_empty_policy=True,
                exploring_starts=True,
                exploring_factor=0.0)
learned_policy = mc.learn_policy(number_episodes=150, show_progress_bar=True)