Python env 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: ReinforceLearning.environment.env

메소드/함수: env

hotexamples.com에서의 예제들: 4

Python env - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 ReinforceLearning.environment.env.env에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

def init(point_dict):
    rl_brain = PolicyGradient(
        n_actions=env.action_space_num,
        n_features=env.obs_num,
        learning_rate=0.02,
        reward_decay=0.99,
        # output_graph=True,
    )
    rl_brain.load_model(
        path='ReinforceLearning/saved_model/PG - 1/policy_gradient.ckpt')
    # 所有节点共用一个RL，PID控制器是独立的
    for id in point_dict:
        if id != 0:
            pid_brain = PID(100, 0.1, 1, 100)
            e = env(point_dict[id])
            a = Agent(rl_brain, pid_brain, e)
            Agent_dict[id] = a

예제 #2

파일 보기

The cart pole example
View more on my tutorial page: https://morvanzhou.github.io/tutorials/
Using:
Tensorflow: 1.0
gym: 0.8.0
"""

import gym
from ReinforceLearning.brain.Policy_Gradient import PolicyGradient
import matplotlib.pyplot as plt
from ReinforceLearning.environment.env import env
from simulation.output_generator import output_generator

RENDER = False  # rendering wastes time
MAX_REWARD = 0
Myenv = env(max_energy=500)
output = output_generator(scale=20,
                          bias=20,
                          period=200,
                          phase=0,
                          max_iter=20000)
# output.load("imagedata.npy")
Myenv.output_need = output.output
# print(env.action_space)
# print(env.observation_space)
# print(env.observation_space.high)
# print(env.observation_space.low)

RL = PolicyGradient(
    n_actions=Myenv.action_space_num,
    n_features=Myenv.obs_num,

예제 #3

파일 보기

Using:
Tensorflow: 1.0
gym: 0.8.0
"""

import numpy as np
from ReinforceLearning.brain.Policy_Gradient import PolicyGradient
import matplotlib.pyplot as plt
from ReinforceLearning.environment.env import env
from simulation.output_generator import output_generator
from method.myfunc import smooth

DISPLAY_REWARD_THRESHOLD = 400  # renders environment if total episode reward is greater then this threshold
RENDER = False  # rendering wastes time

Myenv = env()
output = output_generator(scale=20,
                          bias=20,
                          period=200,
                          phase=0,
                          max_iter=20000)
output.load("imagedata.npy")
Myenv.output_need = output.output
# print(env.action_space)
# print(env.observation_space)
# print(env.observation_space.high)
# print(env.observation_space.low)

RL = PolicyGradient(
    n_actions=Myenv.action_space_num,
    n_features=Myenv.obs_num,

예제 #4

파일 보기

파일: point.py 프로젝트: wufan2132/Wireless-transmission

 def set_env(self):
     self.env = env(self)