Python Pendulum.NDTの例

プログラミング言語: Python

名前空間/パッケージ名: pendulum

クラス/型: Pendulum

メソッド/関数: NDT

hotexamples.comのコード掲載数: 4

Python Pendulum.NDT - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのpendulum.Pendulum.NDTの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

create(30)

Pendulum(30)

create_from_date(30)

add(28)

end_of(7)

date(7)

create_from_time(6)

create_from_format(6)

DT(4)

NDT(4)

astimezone(4)

between(4)

Kf(4)

lte(3)

gte(3)

gt(3)

diff(3)

copy(2)

dynamics(2)

create_from_timestamp(2)

ctime(2)

ne(2)

eq(2)

lt(2)

display(2)

dst(2)

get_current(1)

add_minute(1)

accelerate_second(1)

load_calibration(1)

accelerate_first(1)

set_timezone(1)

start(1)

step_angle(1)

to(1)

for_json(1)

episode_start(1)

first_of(1)

episode_step(1)

control_mode(1)

episode_finish(1)

calc_exit_velocities(1)

encrypt(1)

diff_in_seconds(1)

diff_for_humans(1)

calculate_window(1)

calibrate(1)

close(1)

compute_length(1)

compute_length_dot(1)

コード例 #1

ファイルを表示

print "Seed = %d" %  RANDOM_SEED
np .random.seed     (RANDOM_SEED)
random.seed         (RANDOM_SEED)

#env                 = Pendulum(2,withDisplay=True)       # Continuous pendulum
env                 = Pendulum(2,length=.5,mass=3.0,armature=.2,withDisplay=False)
env.withSinCos      = False             # State is dim-3: (cosq,sinq,qdot) ...
NX                  = env.nobs          # ... training converges with q,qdot with 2x more neurones.
NU                  = env.nu            # Control is dim-1: joint torque

env.vmax            = 100.
env.Kf              = np.diagflat([ 0.2, 2. ])
env.modulo          = False

env.DT              = 0.15
env.NDT             = 1
#env.umax            = 15.
#env.umax            = (15.,15.)
env.umax            = np.matrix([5.,10.]).T
NSTEPS              = 32

env.qlow[1] = -np.pi
env.qup [1] = np.pi


# Shortcut function to convert SE3 to 7-dof vector.
M2gv      = lambda M: XYZQUATToViewerConfiguration(se3ToXYZQUAT(M))
def place(objectId,M):
     robot.viewer.gui.applyConfiguration(objectId, M2gv(M))
     robot.viewer.gui.refresh() # Refresh the window.

コード例 #2

ファイルを表示

DECAY_RATE = 0.99  # Discount factor
UPDATE_RATE = 0.01  # Homotopy rate to update the networks
REPLAY_SIZE = 10000  # Size of replay buffer
BATCH_SIZE = 64  # Number of points to be fed in stochastic gradient
NH1 = NH2 = 250  # Hidden layer size
RESTORE = "netvalues/actorcritic"  # Previously optimize net weight
# (set empty string if no)
### --- Environment
env = Pendulum(1)  # Continuous pendulum
env.withSinCos = True  # State is dim-3: (cosq,sinq,qdot) ...
NX = env.nobs  # ... training converges with q,qdot with 2x more neurones.
NU = env.nu  # Control is dim-1: joint torque

env.vmax = 100.
env.DT = .15
env.NDT = 2
env.Kf = 0.2
NSTEPS = 30

### --- Q-value and policy networks


class QValueNetwork:
    def __init__(self):
        nvars = len(tf.trainable_variables())

        x = tflearn.input_data(shape=[None, NX])
        u = tflearn.input_data(shape=[None, NU])

        netx1 = tflearn.fully_connected(x,
                                        NH1,

コード例 #3

ファイルを表示

BATCH_SIZE              = 64            # Number of points to be fed in stochastic gradient
NH1 = NH2               = 250           # Hidden layer size
RESTORE                 = ""#"netvalues/actorcritic.15.kf2" # Previously optimize net weight 
                                        # (set empty string if no)
RENDERRATE              = 20           # Render rate (rollout and plot) during training (0 = no)
#RENDERACTION            = [ 'saveweights',  'draw', 'rollout' ]
REGULAR                 = True          # Render on a regular grid vs random grid

### --- Environment
env                     = Pendulum(1)       # Continuous pendulum
env.withSinCos          = True              # State is dim-3: (cosq,sinq,qdot) ...
NX                      = env.nobs          # ... training converges with q,qdot with 2x more neurones.
NU                      = env.nu            # Control is dim-1: joint torque

env.DT                  = .15
env.NDT                 = 2
env.Kf                  = 0.2
env.vmax                = 100

RENDERACTION            = [ 'draw', ]

'''

env = Pendulum(2,length=.5,mass=3.0,armature=10.)
env.withSinCos      = True              # State is dim-3: (cosq,sinq,qdot) ...
NX                  = env.nobs          # ... training converges with q,qdot with 2x more neurones.
NU                  = env.nu            # Control is dim-1: joint torque

env.DT              = 0.2
env.NDT             = 1
env.Kf              = 10.0 # 1.0

コード例 #4

ファイルを表示

BATCH_SIZE = 64  # Number of points to be fed in stochastic gradient
NH1 = NH2 = 250  # Hidden layer size
RESTORE = "netvalues/actorcritic.dt015.kf02.ep1300"  # Previously optimize net weight
# (set empty string if no)
### --- Environment
env = Pendulum(1)  # Continuous pendulum
env.withSinCos = True  # State is dim-3: (cosq,sinq,qdot) ...
NX = env.nobs  # ... training converges with q,qdot with 2x more neurones.
NU = env.nu  # Control is dim-1: joint torque

env.vmax = 100.
env.Kf = 0.2
env.modulo = False

env.DT = 0.15
env.NDT = 1
NSTEPS = 32  # Number of intergration steps in horizon
NNODES = 8  # Number of shooting nodes
FNODES = NSTEPS / NNODES  # Number of integration nodes per shooting interval ...
assert (not NSTEPS % NNODES)  # ... should be an integer

### --- Q-value and policy networks


class QValueNetwork:
    def __init__(self):
        nvars = len(tf.trainable_variables())

        x = tflearn.input_data(shape=[None, NX])
        u = tflearn.input_data(shape=[None, NU])