Python get_actions示例

编程语言: Python

命名空间/包名称: framework

方法/功能: get_actions

hotexamples.com的示例: 2

Python get_actions - 已找到2个示例。这些是从开源项目中提取的最受好评的framework.get_actions现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

from tqdm import tqdm
import framework
import utils

DEBUG = False

GAMMA = 0.5  # discounted factor
TRAINING_EP = 0.5  # epsilon-greedy parameter for training
TESTING_EP = 0.05  # epsilon-greedy parameter for testing
NUM_RUNS = 10
NUM_EPOCHS = 600
NUM_EPIS_TRAIN = 25  # number of episodes for training at each epoch
NUM_EPIS_TEST = 50  # number of episodes for testing
ALPHA = 0.001  # learning rate for training

ACTIONS = framework.get_actions()
OBJECTS = framework.get_objects()
NUM_ACTIONS = len(ACTIONS)
NUM_OBJECTS = len(OBJECTS)


def tuple2index(action_index, object_index):
    """Converts a tuple (a,b) to an index c"""
    return action_index * NUM_OBJECTS + object_index


def index2tuple(index):
    """Converts an index c to a tuple (a,b)"""
    return index // NUM_OBJECTS, index % NUM_OBJECTS

示例#2

显示文件

文件： agent_linear_pytorch.py 项目： Sumit-ai/MIT-course-solutions

import numpy as np
import matplotlib.pyplot as plt
from tqdm import tqdm

DEBUG = False

GAMMA = 0.5 # discounted factor
TRAINING_EP = 0.5 # epsilon-greedy parameter for training
TESTING_EP = 0.05 # epsilon-greedy parameter for testing
NUM_RUNS = 10
NUM_EPOCHS = 600
NUM_EPIS_TRAIN = 25 # number of episodes for training at each epoch
NUM_EPIS_TEST = 50 #number of episodes for testing
ALPHA = 0.001 # learning rate for training

actions = framework.get_actions()
objects = framework.get_objects()
NUM_ACTIONS = len(actions)
NUM_OBJECTS = len(objects)

model = None
optimizer = None

def tuple2index(action_index, object_index):
    return action_index * NUM_OBJECTS + object_index

def index2tuple(index):
    return index // NUM_OBJECTS, index % NUM_OBJECTS


# bag-of-words embedding