Python RingBuffer.clip_from_start 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: ring_buffer

클래스/타입: RingBuffer

메소드/함수: clip_from_start

hotexamples.com에서의 예제들: 1

Python RingBuffer.clip_from_start - 1개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 ring_buffer.RingBuffer.clip_from_start에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

RingBuffer(30)

write(22)

append(18)

read(15)

get(14)

insert_keep_old(8)

read_exactly(6)

remove_oldest(5)

insert_keep_new(5)

bytes_used(5)

capacity(5)

__str__(4)

remove_newest(4)

size(3)

add_values(3)

sizeOf(3)

print(3)

bytes_total(2)

bytes_free(2)

add_value(2)

push(2)

reset(1)

pop(1)

random_pick(1)

start_element(1)

Find(1)

peek(1)

mean(1)

last_item_groups(1)

last_item_group(1)

get_len(1)

extend(1)

enqueue(1)

dequeue(1)

clip_from_start(1)

clip_from_end(1)

clear(1)

add_item(1)

add(1)

get_sum(1)

예제 #1

파일 보기

def main():

    env = gym.make('BreakoutDeterministic-v4')
    frame = env.reset()
    env.render()

    frames_per_action = 4
    num_actions = 4
    ATARI_SHAPE_PLUSONE = (105, 80, 5)
    num_games = 10

    this_states = RingBuffer(5)
    this_rewards = RingBuffer(4)

    all_prev_states = []
    all_next_states = []
    all_actions = []
    all_rewards = []
    all_isterminal = []

    # print('a')
    prev_frame = preprocess(frame)
    for this_game in range(0, num_games):
        iter_count = 0
        is_done = False
        while not is_done:
            this_action = env.action_space.sample()
            # print('b')
            this_action_onehot = action_to_onehot(this_action)
            this_states.append(prev_frame)
            for action_count in range(0, frames_per_action):
                # print('c')
                frame, reward, is_done, _ = env.step(this_action)
                this_states.append(preprocess(frame))
                this_rewards.append(transform_reward(reward))
                if not is_done:
                    env.render()
                else:
                    frame = env.reset()
                    env.render()
                    break
            prev_frame = frame
            if (iter_count > 0):
                all_prev_states.append(this_states.clip_from_end(1))
                all_next_states.append(this_states.clip_from_start(1))
                all_rewards.append(this_rewards)
                all_actions.append(this_action)
                all_isterminal.append(int(is_done))
                # is_done = False
            iter_count += 1
            # input()
    np_prev_states = np.asarray(all_prev_states)
    # print('prev states: ',np.shape(np_prev_states))
    np_next_states = np.asarray(all_next_states)
    # print('next states: ',np.shape(np_next_states))
    np_rewards = np.asarray(all_rewards)
    # np_rewards = np_rewards[:-1,:]
    # print('rewards: ',np.shape(np_rewards))
    np_actions = np.asarray(all_actions)
    # np_actions = np_actions[:-1]
    # print('actions: ',np.shape(np_actions))
    np_isterminal = np.asarray(all_isterminal)
    # np_isterminal = np_isterminal[:-1]
    # print('isterminal: ',np.shape(np_isterminal))

    np_num_objects = np.size(np_isterminal)
    # print('num_objects:',np_num_objects)

    t_model = atari_model(num_actions)