Python DataLoader.convert_sentence_to_indices 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: data_loader

클래스/타입: DataLoader

메소드/함수: convert_sentence_to_indices

hotexamples.com에서의 예제들: 2

Python DataLoader.convert_sentence_to_indices - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 data_loader.DataLoader.convert_sentence_to_indices에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

DataLoader(30)

create_batches(9)

convert_df_to_arrays(4)

gen_data(4)

convert_to_char(4)

data_iterator(4)

generate(3)

batch_unpack_image_sequence(3)

_write_nifti(3)

getHistoryRange(3)

change_file(3)

fetch_batch(3)

data_generator(3)

clean_data(3)

create_tf_dataset(3)

_load_file(2)

create_random_ordering(2)

create_dataset(2)

data_batch(2)

createRecoData(2)

add_dataset(2)

convert_sentence_to_indices(2)

astype(2)

generator(2)

getFeatures(2)

build_vocab(2)

build_data(2)

filter_by_nodes(2)

gen(1)

format_file_list(1)

form_sentences(1)

filter_multicolor(1)

filter_latest_questions(1)

fetch_val_batch(1)

gen_batch_data(1)

arrange_data(1)

_make_dataset(1)

gen_iterator(1)

gen_tfrecords(1)

generate_positive_samples(1)

generate_train_data(1)

generate_train_test(1)

getAllHistory(1)

getAllPersons(1)

getBatch(1)

getData(1)

getFuture(1)

getSetLen(1)

load_order_list(1)

fetch_train_batch(1)

예제 #1

파일 보기

class UsableEncoder:
    def __init__(self, loc, WORD_DICT):
        # BEST_MODEL = "../../dir_HugeFiles/prev_model/skip-best-loss10.237"
        print("Preparing the DataLoader. Loading the word dictionary")
        # WORD_DICT = '../dir_HugeFiles/instructions/skip_inst/skip_instruction.csv.pkl'
        self.d = DataLoader(sentences=[''],
                            word_dict=load_dictionary(WORD_DICT))
        self.encoder = None

        print("Loading encoder from the saved model at {}".format(loc))
        model = UniSkip()
        model.load_state_dict(
            torch.load(loc, map_location=lambda storage, loc: storage))
        self.encoder = model.encoder
        if USE_CUDA:
            self.encoder.cuda(CUDA_DEVICE)
            print('using cuda')

    def encode(self, text):
        def chunks(l, n):
            """Yield successive n-sized chunks from l."""
            for i in range(0, len(l), n):
                yield l[i:i + n]

        ret = []

        for chunk in chunks(text, 100):
            #print("encoding chunk of size {}".format(len(chunk)))
            indices = [
                self.d.convert_sentence_to_indices(sentence)
                for sentence in chunk
            ]
            indices = torch.stack(indices)
            indices, _ = self.encoder(indices)
            indices = indices.view(-1, self.encoder.thought_size)
            indices = indices.data.cpu().numpy()

            ret.extend(indices)
        ret = np.array(ret)

        return ret

예제 #2

파일 보기

파일: Evaluate.py 프로젝트: zyy598/Source-Code-Notebook

class UsableEncoder:
    def __init__(self, loc="./saved_models/skip-best"):  #导入之前训练得到的最好模型
        print("Preparing the DataLoader. Loading the word dictionary")
        self.d = DataLoader(
            sentences=[''],
            word_dict=load_dictionary('./data/dummy_corpus.txt.pkl'))
        self.encoder = None

        print("Loading encoder from the saved model at {}".format(loc))
        model = UniSkip()  #载入模型
        model.load_state_dict(
            torch.load(loc, map_location=lambda storage, loc: storage))
        self.encoder = model.encoder
        if USE_CUDA:
            self.encoder.cuda(CUDA_DEVICE)  #gpu

    def encode(self, text):
        def chunks(l, n):
            """Yield successive n-sized chunks from l."""
            for i in range(0, len(l), n):
                yield l[i:i + n]

        ret = []

        for chunk in chunks(text, 100):  #每次往后增加词
            print("encoding chunk of size {}".format(len(chunk)))
            indices = [
                self.d.convert_sentence_to_indices(sentence)
                for sentence in chunk
            ]
            indices = torch.stack(indices)
            indices, _ = self.encoder(indices)  #编码
            indices = indices.view(-1, self.encoder.thought_size)
            indices = indices.data.cpu().numpy()

            ret.extend(indices)
        ret = np.array(ret)

        return ret