Python DataLoader.convert_sentence_to_indices示例

编程语言: Python

命名空间/包名称: data_loader

类/类型: DataLoader

方法/功能: convert_sentence_to_indices

hotexamples.com的示例: 2

Python DataLoader.convert_sentence_to_indices - 已找到2个示例。这些是从开源项目中提取的最受好评的data_loader.DataLoader.convert_sentence_to_indices现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

DataLoader(30)

create_batches(9)

convert_df_to_arrays(4)

gen_data(4)

convert_to_char(4)

data_iterator(4)

generate(3)

batch_unpack_image_sequence(3)

_write_nifti(3)

getHistoryRange(3)

change_file(3)

fetch_batch(3)

data_generator(3)

clean_data(3)

create_tf_dataset(3)

_load_file(2)

create_random_ordering(2)

create_dataset(2)

data_batch(2)

createRecoData(2)

add_dataset(2)

convert_sentence_to_indices(2)

astype(2)

generator(2)

getFeatures(2)

build_vocab(2)

build_data(2)

filter_by_nodes(2)

gen(1)

format_file_list(1)

form_sentences(1)

filter_multicolor(1)

filter_latest_questions(1)

fetch_val_batch(1)

gen_batch_data(1)

arrange_data(1)

_make_dataset(1)

gen_iterator(1)

gen_tfrecords(1)

generate_positive_samples(1)

generate_train_data(1)

generate_train_test(1)

getAllHistory(1)

getAllPersons(1)

getBatch(1)

getData(1)

getFuture(1)

getSetLen(1)

load_order_list(1)

fetch_train_batch(1)

示例#1

显示文件

class UsableEncoder:
    def __init__(self, loc, WORD_DICT):
        # BEST_MODEL = "../../dir_HugeFiles/prev_model/skip-best-loss10.237"
        print("Preparing the DataLoader. Loading the word dictionary")
        # WORD_DICT = '../dir_HugeFiles/instructions/skip_inst/skip_instruction.csv.pkl'
        self.d = DataLoader(sentences=[''],
                            word_dict=load_dictionary(WORD_DICT))
        self.encoder = None

        print("Loading encoder from the saved model at {}".format(loc))
        model = UniSkip()
        model.load_state_dict(
            torch.load(loc, map_location=lambda storage, loc: storage))
        self.encoder = model.encoder
        if USE_CUDA:
            self.encoder.cuda(CUDA_DEVICE)
            print('using cuda')

    def encode(self, text):
        def chunks(l, n):
            """Yield successive n-sized chunks from l."""
            for i in range(0, len(l), n):
                yield l[i:i + n]

        ret = []

        for chunk in chunks(text, 100):
            #print("encoding chunk of size {}".format(len(chunk)))
            indices = [
                self.d.convert_sentence_to_indices(sentence)
                for sentence in chunk
            ]
            indices = torch.stack(indices)
            indices, _ = self.encoder(indices)
            indices = indices.view(-1, self.encoder.thought_size)
            indices = indices.data.cpu().numpy()

            ret.extend(indices)
        ret = np.array(ret)

        return ret

示例#2

显示文件

文件： Evaluate.py 项目： zyy598/Source-Code-Notebook

class UsableEncoder:
    def __init__(self, loc="./saved_models/skip-best"):  #导入之前训练得到的最好模型
        print("Preparing the DataLoader. Loading the word dictionary")
        self.d = DataLoader(
            sentences=[''],
            word_dict=load_dictionary('./data/dummy_corpus.txt.pkl'))
        self.encoder = None

        print("Loading encoder from the saved model at {}".format(loc))
        model = UniSkip()  #载入模型
        model.load_state_dict(
            torch.load(loc, map_location=lambda storage, loc: storage))
        self.encoder = model.encoder
        if USE_CUDA:
            self.encoder.cuda(CUDA_DEVICE)  #gpu

    def encode(self, text):
        def chunks(l, n):
            """Yield successive n-sized chunks from l."""
            for i in range(0, len(l), n):
                yield l[i:i + n]

        ret = []

        for chunk in chunks(text, 100):  #每次往后增加词
            print("encoding chunk of size {}".format(len(chunk)))
            indices = [
                self.d.convert_sentence_to_indices(sentence)
                for sentence in chunk
            ]
            indices = torch.stack(indices)
            indices, _ = self.encoder(indices)  #编码
            indices = indices.view(-1, self.encoder.thought_size)
            indices = indices.data.cpu().numpy()

            ret.extend(indices)
        ret = np.array(ret)

        return ret