Python Tool.build_vocab Examples

Programming Language: Python

Namespace/Package Name: tool

Class/Type: Tool

Method/Function: build_vocab

Examples at hotexamples.com: 2

Python Tool.build_vocab - 2 examples found. These are the top rated real world Python examples of tool.Tool.build_vocab extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Tool(30)

check_type(10)

check_isKeyword(7)

replaceNonASCII(7)

removeNonAscii(7)

_is_array(5)

get_md5(4)

get_PAD_ID(4)

get_B_ID(4)

__init__(4)

get_vocab_size(4)

check_isKeyword_picAssets(3)

get_vocab(2)

items(2)

idxes2line(2)

conv_encoding(2)

get_win_height(2)

build_vocab(2)

check_pic_type(2)

get_win_width(2)

line2idxes(2)

get_E_ID(2)

_invert_dol(2)

get_UNK_ID(2)

NeedTime(2)

get_ivocab(2)

get_yaml(2)

get_project_dir(1)

get_tag_vocab(1)

get_text_vocab(1)

get_view_state(1)

keys2tensor(1)

hexs_to_int(1)

indices2sent(1)

io(1)

isAttributeValid(1)

get_host_by_name(1)

keywords2tensor(1)

lengths2tensor(1)

line2tensor(1)

load_data(1)

populate_components_listbox(1)

populate_components_listbox_wo_select(1)

routes_by_controllers(1)

get_iterator(1)

AES_Decrypt(1)

get_hidden_tag_vocab(1)

fill(1)

FZ(1)

SetPrintDisable(1)

Example #1

Show file

File: train.py Project: shadowkiller33/StyIns

def main():
    args = parse_args()

    if args.task == 'yelp':
        hps = yelp_hps
    else:
        hps = gyafc_hps

    tool = Tool(vocab_file=hps.vocab_path, n_ins=hps.n_ins,
        batch_size=hps.batch_size, max_len=hps.max_len, r_superv=hps.r_superv,
        corrupt_ratio=hps.corrupt_ratio)

    tool.build_vocab([hps.unpaired_train_data, hps.paired_train_data])

    vocab_size = tool.vocabulary_size
    pad_idx = tool.pad_idx
    bos_idx = tool.bos_idx
    assert vocab_size > 0 and pad_idx >=0 and bos_idx >= 0
    hps = hps._replace(vocab_size=vocab_size, pad_idx=pad_idx, bos_idx=bos_idx)

    print ("hyper-patameters:")
    print (hps)
    input ("please check the hyper-parameters, and then press any key to continue >")

    generator = Seq2Seq(hps, device)
    generator = generator.to(device)

    discriminator = Discriminator(hps, device)
    discriminator = discriminator.to(device)

    pretrain_method = hps.pretrain_method

    pretrain(generator, tool, hps, device, pretrain_method)
    train(generator, discriminator, tool, hps, device, pretrain_method)

Example #2

Show file

class Generator(object):
    def __init__(self, hps, device, epoch=None):
        # construct HParams
        self.device = device

        self.tool = Tool(vocab_file=hps.vocab_path,
                         n_ins=hps.n_ins,
                         batch_size=hps.batch_size,
                         max_len=hps.max_len,
                         r_superv=hps.r_superv,
                         corrupt_ratio=0.0)

        self.tool.build_vocab([hps.unpaired_train_data, hps.paired_train_data])

        vocab_size = self.tool.vocabulary_size
        pad_idx = self.tool.pad_idx
        bos_idx = self.tool.bos_idx
        assert vocab_size > 0 and pad_idx >= 0 and bos_idx >= 0
        self.hps = hps._replace(vocab_size=vocab_size,
                                pad_idx=pad_idx,
                                bos_idx=bos_idx)

        # load model
        model = Seq2Seq(self.hps, device)

        # load
        utils.restore_checkpoint_generator(hps.ckpt_path,
                                           device,
                                           model,
                                           optimizer=None,
                                           specified_epoch=epoch,
                                           prefix="")

        model.eval()

        self.model = model.to(device)

        self.tool.close_corruption()
        # we use unpaired validation data to build stylistic instances for generation
        self.tool.build_valid_data(self.hps.unpaired_valid_data, None)

    def reload_checkpoint(self, epoch):
        utils.restore_checkpoint_generator(self.hps.ckpt_path,
                                           self.device,
                                           self.model,
                                           optimizer=None,
                                           specified_epoch=epoch,
                                           prefix="")

        self.model = self.model.to(self.device)
        self.model.eval()

    def greedy_search(self, src, ins):

        enc_outs, init_state, style_feature, attn_mask = self.model.inference_init_encoder(
            src, ins)

        inps = torch.tensor(self.tool.bos_idx,
                            dtype=torch.long,
                            device=self.device).view(1, 1)
        states = init_state
        length = src.size(1)

        trans = []
        costs = 0.0
        for k in range(0, length * 2):

            _, probs, states = self.model.dec_step(inps, states, enc_outs,
                                                   attn_mask, style_feature)
            top1 = probs.data.max(1)[1]
            inps = top1.unsqueeze(1)

            token = top1.item()
            trans.append(token)
            costs -= np.log(probs[0, token].item() + 1e-12)

            if token == self.tool.eos_idx:
                break

        return trans, costs

    def generate_one(self, src_sent, style_id):

        src = self.tool.build_inference_src(src_sent.strip())
        src = src.to(self.device)  # (1, T)

        # (K, 1, L)
        ins = self.tool.build_inference_instances(style_id, src_sent.strip())
        ins = ins.to(self.device)

        trans, costs = self.greedy_search(src, ins)

        if len(trans) == 0:
            return "", "generation failed!"

        out_sent = self.tool.indices2sent(trans)

        return out_sent, "ok"