Python TextLoader.get_batch Exemples

Langage de programmation: Python

Espace de nommage/Pack: utils

Class/Type: TextLoader

Méthode/Fonction: get_batch

Exemples au hotexamples.com: 2

Python TextLoader.get_batch - 2 exemples trouvés. Ce sont les exemples réels les mieux notés de utils.TextLoader.get_batch extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

TextLoader(30)

reset_batch_pointer(30)

next_batch(30)

pointer(7)

read_dataset(3)

cue_batch_pointer_to_epoch_fraction(2)

get_batch(2)

next_batch_test(2)

reset_batch_pointers(1)

sentence_to_token_id(1)

read_data(1)

prepare_data(1)

shuff(1)

pick_bucket(1)

parse_input(1)

next_epoch(1)

next_batch_tr(1)

load_data(1)

build_vocab(1)

iterbatches(1)

init_vocabulary(1)

init_train_bucket(1)

get_words_id(1)

get_words_by_id(1)

get_first_batch_as_valid(1)

get_embeddings(1)

get_data_for_feeder(1)

compose_output(1)

close(1)

clean_str(1)

chars(1)

tensor(1)

Méthodes fréquemment utilisées

TextLoader (30)

reset_batch_pointer (30)

next_batch (30)

pointer (7)

read_dataset (3)

cue_batch_pointer_to_epoch_fraction (2)

get_batch (2)

next_batch_test (2)

reset_batch_pointers (1)

sentence_to_token_id (1)

Méthodes fréquemment utilisées

read_data (1)

prepare_data (1)

shuff (1)

pick_bucket (1)

parse_input (1)

next_epoch (1)

next_batch_tr (1)

load_data (1)

build_vocab (1)

iterbatches (1)

init_vocabulary (1)

init_train_bucket (1)

get_words_id (1)

get_words_by_id (1)

get_first_batch_as_valid (1)

get_embeddings (1)

get_data_for_feeder (1)

compose_output (1)

close (1)

clean_str (1)

Méthodes fréquemment utilisées

init_vocabulary (1)

init_train_bucket (1)

get_words_id (1)

get_words_by_id (1)

get_first_batch_as_valid (1)

get_embeddings (1)

get_data_for_feeder (1)

compose_output (1)

close (1)

clean_str (1)

chars (1)

tensor (1)

Méthodes fréquemment utilisées

chars (1)

tensor (1)

Exemple #1

0

Afficher le fichier

Fichier : translate.py Projet : jkcodetracer/speech_recognition_translation

def translate(): textloader = TextLoader(ORIGINAL_DATA_DIR, SOURCE_VOCAB_SIZE, TARGET_VOCAB_SIZE, SOURCE_LANG, TARGET_LANG, _buckets, batch_size=1) s_vocab_path = os.path.join( ORIGINAL_DATA_DIR, "vocab%d.%s" % (SOURCE_VOCAB_SIZE, SOURCE_LANG)) t_vocab_path = os.path.join( ORIGINAL_DATA_DIR, "vocab%d.%s" % (TARGET_VOCAB_SIZE, TARGET_LANG)) s_vocab, _ = textloader.init_vocabulary(s_vocab_path) _, t_id2vocab = textloader.init_vocabulary(t_vocab_path) # create seq2seq model model = Seq2SeqNMT(SOURCE_VOCAB_SIZE, TARGET_VOCAB_SIZE, _buckets, HIDDEN_UNITS, N_LAYERS, batch_size=1, learning_rate=LR) model.build_graph(train=False) chpt = tf.train.get_checkpoint_state(TRAIN_DIR) if chpt: print("restore model paramters from %s" % chpt.model_checkpoint_path) model.restore(chpt.model_checkpoint_path) else: print("init a new model.") model.init_sess() TEST_SENTENCE_PATH = os.path.join(ORIGINAL_DATA_DIR, "test.%s" % SOURCE_LANG) f_s = open(TEST_SENTENCE_PATH, 'r') step = 0 for sentence in f_s: step += 1 word_ids = textloader.sentence_to_token_id( tf.compat.as_bytes(sentence), s_vocab) # find out the buckets bid = len(_buckets) - 1 for i, bucket in enumerate(_buckets): if bucket[0] >= len(word_ids): bid = i break encoder_inputs, decoder_inputs, target_weights = textloader.get_batch( {bid: [(word_ids, [])]}, bid) _, output_logits = model.predict(encoder_inputs, decoder_inputs, target_weights, bid) # greedy decoder outputs = [int(np.argmax(logit, axis=1)) for logit in output_logits] if TextLoader.EOS_ID in outputs: outputs = outputs[:outputs.index(TextLoader.EOS_ID)] result = [tf.compat.as_str(t_id2vocab[output]) for output in outputs] print "source(%d): %s" % (step, sentence) print "inference(%d): %s" % (step, result)

Exemple #2

0

Afficher le fichier

def train(): textloader = TextLoader(ORIGINAL_DATA_DIR, SOURCE_VOCAB_SIZE, TARGET_VOCAB_SIZE, SOURCE_LANG, TARGET_LANG, _buckets, BATCH_SIZE) source_train, target_train, source_dev, target_dev, _, _ = textloader.prepare_data( ) train_data = textloader.read_data(source_train, target_train) dev_data = textloader.read_data(source_dev, target_dev) textloader.init_train_bucket(train_data) # create seq2seq model model = Seq2SeqNMT(SOURCE_VOCAB_SIZE, TARGET_VOCAB_SIZE, _buckets, HIDDEN_UNITS, N_LAYERS, BATCH_SIZE, LR) model.build_graph() chpt = tf.train.get_checkpoint_state(TRAIN_DIR) if chpt: print("restore model paramters from %s" % chpt.model_checkpoint_path) model.restore(chpt.model_checkpoint_path) else: print("init a new model.") model.init_sess() current_step = 0 avg_time = 0.0 avg_loss = 0.0 for _ in range(ITERATION): bid = textloader.pick_bucket() encoder_inputs, decoder_inputs, target_weights = textloader.get_batch( train_data, bid) begin_time = time.time() gradient_norm, loss = model.train_batch(encoder_inputs, decoder_inputs, target_weights, bid) avg_time += (time.time() - begin_time) / STEP_PER_CKP avg_loss += loss / STEP_PER_CKP current_step += 1 if current_step % STEP_PER_CKP == 0: print( "total step %d learning rate %.4f avg-time %.2f avg-loss: %6f" % (model.global_step.eval(session=model.sess), model.learning_rate.eval(session=model.sess), avg_time, avg_loss)) chk_path = os.path.join(TRAIN_DIR, "nmt.ckpt." + str(current_step)) model.save(chk_path) avg_time = 0.0 avg_loss = 0.0