Python DatasetManager.get_batch Exemples

Langage de programmation: Python

Espace de nommage/Pack: dataset_manager

Class/Type: DatasetManager

Méthode/Fonction: get_batch

Exemples au hotexamples.com: 2

Python DatasetManager.get_batch - 2 exemples trouvés. Ce sont les exemples réels les mieux notés de dataset_manager.DatasetManager.get_batch extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

DatasetManager(27)

get_datasets(6)

boot(5)

create_dataset(3)

generate_3d_data_for_prefix_length(3)

get_batch(2)

encode_data_with_label_all_data(2)

equalize_vector_length_to_np(2)

generate_3d_data_with_label_all_data(2)

add_array(2)

generate_3d_data(2)

get_dataset(2)

get_max_case_length(1)

get_pos_case_length_quantile(1)

get_dataset_names(1)

generate_3d_data_for_prefix_length_with_label_all_data(1)

get_dataloader(1)

extract_timestamp_features(1)

generate_3d_data_for_prefix_length_with_label(1)

generate_3d_data_for_prefix_length_no_padding(1)

extract_duration_features(1)

encode_data_with_label_all_data_act_res_embedding(1)

encode_data_with_label(1)

encode_data(1)

create_label_vector(1)

create_dataset_with_new_annotations(1)

convert_labels_to_np(1)

calculate_divisors(1)

get_test_by_batch(1)

Méthodes fréquemment utilisées

DatasetManager (27)

get_datasets (6)

boot (5)

create_dataset (3)

generate_3d_data_for_prefix_length (3)

get_batch (2)

encode_data_with_label_all_data (2)

equalize_vector_length_to_np (2)

generate_3d_data_with_label_all_data (2)

add_array (2)

Méthodes fréquemment utilisées

generate_3d_data (2)

get_dataset (2)

get_max_case_length (1)

get_pos_case_length_quantile (1)

get_dataset_names (1)

generate_3d_data_for_prefix_length_with_label_all_data (1)

get_dataloader (1)

extract_timestamp_features (1)

generate_3d_data_for_prefix_length_with_label (1)

generate_3d_data_for_prefix_length_no_padding (1)

extract_duration_features (1)

encode_data_with_label_all_data_act_res_embedding (1)

encode_data_with_label (1)

encode_data (1)

create_label_vector (1)

create_dataset_with_new_annotations (1)

convert_labels_to_np (1)

calculate_divisors (1)

get_test_by_batch (1)

Méthodes fréquemment utilisées

extract_duration_features (1)

encode_data_with_label_all_data_act_res_embedding (1)

encode_data_with_label (1)

encode_data (1)

create_label_vector (1)

create_dataset_with_new_annotations (1)

convert_labels_to_np (1)

calculate_divisors (1)

get_test_by_batch (1)

Exemple #1

0

Afficher le fichier

Fichier : train_runner_population_based_tunning.py Projet : ductri/Entropy-2018

def run(experiment_name): BEST_THRES = 3 WORST_THRES = 3 POPULATION_STEPS = 500 ITERATIONS = 100 POPULATION_SIZE = 10 accuracy_hist = np.zeros((POPULATION_SIZE, POPULATION_STEPS)) l1_scale_hist = np.zeros((POPULATION_SIZE, POPULATION_STEPS)) best_accuracy_hist = np.zeros((POPULATION_STEPS, )) best_l1_scale_hist = np.zeros((POPULATION_STEPS, )) with tf.Graph().as_default() as gr: with tf.variable_scope('input'): tf_input = tf.placeholder( dtype=tf.int32, shape=[ None, model_population_based_tunning.SENTENCE_LENGTH_MAX ], name='tf_input') tf_labels = tf.placeholder(dtype=tf.int32, shape=[None], name='tf_labels') models = [ create_model( i, is_included_regularization=FLAGS.IS_INCLUDED_REGULARIZATION) for i in range(10) ] # It will help us with creation of different scope_name for each model for index, model in enumerate(models): with tf.variable_scope(str(index)): model.boot(tf_input, tf_labels) logging.info('Graph size: %s', utils.count_trainable_variables()) gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=FLAGS.GPU) with tf.Session(config=tf.ConfigProto( gpu_options=gpu_options, allow_soft_placement=True, log_device_placement=FLAGS.LOG_DEVICE_PLACEMENT)).as_default( ) as sess: sess.run(tf.global_variables_initializer()) sess.run(tf.local_variables_initializer()) dataset_manager = DatasetManager() dataset_manager.boot() dataset_generator = dataset_manager.get_batch( batch_size=FLAGS.BATCH_SIZE, number_epochs=10 * FLAGS.NUMBER_EPOCHS) for i in range(POPULATION_STEPS): # Copy best sess.run([ m.get_copy_from_op(models[0]) for m in models[-WORST_THRES:] ]) # Perturb others sess.run([m.l1_scale_perturb_op for m in models[BEST_THRES:]]) # Training for _ in range(ITERATIONS): docs, labels = next(dataset_generator) sess.run([m.tf_optimizer for m in models], feed_dict={ tf_input: docs, tf_labels: labels }) docs, labels = next(dataset_generator) # Evaluate l1_scales = sess.run({m: m.l1_scale for m in models}) accuracies = sess.run({m: m.tf_acc for m in models}, feed_dict={ tf_input: docs, tf_labels: labels }) models.sort(key=lambda m: accuracies[m], reverse=True) # Logging best_accuracy_hist[i] = accuracies[models[0]] best_l1_scale_hist[i] = l1_scales[models[0]] for m in models: l1_scale_hist[m.model_id, i] = l1_scales[m] accuracy_hist[m.model_id, i] = accuracies[m] with open('temp', 'w') as output_f: json.dump( { 'accuracy_hist': accuracy_hist, 'l1_scale_hist': l1_scale_hist, 'best_accuracy_hist': best_accuracy_hist, 'best_l1_scale_hist': best_l1_scale_hist }, output_f)

Exemple #2

0

Afficher le fichier

def run(experiment_name): with tf.Graph().as_default() as gr: with tf.variable_scope('input'): tf_input = tf.placeholder(dtype=tf.int32, shape=[None, model.SENTENCE_LENGTH_MAX], name='tf_input') tf_labels = tf.placeholder(dtype=tf.int32, shape=[None], name='tf_labels') tf_logits = model.inference(tf_input) tf_loss = model.loss(tf_logits, tf_labels) tf_optimizer, tf_global_step = model.optimize(tf_loss) model.measure_acc(tf_logits, tf_labels) tf_all_summary = tf.summary.merge_all() tf_train_writer = tf.summary.FileWriter(logdir=os.path.join( CURRENT_DIR, '..', 'summary', 'train_' + experiment_name), graph=gr) tf_test_writer = tf.summary.FileWriter(logdir=os.path.join( CURRENT_DIR, '..', 'summary', 'test_' + experiment_name), graph=gr) tf_embedding_writer = tf.summary.FileWriter(logdir=os.path.join( CURRENT_DIR, '..', 'checkpoint', experiment_name)) # Visual word embedding config = projector.ProjectorConfig() embedding = config.embeddings.add() embedding.tensor_name = 'embedding/word_embeddings' # Reference model_v6.py embedding.metadata_path = os.path.join(CURRENT_DIR, 'data', DatasetManager.VOCAB_FILE) projector.visualize_embeddings(tf_embedding_writer, config) saver = tf.train.Saver(max_to_keep=5, keep_checkpoint_every_n_hours=0.03) logging.info('Graph size: %s', utils.count_trainable_variables()) gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=FLAGS.GPU) with tf.Session(config=tf.ConfigProto( gpu_options=gpu_options, allow_soft_placement=True, log_device_placement=FLAGS.LOG_DEVICE_PLACEMENT)).as_default( ) as sess: sess.run(tf.global_variables_initializer()) sess.run(tf.local_variables_initializer()) dataset_manager = DatasetManager() dataset_manager.boot() for docs, labels in dataset_manager.get_batch( batch_size=FLAGS.BATCH_SIZE, number_epochs=FLAGS.NUMBER_EPOCHS): _, global_step = sess.run([tf_optimizer, tf_global_step], feed_dict={ tf_input: docs, tf_labels: labels }) summary_interval_step = 10 if global_step % summary_interval_step == 0: logging.debug('Global step: %s', global_step) train_summary_data = sess.run(tf_all_summary, feed_dict={ tf_input: docs, tf_labels: labels }) tf_train_writer.add_summary(train_summary_data, global_step=global_step) if global_step % summary_interval_step == 0: docs_test, labels_test = dataset_manager.get_test_set( FLAGS.TEST_SIZE, is_shuffled=True) test_summary_data = sess.run(tf_all_summary, feed_dict={ tf_input: docs_test, tf_labels: labels_test }) tf_test_writer.add_summary(test_summary_data, global_step=global_step) if global_step % 200 == 0: path_to_save = os.path.join(CURRENT_DIR, '..', 'checkpoint', experiment_name) if not os.path.exists(path_to_save): os.makedirs(path_to_save) saved_file = saver.save(sess, save_path=os.path.join( path_to_save, 'step'), global_step=global_step, write_meta_graph=True) logging.debug('Saving model at %s', saved_file)