Python make_environment_reward_fnの例

プログラミング言語: Python

名前空間/パッケージ名: px.nmt.environment_client

メソッド/関数: make_environment_reward_fn

hotexamples.comのコード掲載数: 4

Python make_environment_reward_fn - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのpx.nmt.environment_client.make_environment_reward_fnの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

コード例 #1

ファイルを表示

ファイル: demo.py プロジェクト: BPYap/Question-Generation

def main(argv=()):
  del argv  # Unused.

  if not FLAGS.server_address:
    sys.exit('A server address must be provided.')

  env_get_answers_fn = environment_client.make_environment_reward_fn(
      FLAGS.server_address, mode=FLAGS.mode)

  while True:
    questions_doc_ids = raw_input(
        'Enter question and doc id (use %%% to separate question and '
        'doc id and use ### to separate multiple questions): ')

    start_time = time.time()
    if not questions_doc_ids:
      continue

    questions = []
    doc_ids = []
    for question_doc_id in questions_doc_ids.split('###'):
      question, doc_id = question_doc_id.split('%%%')
      questions.append(question.strip())
      doc_ids.append(doc_id.strip())

    _, _, answers = env_get_answers_fn(np.array(questions), np.array(doc_ids))
    for question, answer in zip(questions, answers):
      print(u'question: {}\nanswer: {}'.format(
          question.decode('utf8'), answer.decode('utf8')))
    print('{0} questions reformulated in {1:.2f} s'.format(
        len(questions),
        time.time() - start_time))

コード例 #2

ファイルを表示

    def __init__(self,
                 hparams,
                 mode,
                 iterator,
                 source_vocab_table,
                 target_vocab_table,
                 reverse_target_vocab_table=None,
                 scope=None,
                 extra_args=None,
                 trie=None):
        """Create the model.

    Args:
      hparams: Hyperparameter configurations.
      mode: TRAIN | EVAL | INFER
      iterator: Dataset Iterator that feeds data.
      source_vocab_table: Lookup table mapping source words to ids.
      target_vocab_table: Lookup table mapping target words to ids.
      reverse_target_vocab_table: Lookup table mapping ids to target words. Only
        required in INFER mode. Defaults to None.
      scope: scope of the model.
      extra_args: model_helper.ExtraArgs, for passing customizable functions.
      trie: pygtrie.Trie to decode into

    """
        assert isinstance(iterator, iterator_utils.BatchedInput)
        self.iterator = iterator
        self.mode = mode
        self.src_vocab_table = source_vocab_table
        self.tgt_vocab_table = target_vocab_table

        self.src_vocab_size = hparams.src_vocab_size
        self.tgt_vocab_size = hparams.tgt_vocab_size
        self.num_gpus = hparams.num_gpus
        self.reverse_target_vocab_table = reverse_target_vocab_table
        # extra_args: to make it flexible for adding external customizable code
        self.single_cell_fn = None
        if extra_args:
            self.single_cell_fn = extra_args.single_cell_fn

        # Set num layers
        self.num_encoder_layers = hparams.num_encoder_layers
        self.num_decoder_layers = hparams.num_decoder_layers
        assert self.num_encoder_layers
        assert self.num_decoder_layers

        self.trie = trie

        # Set num residual layers
        if hasattr(hparams,
                   'num_residual_layers'):  # compatible common_test_utils
            self.num_encoder_residual_layers = hparams.num_residual_layers
            self.num_decoder_residual_layers = hparams.num_residual_layers
        else:
            self.num_encoder_residual_layers = hparams.num_encoder_residual_layers
            self.num_decoder_residual_layers = hparams.num_decoder_residual_layers

        # Initializer
        initializer = model_helper.get_initializer(hparams.init_op,
                                                   hparams.random_seed,
                                                   hparams.init_weight)
        tf.get_variable_scope().set_initializer(initializer)

        # Embeddings
        self.init_embeddings(hparams, scope)
        self.batch_size = tf.size(self.iterator.source_sequence_length)

        # Projection
        with tf.variable_scope(scope or 'build_network', reuse=tf.AUTO_REUSE):
            with tf.variable_scope('decoder/output_projection'):
                self.output_layer = layers_core.Dense(hparams.tgt_vocab_size,
                                                      use_bias=False,
                                                      name='output_projection')

        if hparams.use_rl:
            # Create environment function
            self._environment_reward_fn = (
                environment_client.make_environment_reward_fn(
                    hparams.environment_server, mode=hparams.environment_mode))

        ## Train graph
        res = self.build_graph(hparams, scope=scope)

        (self.loss, self.rewards, self.logits, self.final_context_state,
         self.sample_id, self.sample_words, self.sample_strings,
         train_summaries) = res
        if self.mode == tf.contrib.learn.ModeKeys.TRAIN:
            self.word_count = tf.reduce_sum(
                self.iterator.source_sequence_length) + tf.reduce_sum(
                    self.iterator.target_sequence_length)

        if self.mode != tf.contrib.learn.ModeKeys.INFER:
            ## Count the number of predicted words for compute ppl.
            self.predict_count = tf.reduce_sum(
                self.iterator.target_sequence_length)

        self.global_step = tf.Variable(0, trainable=False)
        params = tf.trainable_variables()

        # Gradients and SGD update operation for training the model.
        # Arrage for the embedding vars to appear at the beginning.
        if self.mode == tf.contrib.learn.ModeKeys.TRAIN:
            self.learning_rate = tf.constant(hparams.learning_rate)
            # warm-up
            self.learning_rate = self._get_learning_rate_warmup(hparams)
            # decay
            self.learning_rate = self._get_learning_rate_decay(hparams)

            # Optimizer
            if hparams.optimizer == 'sgd':
                opt = tf.train.GradientDescentOptimizer(self.learning_rate)
            elif hparams.optimizer == 'adam':
                opt = tf.train.AdamOptimizer(self.learning_rate)
            elif hparams.optimizer == 'rmsprop':
                opt = tf.train.RMSPropOptimizer(self.learning_rate)
            elif hparams.optimizer == 'adadelta':
                opt = tf.train.AdadeltaOptimizer(self.learning_rate)

            # Gradients
            ## http://blog.naver.com/PostView.nhn?blogId=atelierjpro&logNo=220978930368&categoryNo=0&parentCategoryNo=0&viewDate=&currentPage=1&postListTopCurrentPage=1&from=postView
            gradients = tf.gradients(self.loss,
                                     params,
                                     colocate_gradients_with_ops=hparams.
                                     colocate_gradients_with_ops)

            (clipped_gradients, gradients_norm_summary,
             gradients_norm) = model_helper.gradient_clip(
                 gradients, max_gradient_norm=hparams.max_gradient_norm)
            self.gradients_norm = gradients_norm

            self.update = opt.apply_gradients(zip(clipped_gradients, params),
                                              global_step=self.global_step)

            # Summary
            self.train_summary = tf.summary.merge([
                tf.summary.scalar('lr', self.learning_rate),
                tf.summary.scalar('train_loss', self.loss),
            ] + train_summaries + gradients_norm_summary)

        if self.mode == tf.contrib.learn.ModeKeys.INFER:
            self.infer_summary = self._get_infer_summary(hparams)

        # Saver
        self.saver = OptimisticRestoreSaver(max_to_keep=hparams.num_keep_ckpts,
                                            init_uninitialized_variables=True)

        # Print trainable variables
        utils.print_out('# Trainable variables')
        for param in params:
            utils.print_out('  {}, {}, {}'.format(param.name,
                                                  param.get_shape(),
                                                  param.op.device))

コード例 #3

ファイルを表示

def main(argv):
    del argv  # Unused.

    if FLAGS.debug:
        random.seed(0)

    reformulator_instance = reformulator.Reformulator(
        hparams_path=FLAGS.hparams_path,
        source_prefix=FLAGS.source_prefix,
        out_dir=FLAGS.out_dir,
        environment_server_address=FLAGS.environment_server_address)
    environment_fn = environment_client.make_environment_reward_fn(
        FLAGS.environment_server_address,
        mode=FLAGS.mode,
        env_call_parallelism=FLAGS.env_sample_parallelism)

    eval_environment_fn = environment_client.make_environment_reward_fn(
        FLAGS.environment_server_address,
        mode='searchqa',
        env_call_parallelism=FLAGS.env_eval_parallelism)

    # Read data.
    questions, annotations, docid_2_answer = read_data(
        questions_file=FLAGS.train_questions,
        annotations_file=FLAGS.train_annotations,
        answers_file=FLAGS.train_data,
        preprocessing_mode=FLAGS.mode)
    dev_questions, dev_annotations, dev_docid_2_answer = read_data(
        questions_file=FLAGS.dev_questions,
        annotations_file=FLAGS.dev_annotations,
        answers_file=FLAGS.dev_data,
        preprocessing_mode=FLAGS.mode,
        max_lines=FLAGS.max_dev_examples)

    # Summary writer that writes events to a folder. TensorBoard will later read
    # from it.
    summary_writer = tf.summary.FileWriter(
        os.path.join(
            FLAGS.tensorboard_dir,
            'reformulator_and_selector_training_log_' + str(time.time())))

    if FLAGS.enable_selector_training:
        selector_model = selector.Selector()
        last_save_step = 0

    global_step = 0
    for epoch in range(FLAGS.epochs):
        for batch_id, (questions_batch, annotations_batch) in enumerate(
                batch(questions, annotations, FLAGS.batch_size_train)):
            # Run eval every num_steps_per_eval batches.
            if global_step % FLAGS.num_steps_per_eval is 0:
                if FLAGS.debug:
                    print('Running eval...')
                eval_start_time = time.time()

                if not FLAGS.enable_selector_training:
                    eval_f1_avg = _run_reformulator_eval(
                        dev_questions, dev_annotations, reformulator_instance,
                        environment_fn, FLAGS.batch_size_eval)
                else:
                    eval_f1_avg = _run_eval_with_selector(
                        questions=dev_questions,
                        annotations=dev_annotations,
                        docid_2_answer=dev_docid_2_answer,
                        reformulator_instance=reformulator_instance,
                        selector_model=selector_model,
                        batch_size=FLAGS.batch_size_eval,
                        environment_fn=eval_environment_fn)

                # Correct the average F1 score for deleted datapoints in the SearchQA
                # dataset.
                if FLAGS.mode == 'searchqa':
                    eval_f1_avg = _correct_searchqa_score(eval_f1_avg,
                                                          dataset='dev')

                eval_time = time.time() - eval_start_time

                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='eval_f1_avg',
                                       value=eval_f1_avg)
                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='eval_time',
                                       value=eval_time)

                if FLAGS.debug:
                    print('Avg F1 on dev: {}.'.format(eval_f1_avg))
                    print('Time to finish eval: {}'.format(eval_time))

            start_time = time.time()
            if FLAGS.debug:
                print('Epoch {}, Batch {}.'.format(epoch, batch_id))
                print('Question: [{}]; Id: {}'.format(questions_batch[0],
                                                      annotations_batch[0]))

            # Retrieve rewrites for selector training using beam search.
            if FLAGS.enable_selector_training:
                responses_beam = reformulator_instance.reformulate(
                    questions=questions_batch,
                    inference_mode=reformulator_pb2.ReformulatorRequest.
                    BEAM_SEARCH)

                # Discard answers.
                reformulations_beam = [[rf.reformulation for rf in rsp]
                                       for rsp in responses_beam]

            if FLAGS.enable_reformulator_training:
                # Train reformulator model.
                if FLAGS.debug:
                    print('Training reformulator...')

                reformulator_loss, f1s, reformulations = reformulator_instance.train(
                    sources=questions_batch, annotations=annotations_batch)

                f1_avg = f1s.mean()

                if [] in reformulations:
                    if FLAGS.debug:
                        print('Found empty rewrites! Skipping this batch.')
                    continue

                if FLAGS.debug:
                    print('Rewrite: {}'.format(safe_string(reformulations[0])))
                    print('Avg F1: {}'.format(f1_avg))
                    print('Loss  : {}'.format(reformulator_loss))

                # Write the f1_avg and loss to Tensorboard.
                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='f1_avg',
                                       value=f1_avg)
                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='reformulator_loss',
                                       value=reformulator_loss)

            # Train selector model.
            if FLAGS.enable_selector_training:
                (selector_questions, selector_answers,
                 selector_scores) = query_environment(
                     original_questions=questions_batch,
                     rewrites=reformulations_beam,
                     annotations=annotations_batch,
                     environment_fn=eval_environment_fn,
                     docid_2_answer=docid_2_answer,
                     token_level_f1_scores=False)

                if FLAGS.debug:
                    print('Training selector...')

                train_selector_loss, train_selector_accuracy = selector_model.train(
                    selector_questions, selector_answers, selector_scores)

                # Regularly save a checkpoint.
                if global_step - last_save_step >= FLAGS.steps_per_save_selector:
                    selector_model.save(str(global_step))
                    last_save_step = global_step
                    print('Selector saved at step: {}'.format(global_step))

                if FLAGS.debug:
                    print('Train Accuracy: {}'.format(train_selector_accuracy))
                    print('Train Loss    : {}'.format(train_selector_loss))

                # Write the accuracy and loss to Tensorboard.
                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='train_selector_accuracy',
                                       value=train_selector_accuracy)
                misc_utils.add_summary(summary_writer,
                                       global_step,
                                       tag='train_selector_loss',
                                       value=train_selector_loss)

            iteration_time = time.time() - start_time
            if FLAGS.debug:
                print('Iteration time: {}'.format(iteration_time))

            misc_utils.add_summary(summary_writer,
                                   global_step,
                                   tag='iteration_time',
                                   value=iteration_time)

            # Increment the global counter
            global_step += 1

コード例 #4

ファイルを表示

ファイル: reformulator_and_selector_training_edited.py プロジェクト: NRD90M/ActiveQA-Reformulator

def main(argv):
    del argv  # Unused.

    if FLAGS.debug:
        random.seed(0)

    reformulator_instance = reformulator.Reformulator(
        hparams_path=FLAGS.hparams_path,
        source_prefix='<en> <2en> ',  ## FLAGS.source_prefix,
        out_dir=FLAGS.out_dir,
        environment_server_address=FLAGS.environment_server_address)
    environment_fn = environment_client.make_environment_reward_fn(
        FLAGS.environment_server_address,
        mode=FLAGS.mode,
        env_call_parallelism=FLAGS.env_sample_parallelism)

    eval_environment_fn = environment_client.make_environment_reward_fn(
        FLAGS.environment_server_address,
        mode='searchqa',
        env_call_parallelism=FLAGS.env_eval_parallelism)

    # Read data.
    questions, annotations, docid_2_answer = read_data(
        questions_file=FLAGS.train_questions,
        annotations_file=FLAGS.train_annotations,
        answers_file=FLAGS.train_data,
        preprocessing_mode=FLAGS.mode)
    dev_questions, dev_annotations, dev_docid_2_answer = read_data(
        questions_file=FLAGS.dev_questions,
        annotations_file=FLAGS.dev_annotations,
        answers_file=FLAGS.dev_data,
        preprocessing_mode=FLAGS.mode,
        max_lines=FLAGS.max_dev_examples)

    ### Inference:
    all_reformulated_question = []
    custom_questions = [
        'What is the reimbursement policies and how to claim it?'
    ]  ## what are the ways to save tax?,How many casual leaves one is entitled in a year?, why katappa killed bahubali?
    all_reformulated_question.append(custom_questions)
    # print('custom_questions:', type(custom_questions))
    responses = reformulator_instance.reformulate(
        questions=custom_questions,
        inference_mode=reformulator_pb2.ReformulatorRequest.BEAM_SEARCH)

    ### GREEDY , SAMPLING , BEAM_SEARCH , TRIE_GREEDY , TRIE_SAMPLE , TRIE_BEAM_SEARCH

    # print('responses:', responses)
    # Discard answers.
    custom_reformulations = [[rf.reformulation for rf in rsp]
                             for rsp in responses]
    all_reformulated_question.append(custom_reformulations)
    # for i in range(len(custom_reformulations)):
    #   print('The reformulations of "', custom_questions[i], '" are:', custom_reformulations[i])

    # ----------------------------------------------------------------------------------------------
    print(
        '----------------------------reformulations of reformulation--------------------------------'
    )
    # print('custom_reformulations:', type(custom_reformulations), len(custom_reformulations))
    for j in range(len(custom_reformulations)):
        # print('-----------------------reformulation of ',j,' reformulations---------------------------')
        responses_of1st_infer = reformulator_instance.reformulate(
            questions=custom_reformulations[j],
            inference_mode=reformulator_pb2.ReformulatorRequest.BEAM_SEARCH)

        custom_reformulations_of1st_infer = [[rf.reformulation for rf in rsp]
                                             for rsp in responses_of1st_infer]
        # for k in range(len(custom_reformulations_of1st_infer)):
        # print('----------------------------------------------------')
        # print('The reformulations of "', custom_reformulations[j][k], '" are:', custom_reformulations_of1st_infer[k])
        all_reformulated_question.append(custom_reformulations_of1st_infer)

    all_reformulated_question = flatten(all_reformulated_question)
    print('all_reformulated_question:', len(all_reformulated_question),
          len(set(all_reformulated_question)), set(all_reformulated_question))
    all_reformulated_question = set(all_reformulated_question)

    outF = open("all_reformulated_question.txt", "w")
    for q in all_reformulated_question:
        # write line to output file
        outF.write(q)
        outF.write("\n")
    outF.close()