def eval_step(input_ids, target_ids, ): target_inp = target_ids[:, :-1] _, combined_mask, dec_padding_mask = create_masks(input_ids, target_inp) (draft_predictions, draft_attention_weights, refine_predictions, refine_attention_weights) = Model( input_ids, dec_padding_mask=dec_padding_mask, target_ids=target_inp, look_ahead_mask=combined_mask, training=False ) loss, target = loss_function(target_ids, draft_predictions, refine_predictions, Model ) train_loss(loss) log.info(Model.summary()) if config.save_initial_weights: initial_weights = os.path.join(config.initial_weights,'initial_weights') Model.save_weights(initial_weights) return loss
def eval_step(input_ids, target_ids_, target_ids, draft_mask, refine_mask): (draft_predictions, draft_attention_weights, refine_predictions, refine_attention_weights) = Model(input_ids, target_ids_, False) draft_output_sequence_loss = loss_function(target_ids[:, 1:, :], draft_predictions, draft_mask) if config.use_refine_decoder: refine_output_sequence_loss = loss_function(target_ids[:, :-1, :], refine_predictions, refine_mask) else: refine_output_sequence_loss = 0 regularization_loss = tf.add_n(Model.losses) loss = draft_output_sequence_loss + refine_output_sequence_loss + regularization_loss log.info(Model.summary()) if config.save_initial_weights: initial_weights = os.path.join(config.initial_weights, 'initial_weights') Model.save_weights(initial_weights) return loss