Exemplos de create_initializer em Python

Linguagem de programação: Python

Espaço para nome / nome do pacote: modeling_v2

Método / Função: create_initializer

Exemplos em hotexamples.com: 2

create_initializer em Python - 2 exemplos encontrados. Esses são os exemplos do mundo real mais bem avaliados de modeling_v2.create_initializer em Python extraídos de projetos de código aberto. Você pode avaliar os exemplos para nos ajudar a melhorar a qualidade deles.

Exemplo n.º 1

0

Exibir arquivo

Arquivo: run_pretraining_v2_gpu2.py Projeto: Tigerye/DrTiger

def get_next_sentence_output(bert_config, input_tensor, labels): """Get loss and log probs for the next sentence prediction.""" # Simple binary classification. Note that 0 is "next sentence" and 1 is # "random sentence". This weight matrix is not used after pre-training. with tf.compat.v1.variable_scope("cls/seq_relationship"): output_weights = tf.compat.v1.get_variable( "output_weights", shape=[2, bert_config.hidden_size], initializer=modeling.create_initializer( bert_config.initializer_range)) output_bias = tf.compat.v1.get_variable( "output_bias", shape=[2], initializer=tf.compat.v1.zeros_initializer()) logits = tf.matmul(input_tensor, output_weights, transpose_b=True) logits = tf.nn.bias_add(logits, output_bias) log_probs = tf.nn.log_softmax(logits, axis=-1) labels = tf.reshape(labels, [-1]) one_hot_labels = tf.one_hot(labels, depth=2, dtype=tf.float32) per_example_loss = -tf.reduce_sum( input_tensor=one_hot_labels * log_probs, axis=-1) loss = tf.reduce_mean(input_tensor=per_example_loss) return (loss, per_example_loss, log_probs)

Exemplo n.º 2

0

Exibir arquivo

Arquivo: run_pretraining_v2_gpu2.py Projeto: Tigerye/DrTiger

def get_masked_lm_output(bert_config, input_tensor, output_weights, positions, label_ids, label_weights): """Get loss and log probs for the masked LM.""" input_tensor = gather_indexes(input_tensor, positions) with tf.compat.v1.variable_scope("cls/predictions"): # We apply one more non-linear transformation before the output layer. # This matrix is not used after pre-training. with tf.compat.v1.variable_scope("transform"): input_tensor = tf.compat.v1.layers.dense( input_tensor, units=bert_config.hidden_size, activation=modeling.get_activation(bert_config.hidden_act), kernel_initializer=modeling.create_initializer( bert_config.initializer_range)) input_tensor = modeling.layer_norm(input_tensor) # The output weights are the same as the input embeddings, but there is # an output-only bias for each token. output_bias = tf.compat.v1.get_variable( "output_bias", shape=[bert_config.vocab_size], initializer=tf.compat.v1.zeros_initializer()) logits = tf.matmul(input_tensor, output_weights, transpose_b=True) logits = tf.nn.bias_add(logits, output_bias) log_probs = tf.nn.log_softmax(logits, axis=-1) label_ids = tf.reshape(label_ids, [-1]) label_weights = tf.reshape(label_weights, [-1]) one_hot_labels = tf.one_hot(label_ids, depth=bert_config.vocab_size, dtype=tf.float32) # The `positions` tensor might be zero-padded (if the sequence is too # short to have the maximum number of predictions). The `label_weights` # tensor has a value of 1.0 for every real prediction and 0.0 for the # padding predictions. per_example_loss = -tf.reduce_sum( input_tensor=log_probs * one_hot_labels, axis=[-1]) numerator = tf.reduce_sum(input_tensor=label_weights * per_example_loss) denominator = tf.reduce_sum(input_tensor=label_weights) + 1e-5 loss = numerator / denominator return (loss, per_example_loss, log_probs)