Python attention_bias_local Examples

Programming Language: Python

Namespace/Package Name: tensor2tensor.layers.common_attention

Method/Function: attention_bias_local

Examples at hotexamples.com: 4

Python attention_bias_local - 4 examples found. These are the top rated real world Python examples of tensor2tensor.layers.common_attention.attention_bias_local extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: gibbs.py Project: fstahlberg/tensor2tensor-usr

def transformer_prepare_decoder_right(targets, hparams, features=None):
    """Prepare one shard of the model for the decoder.

  Args:
    targets: a Tensor.
    hparams: run hyperparameters
    features: optionally pass the entire features dictionary as well.
      This is needed now for "packed" datasets.

  Returns:
    decoder_input: a Tensor, bottom of decoder stack
    decoder_self_attention_bias: a bias tensor for use in decoder self-attention
  """
    if hparams.causal_decoder_self_attention:
        # Causal attention.
        if hparams.prepend_mode == "prepend_inputs_full_attention":
            decoder_self_attention_bias = (
                common_attention.attention_bias_prepend_inputs_full_attention(
                    common_attention.embedding_to_padding(targets)))
        else:
            decoder_self_attention_bias = (
                common_attention.attention_bias_local(
                    common_layers.shape_list(targets)[1], 0, -1))
    else:
        # Full attention.
        decoder_padding = common_attention.embedding_to_padding(targets)
        decoder_self_attention_bias = (
            common_attention.attention_bias_ignore_padding(decoder_padding))

    if features and "targets_segmentation" in features:
        # "Packed" dataset - keep the examples from seeing each other.
        targets_segmentation = features["targets_segmentation"]
        targets_position = features["targets_position"]
        decoder_self_attention_bias += common_attention.attention_bias_same_segment(
            targets_segmentation, targets_segmentation)
    else:
        targets_position = None
    if hparams.proximity_bias:
        decoder_self_attention_bias += common_attention.attention_bias_proximal(
            common_layers.shape_list(targets)[1])
    decoder_input = shift_left_3d(targets)
    if hparams.pos == "timing":
        if targets_position is not None:
            decoder_input = common_attention.add_timing_signal_1d_given_position(
                decoder_input, targets_position)
        else:
            decoder_input = common_attention.add_timing_signal_1d(
                decoder_input)
    elif hparams.pos == "emb":
        decoder_input = common_attention.add_positional_embedding(
            decoder_input, hparams.max_length, "targets_positional_embedding",
            targets_position)

    if hparams.activation_dtype == "bfloat16":
        decoder_self_attention_bias = tf.cast(decoder_self_attention_bias,
                                              tf.bfloat16)
    return (decoder_input, decoder_self_attention_bias)

Example #2

Show file

 def _pseudolocal_bias(x):
     return common_attention.attention_bias_local(
         tf.shape(x)[1], hparams.local_attention_window,
         0 if hparams.mask_right else
         hparams.local_attention_window)

Example #3

Show file

 def _pseudolocal_bias(x):
     return common_attention.attention_bias_local(
         tf.shape(x)[1], hparams.local_attention_window,
         hparams.local_attention_window)

Example #4

Show file

File: aligned.py Project: chqiwang/tensor2tensor

 def _pseudolocal_bias(x):
   return common_attention.attention_bias_local(
       common_layers.shape_list(x)[1], hparams.local_attention_window,
       0 if hparams.mask_right else hparams.local_attention_window)