Ejemplos de stack en Python, ejemplos de gin.tf.stack en Python

Ejemplo n.º 1

0

Mostrar archivo

    def prediction_loss(self, truths, palette):
        def spatial_loss(truth_features, predicted_features, space_desc):
            feature_losses = []
            for truth, prediction, spec in zip(truth_features,
                                               predicted_features,
                                               space_desc.features):
                if spec.type == FeatureType.CATEGORICAL:
                    truth = tf.transpose(truth, (0, 2, 3, 1))
                    prediction = tf.transpose(prediction, (0, 2, 3, 1))
                    feature_losses.append(
                        tf.losses.softmax_cross_entropy(truth, prediction))

                    summary_image = tf.argmax(
                        tf.concat([truth, prediction], 2), 3)
                    summary_image = tf.gather(
                        palette[space_desc.index][spec.index], summary_image)
                    tf.summary.image(spec.name, summary_image)
                else:
                    feature_losses.append(
                        tf.losses.mean_squared_error(truth, prediction))

                    summary_image = tf.concat([truth, prediction], 3)
                    tf.summary.image(spec.name,
                                     tf.transpose(summary_image, (0, 2, 3, 1)))

                tf.summary.scalar(spec.name, feature_losses[-1])

            return tf.reduce_mean(tf.stack(feature_losses))

        with tf.name_scope('prediction_loss'):
            spatial_losses = []
            for s in self.env_spec.spaces:
                with tf.name_scope(s.name):
                    loss = spatial_loss(truths[s.index],
                                        self.out_pred[s.index], s)
                    spatial_losses.append(loss)
                    tf.summary.scalar('loss', loss)

            loss = tf.reduce_mean(tf.stack(spatial_losses))
            tf.summary.scalar('loss', loss)

        return loss

Ejemplo n.º 2

0

Mostrar archivo

Archivo: slate_decomp_q_agent.py Proyecto: kiminh/ExpertDrivenRec

def compute_target_greedy_q(reward, gamma, next_actions, next_q_values,
                            next_states, terminals):
    """Computes the optimal target Q value with the adaptive greedy algorithm.

  This algorithm corresponds to the method "GT" in
  Ie et al. https://arxiv.org/abs/1905.12767..

  Args:
    reward: [batch_size] tensor, the immediate reward.
    gamma: float, discount factor with the usual RL meaning.
    next_actions: [batch_size, slate_size] tensor, the next slate.
    next_q_values: [batch_size, num_of_documents] tensor, the q values of the
      documents in the next step.
    next_states: [batch_size, 1 + num_of_documents] tensor, the features for the
      user and the docuemnts in the next step.
    terminals: [batch_size] tensor, indicating if this is a terminal step.

  Returns:
    [batch_size] tensor, the target q values.
  """
    slate_size = next_actions.get_shape().as_list()[1]
    stack_number = -1
    user_obs = next_states[:, 0, :, stack_number]
    doc_obs = next_states[:, 1:, :, stack_number]

    batch_size = next_q_values.get_shape().as_list()[0]
    next_greedy_q_list = []
    for i in range(batch_size):
        s, s_no_click = score_documents_tf(user_obs[i], doc_obs[i])
        q = next_q_values[i]

        slate = select_slate_greedy(slate_size, s_no_click, s, q)
        p_selected = compute_probs_tf(slate, s, s_no_click)
        q_selected = tf.gather(q, slate)
        next_greedy_q_list.append(
            tf.reduce_sum(input_tensor=p_selected * q_selected))

    next_greedy_q_values = tf.stack(next_greedy_q_list)

    return reward + gamma * next_greedy_q_values * (
        1. - tf.cast(terminals, tf.float32))

Ejemplo n.º 3

0

Mostrar archivo

Archivo: slate_decomp_q_agent.py Proyecto: kiminh/ExpertDrivenRec

def select_slate_optimal(slate_size, s_no_click, s, q):
    """Selects the slate using exhaustive search.

  This algorithm corresponds to the method "OS" in
  Ie et al. https://arxiv.org/abs/1905.12767.

  Args:
    slate_size: int, the size of the recommendation slate.
    s_no_click: float tensor, the score for not clicking any document.
    s: [num_of_documents] tensor, the scores for clicking documents.
    q: [num_of_documents] tensor, the predicted q values for documents.

  Returns:
    [slate_size] tensor, the selected slate.
  """

    num_candidates = s.shape.as_list()[0]

    # Obtain all possible slates given current docs in the candidate set.
    mesh_args = [list(range(num_candidates))] * slate_size
    slates = tf.stack(tf.meshgrid(*mesh_args), axis=-1)
    slates = tf.reshape(slates, shape=(-1, slate_size))

    # Filter slates that include duplicates to ensure each document is picked
    # at most once.
    unique_mask = tf.map_fn(
        lambda x: tf.equal(tf.size(input=x), tf.size(input=tf.unique(x)[0])),
        slates,
        dtype=tf.bool)
    slates = tf.boolean_mask(tensor=slates, mask=unique_mask)

    slate_q_values = tf.gather(s * q, slates)
    slate_scores = tf.gather(s, slates)
    slate_normalizer = tf.reduce_sum(input_tensor=slate_scores,
                                     axis=1) + s_no_click

    slate_q_values = slate_q_values / tf.expand_dims(slate_normalizer, 1)
    slate_sum_q_values = tf.reduce_sum(input_tensor=slate_q_values, axis=1)
    max_q_slate_index = tf.argmax(input=slate_sum_q_values)
    return tf.gather(slates, max_q_slate_index, axis=0)

Ejemplo n.º 4

0

Mostrar archivo

Archivo: preprocessor.py Proyecto: xuzhankai/google-research

def rotate_points_around_axis(points, rotation_angle, axis=2):
    """Rotates points around axis.

  Args:
    points: A tf.float32 tensor of size [N, 3] containing points.
    rotation_angle: A float value containing the rotation angle in radians.
    axis: A value in [0, 1, 2] for rotating around x, y, z axis.

  Returns:
    rotated_points: A tf.float32 tensor of size [N, 3] containing points.
  """
    if axis not in [0, 1, 2]:
        raise ValueError(('axis is out of bound: %d' % axis))
    c = tf.cos(rotation_angle)
    s = tf.sin(rotation_angle)
    new_points = [points[:, 0], points[:, 1], points[:, 2]]
    other_axis = list(set([0, 1, 2]) - set([axis]))
    new_points[other_axis[0]] = (points[:, other_axis[0]] * c -
                                 points[:, other_axis[1]] * s)
    new_points[other_axis[1]] = (points[:, other_axis[0]] * s +
                                 points[:, other_axis[1]] * c)
    return tf.stack(new_points, axis=1)

Ejemplo n.º 5

0

Mostrar archivo

Archivo: slate_decomp_q_agent.py Proyecto: kiminh/ExpertDrivenRec

def compute_target_sarsa(reward, gamma, next_actions, next_q_values,
                         next_states, terminals):
    """Computes the SARSA target Q value.

  Args:
    reward: [batch_size] tensor, the immediate reward.
    gamma: float, discount factor with the usual RL meaning.
    next_actions: [batch_size, slate_size] tensor, the next slate.
    next_q_values: [batch_size, num_of_documents] tensor, the q values of the
      documents in the next step.
    next_states: [batch_size, 1 + num_of_documents] tensor, the features for the
      user and the docuemnts in the next step.
    terminals: [batch_size] tensor, indicating if this is a terminal step.

  Returns:
    [batch_size] tensor, the target q values.
  """
    stack_number = -1
    user_obs = next_states[:, 0, :, stack_number]
    doc_obs = next_states[:, 1:, :, stack_number]

    batch_size = next_q_values.get_shape().as_list()[0]
    next_sarsa_q_list = []
    for i in range(batch_size):
        s, s_no_click = score_documents_tf(user_obs[i], doc_obs[i])
        q = next_q_values[i]

        slate = tf.expand_dims(next_actions[i], 1)
        p_selected = compute_probs_tf(slate, s, s_no_click)
        q_selected = tf.gather(q, slate)
        next_sarsa_q_list.append(
            tf.reduce_sum(input_tensor=p_selected * q_selected))

    next_sarsa_q_values = tf.stack(next_sarsa_q_list)

    return reward + gamma * next_sarsa_q_values * (
        1. - tf.cast(terminals, tf.float32))

Ejemplo n.º 6

0

Mostrar archivo

    def true_fn(images):
        if augment_entire_batch:
            image_2 = images
            mean_color = tf.reduce_mean(image_2, axis=[1, 2], keepdims=True)
            print(mean_color.shape)
        else:
            image_1, image_2 = tf.unstack(images)
            mean_color = tf.reduce_mean(image_2, axis=[0, 1], keepdims=True)

        def body(var_img, mean_color):
            x0 = tf.random.uniform([], 0, width, dtype=tf.int32)
            y0 = tf.random.uniform([], 0, height, dtype=tf.int32)
            dx = tf.random.uniform([], min_size, max_size, dtype=tf.int32)
            dy = tf.random.uniform([], min_size, max_size, dtype=tf.int32)
            x = tf.range(width)
            x_mask = (x0 <= x) & (x < x0 + dx)
            y = tf.range(height)
            y_mask = (y0 <= y) & (y < y0 + dy)
            mask = x_mask & y_mask[:, tf.newaxis]
            mask = tf.cast(mask[:, :, tf.newaxis], image_2.dtype)
            result = var_img * (1 - mask) + mean_color * mask
            return result

        # Perform at least one erase operation.
        image_2 = body(image_2, mean_color)
        # Perform additional erase operations.
        for _ in range(max_operations - 1):
            perform_erase = tf.less(tf.random.uniform([]),
                                    probability_additional_operations)
            image_2 = tf.cond(perform_erase, lambda: body(image_2, mean_color),
                              lambda: image_2)
        if augment_entire_batch:
            images = image_2
        else:
            images = tf.stack([image_1, image_2])
        return images

Ejemplo n.º 7

0

Mostrar archivo