Ejemplos de cheat_get_inner_layers en Python

Lenguaje de programación: Python

Namespace/Package Name: src.utils

Método / Función: cheat_get_inner_layers

Ejemplos en hotexamples.com: 10

Python cheat_get_inner_layers - 10 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de src.utils.cheat_get_inner_layers extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Ejemplo n.º 1

Mostrar archivo

def gather_ratios(critical_points, known_T, check_fn, LAYER, COUNT):
    this_layer_critical_points = []
    print("Gathering", COUNT, "critical points")
    for point in critical_points:
        if LAYER > 0:
            if any(np.any(np.abs(x) < 1e-5) for x in known_T.get_hidden_layers(point)):
                continue
            if CHEATING:
                if np.any(np.abs(cheat_get_inner_layers(point)[0]) < 1e-10):
                    print(cheat_get_inner_layers(point))
                    print("Looking at one I don't need to")
            
            
        if LAYER > 0 and np.sum(known_T.forward(point) != 0) <= 1:
            print("Not enough hidden values are active to get meaningful data")
            continue

        if not check_fn(point):
            #print("Check function rejected it")
            continue
        if CHEATING:
            print("What layer is this neuron on (by cheating)?",
                  [(np.min(np.abs(x)), np.argmin(np.abs(x))) for x in cheat_get_inner_layers(point)])

        tmp = query_count
        for EPS in [GRAD_EPS, GRAD_EPS/10, GRAD_EPS/100]:
            try:
                normal = get_ratios_lstsq(LAYER, [point], [range(DIM)], known_T, eps=EPS)[0].flatten()
                #normal = get_ratios([point], [range(DIM)], eps=EPS)[0].flatten()
                break
            except AcceptableFailure:
                print("Try again with smaller eps")
                pass
        #print("LSTSQ Delta queries", query_count-tmp)

        this_layer_critical_points.append((normal, point))
        
        # coupon collector: we need nlogn points.
        print("Up to", len(this_layer_critical_points), 'of', COUNT)
        if len(this_layer_critical_points) >= COUNT:
            break

    return this_layer_critical_points

Ejemplo n.º 2

Mostrar archivo

Archivo: sign_recovery.py Proyecto: STulling/cryptanalytic-model-extraction

 def is_on_prior_layer(query):
     logger.log("Hidden think", known_T.get_hidden_layers(query), level=Logger.INFO)
     if CHEATING:
         logger.log("Hidden real", cheat_get_inner_layers(query), level=Logger.INFO)
     if any(np.min(np.abs(layer)) < 1e-5 for layer in known_T.get_hidden_layers(query)):
         return True
     next_hidden = known_T.extend_by(known_A, known_B).forward(query)
     logger.log(next_hidden, level=Logger.INFO)
     if np.min(np.abs(next_hidden)) < 1e-4:
         return True
     return False

Ejemplo n.º 3

Mostrar archivo

Archivo: sign_recovery.py Proyecto: muskanmahajan37/cryptanalytic-model-extraction

def solve_layer_sign(known_T,
                     known_A0,
                     known_B0,
                     critical_points,
                     LAYER,
                     already_checked_critical_points=False,
                     only_need_positive=False,
                     l1_mask=None):
    """
    Compute the signs for one layer of the network.

    known_T is the transformation that computes up to layer K-1, with
    known_A and known_B being the layer K matrix up to sign.
    """
    def get_critical_points():
        print("Init")
        print(critical_points)
        for point in critical_points:
            print("Tick")
            if already_checked_critical_points or is_on_following_layer(
                    known_T, known_A0, known_B0, point):
                print("Found layer N point at ", point,
                      already_checked_critical_points)
                yield point

    get_critical_point = get_critical_points()

    print("Start looking for critical point")
    MAX_POINTS = 200
    which_point = next(get_critical_point)
    print("Done looking for critical point")

    initial_points = []
    history = []
    pts = []
    if already_checked_critical_points:
        for point in get_critical_point:
            initial_points.append(point)
            pts.append(point)
            which_polytope = get_polytope_at(known_T, known_A0, known_B0,
                                             point, False)  # [-1 1 -1]
            hidden_vector = get_hidden_at(known_T, known_A0, known_B0, LAYER,
                                          point, False)
            if CHEATING:
                layers = cheat_get_inner_layers(point)
                print('have', [(np.argmin(np.abs(x)), np.min(np.abs(x)))
                               for x in layers])
            history.append((which_polytope, hidden_vector, np.copy(point)))

    while True:
        if not already_checked_critical_points:
            history = []
            pts = []

        prev_count = -10
        good = False
        while len(pts) > prev_count + 2:
            print("======" * 10)
            print("RESTART SEARCH", len(pts), prev_count)
            print(which_point)
            prev_count = len(pts)
            more_points, done = follow_hyperplane(
                LAYER,
                which_point,
                known_T,
                known_A0,
                known_B0,
                history=history,
                only_need_positive=only_need_positive)
            pts.extend(more_points)
            if len(pts) >= MAX_POINTS:
                print("Have enough; break")
                break

            if len(pts) == 0:
                break

            neuron_values = known_T.extend_by(known_A0, known_B0).forward(pts)

            neuron_positive_count = np.sum(neuron_values > 1, axis=0)
            neuron_negative_count = np.sum(neuron_values < -1, axis=0)
            print("Counts")
            print(neuron_positive_count)
            print(neuron_negative_count)

            print("SHOULD BE DONE?", done, only_need_positive)
            if done and only_need_positive:
                good = True
                break
            if np.all(neuron_positive_count > 0) and np.all(neuron_negative_count > 0) or \
               (only_need_positive and np.all(neuron_positive_count > 0)):
                print("Have all the points we need (2)")
                good = True
                break

        if len(pts) < MAX_POINTS / 2 and good == False:
            print("=======" * 10)
            print("Select a new point to start from")
            print("=======" * 10)
            if already_checked_critical_points:
                print("CHOOSE FROM", len(initial_points), initial_points)
                which_point = initial_points[np.random.randint(
                    0,
                    len(initial_points) - 1)]
            else:
                which_point = next(get_critical_point)
        else:
            print("Abort")
            break

    critical_points = np.array(pts)  #sorted(list(set(map(tuple,pts))))

    print("Now have critical points", len(critical_points))

    if CHEATING:
        layer = [[
            np.min(np.abs(x)) for x in cheat_get_inner_layers(x[np.newaxis, :])
        ][LAYER + 1] for x in critical_points]

        #print("Which layer is zero?", sorted(layer))
        layer = np.abs(
            cheat_get_inner_layers(np.array(critical_points))[LAYER + 1])

        print(layer)

        which_is_zero = np.argmin(layer, axis=1)
        print("Which neuron is zero?", which_is_zero)

        which_is_zero = which_is_zero[0]

    print("Query count", query_count)

    K = neuron_count[LAYER + 1]
    MAX = (1 << K)
    if already_checked_critical_points:
        bounds = [(MAX - 1, MAX)]
    else:
        bounds = []
        for i in range(1024):
            bounds.append(((MAX * i) // 1024, (MAX * (i + 1)) // 1024))

    print("Created a list")

    known_hidden_so_far = known_T.forward(critical_points, with_relu=True)
    debug = False

    start_time = time.time()

    extra_args_tup = (known_A0, known_B0, LAYER, known_hidden_so_far, K, None)

    all_res = pool[0].map(is_solution_map,
                          [(bound, extra_args_tup) for bound in bounds])

    end_time = time.time()

    print("Done map, now collect results")
    print("Took", end_time - start_time, 'seconds')

    all_res = [x for y in all_res for x in y]

    scores = [r[0] for r in all_res]
    solution_attempts = sum([r[1] for r in all_res])
    total_attempts = len(all_res)

    print("Attempts at solution:", (solution_attempts), 'out of',
          total_attempts)

    std = np.std([x[0] for x in scores])
    print('std', std)
    print('median', np.median([x[0] for x in scores]))
    print('min', np.min([x[0] for x in scores]))

    return min(scores, key=lambda x: x[0])[1], critical_points

Ejemplo n.º 4

Mostrar archivo

Archivo: sign_recovery.py Proyecto: muskanmahajan37/cryptanalytic-model-extraction

def follow_hyperplane(LAYER,
                      start_point,
                      known_T,
                      known_A,
                      known_B,
                      history=[],
                      MAX_POINTS=1e3,
                      only_need_positive=False):
    """
    This is the ugly algorithm that will let us recover sign for expansive networks.
    Assumes we have extracted up to layer K-1 correctly, and layer K up to sign.

    start_point is a neuron on layer K+1

    known_T is the transformation that computes up to layer K-1, with
    known_A and known_B being the layer K matrix up to sign.

    We're going to come up with a bunch of different inputs,
    each of which has the same critical point held constant at zero.
    """
    def choose_new_direction_from_minimize(previous_axis):
        """
        Given the current point which is at a critical point of the next
        layer neuron, compute which direction we should travel to continue
        with finding more points on this hyperplane.

        Our goal is going to be to pick a direction that lets us explore
        a new part of the space we haven't seen before.
        """

        print("Choose a new direction to travel in")
        if len(history) == 0:
            which_to_change = 0
            new_perp_dir = perp_dir
            new_start_point = start_point
            initial_signs = get_polytope_at(known_T, known_A, known_B,
                                            start_point)

            # If we're in the 1 region of the polytope then we try to make it smaller
            # otherwise make it bigger
            fn = min if initial_signs[0] == 1 else max
        else:
            neuron_values = np.array([x[1] for x in history])

            neuron_positive_count = np.sum(neuron_values > 1, axis=0)
            neuron_negative_count = np.sum(neuron_values < -1, axis=0)

            mean_plus_neuron_value = neuron_positive_count / (
                neuron_positive_count + neuron_negative_count + 1)
            mean_minus_neuron_value = neuron_negative_count / (
                neuron_positive_count + neuron_negative_count + 1)

            # we want to find values that are consistently 0 or 1
            # So map 0 -> 0 and 1 -> 0 and the middle to higher values
            if only_need_positive:
                neuron_consistency = mean_plus_neuron_value
            else:
                neuron_consistency = mean_plus_neuron_value * mean_minus_neuron_value

            # Print out how much progress we've made.
            # This estimate is probably worse than Windows 95's estimated time remaining.
            # At least it's monotonic. Be thankful for that.
            print("Progress",
                  "%.1f" % int(np.mean(neuron_consistency != 0) * 100) + "%")
            print("Counts on each side of each neuron")
            print(neuron_positive_count)
            print(neuron_negative_count)

            # Choose the smallest value, which is the most consistent
            which_to_change = np.argmin(neuron_consistency)

            print("Try to explore the other side of neuron", which_to_change)

            if which_to_change != previous_axis:
                if previous_axis is not None and neuron_consistency[
                        previous_axis] == neuron_consistency[which_to_change]:
                    # If the previous thing we were working towards has the same value as this one
                    # the don't change our mind and just keep going at that one
                    # (almost always--sometimes we can get stuck, let us get unstuck)
                    which_to_change = previous_axis
                    new_start_point = start_point
                    new_perp_dir = perp_dir
                else:
                    valid_axes = np.where(
                        neuron_consistency ==
                        neuron_consistency[which_to_change])[0]

                    best = (np.inf, None, None)

                    for _, potential_hidden_vector, potential_point in history[
                            -1:]:
                        for potential_axis in valid_axes:
                            value = potential_hidden_vector[potential_axis]
                            if np.abs(value) < best[0]:
                                best = (np.abs(value), potential_axis,
                                        potential_point)

                    _, which_to_change, new_start_point = best
                    new_perp_dir = perp_dir

            else:
                new_start_point = start_point
                new_perp_dir = perp_dir

            # If we're in the 1 region of the polytope then we try to make it smaller
            # otherwise make it bigger
            fn = min if neuron_positive_count[
                which_to_change] > neuron_negative_count[
                    which_to_change] else max
            arg_fn = np.argmin if neuron_positive_count[
                which_to_change] > neuron_negative_count[
                    which_to_change] else np.argmax
            print("Changing", which_to_change, 'to flip sides because mean is',
                  mean_plus_neuron_value[which_to_change])

        val = matmul(known_T.forward(new_start_point, with_relu=True), known_A,
                     known_B)[which_to_change]

        initial_signs = get_polytope_at(known_T, known_A, known_B,
                                        new_start_point)

        # Now we're going to figure out what direction makes this biggest/smallest
        # this doesn't take any queries
        # There's probably an analytical way to do this.
        # But thinking is hard. Just try 1000 random angles.
        # There are no queries involved in this process.

        choices = []
        for _ in range(1000):
            random_dir = np.random.normal(size=DIM)
            perp_component = np.dot(random_dir, new_perp_dir) / (np.dot(
                new_perp_dir, new_perp_dir)) * new_perp_dir
            parallel_dir = random_dir - perp_component

            # This is the direction we're going to travel in.
            go_direction = parallel_dir / np.sum(parallel_dir**2)**.5

            try:
                a_bit_further, high = binary_search_towards(
                    known_T, known_A, known_B, new_start_point, initial_signs,
                    go_direction)
            except AcceptableFailure:
                continue
            if a_bit_further is None:
                continue

            # choose a direction that makes the Kth value go down by the most
            val = matmul(
                known_T.forward(a_bit_further[np.newaxis, :], with_relu=True),
                known_A, known_B)[0][which_to_change]

            #print('\t', val, high)

            choices.append([val, new_start_point + high * go_direction])

        best_value, multiple_intersection_point = fn(choices,
                                                     key=lambda x: x[0])

        print('Value', best_value)
        return new_start_point, multiple_intersection_point, which_to_change

    ###################################################
    ### Actual code to do the sign recovery starts. ###
    ###################################################

    start_box_step = 0
    points_on_plane = []

    if CHEATING:
        layer = np.abs(
            cheat_get_inner_layers(np.array(start_point))[LAYER + 1])
        print("Layer", layer)
        which_is_zero = np.argmin(layer)

    current_change_axis = 0

    while True:
        print("\n\n")
        print("-----" * 10)

        if CHEATING:
            layer = np.abs(
                cheat_get_inner_layers(np.array(start_point))[LAYER + 1])
            #print('layer',LAYER+1, layer)
            #print('all inner layers')
            #for e in cheat_get_inner_layers(np.array(start_point)):
            #    print(e)
            which_is_zero_2 = np.argmin(np.abs(layer))

            if which_is_zero_2 != which_is_zero:
                print("STARTED WITH", which_is_zero, "NOW IS", which_is_zero_2)
                print(layer)
                raise

        # Keep track of where we've been, so we can go to new places.
        which_polytope = get_polytope_at(known_T, known_A, known_B,
                                         start_point, False)  # [-1 1 -1]
        hidden_vector = get_hidden_at(known_T, known_A, known_B, LAYER,
                                      start_point, False)
        sign_at_init = sign_to_int(which_polytope)  # 0b010 -> 2

        print("Number of collected points", len(points_on_plane))
        if len(points_on_plane) > MAX_POINTS:
            return points_on_plane, False

        neuron_values = np.array([x[1] for x in history])

        neuron_positive_count = np.sum(neuron_values > 1, axis=0)
        neuron_negative_count = np.sum(neuron_values < -1, axis=0)

        if (np.all(neuron_positive_count > 0) and np.all(neuron_negative_count > 0)) or \
           (only_need_positive and np.all(neuron_positive_count > 0)):
            print("Have all the points we need (1)")
            print(query_count)
            print(neuron_positive_count)
            print(neuron_negative_count)

            neuron_values = np.array([
                get_hidden_at(known_T, known_A, known_B, LAYER, x, False)
                for x in points_on_plane
            ])

            neuron_positive_count = np.sum(neuron_values > 1, axis=0)
            neuron_negative_count = np.sum(neuron_values < -1, axis=0)

            print(neuron_positive_count)
            print(neuron_negative_count)

            return points_on_plane, True

        # 1. find a way to move along the hyperplane by computing the normal
        # direction using the ratios function. Then find a parallel direction.

        try:
            #perp_dir = get_ratios([start_point], [range(DIM)], eps=1e-4)[0].flatten()
            perp_dir = get_ratios_lstsq(0, [start_point], [range(DIM)],
                                        KnownT([], []),
                                        eps=1e-5)[0].flatten()

        except AcceptableFailure:
            print(
                "Failed to compute ratio at start point. Something very bad happened."
            )
            return points_on_plane, False

        # Record these points.
        history.append((which_polytope, hidden_vector, np.copy(start_point)))

        # We can't just pick any parallel direction. If we did, then we would
        # not end up covering much of the input space.

        # Instead, we're going to figure out which layer-1 hyperplanes are "visible"
        # from the current point. Then we're going to try and go reach all of them.

        # This is the point at which the first and second layers intersect.
        start_point, multiple_intersection_point, new_change_axis = choose_new_direction_from_minimize(
            current_change_axis)

        if new_change_axis != current_change_axis:
            start_point, multiple_intersection_point, current_change_axis = choose_new_direction_from_minimize(
                None)

        #if CHEATING:
        #    print("INIT MULTIPLE", cheat_get_inner_layers(multiple_intersection_point))

        # Refine the direction we're going to travel in---stay numerically stable.
        towards_multiple_direction = multiple_intersection_point - start_point
        step_distance = np.sum(towards_multiple_direction**2)**.5

        print("Distance we need to step:", step_distance)

        if step_distance > 1 or True:
            mid_point = 1e-4 * towards_multiple_direction / np.sum(
                towards_multiple_direction**2)**.5 + start_point

            random_dir = np.random.normal(size=DIM)

            mid_points = do_better_sweep(mid_point,
                                         perp_dir / np.sum(perp_dir**2)**.5,
                                         low=-1e-3,
                                         high=1e-3,
                                         known_T=known_T)

            if len(mid_points) > 0:
                mid_point = mid_points[np.argmin(
                    np.sum((mid_point - mid_points)**2, axis=1))]

                towards_multiple_direction = mid_point - start_point
                towards_multiple_direction = towards_multiple_direction / np.sum(
                    towards_multiple_direction**2)**.5

                initial_signs = get_polytope_at(known_T, known_A, known_B,
                                                start_point)
                _, high = binary_search_towards(known_T, known_A, known_B,
                                                start_point, initial_signs,
                                                towards_multiple_direction)

                multiple_intersection_point = towards_multiple_direction * high + start_point

        # Find the angle of the next hyperplane
        # First, take random steps away from the intersection point
        # Then run the search algorithm to find some intersections
        # what we find will either be a layer-1 or layer-2 intersection.

        print("Now try to find the continuation direction")
        success = None
        while success is None:
            if start_box_step < 0:
                start_box_step = 0
                print("VERY BAD FAILURE")
                print("Choose a new random point to start from")
                which_point = np.random.randint(0, len(history))
                start_point = history[which_point][2]
                print("New point is", which_point)
                current_change_axis = np.random.randint(0, sizes[LAYER + 1])
                print("New axis to change", current_change_axis)
                break

            print("\tStart the box step with size", start_box_step)
            try:
                success, camefrom, stepsize = find_plane_angle(
                    known_T, known_A, known_B, multiple_intersection_point,
                    sign_at_init, start_box_step)
            except AcceptableFailure:
                # Go back to the top and try with a new start point
                print("\tOkay we need to try with a new start point")
                start_box_step = -10

            start_box_step -= 2

        if success is None:
            continue

        val = matmul(
            known_T.forward(multiple_intersection_point, with_relu=True),
            known_A, known_B)[new_change_axis]
        print("Value at multiple:", val)
        val = matmul(known_T.forward(success, with_relu=True), known_A,
                     known_B)[new_change_axis]
        print("Value at success:", val)

        if stepsize < 10:
            new_move_direction = success - multiple_intersection_point

            # We don't want to be right next to the multiple intersection point.
            # So let's binary search to find how far away we can go while remaining in this polytope.
            # Then we'll go half as far as we can maximally go.

            initial_signs = get_polytope_at(known_T, known_A, known_B, success)
            print("polytope at initial", sign_to_int(initial_signs))
            low = 0
            high = 1
            while high - low > 1e-2:
                mid = (high + low) / 2
                query_point = multiple_intersection_point + mid * new_move_direction
                next_signs = get_polytope_at(known_T, known_A, known_B,
                                             query_point)
                print(
                    "polytope at", mid, sign_to_int(next_signs), "%x" %
                    (sign_to_int(next_signs) ^ sign_to_int(initial_signs)))
                if initial_signs == next_signs:
                    low = mid
                else:
                    high = mid
            print("GO TO", mid)

            success = multiple_intersection_point + (mid /
                                                     2) * new_move_direction

            val = matmul(known_T.forward(success, with_relu=True), known_A,
                         known_B)[new_change_axis]
            print("Value at moved success:", val)

        print("Adding the points to the set of known good points")

        points_on_plane.append(start_point)

        if camefrom is not None:
            points_on_plane.append(camefrom)
        #print("Old start point", start_point)
        #print("Set to success", success)
        start_point = success
        start_box_step = max(stepsize - 1, 0)

    return points_on_plane, False

Ejemplo n.º 5

Mostrar archivo

Archivo: sign_recovery.py Proyecto: muskanmahajan37/cryptanalytic-model-extraction

def is_on_following_layer(known_T, known_A, known_B, point):

    print("Check if the critical point is on the next layer")

    def is_on_prior_layer(query):
        print("Hidden think", known_T.get_hidden_layers(query))
        if CHEATING:
            print("Hidden real", cheat_get_inner_layers(query))
        if any(
                np.min(np.abs(layer)) < 1e-5
                for layer in known_T.get_hidden_layers(query)):
            return True
        next_hidden = known_T.extend_by(known_A, known_B).forward(query)
        print(next_hidden)
        if np.min(np.abs(next_hidden)) < 1e-4:
            return True
        return False

    if is_on_prior_layer(point):
        print("It's not, because it's on an earlier layer")
        return False

    if CHEATING:
        ls = ([np.min(np.abs(x)) for x in cheat_get_inner_layers(point)])

    initial_signs = get_polytope_at(known_T, known_A, known_B, point)

    normal = get_ratios([point], [range(DIM)], eps=GRAD_EPS)[0].flatten()
    normal = normal / np.sum(normal**2)**.5

    for tol in range(10):

        random_dir = np.random.normal(size=DIM)
        perp_component = np.dot(random_dir, normal) / (np.dot(normal,
                                                              normal)) * normal
        parallel_dir = random_dir - perp_component

        go_direction = parallel_dir / np.sum(parallel_dir**2)**.5

        _, high = binary_search_towards(known_T, known_A, known_B, point,
                                        initial_signs, go_direction)

        if CHEATING:
            print(
                cheat_get_inner_layers(point +
                                       go_direction * high / 2)[np.argmin(ls)])

        point_in_same_polytope = point + (high * .999 - 1e-4) * go_direction

        print("high", high)

        solutions = do_better_sweep(point_in_same_polytope,
                                    normal,
                                    -1e-4 * high,
                                    1e-4 * high,
                                    known_T=known_T)
        if len(solutions) >= 1:
            print("Correctly found", len(solutions))
        else:
            return False

        point_in_different_polytope = point + (high * 1.1 +
                                               1e-1) * go_direction

        solutions = do_better_sweep(point_in_different_polytope,
                                    normal,
                                    -1e-4 * high,
                                    1e-4 * high,
                                    known_T=known_T)
        if len(solutions) == 0:
            print("Correctly found", len(solutions))
        else:
            return False

    #print("I THINK IT'S ON THE NEXT LAYER")
    if CHEATING:
        soln = [np.min(np.abs(x)) for x in cheat_get_inner_layers(point)]
        print(soln)
        assert np.argmin(soln) == len(known_T.A) + 1

    return True

Ejemplo n.º 6

Mostrar archivo

Archivo: sign_recovery.py Proyecto: muskanmahajan37/cryptanalytic-model-extraction

def find_plane_angle(known_T,
                     known_A,
                     known_B,
                     multiple_intersection_point,
                     sign_at_init,
                     init_step,
                     exponential_base=1.5):
    """
    Given an input that's at the multiple intersection point, figure out how
    to continue along the path after it bends.


                /       X    : multiple intersection point
       ......../..      ---- : layer N hyperplane
       .      /  .       |   : layer N+1 hyperplane that bends
       .     /   .    
    --------X-----------
       .    |    .
       .    |    .
       .....|.....
            |
            |

    We need to make sure to bend, and not turn onto the layer N hyperplane.

    To do this we will draw a box around the X and intersect with the planes 
    and determine the four coordinates. Then draw another box twice as big.
    
    The first layer plane will be the two points at a consistent angle.
    The second layer plane will have an inconsistent angle.

    Choose the inconsistent angle plane, and make sure we move to a new
    polytope and don't just go backwards to where we've already bene.
    """
    success = None
    camefrom = None

    prev_iter_intersections = []

    while True:
        x_dir_base = np.sign(np.random.normal(size=DIM)) / DIM**.5
        y_dir_base = np.sign(np.random.normal(size=DIM)) / DIM**.5
        # When the input dimension is odd we can't have two orthogonal
        # vectors from {-1,1}^DIM
        if np.abs(np.dot(x_dir_base, y_dir_base)) <= DIM % 2:
            break

    MAX = 35

    start = [10] if init_step > 10 else []
    for stepsize in start + list(range(init_step, MAX)):
        print("\tTry stepping away", stepsize)
        x_dir = x_dir_base * (exponential_base**(stepsize - 10))
        y_dir = y_dir_base * (exponential_base**(stepsize - 10))

        # Draw the box as shown in the diagram above, and compute where
        # the critical points are.
        top = do_better_sweep(multiple_intersection_point + x_dir,
                              y_dir,
                              -1,
                              1,
                              known_T=known_T)
        bot = do_better_sweep(multiple_intersection_point - x_dir,
                              y_dir,
                              -1,
                              1,
                              known_T=known_T)
        left = do_better_sweep(multiple_intersection_point + y_dir,
                               x_dir,
                               -1,
                               1,
                               known_T=known_T)
        right = do_better_sweep(multiple_intersection_point - y_dir,
                                x_dir,
                                -1,
                                1,
                                known_T=known_T)

        intersections = top + bot + left + right

        # If we only have two critical points, and we're taking a big step,
        # then something is seriously messed up.
        # This is not an acceptable error. Just abort out and let's try to
        # do the whole thing again.
        if len(intersections) == 2 and stepsize >= 10:
            raise AcceptableFailure()

        if CHEATING:
            print("\tHAVE BOX INTERSECT COUNT", len(intersections))
            print("\t", len(left), len(right), len(top), len(bot))

        if (len(intersections) == 0 and stepsize >
                15):  # or (len(intersections) == 3 and stepsize > 5):
            # Probably we're in just a constant flat 0 region
            # At this point we're basically dead in the water.
            # Just fail up and try again.
            print("\tIt looks like we're in a flat region, raise failure")
            raise AcceptableFailure()

        # If we somehow went from almost no critical points to more than 4,
        # then we've really messed up.
        # Just fail out and let's hope next time it doesn't happen.
        if len(intersections) > 4 and len(prev_iter_intersections) < 2:
            print("\tWe didn't get enough inner points")
            if exponential_base == 1.2:
                print("\tIt didn't work a second time")
                return None, None, 0
            else:
                print("\tTry with smaller step")
                return find_plane_angle(known_T,
                                        known_A,
                                        known_B,
                                        multiple_intersection_point,
                                        sign_at_init,
                                        init_step,
                                        exponential_base=1.2)

        # This is the good, expected code-path.
        # We've seen four intersections at least twice before, and now
        # we're seeing more than 4.
        if (len(intersections) > 4
                or stepsize > 20) and len(prev_iter_intersections) >= 2:
            next_intersections = np.array(prev_iter_intersections[-1])
            intersections = np.array(prev_iter_intersections[-2])

            # Let's first figure out what points are responsible for the prior-layer neurons
            # being zero, and which are from the current-layer neuron being zero
            candidate = []
            for i, a in enumerate(intersections):
                for j, b in enumerate(intersections):
                    if i == j: continue
                    score = np.sum(
                        ((a + b) / 2 - multiple_intersection_point)**2)
                    a_to_b = b - a
                    a_to_b /= np.sum(a_to_b**2)**.5

                    variance = np.std((next_intersections - a) / a_to_b,
                                      axis=1)
                    best_variance = np.min(variance)

                    #print(i,j,score, best_variance)

                    candidate.append((best_variance, i, j))

            if sorted(candidate)[3][0] < 1e-8:
                # It looks like both lines are linear here
                # We can't distinguish what way is the next best way to go.
                print("\tFailed the box continuation finding procedure. (1)")
                print("\t", candidate)
                raise AcceptableFailure()

            # Sometimes life is just ugly, and nothing wants to work.
            # Just abort.
            err, index_0, index_1 = min(candidate)
            if err / max(candidate)[0] > 1e-5:
                return None, None, 0

            prior_layer_near_zero = np.zeros(4, dtype=np.bool)
            prior_layer_near_zero[index_0] = True
            prior_layer_near_zero[index_1] = True

            # Now let's walk through each of these points and check that everything looks sane.
            should_fail = False
            for critical_point, is_prior_layer_zero in zip(
                    intersections, prior_layer_near_zero):
                vs = known_T.extend_by(
                    known_A, known_B).get_hidden_layers(critical_point)
                #print("VS IS", vs)
                #print("Is prior", is_prior_layer_zero)
                #if CHEATING:
                #    print(cheat_get_inner_layers(critical_point))

                if is_prior_layer_zero:
                    # We expect the prior layer to be zero.
                    if all([np.min(np.abs(x)) > 1e-5 for x in vs]):
                        # If it looks like it's not actually zero, then brutally fail.
                        print("\tAbort 1: failed to find a valid box")
                        should_fail = True
                if any([np.min(np.abs(x)) < 1e-10 for x in vs]):
                    # We expect the prior layer to be zero.
                    if not is_prior_layer_zero:
                        # If it looks like it's not actually zero, then brutally fail.
                        print("\tAbort 2: failed to find a valid box")
                        should_fail = True
            if should_fail:
                return None, None, 0

            # Done with error checking, life is good here.
            # Find the direction that corresponds to the next direction we can move in
            # and continue our search from that point.
            for critical_point, is_prior_layer_zero in zip(
                    intersections, prior_layer_near_zero):
                sign_at_crit = sign_to_int(
                    get_polytope_at(known_T, known_A, known_B, critical_point))
                print("\tMove to", sign_at_crit, 'versus', sign_at_init,
                      is_prior_layer_zero)
                if not is_prior_layer_zero:
                    if sign_at_crit != sign_at_init:
                        success = critical_point
                        if CHEATING:
                            print('\tinner at success',
                                  cheat_get_inner_layers(success))
                        print("\tSucceeded")
                    else:
                        camefrom = critical_point

            # If we didn't get a solution, then abort out.
            # Probably what happened here is that we got more than four points
            # on the box but didn't see exactly four points on the box twice before
            # this means we should decrease the initial step size and try again.
            if success is None:
                print("\tFailed the box continuation finding procedure. (2)")
                raise AcceptableFailure()
                #assert success is not None
            break
        if len(intersections) == 4:
            prev_iter_intersections.append(intersections)
    return success, camefrom, min(stepsize, MAX - 3)

Ejemplo n.º 7

Mostrar archivo

def graph_solve(all_ratios, all_criticals, expected_neurons, LAYER, debug=False):
    # 1. Load the critical points and ratios we precomputed

    all_ratios = np.array(all_ratios, dtype=np.float64)
    all_ratios_f32 = np.array(all_ratios, dtype=np.float32)
    all_criticals = np.array(all_criticals, dtype=np.float64)

    # Batch them to be sensibly sized
    ratios_group = [all_ratios_f32[i:i+1000] for i in range(0,len(all_ratios),1000)]
    criticals_group = [all_criticals[i:i+1000] for i in range(0,len(all_criticals),1000)]
                    
    # 2. Compute the similarity pairwise between the ratios we've computed

    print("Go up to", len(criticals_group))
    now = time.time()
    all_pairings = [[] for _ in range(sum(map(len,ratios_group)))]
    for batch_index,(criticals,ratios) in enumerate(zip(criticals_group, ratios_group)):
        print(batch_index)

        # Compute the all-pairs similarity
        axis = list(range(all_ratios.shape[1]))
        random.shuffle(axis)
        axis = axis[:20]
        for dim in axis:
            # We may have an error on one of the directions, so let's try all of them
            scaled_all_ratios =  all_ratios_f32 / all_ratios_f32[:,dim:dim+1]
            scaled_ratios = ratios / ratios[:,dim:dim+1]

            batch_pairings = process_block(scaled_ratios, scaled_all_ratios)
            
            # To get the offset, Compute the cumsum of the length up to batch_index
            batch_offset = sum(map(len,ratios_group[:batch_index]))
            # And now create the graph matching ratios that are similar
            for this_batch_i,global_j in zip(*np.nonzero(np.array(batch_pairings))):
                all_pairings[this_batch_i + batch_offset].append(global_j)
    print(time.time()-now)

    graph = nx.Graph()
    # Add the edges to the graph, removing self-loops
    graph.add_edges_from([(i,j) for i,js in enumerate(all_pairings) for j in js if abs(i-j) > 1]) 
    components = list(nx.connected_components(graph))

    sorted_components = sorted(components, key=lambda x: -len(x))

    if CHEATING:
        print('Total (unmatched) examples found:', sorted(collections.Counter(which_is_zero(LAYER, cheat_get_inner_layers(all_criticals))).items()))

        #for crit,rat in zip(all_criticals,all_ratios):
        #    if which_is_zero(LAYER, cheat_get_inner_layers(crit)) == 6:
        #        print(" ".join("%.6f"%abs(x) if not np.isnan(x) else "     nan" for x in rat))
            
        #cc = which_is_zero(LAYER, cheat_get_inner_layers(all_criticals))
        #print("THREES")
        #
        #threes = []
        #print("Pair", process_block
        #      [all_ratios[x] for x in range(len(all_criticals)) if cc[x] == 3]

            

    if len(components) == 0:
        print("No components found")
        raise AcceptableFailure()
    print("Graph search found", len(components), "different components with the following counts", list(map(len,sorted_components)))

    if CHEATING:
        which_neurons = [collections.Counter(which_is_zero(LAYER, cheat_get_inner_layers(all_criticals[list(orig_component)]))) for orig_component in sorted_components]
        first_index_of = [-1]*expected_neurons

        for i,items in enumerate(which_neurons):
            for item in items.keys():
                if first_index_of[item] == -1:
                    first_index_of[item] = i

        print('These components corresopnd to', which_neurons)
        print("Withe the corresponding index in the list:", first_index_of)

    previous_num_components = np.inf
    
    while previous_num_components > len(sorted_components):
        previous_num_components = len(sorted_components)
        candidate_rows = []
        candidate_components = []

        datas = [all_ratios[list(component)] for component in sorted_components]
        results = pool[0].map(ratio_normalize, datas)

        candidate_rows = [x[0] for x in results]
        candidate_components = sorted_components

        candidate_rows = np.array(candidate_rows)

        new_pairings = [[] for _ in range(len(candidate_rows))]
        
        # Re-do the pairings
        for dim in range(all_ratios.shape[1]):
            scaled_ratios = candidate_rows / candidate_rows[:,dim:dim+1]

            batch_pairings = process_block(scaled_ratios, scaled_ratios)
            
            # And now create the graph matching ratios that are similar
            for this_batch_i,global_j in zip(*np.nonzero(np.array(batch_pairings))):
                new_pairings[this_batch_i].append(global_j)
            
        graph = nx.Graph()
        # Add the edges to the graph, ALLOWING self-loops this time
        graph.add_edges_from([(i,j) for i,js in enumerate(new_pairings) for j in js]) 
        components = list(nx.connected_components(graph))

        components = [sum([list(candidate_components[y]) for y in comp],[]) for comp in components]

        sorted_components = sorted(components, key=lambda x: -len(x))

        print("After re-doing the graph, the component counts is", len(components), "with items", list(map(len,sorted_components)))

        if CHEATING:
            which_neurons = [collections.Counter(which_is_zero(LAYER, cheat_get_inner_layers(all_criticals[list(orig_component)]))) for orig_component in sorted_components]
            first_index_of = [-1]*expected_neurons
        
            for i,items in enumerate(which_neurons):
                for item in items.keys():
                    if first_index_of[item] == -1:
                        first_index_of[item] = i
            
            print('Corresponding to', which_neurons)
            print("First index:", first_index_of)
        
            print("Expected neurons", expected_neurons)


    print("Processing each connected component in turn.")
            
    resulting_examples = []
    resulting_rows = []

    skips_because_of_nan = 0
    failure = None
    
    for c_count, component in enumerate(sorted_components):
        if debug:
            print("\n")
            if c_count >= expected_neurons:
                print("WARNING: This one might be a duplicate!")
        print("On component", c_count, "with indexs", component)
        if debug and CHEATING:
            inner = cheat_get_inner_layers(all_criticals[list(component)])
            print('Corresponding to (cheating) ', which_is_zero(LAYER, inner))

        possible_matrix_rows = all_ratios[list(component)]
        
        guessed_row, normalize_axis, normalize_error = ratio_normalize(possible_matrix_rows)

        print('The guessed error in the computation is',normalize_error, 'with', len(component), 'witnesses')
        if normalize_error > .01 and len(component) <= 5:
            print("Component size less than 5 with high error; this isn't enough to be sure")
            continue
        
        print("Normalize on axis", normalize_axis)

        if len(resulting_rows):
            scaled_resulting_rows = np.array(resulting_rows)
            #print(scaled_resulting_rows.shape)
            scaled_resulting_rows /= scaled_resulting_rows[:,normalize_axis:normalize_axis+1]
            delta = np.abs(scaled_resulting_rows - guessed_row[np.newaxis,:])
            if min(np.nanmax(delta, axis=1)) < 1e-2:
                print("Likely have found this node before")
                raise


        if CHEATING:
            # Check our work against the ground truth entries in the corresponding matrix
            layers = cheat_get_inner_layers(all_criticals[list(component)[0]])
            layer_vals = [np.min(np.abs(x)) for x in layers]
            which_layer = np.argmin(layer_vals)
        
            M = A[which_layer]
            which_neuron = which_is_zero(which_layer, layers)
            print("Neuron corresponds to", which_neuron)
            if which_layer != LAYER:
                which_neuron = 0
                normalize_axis = 0

            actual_row = M[:,which_neuron]/M[normalize_axis,which_neuron]
            actual_row = actual_row[:guessed_row.shape[0]]
    
            do_print_err = np.any(np.isnan(guessed_row))
    
            if which_layer == LAYER:
                error = np.max(np.abs(np.abs(guessed_row)-np.abs(actual_row)))
            else:
                error = 1e6
            print('max error', "%0.8f"%error, len(component))
            if (error > 1e-4 * len(guessed_row) and debug) or do_print_err:
                print('real ', " ".join("%2.3f"%x for x in actual_row))
                print('guess', " ".join("%2.3f"%x for x in guessed_row))
                print('gap', " ".join("%2.3f"%(np.abs(x-y)) for x,y in zip(guessed_row,actual_row)))
                #print("scale", scale)
                print("--")
                for row in possible_matrix_rows:
                    print('posbl', " ".join("%2.3f"%x for x in row/row[normalize_axis]))
                print("--")
                
                scale = 10**int(np.round(np.log(np.nanmedian(np.abs(possible_matrix_rows)))/np.log(10)))
                possible_matrix_rows /= scale
                for row in possible_matrix_rows:
                    print('posbl', " ".join("%2.3f"%x for x in row))
        if np.any(np.isnan(guessed_row)) and c_count < expected_neurons:
            print("Got NaN, need more data",len(component)/sum(map(len,components)),1/sizes[LAYER+1])
            if len(component) >= 3:
                if c_count < expected_neurons:
                    failure = GatherMoreData([all_criticals[x] for x in component])
                skips_because_of_nan += 1
            continue

        guessed_row[np.isnan(guessed_row)] = 0

        if c_count < expected_neurons and len(component) >= 3:
            resulting_rows.append(guessed_row)
            resulting_examples.append([all_criticals[x] for x in component])
        else:
            print("Don't add it to the set")


    # We set failure when something went wrong but we want to defer crashing
    # (so that we can use the partial solution)

    if len(resulting_rows)+skips_because_of_nan < expected_neurons and len(all_ratios) < DEAD_NEURON_THRESHOLD:
        print("We have not explored all neurons. Do more random search", len(resulting_rows), skips_because_of_nan, expected_neurons)
        raise AcceptableFailure(partial_solution=(np.array(resulting_rows), np.array(resulting_examples)))
    else:
        print("At this point, we just assume the neuron must be dead")
        while len(resulting_rows) < expected_neurons:
            resulting_rows.append(np.zeros_like((resulting_rows[0])))
            resulting_examples.append([np.zeros_like(resulting_examples[0][0])])

    # Here we know it's a GatherMoreData failure, but we want to only do this
    # if there was enough data for everything else
    if failure is not None:
        print("Need to raise a previously generated failure.")
        raise failure


    print("Successfully returning a solution attempt.\n")
    return resulting_examples, resulting_rows

Ejemplo n.º 8

Mostrar archivo

def compute_layer_values(critical_points, known_T, LAYER):
    if LAYER == 0:
        COUNT = neuron_count[LAYER+1] * 3
    else:
        COUNT = neuron_count[LAYER+1] * np.log(sizes[LAYER+1]) * 3


    # type: [(ratios, critical_point)]
    this_layer_critical_points = []

    partial_weights = None
    partial_biases = None

    def check_fn(point):
        if partial_weights is None:
            return True
        hidden = matmul(known_T.forward(point, with_relu=True), partial_weights.T, partial_biases)
        if np.any(np.abs(hidden) < 1e-4):
            return False
        
        return True

    
    print()
    print("Start running critical point search to find neurons on layer", LAYER)
    while True:
        print("At this iteration I have", len(this_layer_critical_points), "critical points")

        def reuse_critical_points():
            for witness in critical_points:
                yield witness
        
        this_layer_critical_points.extend(gather_ratios(reuse_critical_points(), known_T, check_fn,
                                                         LAYER, COUNT))

        print("Query count after that search:", query_count)
        print("And now up to ", len(this_layer_critical_points), "critical points")

        ## filter out duplicates
        filtered_points = []

        # Let's not add points that are identical to onees we've already done.
        for i,(ratio1,point1) in enumerate(this_layer_critical_points):
            for ratio2,point2 in this_layer_critical_points[i+1:]:
                if np.sum((point1 - point2)**2)**.5 < 1e-10:
                    break
            else:
                filtered_points.append((ratio1, point1))
        
        this_layer_critical_points = filtered_points

        print("After filtering duplicates we're down to ", len(this_layer_critical_points), "critical points")
        

        print("Start trying to do the graph solving")
        try:
            critical_groups, extracted_normals = graph_solve([x[0] for x in this_layer_critical_points],
                                                             [x[1] for x in this_layer_critical_points],
                                                             neuron_count[LAYER+1],
                                                             LAYER=LAYER,
                                                             debug=True)
            break
        except GatherMoreData as e:
            print("Graph solving failed because we didn't explore all sides of at least one neuron")
            print("Fall back to the hyperplane following algorithm in order to get more data")
            
            def mine(r):
                while len(r) > 0:
                    print("Yielding a point")
                    yield r[0]
                    r = r[1:]
                print("No more to give!")
    
            prev_T = KnownT(known_T.A[:-1], known_T.B[:-1])
            
            _, more_critical_points = sign_recovery.solve_layer_sign(prev_T, known_T.A[-1], known_T.B[-1], mine(e.data),
                                                                     LAYER-1, already_checked_critical_points=True,
                                                                     only_need_positive=True)

            print("Add more", len(more_critical_points))
            this_layer_critical_points.extend(gather_ratios(more_critical_points, known_T, check_fn,
                                                             LAYER, 1e6))
            print("Done adding")
            
            COUNT = neuron_count[LAYER+1]
        except AcceptableFailure as e:
            print("Graph solving failed; get more points")
            COUNT = neuron_count[LAYER+1]
            if 'partial_solution' in dir(e):

                if len(e.partial_solution[0]) > 0:
                    partial_weights, corresponding_examples = e.partial_solution
                    print("Got partial solution with shape", partial_weights.shape)
                    if CHEATING:
                        print("Corresponding to", np.argmin(np.abs(cheat_get_inner_layers([x[0] for x in corresponding_examples])[LAYER]),axis=1))
    
                    partial_biases = []
                    for weight, examples in zip(partial_weights, corresponding_examples):

                        hidden = known_T.forward(examples, with_relu=True)
                        print("hidden", np.array(hidden).shape)
                        bias = -np.median(np.dot(hidden, weight))
                        partial_biases.append(bias)
                    partial_biases = np.array(partial_biases)
                    
                
    print("Number of critical points per cluster", [len(x) for x in critical_groups])
    
    point_per_class = [x[0] for x in critical_groups]

    extracted_normals = np.array(extracted_normals).T

    # Compute the bias because we know wx+b=0
    extracted_bias = [matmul(known_T.forward(point_per_class[i], with_relu=True), extracted_normals[:,i], c=None) for i in range(neuron_count[LAYER+1])]

    # Don't forget to negate it.
    # That's important.
    # No, I definitely didn't forget this line the first time around.
    extracted_bias = -np.array(extracted_bias)

    # For the failed-to-identify neurons, set the bias to zero
    extracted_bias *= np.any(extracted_normals != 0,axis=0)[:,np.newaxis]
        

    if CHEATING:
        # Compute how far we off from the true matrix
        real_scaled = A[LAYER]/A[LAYER][0]
        extracted_scaled = extracted_normals/extracted_normals[0]
        
        mask = []
        reorder_rows = []
        for i in range(len(extracted_bias)):
            which_idx = np.argmin(np.sum(np.abs(real_scaled - extracted_scaled[:,[i]]),axis=0))
            reorder_rows.append(which_idx)
            mask.append((A[LAYER][0,which_idx]))
    
        print('matrix norm difference', np.sum(np.abs(extracted_normals*mask - A[LAYER][:,reorder_rows])))
    else:
        mask = [1]*len(extracted_bias)
    

    return extracted_normals, extracted_bias, mask

Ejemplo n.º 9

Mostrar archivo

    def search(low, high):
        if debug:
            logger.log("low high", low, high, level=Logger.DEBUG)
        mid = (low + high) / 2

        y1 = f_low = memo_forward_pass(low)
        f_mid = memo_forward_pass(mid)
        y2 = f_high = memo_forward_pass(high)

        if debug:
            ncross = cheat_num_relu_crosses(
                (offset + direction * low)[np.newaxis, :],
                (offset + direction * high)[np.newaxis, :])
            logger.log("ncross", ncross, level=Logger.DEBUG)

        if debug:
            logger.log("aa", f_mid, f_high, f_low, level=Logger.DEBUG)
            logger.log("compare",
                       np.abs(f_mid - (f_high + f_low) / 2),
                       SKIP_LINEAR_TOL * ((high - low)**.5),
                       level=Logger.DEBUG)
            logger.log("really", ncross, level=Logger.DEBUG)

        if np.abs(f_mid -
                  (f_high + f_low) / 2) < SKIP_LINEAR_TOL * ((high - low)**.5):
            # We're in a linear region
            if debug:
                logger.log("Skip linear",
                           sum(ncross),
                           ncross,
                           level=Logger.DEBUG)
            return
        elif high - low < 1e-8:
            # Too close to each other
            if debug:
                logger.log("wat", ncross, level=Logger.DEBUG)
            return
        else:
            # Check if there is exactly one ReLU switching sign, or if there are multiple.
            # To do this, use the 2-linear test from Jagielski et al. 2019
            #
            #
            #             /\   <---- real_h_at_x
            #            /  \
            #           /    \
            #          /      \
            #         /        \
            #        /          \
            #       /            \
            #     low q1 x_s_b q3 high
            #
            # Use (low,q1) to estimate the direction of the first line
            # Use (high,q3) to estimate the direction of the second line
            # They should in theory intersect at (x_should_be, y_should_be)
            # Query to compute real_h_at_x and then check if that's what we get
            # Then check that we're linear from x_should_be to low, and
            # linear from x_should_be to high.
            # If it all checks out, then return the solution.
            # Otherwise recurse again.

            q1 = (low + mid) * .5
            q3 = (high + mid) * .5

            f_q1 = memo_forward_pass(q1)
            f_q3 = memo_forward_pass(q3)

            m1 = (f_q1 - f_low) / (q1 - low)
            m2 = (f_q3 - f_high) / (q3 - high)

            if m1 != m2:
                d = (high - low)
                alpha = (y2 - y1 - d * m2) / (d * m1 - d * m2)

                x_should_be = low + (y2 - y1 - d * m2) / (m1 - m2)
                height_should_be = y1 + m1 * (y2 - y1 - d * m2) / (m1 - m2)

            if m1 == m2:
                # If the slopes on both directions are the same (e.g., the function is flat)
                # then we need to split and can't learn anything
                pass
            elif np.all(.25 + 1e-5 < alpha) and np.all(
                    alpha < .75 -
                    1e-5) and np.max(x_should_be) - np.min(x_should_be) < 1e-5:
                x_should_be = np.median(x_should_be)
                real_h_at_x = memo_forward_pass(x_should_be)

                if np.all(
                        np.abs(real_h_at_x -
                               height_should_be) < SKIP_LINEAR_TOL * 100):
                    # Compute gradient on each side and check for linearity

                    eighth_left = x_should_be - 1e-4
                    eighth_right = x_should_be + 1e-4
                    grad_left = (memo_forward_pass(eighth_left) -
                                 real_h_at_x) / (eighth_left - x_should_be)
                    grad_right = (memo_forward_pass(eighth_right) -
                                  real_h_at_x) / (eighth_right - x_should_be)

                    if np.all(np.abs(grad_left - m1) > SKIP_LINEAR_TOL *
                              10) or np.all(
                                  np.abs(grad_right - m2) > SKIP_LINEAR_TOL *
                                  10):
                        if debug:
                            logger.log("it's nonlinear", level=Logger.DEBUG)
                        pass
                    else:

                        if debug:
                            logger.log("OK", ncross, level=Logger.DEBUG)
                            vals = cheat_get_inner_layers(
                                (offset + direction * x_should_be))
                            smallest = min([np.min(np.abs(v)) for v in vals])
                            logger.log("Small",
                                       smallest,
                                       vals,
                                       level=Logger.DEBUG)
                            if smallest > .01:
                                raise
                        if debug and sum(ncross) > 1:
                            logger.log("BADNESS", level=Logger.DEBUG)
                        if return_scalar:
                            relus.append(x_should_be)
                        else:
                            relus.append(offset + direction * x_should_be)
                        return

        search(low, mid)
        if return_upto_one and len(relus) > 0:
            # we're done because we just want the left-most solution; don't do more searching
            return
        search(mid, high)

Ejemplo n.º 10

Mostrar archivo

Archivo: hyperplane_normal.py Proyecto: zedoul/cryptanalytic-model-extraction

def get_ratios_lstsq(LAYER, critical_points, N, known_T, debug=False, eps=1e-5):
    """
    Do the same thing as get_ratios, but works when we can't directly control where we want to query.
    
    This means we can't directly choose orthogonal directions, and so we're going
    to just pick random ones and then use least-squares to do it
    """
    #pickle.dump((LAYER, critical_points, N, known_T, debug, eps),
    #            open("/tmp/save.p","wb"))
    ratios = []
    for i,point in enumerate(critical_points):
        if CHEATING:
            layers = cheat_get_inner_layers(point)
            layer_vals = [np.min(np.abs(x)) for x in layers]
            which_layer = np.argmin(layer_vals)
            #print("real zero", np.argmin(np.abs(layers[0])))
            which_neuron = which_is_zero(which_layer, layers)
            #print("Which neuron?", which_neuron)

            real = A[which_layer][:,which_neuron]/A[which_layer][0,which_neuron]
        
        # We're going to create a system of linear equations
        # d_matrix is going to hold the inputs,
        # and ys is going to hold the resulting learned outputs
        d_matrix = []
        ys = []

        # Query on N+2 random points, so that we have redundency
        # for the least squares solution.
        for i in range(np.sum(known_T.forward(point) != 0)+2):
            # 1. Choose a random direction
            d = np.sign(np.random.normal(0,1,point.shape))
            d_matrix.append(d)

            # 2. See what the second partial derivitive at this value is
            ratio_val = get_second_grad_unsigned(point, d, eps, eps/3)

            # 3. Get the sign correct
            if len(ys) > 0:
                # When we have at least one y value already we need to orient this one
                # so that they point the same way.
                # We are given |f(x+d1)| and |f(x+d2)|
                # Compute |f(x+d1+d2)|.
                # Then either
                # |f(x+d1+d2)| = |f(x+d1)| + |f(x+d2)|
                # or
                # |f(x+d1+d2)| = |f(x+d1)| - |f(x+d2)|
                # or 
                # |f(x+d1+d2)| = |f(x+d2)| - |f(x+d1)|
                both_ratio_val = get_second_grad_unsigned(point, (d+d_matrix[0])/2, eps, eps/3)

                positive_error = abs(abs(ys[0]+ratio_val)/2 - abs(both_ratio_val))
                negative_error = abs(abs(ys[0]-ratio_val)/2 - abs(both_ratio_val))

                if positive_error > 1e-4 and negative_error > 1e-4:
                    print("Probably something is borked")
                    print("d^2(e(i))+d^2(e(j)) != d^2(e(i)+e(j))", positive_error, negative_error)
                    raise AcceptableFailure()

                
                if negative_error < positive_error:
                    ratio_val *= -1
            
            ys.append(ratio_val)

        d_matrix = np.array(d_matrix)
        # Now we need to compute the system of equations
        # We have to figure out what the vectors look like in hidden space,
        # so compute that precisely
        h_matrix = np.array(known_T.forward_at(point, d_matrix))

            
        # Which dimensions do we lose?
        column_is_zero = np.mean(np.abs(h_matrix)<1e-8,axis=0) > .5
        assert np.all((known_T.forward(point, with_relu=True) == 0) == column_is_zero)

        #print(h_matrix.shape)

        # Solve the least squares problem and get the solution
        # This is equal to solving for the ratios of the weight vector
        soln, *rest = np.linalg.lstsq(np.array(h_matrix, dtype=np.float32),
                                      np.array(ys, dtype=np.float32), 1e-5)
    
        # Set the columns we know to be wrong to NaN so that it's obvious
        # this isn't important but it helps us distinguish from genuine errors
        # and the kind that we can't avoic because of zero gradients
        soln[column_is_zero] = np.nan

        ratios.append(soln)
        
    return ratios