Exemplo n.º 1
0
def attack_whitebox(sess, model, attack_method, X, Y, **kwargs):
    # remove the file format
    dataset = DATA.CUR_DATASET_NAME

    logger.info('Crafting adversarial examples using {} method...'.format(
        attack_method.upper()))
    X_adv = None

    if (attack_method == ATTACK.FGSM):
        eps = kwargs.get('eps', 0.25)
        attack_params = {
            'eps': eps,
            'ord': np.inf,
            'clip_min': 0.,
            'clip_max': 1.
        }
        logger.info('{}: (eps={})'.format(attack_method.upper(), eps))

        start_time = time.time()
        X_adv, Y = whitebox.generate_art(model, X, Y, attack_method, dataset,
                                         attack_params)
        # X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset, attack_params)
        duration = time.time() - start_time
        logger.info('Time cost for generation: {}'.format(duration))

    elif (attack_method == ATTACK.BIM):
        # iterative fast gradient method
        eps = kwargs.get('eps', 0.25)
        nb_iter = kwargs.get('nb_iter', 100)
        ord = kwargs.get('ord', np.inf)
        """
        Cleverhans requires an eps_iter that is smaller than the eps. 
        By default, eps_iter=0.05, so, update eps_iter for small epsilons.
        """
        if eps < 0.005:
            eps_iter = 0.001
        elif eps < 0.05:
            eps_iter = 0.005
        else:
            # for big enough eps, use the default setting
            eps_iter = 0.05
        attack_params = {
            'eps': eps,
            'eps_iter': eps_iter,
            'nb_iter': nb_iter,
            'ord': ord,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, nb_iter={}, eps={})'.format(
            attack_method.upper(), ord, nb_iter, eps))
        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)

        duration = time.time() - start_time
        print('Time cost: {}'.format(duration))
    elif (attack_method == ATTACK.DEEPFOOL):
        # Images for inception classifier are normalized to be in [0, 255] interval.
        # max_iterations = kwargs.get('max_iterations', 100)
        max_iterations = 100
        ord = kwargs.get('ord', 2)
        overshoot = kwargs.get('overshoot', 1.0)

        attack_params = {
            'ord': ord,
            'max_iterations': max_iterations,
            'nb_candidate': Y.shape[1],
            'overshoot': overshoot,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (max_iterations={})'.format(attack_method.upper(),
                                                     max_iterations))
        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        print('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_L2):
        ord = 2
        binary_search_steps = kwargs.get('binary_search_steps', 10)
        batch_size = kwargs.get('cw_batch_size', 2)
        initial_const = kwargs.get('initial_const', 10)
        learning_rate = kwargs.get('learning_rate', 0.1)
        max_iterations = kwargs.get('max_iterations', 100)

        attack_params = {
            'batch_size': batch_size,
            'binary_search_steps': binary_search_steps,
            'initial_const': initial_const,
            'learning_rate': learning_rate,
            'max_iterations': max_iterations,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, max_iterations={})'.format(
            attack_method.upper(), ord, max_iterations))

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_Linf):
        ord = np.inf

        decrease_factor = kwargs.get('decrease_factor', 0.9)
        initial_const = kwargs.get('initial_const', 1e-5)
        learning_rate = kwargs.get('learning_rate', 0.1)
        largest_const = kwargs.get('largest_const', 2e+1)
        max_iterations = kwargs.get('max_iterations', 1000)
        reduce_const = False
        const_factor = 3.0

        attack_params = {
            # 'descrease_factor': decrease_factor,
            'initial_const': initial_const,
            'learning_rate': learning_rate,
            'max_iterations': max_iterations,
            'largest_const': largest_const,
            'reduce_const': reduce_const,
            'const_factor': const_factor,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, max_iterations={})'.format(
            attack_method.upper(), ord, max_iterations))

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_L0):
        max_iterations = kwargs.get('max_iterations', 1000)
        initial_const = kwargs.get('initial_const', 10)
        largest_const = kwargs.get('largest_const', 15)

        attack_params = {
            'max_iterations': max_iterations,
            'initial_const': initial_const,
            'largest_const': largest_const
        }

        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method,
                                     attack_params)

    elif (attack_method == ATTACK.JSMA):
        theta = kwargs.get('theta', 0.6)
        gamma = kwargs.get('gamma', 0.5)
        attack_params = {
            'theta': theta,
            'gamma': gamma,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (theta={}, gamma={})'.format(attack_method.upper(),
                                                      theta, gamma))
        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.PGD):
        eps = kwargs.get('eps', 0.1)
        nb_iter = kwargs.get('nb_iter', 250)
        eps_iter = kwargs.get('eps_iter', eps / nb_iter)

        attack_params = {
            'eps': eps,
            'clip_min': 0.,
            'clip_max': 1.,
            'nb_iter': nb_iter,
            'eps_iter': eps_iter
        }

        start_time = time.time()
        # X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset, attack_params)
        X_adv, Y = whitebox.generate_art(model, X, Y, attack_method, dataset,
                                         attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.ONE_PIXEL):
        # one-pixel was implemented separately.
        targeted = kwargs.get('targeted', False)
        pixel_counts = kwargs.get('pixel_counts', 3)
        max_iter = kwargs.get('max_iter', 10)
        pop_size = kwargs.get('pop_size', 10)

        attack_params = {
            'targeted': targeted,
            'pixel_counts': pixel_counts,
            'max_iter': max_iter,
            'pop_size': pop_size,
            'clip_min': 0.,
            'clip_max': 1.,
        }

        start_time = time.monotonic()
        X_adv, Y = one_pixel.generate(model, X, Y, attack_params)
        duration = time.monotonic() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.MIM):
        eps = kwargs.get('eps', 0.3)
        eps_iter = kwargs.get('eps_iter', 0.06)
        nb_iter = kwargs.get('nb_iter', 10)
        decay_factor = kwargs.get('decay_factor', 1.0)
        y_target = kwargs.get('y_target', None)

        attack_params = {
            'eps': eps,
            'eps_iter': eps_iter,
            'nb_iter': nb_iter,
            'ord': np.inf,
            'decay_factor': decay_factor,
            'y_target': y_target,
            'clip_min': 0.,
            'clip_max': 1.
        }

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    print('*** SHAPE: {}'.format(np.asarray(X_adv).shape))

    return X_adv, Y
Exemplo n.º 2
0
def get_adversarial_examples(model_name, attack_method, X, Y, **kwargs):
    # remove the file format
    model_name = model_name.split('.')[0]
    dataset = DATA.CUR_DATASET_NAME

    if ((not os.path.isfile('{}/{}.h5'.format(PATH.MODEL, model_name))) and
        (not os.path.isfile('{}/{}.json'.format(PATH.MODEL, model_name)))):
        raise FileNotFoundError(
            'Could not file target mode [{}].'.format(model_name))

    config = tf.ConfigProto(intra_op_parallelism_threads=4,
                            inter_op_parallelism_threads=4)

    sess = tf.Session(config=config)
    keras.backend.set_session(sess)

    model = load_model(model_name)

    logger.info('Crafting adversarial examples using {} method...'.format(
        attack_method.upper()))
    X_adv = None

    if (attack_method == ATTACK.FGSM):
        eps = kwargs.get('eps', 0.25)
        attack_params = {
            'eps': eps,
            'ord': np.inf,
            'clip_min': 0.,
            'clip_max': 1.
        }
        logger.info('{}: (eps={})'.format(attack_method.upper(), eps))

        start_time = time.time()
        X_adv, Y = whitebox.generate_art(model, X, Y, attack_method, dataset,
                                         attack_params)
        # X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset, attack_params)
        duration = time.time() - start_time
        logger.info('Time cost for generation: {}'.format(duration))

    elif (attack_method == ATTACK.BIM):
        # iterative fast gradient method
        eps = kwargs.get('eps', 0.25)
        nb_iter = kwargs.get('nb_iter', 100)
        ord = kwargs.get('ord', np.inf)
        """
        Cleverhans requires an eps_iter that is smaller than the eps. 
        By default, eps_iter=0.05, so, update eps_iter for small epsilons.
        """
        if eps < 0.005:
            eps_iter = 0.001
        elif eps < 0.05:
            eps_iter = 0.005
        else:
            # for big enough eps, use the default setting
            eps_iter = 0.05
        attack_params = {
            'eps': eps,
            'eps_iter': eps_iter,
            'nb_iter': nb_iter,
            'ord': ord,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, nb_iter={}, eps={})'.format(
            attack_method.upper(), ord, nb_iter, eps))
        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)

        duration = time.time() - start_time
        print('Time cost: {}'.format(duration))
    elif (attack_method == ATTACK.DEEPFOOL):
        # Images for inception classifier are normalized to be in [0, 255] interval.
        # max_iterations = kwargs.get('max_iterations', 100)
        # keras.backend.set_learning_phase(True)
        max_iterations = 50
        ord = kwargs.get('ord', 2)
        overshoot = kwargs.get('overshoot', 0.02)

        attack_params = {
            'ord': ord,
            'max_iterations': max_iterations,
            'nb_candidate': int(Y.shape[1] / 2),
            'overshoot': overshoot,
            'clip_min': 0.,
            'clip_max': 255.
        }

        print(attack_params)
        logger.info('{}: (max_iterations={})'.format(attack_method.upper(),
                                                     max_iterations))

        X *= 255.
        Y *= 255

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)

        X /= 255.
        Y /= 255.
        X_adv /= 255.

        duration = time.time() - start_time
        print('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_L2):
        ord = 2
        binary_search_steps = kwargs.get('binary_search_steps', 10)
        batch_size = kwargs.get('cw_batch_size', 2)
        initial_const = kwargs.get('initial_const', 10)
        learning_rate = kwargs.get('learning_rate', 0.1)
        max_iterations = kwargs.get('max_iterations', 100)

        attack_params = {
            'batch_size': batch_size,
            'binary_search_steps': binary_search_steps,
            'initial_const': initial_const,
            'learning_rate': learning_rate,
            'max_iterations': max_iterations,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, max_iterations={})'.format(
            attack_method.upper(), ord, max_iterations))

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_Linf):
        ord = np.inf

        decrease_factor = kwargs.get('decrease_factor', 0.9)
        initial_const = kwargs.get('initial_const', 1e-5)
        learning_rate = kwargs.get('learning_rate', 0.1)
        largest_const = kwargs.get('largest_const', 2e+1)
        max_iterations = kwargs.get('max_iterations', 1000)
        reduce_const = False
        const_factor = 3.0

        attack_params = {
            # 'descrease_factor': decrease_factor,
            'initial_const': initial_const,
            'learning_rate': learning_rate,
            'max_iterations': max_iterations,
            'largest_const': largest_const,
            'reduce_const': reduce_const,
            'const_factor': const_factor,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (ord={}, max_iterations={})'.format(
            attack_method.upper(), ord, max_iterations))

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.CW_L0):
        max_iterations = kwargs.get('max_iterations', 1000)
        initial_const = kwargs.get('initial_const', 10)
        largest_const = kwargs.get('largest_const', 15)

        attack_params = {
            'max_iterations': max_iterations,
            'initial_const': initial_const,
            'largest_const': largest_const
        }

        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method,
                                     attack_params)

    elif (attack_method == ATTACK.JSMA):
        theta = kwargs.get('theta', 0.6)
        gamma = kwargs.get('gamma', 0.5)
        attack_params = {
            'theta': theta,
            'gamma': gamma,
            'clip_min': 0.,
            'clip_max': 1.
        }

        logger.info('{}: (theta={}, gamma={})'.format(attack_method.upper(),
                                                      theta, gamma))
        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.PGD):
        eps = kwargs.get('eps', 0.3)
        nb_iter = kwargs.get('nb_iter', 40)
        eps_iter = kwargs.get('eps_iter', 0.01)

        attack_params = {
            'eps': eps,
            'clip_min': 0.,
            'clip_max': 1.,
            'nb_iter': nb_iter,
            'eps_iter': eps_iter
        }

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.ONE_PIXEL):
        # one-pixel was implemented separately.
        targeted = kwargs.get('targeted', False)
        pixel_counts = kwargs.get('pixel_counts', 3)
        max_iter = kwargs.get('max_iter', 10)
        pop_size = kwargs.get('pop_size', 10)

        attack_params = {
            'targeted': targeted,
            'pixel_counts': pixel_counts,
            'max_iter': max_iter,
            'pop_size': pop_size,
            'clip_min': 0.,
            'clip_max': 1.,
        }

        start_time = time.monotonic()
        X_adv, Y = one_pixel.generate(model, X, Y, attack_params)
        duration = time.monotonic() - start_time
        logger.info('Time cost: {}'.format(duration))

    elif (attack_method == ATTACK.MIM):
        eps = kwargs.get('eps', 0.3)
        eps_iter = kwargs.get('eps_iter', 0.06)
        nb_iter = kwargs.get('nb_iter', 10)
        decay_factor = kwargs.get('decay_factor', 0.5)
        y_target = kwargs.get('y_target', None)

        attack_params = {
            'eps': eps,
            'eps_iter': eps_iter,
            'nb_iter': nb_iter,
            'ord': np.inf,
            'decay_factor': decay_factor,
            'y_target': y_target,
            'clip_min': 0.,
            'clip_max': 1.
        }

        start_time = time.time()
        X_adv, Y = whitebox.generate(sess, model, X, Y, attack_method, dataset,
                                     attack_params)
        duration = time.time() - start_time
        logger.info('Time cost: {}'.format(duration))

    print('*** SHAPE: {}'.format(np.asarray(X_adv).shape))

    del model
    sess.close()

    return X_adv, Y