Exemplos de FGSM em Python, exemplos de BayesKeras.analyzers.FGSM em Python

Exemplo n.º 1

0

Exibir arquivo

Arquivo: sgd.py Projeto: matthewwicker/GradientFreeAttacksBNNs

    def step(self, features, labels, lrate):
        # Define the GradientTape context
        with tf.GradientTape(
                persistent=True
        ) as tape:  # Below we add an extra variable for IBP
            tape.watch(self.posterior_mean)
            predictions = self.model(features)
            if (self.robust_train == 0):
                worst_case = predictions  # cheap hack lol
                loss = self.loss_func(labels, predictions)
            elif (int(self.robust_train) == 1):
                # Get the probabilities
                predictions = self.model(features)
                logit_l, logit_u = analyzers.IBP(
                    self,
                    features,
                    self.model.trainable_variables,
                    eps=self.epsilon)
                #!*! TODO: Undo the hardcoding of depth in this function
                v1 = tf.one_hot(labels, depth=10)
                v2 = 1 - tf.one_hot(labels, depth=10)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u),
                                         tf.math.multiply(v1, logit_l))
                # Now we have the worst case softmax probabilities
                worst_case = self.model.layers[-1].activation(worst_case)
                # Calculate the loss
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)
            elif (int(self.robust_train) == 2):
                predictions = self.model(features)
                features_adv = analyzers.FGSM(self,
                                              features,
                                              self.attack_loss,
                                              eps=self.epsilon,
                                              num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                # Calculate the loss
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)
                #self.train_rob(labels, worst_case)

        # Get the gradients
        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        #        print(weight_gradient)
        weights = self.model.get_weights()
        new_weights = []
        for i in range(len(weight_gradient)):
            wg = tf.math.multiply(weight_gradient[i], lrate)
            m = tf.math.subtract(weights[i], wg)
            new_weights.append(m)

        self.model.set_weights(new_weights)
        self.posterior_mean = new_weights

        self.train_loss(loss)
        self.train_metric(labels, predictions)
        #self.train_rob(labels, worst_case)
        return self.posterior_mean, self.posterior_var

Exemplo n.º 2

0

Exibir arquivo

    def step(self, features, labels, lrate):

        # Define the GradientTape context
        with tf.GradientTape(
                persistent=True
        ) as tape:  # Below we add an extra variable for IBP
            tape.watch(self.posterior_mean)
            predictions = self.model(features)
            if (self.robust_train == 0):
                loss = losses.normal_potential_energy(labels, predictions,
                                                      self.prior_mean,
                                                      self.prior_var, self.q,
                                                      self.loss_func)
            elif (int(self.robust_train) == 1):
                # Get the probabilities
                predictions = self.model(features)
                logit_l, logit_u = analyzers.IBP(
                    self,
                    features,
                    self.model.trainable_variables,
                    eps=self.epsilon)
                #!*! TODO: Undo the hardcoding of depth in this function
                v1 = tf.one_hot(labels, depth=10)
                v2 = 1 - tf.one_hot(labels, depth=10)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u),
                                         tf.math.multiply(v1, logit_l))
                # Now we have the worst case softmax probabilities
                worst_case = self.model.layers[-1].activation(worst_case)
                # Calculate the loss
                loss = losses.robust_potential_energy(
                    labels, predictions, self.prior_mean, self.prior_var,
                    self.q, self.loss_func, worst_case, self.robust_lambda)
                #loss = self.loss_func(labels, predictions, worst_case, self.robust_lambda)
            elif (int(self.robust_train) == 2):
                predictions = self.model(features)
                features_adv = analyzers.FGSM(self,
                                              features,
                                              self.attack_loss,
                                              eps=self.epsilon,
                                              num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                # Calculate the loss
                loss = losses.robust_potential_energy(
                    labels, predictions, self.prior_mean, self.prior_var,
                    self.q, self.loss_func, worst_case, self.robust_lambda)
                #loss = self.loss_func(labels, predictions, worst_case, self.robust_lambda)
                #self.train_rob(labels, worst_case)

        # Get the gradients
        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        #print(weight_gradient)
        # Update the momentum variable
        temp_p = []
        for i in range(len(weight_gradient)):
            wg = tf.math.multiply(weight_gradient[i], lrate)
            temp_p.append(tf.math.add(
                self.p[i], wg))  # maybe come back and make this subtraction
        self.p = np.asarray(temp_p)

        self.train_loss(loss)
        self.train_metric(labels, predictions)
        #self.train_rob(labels, worst_case)
        return self.posterior_mean, self.posterior_var

Exemplo n.º 3

0

Exibir arquivo

    def step(self, features, labels, lrate):
        # OPTIMIZATION PARAMETERS:
        alpha = lrate  #self.alpha
        beta_1 = self.beta_1
        beta_2 = self.beta_2
        lam = self.lam

        N = self.N  #60000
        #N = float(self.batch_size) # batch size

        self.posterior_mean = self.model.get_weights()

        v1 = tf.one_hot(labels, depth=10)
        v2 = 1 - tf.one_hot(labels, depth=10)

        init_weights = []
        for i in range(len(self.posterior_mean)):
            var = tf.math.add(tf.math.sqrt(N * self.posterior_var[i]), lam)
            var = tf.math.reciprocal(var)
            sample = tf.random.normal(shape=self.posterior_var[i].shape,
                                      mean=0,
                                      stddev=1.0)
            sample = tf.math.multiply(var, sample)
            sample = tf.math.add(self.posterior_mean[i], sample)
            init_weights.append(sample)

        self.model.set_weights(init_weights)

        with tf.GradientTape(persistent=True) as tape:
            # Get the probabilities
            predictions = self.model(features)
            # Calculate the loss
            if (int(self.robust_train) == 0):
                loss = self.loss_func(labels, predictions)
            elif (int(self.robust_train) == 1):
                logit_l, logit_u = analyzers.IBP(
                    self,
                    features,
                    self.model.trainable_variables,
                    eps=self.epsilon)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u),
                                         tf.math.multiply(v1, logit_l))
                worst_case = self.model.layers[-1].activation(worst_case)
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)
                #self.train_rob(labels, worst_case)
            elif (int(self.robust_train) == 2):
                features_adv = analyzers.FGSM(self,
                                              features,
                                              self.attack_loss,
                                              eps=self.epsilon,
                                              num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                # Calculate the loss
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)

        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        g = np.asarray(weight_gradient)
        #        print(g)
        sq_grad = []
        for i in range(len(weight_gradient)):
            sq_grad.append(
                tf.math.multiply(weight_gradient[i], weight_gradient[i]))
            self.m[i] = (beta_1 * self.m[i]) + ((1 - beta_1) * (g[i] + (
                (lam * self.posterior_mean[i]) / N)))
            self.posterior_var[i] = (beta_2 * self.posterior_var[i]) + (
                (1 - beta_2) * (sq_grad[i]))

        #print("sq: ", sq_grad)
        sq_grad = np.asarray(sq_grad)
        self.m = np.asarray(self.m)
        self.posterior_var = np.asarray(self.posterior_var)

        for i in range(len(weight_gradient)):
            m_ = self.m[i] / (1 - beta_1)
            s_ = np.sqrt(self.posterior_var[i]) + lam / N
            self.posterior_mean[i] = self.posterior_mean[i] - (alpha *
                                                               (m_ / s_))

        self.model.set_weights(self.posterior_mean)
        self.train_loss(loss)
        self.train_metric(labels, predictions)
        #self.posterior_mean = posti_mean
        #self.posterior_var = posti_var
        return self.posterior_mean, self.posterior_var

Exemplo n.º 4

0

Exibir arquivo

    def step(self, features, labels, lrate):
        """
        Initial sampling for BBB
        """
        init_weights = []
        noise_used = []
        for i in range(len(self.posterior_mean)):
            noise = tf.random.normal(shape=self.posterior_var[i].shape,
                                     mean=tf.zeros(
                                         self.posterior_var[i].shape),
                                     stddev=1.0)
            var_add = tf.multiply(softplus(self.posterior_var[i]), noise)
            #var_add = tf.multiply(self.posterior_mean[i], noise)
            w = tf.math.add(self.posterior_mean[i], var_add)
            noise_used.append(noise)
            init_weights.append(w)
        self.model.set_weights(init_weights)

        # Define the GradientTape context
        with tf.GradientTape(
                persistent=True
        ) as tape:  # Below we add an extra variable for IBP
            tape.watch(self.posterior_mean)
            tape.watch(self.posterior_var)
            #tape.watch(init_weights)
            if (self.robust_train == 0):
                predictions = self.model(features)
                worst_case = predictions  # cheap hack lol
                loss, kl_comp = losses.KL_Loss(labels, predictions,
                                               self.model.trainable_variables,
                                               self.prior_mean, self.prior_var,
                                               self.posterior_mean,
                                               self.posterior_var,
                                               self.loss_func, self.kl_weight)
            elif (int(self.robust_train) == 1):
                # Get the probabilities
                predictions = self.model(features)
                logit_l, logit_u = analyzers.IBP(
                    self,
                    features,
                    self.model.trainable_variables,
                    eps=self.epsilon)
                #!*! TODO: Undo the hardcoding of depth in this function
                v1 = tf.one_hot(labels, depth=10)
                v2 = 1 - tf.one_hot(labels, depth=10)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u),
                                         tf.math.multiply(v1, logit_l))

                # Now we have the worst case softmax probabilities
                worst_case = self.model.layers[-1].activation(worst_case)
                # Calculate the loss
                loss, kl_comp = losses.robust_KL_Loss(
                    labels, predictions, self.model.trainable_variables,
                    self.prior_mean, self.prior_var, self.posterior_mean,
                    self.posterior_var, self.loss_func, self.kl_weight,
                    worst_case, self.robust_lambda)

            # !*! This is currently a broken branch.
            elif (int(self.robust_train) == 2):
                predictions = self.model(features)
                features_adv = analyzers.FGSM(self,
                                              features,
                                              self.attack_loss,
                                              eps=self.epsilon,
                                              num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                #print(predictions[0], worst_case[0])
                # Calculate the loss
                loss, kl_comp = losses.robust_KL_Loss(
                    labels, predictions, self.model.trainable_variables,
                    self.prior_mean, self.prior_var, self.posterior_mean,
                    self.posterior_var, self.loss_func, self.kl_weight,
                    worst_case, self.robust_lambda)

        # Get the gradients
        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        mean_gradient = tape.gradient(loss, self.posterior_mean)
        var_gradient = tape.gradient(loss, self.posterior_var)
        #init_gradient = tape.gradient(loss, init_weights)

        posti_mean_grad = []
        posti_var_grad = []
        # !*! - Make the weight and init gradients the same variable and retest
        for i in range(len(mean_gradient)):
            #weight_gradient[i] = tf.math.add(weight_gradient[i], init_gradient[i])
            weight_gradient[i] = tf.cast(weight_gradient[i], 'float32')
            mean_gradient[i] = tf.cast(mean_gradient[i], 'float32')
            f = tf.math.add(weight_gradient[i], mean_gradient[i])
            posti_mean_grad.append(f)
            v = tf.math.divide(
                noise_used[i],
                1 + tf.math.exp(tf.math.multiply(self.posterior_var[i], -1)))
            v = tf.math.multiply(v, weight_gradient[i])
            v = tf.math.add(v, var_gradient[i])
            posti_var_grad.append(v)
        #gradients = posti_mean_grad

        # APPLICATION OF WEIGHTS
        new_posti_var = []
        new_posti_mean = []
        for i in range(len(mean_gradient)):
            pdv = tf.math.multiply(posti_var_grad[i], lrate)
            pdm = tf.math.multiply(posti_mean_grad[i], lrate)
            v = tf.math.subtract(self.posterior_var[i], pdv)
            m = tf.math.subtract(self.posterior_mean[i], pdm)
            new_posti_var.append(v)
            new_posti_mean.append(m)

        self.train_loss(loss)
        self.train_metric(labels, predictions)
        #self.train_rob(labels, worst_case)
        self.kl_component(kl_comp)
        self.posterior_mean = new_posti_mean
        self.posterior_var = new_posti_var
        return new_posti_mean, new_posti_var

Exemplo n.º 5

0

Exibir arquivo

    def step(self, features, labels, lrate):
        alpha = lrate
        beta_1 = self.beta_1
        beta_2 = self.beta_2
        lam = self.lam

        posti_var = self.posterior_var
        posti_mean = self.posterior_mean

        N = float(self.batch_size)  # batch size

        with tf.GradientTape(persistent=True) as tape:
            # Get the probabilities
            predictions = self.model(features)
            # Calculate the loss
            if (int(self.robust_train) == 0):
                loss = self.loss_func(labels, predictions)
            elif (int(self.robust_train) == 1):
                logit_l, logit_u = analyzers.IBP(
                    self,
                    features,
                    self.model.trainable_variables,
                    eps=self.epsilon)
                v1 = tf.one_hot(labels, depth=10)
                v2 = 1 - tf.one_hot(labels, depth=10)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u),
                                         tf.math.multiply(v1, logit_l))
                worst_case = self.model.layers[-1].activation(worst_case)
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)
                #self.train_rob(labels, worst_case)
            elif (int(self.robust_train) == 2):
                features_adv = analyzers.FGSM(self,
                                              features,
                                              self.attack_loss,
                                              eps=self.epsilon,
                                              num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                # Calculate the loss
                loss = self.loss_func(labels, predictions, worst_case,
                                      self.robust_lambda)

        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        g = np.asarray(weight_gradient)

        sq_grad = []
        for i in range(len(weight_gradient)):
            sq_grad.append(
                tf.math.multiply(weight_gradient[i], weight_gradient[i]))
            self.m[i] = (beta_1 * self.m[i]) + ((1 - beta_1) *
                                                (g[i] +
                                                 ((lam * posti_mean[i]) / N)))
            posti_var[i] = (beta_2 * posti_var[i]) + ((1 - beta_2) *
                                                      (sq_grad[i]))

        sq_grad = np.asarray(sq_grad)
        self.m = np.asarray(self.m)
        posti_var = np.asarray(posti_var)

        for i in range(len(weight_gradient)):
            m_ = self.m[i] / (1 - beta_1)
            s_ = np.sqrt(posti_var[i]) + lam / N
            posti_mean[i] = posti_mean[i] - (alpha * (m_ / s_))

        self.model.set_weights(posti_mean)
        self.train_loss(loss)
        self.train_metric(labels, predictions)
        return posti_mean, posti_var

Exemplo n.º 6

0

Exibir arquivo

    def step(self, features, labels, lrate):
        # OPTIMIZATION PARAMETERS:
        alpha = lrate #self.alpha
        beta_1 = self.beta_1
        beta_2 = self.beta_2
        lam = self.lam

        N = 60000 #float(self.batch_size) # batch size

        self.posterior_mean = self.model.get_weights()

        init_weights = []
        for i in range(len(self.posterior_mean)):
            var = tf.math.add(tf.math.sqrt(N*self.posterior_var[i]), lam)
            var = tf.math.reciprocal(var)
            sample = tf.random.normal(shape=self.posterior_var[i].shape, mean=0, stddev=1.0)
            sample = tf.math.multiply(var, sample)
            sample = tf.math.add(self.posterior_mean[i], sample)
            init_weights.append(sample)
        
        self.model.set_weights(np.asarray(init_weights))
        
        with tf.GradientTape(persistent=True) as tape:
            # Get the probabilities
            predictions = self.model(features)
            # Calculate the loss
            if(int(self.robust_train) == 0):
                loss = self.loss_func(labels, predictions)
            elif(int(self.robust_train) == 1):
                logit_l, logit_u = analyzers.IBP(self, features, self.model.trainable_variables, eps=self.epsilon)
                v1 = tf.one_hot(labels, depth=10)
                v2 = 1 - tf.one_hot(labels, depth=10)
                worst_case = tf.math.add(tf.math.multiply(v2, logit_u), tf.math.multiply(v1, logit_l))
                worst_case = self.model.layers[-1].activation(worst_case)
                #print(worst_case, predictions)
                loss =  self.loss_func(labels, predictions, worst_case, self.robust_lambda)
                #self.train_rob(labels, worst_case)
            elif(int(self.robust_train) == 2):
                features_adv = analyzers.FGSM(self, features, self.attack_loss, eps=self.epsilon, num_models=-1)
                # Get the probabilities
                worst_case = self.model(features_adv)
                #print(predictions[0], worst_case[0])
                # Calculate the loss
                loss = self.loss_func(labels, predictions, worst_case, self.robust_lambda)
                
        weight_gradient = tape.gradient(loss, self.model.trainable_variables)
        g = np.asarray(weight_gradient)
       
        #if(int(self.robust_train) == 1):
        #print(g)
        # We need to process the gradient according to the reparameterization given by Khan (2002.10060)
        g_mu = []
        g_s = []
        m_hat = []
        s_hat = []
        t = self.learning_rate
        for i in range(len(g)):
            # Appropriately scaled updates to the gradients Khan (2002.10060)[ICLR2020]
            g_mu.append((self.lam/60000)*self.posterior_mean[i] + g[i])
            g_s_comp2 = tf.math.multiply((60000*self.posterior_var[i]), (init_weights[i] - self.posterior_mean[i]))
            g_s_comp2 = tf.math.multiply(g_s_comp2, g[i])
            g_s.append((self.lam/60000) - self.posterior_var[i] + g_s_comp2)
            # Standard momentum updtae
            self.m[i] = (beta_1*self.m[i]) + ((1-beta_1)*(g_mu[i]))
            m_hat.append(self.m[i]/(1-beta_1))
            s_hat.append(self.posterior_var[i]/(1-beta_2))

        # Apply the effects from the updates
        for i in range(len(g)):
            self.posterior_mean[i] = self.posterior_mean[i] - t*(m_hat[i]/s_hat[i])
            comp_1 = (0.5 * ((1-beta_2)**2) * g_s[i])
            recip = tf.math.multiply(tf.math.reciprocal(self.posterior_var[i]), g_s[i])
            self.posterior_var[i] = self.posterior_var[i] + tf.math.multiply(comp_1, recip) 

        self.model.set_weights(self.posterior_mean)
        self.train_loss(loss)
        self.train_metric(labels, predictions)
        return self.posterior_mean, self.posterior_var