예제 #1
0
    def generate_gradient(self, input, target):
        target = TensorBase(np.array(target).astype('float64'))
        input = TensorBase(np.array(input).astype('float64'))
        pred = self.forward(input)

        target_v = target

        if(self.pubkey is not None and self.encrypted):
            target_v = self.pubkey.encrypt(target_v)

        output_grad = (pred - target_v)

        weight_grad = TensorBase(np.zeros_like(self.weights.data))

        if(self.encrypted):
            weight_grad = weight_grad.encrypt(self.pubkey)

        for i in range(len(input)):
            if(input[i] != 1 and input[i] != 0):
                weight_grad[i] += (output_grad[0] * input[i])
            elif(input[i] == 1):
                weight_grad[i] += output_grad[0]
            else:
                "doesn't matter... input == 0"

        return weight_grad
예제 #2
0
파일: linear.py 프로젝트: kaushiksk/PySyft
 def batch_update(self, minibatch, alpha):
     """Updates a minibatch of input and target prediction. Should be called through
     learn() for default parameters
     """
     weight_update = TensorBase(np.zeros(self.weights.data.shape))
     if (self.encrypted):
         weight_update = weight_update.encrypt(self.pubkey)
     for (x, y) in zip(*minibatch):
         weight_update += self.generate_gradient(x, y)
     self.weights -= weight_update * (alpha / len(minibatch[0]))
예제 #3
0
class LinearClassifier():
    """This class is a basic linear classifier with functionality to
    encrypt/decrypt weights according to any of the homomorphic encryption
    schemes in syft.he. It also contains the logic to make predictions when
    in an encrypted state.

    TODO: create a generic interface for ML models that this class implements.

    TODO: minibatching in the "learn" API. The greater the batch size, the more
    iterations should be doable before the homomorphic encryption noise grows
    too much to be decrypted.
    """

    def __init__(self, n_inputs=4, n_labels=2, desc=""):

        self.desc = desc

        self.n_inputs = n_inputs
        self.n_labels = n_labels

        self.weights = TensorBase(np.zeros((n_inputs, n_labels)))

        self.pubkey = None
        self.encrypted = False

    def encrypt(self, pubkey):
        """iterates through each weight and encrypts it

        TODO: check that weights are actually decrypted

        """

        self.encrypted = True
        self.pubkey = pubkey
        self.weights = self.weights.encrypt(pubkey)
        return self

    def decrypt(self, seckey):
        """iterates through each weight and decrypts it

        TODO: check that weights are actually encrypted

        """
        self.encrypted = False
        self.weights = self.weights.decrypt(seckey)
        return self

    def forward(self, input):

        """Makes a prediction based on input. If the network is encrypted, the
        prediction is also encrypted and vise versa."""

        pred = self.weights[0] * input[0]
        for j, each_inp in enumerate(input[1:]):
            if(each_inp == 1):
                pred = pred + self.weights[j + 1]
            elif(each_inp != 0):
                pred = pred + (self.weights[j + 1] * input[j + 1])

        return pred

    def learn(self, input, target, alpha=0.5):
        """Updates weights based on input and target prediction. Note, updating
        weights increases the noise in the encrypted weights and will
        eventually require the weights to be re-encrypted.

        TODO: minibatching
        TODO: instead of storing weights, store aggregated weight updates (and
        optionally use them in "forward").
        """

        weight_update = self.generate_gradient(input, target)
        self.weights -= weight_update * alpha

        return weight_update

    def evaluate(self, inputs, targets):
        """accepts a list of inputs and a list of targets - returns the mean
        squared error scaled by a fixed amount and converted to an integer."""

        scale = 1000

        if(self.encrypted):
            return "not yet supported... but will in the future"
        else:

            loss = 0
            for i, row in enumerate(inputs):
                pred = self.forward(row)
                true = targets[i]
                diff = (pred - true)
                loss += (diff * diff).to_numpy()
            return int((loss[0] * scale) / float(len(inputs)))

    def __str__(self):
        left = "Linear Model (" + str(self.n_inputs) + ","
        return left + str(self.n_labels) + "): " + str(self.desc)

    def __repr__(self):
        return self.__str__()

    def generate_gradient(self, input, target):
        target = TensorBase(np.array(target).astype('float64'))
        input = TensorBase(np.array(input).astype('float64'))
        pred = self.forward(input)

        target_v = target

        if(self.pubkey is not None and self.encrypted):
            target_v = self.pubkey.encrypt(target_v)

        output_grad = (pred - target_v)

        weight_grad = TensorBase(np.zeros_like(self.weights.data))

        if(self.encrypted):
            weight_grad = weight_grad.encrypt(self.pubkey)

        for i in range(len(input)):
            if(input[i] != 1 and input[i] != 0):
                weight_grad[i] += (output_grad[0] * input[i])
            elif(input[i] == 1):
                weight_grad[i] += output_grad[0]
            else:
                "doesn't matter... input == 0"

        return weight_grad
예제 #4
0
파일: linear.py 프로젝트: kaushiksk/PySyft
class LinearClassifier(AbstractModel):
    """
        This class is a basic linear classifier with functionality to
        encrypt/decrypt weights according to any of the homomorphic encryption
        schemes in syft.he. It also contains the logic to make predictions when
        in an encrypted state.
    """
    def __init__(self, n_inputs=4, n_labels=2, desc="", capsule_client=None):
        self.desc = desc

        self.n_inputs = n_inputs
        self.n_labels = n_labels

        self.weights = TensorBase(np.random.rand(n_inputs, n_labels))

        self.pubkey = None
        self.encrypted = False
        self.capsule = capsule_client

    def encrypt(self):
        """iterates through each weight and encrypts it
        """

        if self.encrypted:
            return self

        self.pubkey = self.capsule.keygen()
        self.weights = self.weights.encrypt(self.pubkey)
        self.encrypted = self.weights.encrypted

        return self

    def decrypt(self):
        """iterates through each weight and decrypts it
        """
        if not self.pubkey:
            raise KeyException("Public key was not generated.")

        if not self.encrypted:
            return self

        self.weights = self.capsule.decrypt(self.weights, self.pubkey.id)
        self.encrypted = self.weights.encrypted
        return self

    def forward(self, input):
        """Makes a prediction based on input. If the network is encrypted, the
        prediction is also encrypted and vise versa.
        """
        pred = self.weights[0] * input[0]
        for j, each_inp in enumerate(input[1:]):
            if (each_inp == 1):
                pred = pred + self.weights[j + 1]
            elif (each_inp != 0):
                pred = pred + (self.weights[j + 1] * input[j + 1])

        return pred

    def learn(self,
              input,
              target,
              alpha=0.5,
              batchsize=32,
              encrypt_interval=16):
        """Updates weights based on input and target prediction. Note, updating
        weights increases the noise in the encrypted weights and will
        eventually require the weights to be re-encrypted.

        TODO: instead of storing weights, store aggregated weight updates (and
        optionally use them in "forward").
        """
        input_batches = [
            input[i:i + batchsize] for i in range(0, len(input), batchsize)
        ]
        target_batches = [
            target[i:i + batchsize] for i in range(0, len(target), batchsize)
        ]
        for epoch_count, minibatch in enumerate(
                zip(input_batches, target_batches)):
            self.batch_update(minibatch, alpha)
            if self.encrypted and (epoch_count > encrypt_interval) and (
                    epoch_count % encrypt_interval == 0):
                self.weights = self.capsule.bootstrap(self.weights,
                                                      self.pubkey.id)

    def batch_update(self, minibatch, alpha):
        """Updates a minibatch of input and target prediction. Should be called through
        learn() for default parameters
        """
        weight_update = TensorBase(np.zeros(self.weights.data.shape))
        if (self.encrypted):
            weight_update = weight_update.encrypt(self.pubkey)
        for (x, y) in zip(*minibatch):
            weight_update += self.generate_gradient(x, y)
        self.weights -= weight_update * (alpha / len(minibatch[0]))

    def evaluate(self, inputs, targets):
        """accepts a list of inputs and a list of targets - returns the mean
        squared error scaled by a fixed amount and converted to an integer.
        """
        scale = 1000

        if (self.encrypted):
            return "not yet supported... but will in the future"
        else:

            loss = 0
            for i, row in enumerate(inputs):
                pred = self.forward(row)
                true = targets[i]
                diff = (pred - true)
                loss += (diff * diff).to_numpy()
            return int((loss[0] * scale) / float(len(inputs)))

    def __str__(self):
        left = "Linear Model (" + str(self.n_inputs) + ","
        return left + str(self.n_labels) + "): " + str(self.desc)

    def generate_gradient(self, input, target):
        target = TensorBase(np.array(target).astype('float64'))
        input = TensorBase(np.array(input).astype('float64'))
        pred = self.forward(input)

        target_v = target

        if (self.pubkey is not None and self.encrypted):
            target_v = self.pubkey.encrypt(target_v)

        output_grad = (pred - target_v)

        weight_grad = TensorBase(np.zeros_like(self.weights.data))

        if (self.encrypted):
            weight_grad = weight_grad.encrypt(self.pubkey)

        for i in range(len(input)):
            if (input[i] != 1 and input[i] != 0):
                weight_grad[i] += (output_grad[0] * input[i])
            elif (input[i] == 1):
                weight_grad[i] += output_grad[0]
            else:
                "doesn't matter... input == 0"

        return weight_grad