Python Activations Examples

Programming Language: Python

Namespace/Package Name: activations

Class/Type: Activations

Examples at hotexamples.com: 9

Python Activations - 9 examples found. These are the top rated real world Python examples of activations.Activations extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Activations(5)

resolve_activation(3)

f(1)

Example #1

Show file

File: logreg.py Project: trygvels/FYS-STK4155

    def __init__(
            self,  # Specify cost function to calculate with
            cost='cross_entropy'):

        self.cost = CostFunctions(cost)  # Init cross_entropy cost function
        self.initdata = InitData()  # Init data set
        self.act = Activations("sigmoid")

Example #2

Show file

 def __init__(self, config):
     self.config = config
     self.activations = Activations()
     self.inputs = tf.placeholder(tf.float32,
                                  shape=(1, self.config['input_size']))
     self.params_size = (
         self.config['input_size'] * self.config['n_nodes_per_layer']
     ) + self.config[
         'n_nodes_per_layer'] + self.config['n_hidden_layers'] * (
             self.config['n_nodes_per_layer']**2 +
             self.config['n_nodes_per_layer']) + (
                 self.config['n_nodes_per_layer'] *
                 self.config['output_size']) + self.config['output_size']
     self.params = tf.placeholder(tf.float32)

Example #3

Show file

class FeedForwardNeuralNetwork():
    def __init__(self, config):
        self.config = config
        self.activations = Activations()
        self.inputs = tf.placeholder(tf.float32,
                                     shape=(1, self.config['input_size']))
        self.params_size = (
            self.config['input_size'] * self.config['n_nodes_per_layer']
        ) + self.config[
            'n_nodes_per_layer'] + self.config['n_hidden_layers'] * (
                self.config['n_nodes_per_layer']**2 +
                self.config['n_nodes_per_layer']) + (
                    self.config['n_nodes_per_layer'] *
                    self.config['output_size']) + self.config['output_size']
        self.params = tf.placeholder(tf.float32)

    def model(self):
        """
		Builds Tensorflow graph
		Returns:
			(tensor): Output Tensor for the graph
		"""
        start = 0
        weights = tf.reshape(
            self.params[start:self.config['input_size'] *
                        self.config['n_nodes_per_layer']],
            [self.config['input_size'], self.config['n_nodes_per_layer']])
        start += self.config['input_size'] * self.config['n_nodes_per_layer']
        biases = tf.reshape(
            self.params[start:start + self.config['n_nodes_per_layer']],
            [self.config['n_nodes_per_layer']])
        start += self.config['n_nodes_per_layer']
        hidden_layer = self.activations.resolve_activation(
            self.config['hidden_layer_activation'])(tf.add(
                tf.matmul(self.inputs, weights), biases))

        for i in range(self.config['n_hidden_layers']):
            weights = tf.reshape(
                self.params[start:start + self.config['n_nodes_per_layer'] *
                            self.config['n_nodes_per_layer']], [
                                self.config['n_nodes_per_layer'],
                                self.config['n_nodes_per_layer']
                            ])
            start += self.config['n_nodes_per_layer'] * self.config[
                'n_nodes_per_layer']
            biases = tf.reshape(
                self.params[start:start + self.config['n_nodes_per_layer']],
                [self.config['n_nodes_per_layer']])
            start += self.config['n_nodes_per_layer']
            hidden_layer = self.activations.resolve_activation(
                self.config['hidden_layer_activation'])(tf.add(
                    tf.matmul(hidden_layer, weights), biases))

        weights = tf.reshape(
            self.params[start:start + self.config['n_nodes_per_layer'] *
                        self.config['output_size']],
            [self.config['n_nodes_per_layer'], self.config['output_size']])
        start += self.config['n_nodes_per_layer'] * self.config['output_size']
        biases = tf.reshape(
            self.params[start:start + self.config['output_size']],
            [self.config['output_size']])
        start += self.config['output_size']
        output_layer = tf.scalar_mul(
            self.config['output_scale'],
            self.activations.resolve_activation(
                self.config['output_activation'])(tf.add(
                    tf.matmul(hidden_layer, weights), biases)))
        return output_layer

    def init_master_params(self, from_file=False, filepath=None):
        """
		Computes initial random gaussian values for master weights and biases
		Returns:
			(float array): Random gaussian values for neural network weights and biases
		"""
        if from_file:
            master_params = utils.load_array(filepath)
            if len(master_params) != self.params_size:
                err_msg = "Params from (" + filepath + ") does not match the network shape."
                raise ValueError(err_msg)
            return utils.load_array(filepath)
        master_params = []
        weights = np.random.normal(
            0, 1, self.config['input_size'] * self.config['n_nodes_per_layer'])
        master_params += list(weights)
        biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
        master_params += list(biases)

        for i in range(self.config['n_hidden_layers']):
            weights = np.random.normal(
                0, 1, self.config['n_nodes_per_layer'] *
                self.config['n_nodes_per_layer'])
            master_params += list(weights)
            biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
            master_params += list(biases)

        weights = np.random.normal(
            0, 1,
            self.config['n_nodes_per_layer'] * self.config['output_size'])
        master_params += list(weights)
        biases = np.random.normal(0, 1, self.config['output_size'])
        master_params += list(biases)
        return master_params

    def save(self, filedir, filename, master_params):
        try:
            os.makedirs(filedir)
        except OSError as e:
            if e.errno != errno.EEXIST:
                raise
        return utils.save_array(filedir + filename, master_params)

    def feed_dict(self, inputs, params):
        """
		Fills the feed_dict for the Tensorflow graph
		Returns:
			(dict): Feed_dict filled with given values for placeholders
		"""
        return {self.inputs: inputs, self.params: params}

Example #4

Show file

class BatchNormalizationNeuralNetwork():
    def __init__(self, config):
        self.config = config
        self.activations = Activations()
        self.inputs = tf.placeholder(tf.float32,
                                     shape=(1, self.config['input_size']))
        params_size = (
            self.config['input_size'] * self.config['n_nodes_per_layer']
        ) + self.config['n_nodes_per_layer'] + 2 * self.config[
            'input_size'] + self.config['n_hidden_layers'] * (
                self.config['n_nodes_per_layer']**2 +
                self.config['n_nodes_per_layer'] +
                2 * self.config['n_nodes_per_layer']) + (
                    self.config['n_nodes_per_layer'] *
                    self.config['output_size']) + self.config[
                        'output_size'] + 2 * self.config['n_nodes_per_layer']
        self.params = tf.placeholder(tf.float32, shape=(params_size))
        self.learning_rate = self.config['learning_rate']
        self.keep_rate = self.config['keep_rate']

    def model(self):
        """
		Builds Tensorflow graph
		Returns:
			(tensor): Output Tensor for the graph
		"""
        start = 0
        nodes_per_layer = self.config['n_nodes_per_layer']
        input_size = self.config['input_size']
        activation = self.config['hidden_layer_activation']
        num_hidden_layers = self.config['n_hidden_layers']
        output_size = self.config['output_size']
        output_scale = self.config['output_scale']
        output_activation = self.config['output_activation']

        weights = tf.reshape(self.params[start:input_size * nodes_per_layer],
                             [input_size, nodes_per_layer])
        start += input_size * nodes_per_layer
        biases = tf.reshape(self.params[start:start + nodes_per_layer],
                            [nodes_per_layer])
        start += nodes_per_layer

        mean, var = tf.nn.moments(weights, [1], keep_dims=True)
        stddev = tf.sqrt(var)
        weights = tf.div(tf.subtract(weights, mean), stddev)
        gamma = tf.reshape(self.params[start:start + input_size],
                           [input_size, 1])
        start += input_size
        beta = tf.reshape(self.params[start:start + input_size],
                          [input_size, 1])
        start += input_size
        weights = tf.add(tf.multiply(gamma, weights), beta)

        hidden_layer = self.activations.resolve_activation(activation)(tf.add(
            tf.matmul(self.inputs, weights), biases))

        for i in range(num_hidden_layers):
            weights = tf.reshape(
                self.params[start:start + nodes_per_layer * nodes_per_layer],
                [nodes_per_layer, nodes_per_layer])
            start += nodes_per_layer * nodes_per_layer
            biases = tf.reshape(self.params[start:start + nodes_per_layer],
                                [nodes_per_layer])
            start += nodes_per_layer

            # Add batch normalization by subtracting the mean and dividing by the std dev
            mean, var = tf.nn.moments(weights, [1], keep_dims=True)
            stddev = tf.sqrt(var)
            weights = tf.div(tf.subtract(weights, mean), stddev)

            gamma = tf.reshape(self.params[start:start + nodes_per_layer],
                               [nodes_per_layer, 1])
            start += nodes_per_layer
            beta = tf.reshape(self.params[start:start + nodes_per_layer],
                              [nodes_per_layer, 1])
            start += nodes_per_layer
            weights = tf.add(tf.multiply(gamma, weights), beta)

            hidden_layer = self.activations.resolve_activation(activation)(
                tf.add(tf.matmul(hidden_layer, weights), biases))
            hidden_layer = tf.nn.dropout(hidden_layer, self.keep_rate)

        weights = tf.reshape(
            self.params[start:start + nodes_per_layer * output_size],
            [nodes_per_layer, output_size])
        start += nodes_per_layer * output_size
        biases = tf.reshape(self.params[start:start + output_size],
                            [output_size])
        start += output_size

        mean, var = tf.nn.moments(weights, [1], keep_dims=True)
        stddev = tf.sqrt(var)
        weights = tf.div(tf.subtract(weights, mean), stddev)

        gamma = tf.reshape(self.params[start:start + nodes_per_layer],
                           [nodes_per_layer, 1])
        start += nodes_per_layer
        beta = tf.reshape(self.params[start:start + nodes_per_layer],
                          [nodes_per_layer, 1])
        start += nodes_per_layer
        weights = tf.add(tf.multiply(gamma, weights), beta)

        output_layer = tf.scalar_mul(
            output_scale,
            self.activations.resolve_activation(output_activation)(tf.add(
                tf.matmul(hidden_layer, weights), biases)))
        return output_layer

    def init_master_params(self):
        """
		Computes initial random gaussian values for master weights and biases
		Returns:
			(float array): Random gaussian values for neural network weights and biases
		"""
        master_params = []
        weights = np.random.normal(
            0, 1, self.config['input_size'] * self.config['n_nodes_per_layer'])
        master_params += list(weights)
        biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
        master_params += list(biases)
        master_params += [1 for i in range(self.config['input_size'])]
        master_params += [0 for i in range(self.config['input_size'])]

        for i in range(self.config['n_hidden_layers']):
            weights = np.random.normal(
                0, 1, self.config['n_nodes_per_layer'] *
                self.config['n_nodes_per_layer'])
            master_params += list(weights)
            biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
            master_params += list(biases)
            master_params += [
                1 for i in range(self.config['n_nodes_per_layer'])
            ]
            master_params += [
                0 for i in range(self.config['n_nodes_per_layer'])
            ]

        weights = np.random.normal(
            0, 1,
            self.config['n_nodes_per_layer'] * self.config['output_size'])
        master_params += list(weights)
        biases = np.random.normal(0, 1, self.config['output_size'])
        master_params += list(biases)
        master_params += [1 for i in range(self.config['n_nodes_per_layer'])]
        master_params += [0 for i in range(self.config['n_nodes_per_layer'])]
        return master_params

    def feed_dict(self, inputs, params):
        """
		Fills the feed_dict for the Tensorflow graph
		Returns:
			(dict): Feed_dict filled with given values for placeholders
		"""
        return {self.inputs: inputs, self.params: params}

Example #5

Show file

File: facenet_activations.py Project: monjoybme/TF-Visualize-CNN

def main():

    # Read the file containing the pairs used for testing
    pairs = lfw.read_pairs(os.path.join(FLAGS.facenet_dir, 'data/pairs.txt'))

    # Get the paths for the corresponding images
    lfw_dir = os.path.join(os.getenv('FACENET_DIR'), FLAGS.lfw_dir)
    paths, _ = lfw.get_paths(lfw_dir, pairs)
    # Remove duplicates,
    paths = list(set(paths))

    if not os.path.exists(FLAGS.out_dir):
        os.makedirs(FLAGS.out_dir)

    # Will store an Activation object for each layer for each channel.
    # The key is layer_name, the value is a list of 'Activations' objects, one per channel.
    activations = {}

    with tf.Graph().as_default() as graph:

        # Load .pb model file.
        # It is a "freezed" model, where all variables are replaced with constants.
        load_model(FLAGS.model_path)

        # If you don't know which layers to use, print them out.
        if FLAGS.print_all_names:
            all_names = [n.name for n in graph.as_graph_def().node]
            for name in all_names:
                print('%s:0' % name)
            return

        images_ph = graph.get_tensor_by_name("input:0")
        phase_train_ph = graph.get_tensor_by_name("phase_train:0")

        height, width, channels = IMAGE_SHAPE[1:]

        # Get all the features we want to visualize.
        layers_names = FLAGS.layers
        layers = [
            tf.get_default_graph().get_tensor_by_name(x) for x in layers_names
        ]

        with tf.Session() as sess:

            # 1. Run through all images and find the best for each layer.
            #    'Activation' class is used in this loop.

            for i in ProgressBar()(range(
                    min(len(paths) // FLAGS.batch_size, FLAGS.batches))):
                start_index = i * FLAGS.batch_size
                end_index = min((i + 1) * FLAGS.batch_size,
                                FLAGS.batches * FLAGS.batch_size)
                paths_batch = paths[start_index:end_index]

                # Run a forward pass with normalized images.
                images = facenet.load_data(paths_batch, False, False, height)
                features = sess.run(layers,
                                    feed_dict={
                                        images_ph: images,
                                        phase_train_ph: False
                                    })

                images_uint8 = facenet.load_data(paths_batch,
                                                 False,
                                                 False,
                                                 height,
                                                 do_prewhiten=False).astype(
                                                     np.uint8)

                for ilayer, layer_name in enumerate(layers_names):
                    # Lazy intialization.
                    num_channels = min(FLAGS.num_channels,
                                       features[ilayer].shape[3])
                    if layer_name not in activations:
                        activations[layer_name] = [
                            Activations(FLAGS.num_samples)
                            for i in range(num_channels)
                        ]
                    # Update activations.
                    for ichannel in range(num_channels):
                        activations[layer_name][ichannel].update(
                            images_uint8,
                            features=features[ilayer][:, :, :, ichannel])

            # 2. Run through layers and visualize images for the best features.
            #    'Recfield' class is used in this loop with 'Activation' class.

            for layer, layer_name in zip(layers, layers_names):

                # Compute receptive field for this layer and show statistics.
                forward = lambda x: sess.run([layer],
                                             feed_dict={
                                                 images_ph: x,
                                                 phase_train_ph: False
                                             })
                recfield = ReceptiveField(IMAGE_SHAPE, forward)

                print(layer_name, 'feature map is of shape', layer.get_shape(),
                      'and has receptive field', recfield.max())

                for ichannel in range(len(activations[layer_name])):
                    image, crop = activations[layer_name][ichannel].retrieve(
                        recfield)
                    if ichannel == 0:
                        images = image
                        crops = crop
                    else:
                        images = np.concatenate((images, image), axis=1)
                        crops = np.concatenate((crops, crop), axis=1)
                filename = layer_name.replace('/', '-').replace(':', '')
                cv2.imwrite(
                    os.path.join(FLAGS.out_dir, '%s-full.jpg' % filename),
                    images)  #[:,:,::-1])
                cv2.imwrite(
                    os.path.join(FLAGS.out_dir, '%s-crop.jpg' % filename),
                    crops)  #[:,:,::-1])

Example #6

Show file

File: multiLayer.py Project: guutama/DeepLearning-Class-2020

"""

#%%
#used librariies and packages
import numpy as np
import matplotlib.pyplot as plt
from activations import Activations

from sklearn.datasets import make_moons

#%%

#%%
#Global variables
X, y = make_moons()
activation = Activations()

#%%


#%%
def scatter(X, y):

    fig, ax = plt.subplots()

    for i, j in enumerate(np.unique(y)):
        ax.scatter(X[y == j, 0], X[y == j, 1])


#%%

Example #7

Show file

File: models.py Project: alvinzz/MOR

class FeedForwardNeuralNetwork():

	def __init__(self, config):
		self.config = config
		self.activations = Activations()
		self.inputs = tf.placeholder(tf.float32, shape=(1, self.config['input_size']))
		params_size = (self.config['input_size'] * self.config['n_nodes_per_layer']) + self.config['n_nodes_per_layer'] + self.config['n_hidden_layers'] * (self.config['n_nodes_per_layer']**2 + self.config['n_nodes_per_layer']) + (self.config['n_nodes_per_layer'] * self.config['output_size']) + self.config['output_size']
		self.params = tf.placeholder(tf.float32)

	def model(self):
		"""
		Builds Tensorflow graph
		Returns:
			(tensor): Output Tensor for the graph
		"""
		start = 0
		weights = tf.reshape(self.params[start : self.config['input_size'] * self.config['n_nodes_per_layer']], [self.config['input_size'], self.config['n_nodes_per_layer']])
		start += self.config['input_size'] * self.config['n_nodes_per_layer']
		biases = tf.reshape(self.params[start : start + self.config['n_nodes_per_layer']], [self.config['n_nodes_per_layer']])
		start += self.config['n_nodes_per_layer']
		hidden_layer = self.activations.resolve_activation(self.config['hidden_layer_activation'])(tf.add(tf.matmul(self.inputs, weights), biases))

		for i in range(self.config['n_hidden_layers']):
			weights = tf.reshape(self.params[start : start + self.config['n_nodes_per_layer'] * self.config['n_nodes_per_layer']], [self.config['n_nodes_per_layer'], self.config['n_nodes_per_layer']])
			start += self.config['n_nodes_per_layer'] * self.config['n_nodes_per_layer']
			biases = tf.reshape(self.params[start : start + self.config['n_nodes_per_layer']], [self.config['n_nodes_per_layer']])
			start += self.config['n_nodes_per_layer']
			hidden_layer = self.activations.resolve_activation(self.config['hidden_layer_activation'])(tf.add(tf.matmul(hidden_layer, weights), biases))

		weights = tf.reshape(self.params[start : start + self.config['n_nodes_per_layer'] * self.config['output_size']], [self.config['n_nodes_per_layer'], self.config['output_size']])
		start += self.config['n_nodes_per_layer'] * self.config['output_size']
		biases = tf.reshape(self.params[start : start + self.config['output_size']], [self.config['output_size']])
		start += self.config['output_size']
		output_layer = tf.scalar_mul(self.config['output_scale'], self.activations.resolve_activation(self.config['output_activation'])(tf.add(tf.matmul(hidden_layer, weights), biases)))
		return output_layer

	def init_master_params(self):
		"""
		Computes initial random gaussian values for master weights and biases
		Returns:
			(float array): Random gaussian values for neural network weights and biases
		"""
		master_params = []
		weights = np.random.normal(0, 1, self.config['input_size'] * self.config['n_nodes_per_layer'])
		master_params += list(weights)
		biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
		master_params += list(biases)

		for i in range(self.config['n_hidden_layers']):
			weights = np.random.normal(0, 1, self.config['n_nodes_per_layer'] * self.config['n_nodes_per_layer'])
			master_params += list(weights)
			biases = np.random.normal(0, 1, self.config['n_nodes_per_layer'])
			master_params += list(biases)

		weights = np.random.normal(0, 1, self.config['n_nodes_per_layer'] * self.config['output_size'])
		master_params += list(weights)
		biases = np.random.normal(0, 1, self.config['output_size'])
		master_params += list(biases)
		return master_params

	def feed_dict(self, inputs, params):
		"""
		Fills the feed_dict for the Tensorflow graph
		Returns:
			(dict): Feed_dict filled with given values for placeholders
		"""
		return {self.inputs: inputs, self.params: params}

Example #8

Show file

File: logreg.py Project: trygvels/FYS-STK4155

class LogReg:  # Logistic regression class
    def __init__(
            self,  # Specify cost function to calculate with
            cost='cross_entropy'):

        self.cost = CostFunctions(cost)  # Init cross_entropy cost function
        self.initdata = InitData()  # Init data set
        self.act = Activations("sigmoid")

    def GD(self,
           X,
           y,
           lr=1,
           tol=1e-2,
           rnd_seed=False):  #Gradient descent method
        print("Doing GD for logreg")
        n = len(y)
        costs = []  # Initializing cost list
        if (rnd_seed):
            np.random.seed(int(
                time.time()))  # seed numpy RNG with the time stamp
        self.beta = np.random.randn(X.shape[1],
                                    1)  # Drawing initial random beta values
        y = y.reshape(X.shape[0], 1)
        i = 0
        t = 1
        while t > tol:  # Do gradient descent while below threshold
            if (i == 0):
                tar = X @ self.beta  # Calculate current prediction
                #no need in calculating again for each iteration
            gradient = 1.0 / n * (X.T @ (self.act.f(tar) - y)
                                  )  # Calculate gradient
            self.beta -= lr * gradient  # Calculate perturbation to beta
            tar = X @ self.beta
            costs.append(self.cost.f(tar, y))  # Save cost of new beta
            t = np.linalg.norm(gradient)  # Calculate norm of gradient
            i += 1
            if i > 1e5:  # If descent takes too long, break.
                print(
                    "This takes way too long, %d iterations, with learning rage %e"
                    % (i, lr))
                break

        print("Gradient solver has converged after %d iterations" % i)

        #plt.plot(range(iter), costs)
        #plt.show()
        return self.beta, costs

    def SGD(self,
            X,
            y,
            lr=0.01,
            tol=1e-4):  # Stochastic gradient descent method
        print("Doing SGD for logreg")
        n = len(y)
        costs = []  # Initializing cost list
        self.beta = np.random.randn(X.shape[1],
                                    1)  # Drawing initial random beta values

        i = 0
        t = 1
        while t > tol:  # Do gradient descent while below threshold
            cost = 0
            for j in range(n):
                idx = np.random.randint(0, n)  # Chose random data row
                X_ = X[idx, :].reshape(1,
                                       X.shapels[1])  # Select random data row
                y_ = y[idx].reshape(1, 1)  # select corresponding prediction

                b = X_ @ self.beta  # Calculate current prediction
                gradient = 1 / n * (X_.T @ (self.act.f(b) - y_)
                                    )  # Calculate gradient
                self.beta -= lr * gradient  # Calculate perturbation to beta
                tar = X_ @ self.beta
                cost += self.cost(tar, y_)  # Save cost of new beta

            costs.append(cost)  # Save cost of new beta
            t = np.linalg.norm(
                gradient)  # Calculate norm of gradient #Fix this for SGD
            i += 1
            if i > 1e5:  # If descent takes too long, break.
                print(
                    "This takes way too long, %d iterations, with learning rage %e"
                    % (i, lr))
                break

        print("Stochastic gradient solver has converged after %d iterations" %
              i)
        return self.beta, costs

    # Stochastic gradient descent method with batches
    def SGD_batch(self,
                  X,
                  y,
                  lr=0.01,
                  tol=1e-4,
                  n_iter=1,
                  batch_size=100,
                  n_epoch=100,
                  rnd_seed=False,
                  adj_lr=False,
                  rnd_batch=False,
                  verbosity=0,
                  lambda_r=0.0,
                  new_per_iter=False):

        # lambda_r = lambda value for ridge regulation term in cost function.
        print("Doing SGD for logreg")
        n = len(y)
        costs = []  # Initializing cost list

        if (rnd_seed):
            np.random.seed(int(time.time()))
        self.beta = np.random.randn(X.shape[1],
                                    1)  # Drawing initial random beta values
        tar = X @ self.beta
        min_cost = self.cost.f(
            tar, y) + lambda_r * np.sum(self.beta**2)  # Save cost of new beta

        best_beta = self.beta.copy()

        # adjustable learning rate
        if (adj_lr):
            t0 = 5 * n
            #t0 = n
            lr0 = lr

        # We do several SGD searches with new batches for each search, with new searches
        # starting from the previous endpoint
        betas = np.zeros(
            shape=(X.shape[1] + 1, n_iter)
        )  #array to store the best betas with corresponding cost per iteration
        for i in range(n_iter):
            if (new_per_iter):
                self.beta = np.random.randn(X.shape[1], 1)
                tar = X @ self.beta
                min_cost = self.cost.f(tar,
                                       y) + lambda_r * np.sum(self.beta**2)
                best_beta = self.beta.copy()

            if (verbosity > 0):

                print('  search %i of %i' % (i + 1, n_iter))
            # Data is (semi) sorted on age after index ~15000,
            # dividing into batches based on index is therefore potentially not random.
            # We therefore have 2 options, (1) draw batch_size random values for each
            # iteration 'j', or (2) split data into m batches before starting
            m = int(n / batch_size)
            if (rnd_batch):
                nbatch = []
                nbatch.append(batch_size)
                idx = 0
            else:
                batch_idx, nbatch = self.split_batch(n, m)
            for k in range(n_epoch):
                if (verbosity > 1):
                    print('    epoch %i of %i' % (k + 1, n_epoch))
                for j in range(m):
                    #values instead
                    if (rnd_batch):
                        idx_arr = np.random.randint(
                            0, n, batch_size)  # Choose n random data rows
                    else:
                        idx = np.random.randint(0, m)
                        idx_arr = batch_idx[idx, :nbatch[idx]]
                    X_ = X[idx_arr, :].reshape(nbatch[idx],
                                               X.shape[1])  # Select batch data
                    y_ = y[idx_arr].reshape(
                        nbatch[idx], 1)  # select corresponding prediction
                    b = X_ @ self.beta  # Calculate current prediction
                    gradient = (
                        X_.T @ (self.act.f(b) - y_)
                    ) + 2.0 * lambda_r * self.beta  # Calculate gradient
                    if (adj_lr):
                        #as iterations increase, the step size in beta is reduced
                        lr = (lr0 * t0) / (t0 + k * n + j * batch_size)

                    self.beta = self.beta - lr * gradient  # Calculate perturbation to beta

                #after each epoch we compute the cost (majority of runtime)
                tar = X @ self.beta
                #calculate total cost (This takes a long time!!). Has support for ridge
                cost = self.cost.f(tar, y) + lambda_r * np.sum(self.beta**2)
                costs.append(cost)  # Save cost of new beta
                if (cost < min_cost):
                    min_cost = cost
                    best_beta = self.beta.copy()
            betas[:X.shape[1], i] = best_beta[:, 0].copy()
            betas[X.shape[1], i] = min_cost.copy()
        # if we draw new initial betas per iteration, we need to find the beta giving the
        # smallest cost of all iterations. If not, then the final best_beta is the one
        # we're after
        if (new_per_iter):
            idx = np.argmin(betas[X.shape[1], :])  #find index with lowest cost
            self.beta[:, 0] = betas[:X.shape[1], idx].copy(
            )  #finally return beta with the lowest total cost
        else:
            self.beta = best_beta.copy(
            )  #finally return beta with the lowest total cost

        return best_beta, costs, betas

    def predict(self,
                X,
                betas=[]):  # Calculates probabilities and onehots for y
        if (len(betas) > 0):
            beta = betas.copy()
        else:
            beta = self.beta.copy()
        print("Predicting y using logreg")
        # Returns probabilities
        self.yprobs = self.act.f(X @ beta)
        self.yPred = (self.yprobs > 0.5).astype(int)
        self.y_pred_onehot = self.initdata.onehotencoder.fit_transform(
            self.yPred.reshape(-1, 1))  # Converts to onehot
        return self.yPred

    def sklearn_alternative(self, XTrain, yTrain, XTest,
                            yTest):  # Does SKLEARN method
        print("Doing logreg using sklearn")
        #%Setting up grid search for optimal parameters of Logistic regression
        from sklearn.linear_model import LogisticRegression
        from sklearn.model_selection import GridSearchCV
        from sklearn.metrics import classification_report

        lambdas = np.logspace(-5, 7, 13)
        parameters = [{
            'C': 1. / lambdas,
            "solver": ["lbfgs"]
        }]  #*len(parameters)}]
        scoring = ['accuracy', 'roc_auc']
        logReg = LogisticRegression()
        # Finds best hyperparameters, then does regression.
        gridSearch = GridSearchCV(logReg,
                                  parameters,
                                  cv=5,
                                  scoring=scoring,
                                  refit='roc_auc')

        # Fit stuff
        gridSearch.fit(XTrain, yTrain.ravel())
        yTrue, yPred = yTest, gridSearch.predict(XTest)
        print(classification_report(yTrue, yPred))
        rep = pd.DataFrame(
            classification_report(yTrue, yPred, output_dict=True)).transpose()
        display(rep)

        logreg_df = pd.DataFrame(
            gridSearch.cv_results_)  # Shows behaviour of CV
        pd.display(logreg_df[[
            'param_C', 'mean_test_accuracy', 'rank_test_accuracy',
            'mean_test_roc_auc', 'rank_test_roc_auc'
        ]])

        logreg_df.columns
        logreg_df.plot(x='param_C',
                       y='mean_test_accuracy',
                       yerr='std_test_accuracy',
                       logx=True)
        logreg_df.plot(x='param_C',
                       y='mean_test_roc_auc',
                       yerr='std_test_roc_auc',
                       logx=True)
        plt.show()

    def own_classification_report(self,
                                  ytrue,
                                  pred,
                                  threshold=0.5,
                                  return_f1=False,
                                  return_ac=False):
        tp = 0
        tn = 0
        fp = 0
        fn = 0
        pred = np.where(pred > threshold, 1, 0)
        for i in range(len(ytrue)):
            if (pred[i] == 1 and ytrue[i] == 1):
                tp += 1
            elif (pred[i] == 1 and ytrue[i] == 0):
                fp += 1
            elif (pred[i] == 0 and ytrue[i] == 0):
                tn += 1
            elif (pred[i] == 0 and ytrue[i] == 1):
                fn += 1
        pcp = np.sum(np.where(pred == 1, 1, 0))
        pcn = np.sum(np.where(pred == 0, 1, 0))
        cp = np.sum(np.where(ytrue == 1, 1, 0))
        cn = np.sum(np.where(ytrue == 0, 1, 0))
        ppv = [tn * 1.0 / pcn, tp * 1.0 / pcp]
        trp = [tn * 1.0 / cn, tp * 1.0 / cp]
        ac = (tp + tn) * 1.0 / (cp + cn)
        f1 = [
            2.0 * ppv[0] * trp[0] / (ppv[0] + trp[0]),
            2.0 * ppv[1] * trp[1] / (ppv[1] + trp[1])
        ]
        if return_f1:
            if return_ac:
                return (f1[0] * cn + f1[1] * cp) / (cn + cp), ac
            else:
                return (f1[0] * cn + f1[1] * cp) / (cn + cp)
        if return_ac:
            return ac
        print(
            "              precision     recall     f1-score     true number    predicted number"
        )
        print()
        print(
            "           0      %5.3f      %5.3f        %5.3f        %8i    %16i"
            % (ppv[0], trp[0], f1[0], cn, pcn))
        print(
            "           1      %5.3f      %5.3f        %5.3f        %8i    %16i"
            % (ppv[1], trp[1], f1[1], cp, pcp))
        print()
        print("    accuracy                              %5.3f        %8i" %
              ((tp + tn) * 1.0 / (cp + cn), cp + cn))
        print("   macro avg      %5.3f      %5.3f        %5.3f        %8i" %
              ((ppv[0] + ppv[1]) / 2.0, (trp[0] + trp[1]) / 2.0,
               (f1[0] + f1[1]) / 2.0, cn + cp))
        print("weighted avg      %5.3f      %5.3f        %5.3f        %8i" %
              ((ppv[0] * cn + ppv[1] * cp) / (cn + cp),
               (trp[0] * cn + trp[1] * cp) / (cn + cp),
               (f1[0] * cn + f1[1] * cp) / (cn + cp), cn + cp))
        print()

        return

    def split_batch(self, n, m):

        if (m > n):
            print('m > n in split_batch')
            exit()

        #maximum batch size
        if (np.mod(n, m) == 0):
            n_m = n // m
        else:
            n_m = n // m + 1

        idx_arr = np.zeros(shape=(m, n_m), dtype='int')
        n_ms = np.zeros(shape=(m), dtype='int')

        if (m == n):  #n_m=1
            idx_arr[:, 0] = np.arange(0, m, dtypr='int')
            n_ms += 1
            return idx_arr, n_ms

        arr = np.arange(0, n, dtype='int')
        n_left = n
        for i in range(n):
            m_i = np.mod(i, m)  #group number
            nm_i = i // m  #index in group
            n_ms[m_i] = nm_i + 1  #update number of values in group
            ind = np.random.randint(
                n_left)  #draw random sample in data that is left
            idx_arr[
                m_i,
                nm_i] = arr[ind].copy()  #add index of data point to batch m_i
            arr[ind:n_left -
                1] = arr[ind +
                         1:n_left].copy()  #remove data point from what is left
            n_left -= 1

        return idx_arr, n_ms

    def print_beta(self, cols=[], betas=np.zeros(shape=(1, 1))):
        if (betas.shape[1] > 2):
            std_b = np.std(betas, axis=1)
            mean_b = np.mean(betas, axis=1)

        print('------- Beta values -------')
        print()
        if (betas.shape[1] > 2):
            print('     best fit      std         mean     data label')
        else:
            print('      value   data label')

        for i in range(len(self.beta)):
            if i >= len(cols):
                if (betas.shape[1] > 2):
                    print('  %11.6f %11.6f %11.6f' %
                          (self.beta[i, 0], std_b[i], mean_b[i]))
                else:
                    print('  %11.6f' % (self.beta[i, 0]))
            else:
                if (betas.shape[1] > 2):
                    print('  %11.6f %11.6f %11.6f   %s' %
                          (self.beta[i, 0], std_b[i], mean_b[i], cols[i]))
                else:
                    print('  %11.6f   %s' % (self.beta[i, 0], cols[i]))
        print()

        return

    def plot_cumulative(self,
                        X,
                        y,
                        p=[],
                        beta=[],
                        label='',
                        plt_ar=True,
                        return_ar=False):
        if (len(p) == 0):
            if (len(beta) == 0):
                beta = self.beta
            p = self.act.f(X @ beta)
        if (not label == ''):
            lab = '_' + label
        else:
            #make a date and time stamp
            t = time.ctime()
            ta = t.split()
            hms = ta[3].split(':')
            label = ta[4] + '_' + ta[1] + ta[2] + '_' + hms[0] + hms[1] + hms[2]
            lab = '_' + label
        temp_p = p[:, 0].copy()
        nd = len(temp_p)
        nt = np.sum(y)
        model_pred = np.zeros(nd + 1)
        for i in range(len(temp_p)):
            idx = np.argmax(temp_p)
            model_pred[i + 1] = model_pred[i] + y[idx, 0]
            temp_p[idx] = -1.0

        x_plt = np.arange(nd + 1)
        best_y = np.arange(nd + 1)
        best_y[nt:] = nt
        baseline = (1.0 * nt) / nd * x_plt

        ar = 1.0 * np.sum(model_pred - baseline) / np.sum(best_y - baseline)
        if return_ar:
            return ar

        xtick = []
        if (nd < 2000):
            j = 500
            nm = 2001
        else:
            j = 4000
            nm = 16000
        for k in range(0, nm, j):
            xtick.append(k)
            if (k > nd):
                break
        if (label == 'lift'):
            xtick = [0, nt, nd]
            xtick_lab = ['0', r'$N_t$', r'$N_d$']
            ytick = [0, nt]
            ytick_lab = ['0', r'$N_t$']
        plt.figure(1, figsize=(7, 7))
        plt.plot(x_plt, best_y, label='Best fit', color=plt.cm.tab10(0))
        plt.plot(x_plt, model_pred, label='Model', color=plt.cm.tab10(1))
        plt.plot(x_plt, baseline, label='Baseline', color=plt.cm.tab10(7))
        plt.legend(loc='lower right', fontsize=22)
        plt.xlabel('Number of total data', fontsize=22)
        if (label == 'lift'):
            plt.xticks(xtick, xtick_lab, fontsize=18)
            plt.yticks(ytick, ytick_lab, fontsize=18)
        else:
            plt.xticks(xtick, fontsize=18)
            plt.yticks(fontsize=18)
        plt.ylabel('Cumulative number of target data', fontsize=22)
        if (plt_ar):
            plt.text(nd * 0.55,
                     nt * 0.4,
                     'area ratio = %5.3f' % (ar),
                     fontsize=20)
        plt.savefig('plots/cumulative_plot' + lab + '.pdf',
                    bbox_inches='tight',
                    pad_inches=0.02)
        plt.clf()

        return

    def print_beta_to_file(self, beta=[], label='', d_label=[]):
        if (len(beta) == 0):
            beta = self.beta

        if (not label == ''):
            label = '_' + label
        else:
            #make a date and time stamp
            t = time.ctime()
            ta = t.split()
            hms = ta[3].split(':')
            label = '_' + ta[4] + '_' + ta[1] + ta[2] + '_' + hms[0] + hms[
                1] + hms[2]

        filename = 'beta_values/beta' + label + '.txt'
        f = open(filename, 'w')
        for i in range(len(beta)):
            if i >= len(d_label):
                f.write('  %11.6f\n' % (self.beta[i, 0]))
            else:
                f.write('  %11.6f   %s\n' % (self.beta[i, 0], d_label[i]))
        f.close()

    def unit_test(self):
        XTrain = np.zeros(shape=(100, 3))
        XTest = XTrain.copy()
        yTrain = np.zeros(shape=(100, 1))
        yTest = yTrain.copy()

        XTrain[:50, 0] = 1.0
        XTrain[50:, 0] = -1.0
        XTrain[:, 0] *= 1.0 / np.std(XTrain[:, 0])  #unit variance
        XTrain[:, 1:] = np.random.normal(0, 1, size=(100, 2))
        yTrain[:50, 0] = 1.0
        yTrain[50:, 0] = 0.0
        yTrain[0, 0] = 0.0  #to not get infinities
        yTrain[-1, 0] = 1.0
        yTest = yTrain.copy()
        XTest[:, 0] = XTrain[:, 0].copy()
        XTest[:, 1:] = np.random.normal(0, 1, size=(100, 2))

        lrs = [0.01]
        beta, costs = self.GD(
            XTrain, yTrain.ravel(), lr=lrs[0], rnd_seed=True, tol=1e-2
        )  # Fit using GD. This can be looped over for best lambda (i.e. learning rate 'lr').

        print('Unit test with GD')
        print('Beta values')
        self.print_beta(betas=beta)
        print('Training data')
        yPred = self.predict(XTrain, betas=beta)  #predict
        self.own_classification_report(yTrain, yPred)
        print('Test data')
        yPred = self.predict(XTest, betas=beta)  #predict
        self.own_classification_report(yTest, yPred)

        beta, costs, betas = self.SGD_batch(
            XTrain,
            yTrain.ravel(),
            lr=lrs[0],
            adj_lr=True,
            rnd_seed=True,
            batch_size=10,
            n_epoch=50,
            verbosity=1,
            max_iter=10,
            new_per_iter=False
        )  # Fit using SGD. This can be looped over for best lambda (i.e. learning rate 'lr').

        print('Unit test with SGD')
        print('Beta values')
        self.print_beta(betas=beta)
        print('Training data')
        yPred = self.predict(XTrain, betas=beta)  #predict
        self.own_classification_report(yTrain, yPred)
        print('Test data')
        yPred = self.predict(XTest, betas=beta)  #predict
        self.own_classification_report(yTest, yPred)
        exit()

Example #9

Show file

File: cifar10_activations.py Project: monjoybme/TF-Visualize-CNN

def main():

  if not os.path.exists(FLAGS.out_dir):
    os.makedirs(FLAGS.out_dir)

  # Will store an Activation object for each layer for each channel.
  # The key is layer_name, the value is a list of 'Activations' objects, one per channel.
  activations = {}

  with tf.Graph().as_default():

    inputs, _ = cifar10.inputs(eval_data=False) # Training set.
    imshape = inputs.get_shape().as_list()
    print('Image shape:', imshape)

    # Logits takes images_ph, not inputs so that we can feed a generated image.
    images_ph = tf.placeholder(dtype=tf.float32, shape=imshape)
    logits = cifar10.inference(images_ph)

    # If you don't know which layers to use, print them out.
    if FLAGS.print_all_names:
      all_names = [n.name for n in tf.get_default_graph().as_graph_def().node]
      for name in all_names: print('%s:0' % name)
      return

    # # Get all the features we want to visualize.
    layers_names = FLAGS.layers.split(',')
    layers = [tf.get_default_graph().get_tensor_by_name(x) for x in layers_names]

    # Add an op to initialize the variables.
    saver = tf.train.Saver()

    with tf.Session() as sess:

      coord = tf.train.Coordinator()
      threads = tf.train.start_queue_runners(sess=sess, coord=coord)

      latest_checkpoint = tf.train.latest_checkpoint(FLAGS.train_dir)
      assert latest_checkpoint is not None
      saver.restore(sess, latest_checkpoint)
      
      # 1. Run through all images and find the best for each layer.
      #    'Activation' class is used in this loop.

      for i in ProgressBar()(range(FLAGS.batches)):

        # Get a batch of images.
        images = sess.run(inputs)
        images_uint8 = np.stack([
          ((im - im.min()) / (im.max() - im.min()) * 255.).astype(np.uint8) for im in images])

        # Run a forward pass with normalized images.
        features = sess.run(layers, feed_dict={ images_ph: images })

        for ilayer, layer_name in enumerate(layers_names):
          # Lazy intialization.
          num_channels = min(FLAGS.num_channels, features[ilayer].shape[3])
          if layer_name not in activations:
            activations[layer_name] = [Activations(FLAGS.num_samples) for i in range(num_channels)]
          # Update activations for each channel.
          for ichannel in range(num_channels):
            activations[layer_name][ichannel].update(
                images_uint8, features=features[ilayer][:,:,:,ichannel])

      # 2. Run through layers and visualize images for the best features.
      #    'Recfield' class is used in this loop with 'Activation' class.

      for layer, layer_name in zip(layers, layers_names):
        
        forward = lambda x: sess.run([layer], feed_dict={ images_ph: x })

        # Compute receptive field for this layer and show statistics.
        recfield = ReceptiveField(inputs.get_shape().as_list(), forward)
        print (layer_name, 'feature map is of shape', layer.get_shape(),
               'and has receptive field', recfield.max())

        for ichannel in range(len(activations[layer_name])):
          image, crop = activations[layer_name][ichannel].retrieve(recfield)
          if ichannel == 0:
            images = image
            crops = crop
          else:
            images = np.concatenate((images, image), axis=1)
            crops = np.concatenate((crops, crop), axis=1)
        filename = layer_name.replace('/', '-').replace(':', '')
        cv2.imwrite(os.path.join(FLAGS.out_dir, '%s-full.jpg' % filename), images[:,:,::-1])
        cv2.imwrite(os.path.join(FLAGS.out_dir, '%s-crop.jpg' % filename), crops[:,:,::-1])

      coord.request_stop()
      coord.join(threads)