Python Logger.graph_training_stats Examples

Programming Language: Python

Namespace/Package Name: utils.Logger

Class/Type: Logger

Method/Function: graph_training_stats

Examples at hotexamples.com: 3

Python Logger.graph_training_stats - 3 examples found. These are the top rated real world Python examples of utils.Logger.Logger.graph_training_stats extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

error(30)

info(30)

warning(30)

progress(30)

anticheat(30)

getLogger(22)

debug(20)

Logger(19)

new_epoch(14)

save_best(14)

success(9)

log(7)

AddNewLog(5)

AddRecord(5)

scalar_summary(4)

Save(3)

get_utc_iso_timestamp(3)

print(3)

graph_training_stats(3)

GetLogByName(3)

log_for_graphing(3)

task(2)

log_test(2)

write(2)

Load(2)

load_from_json(1)

set_names(1)

warn(1)

append(1)

end(1)

show_training_result(1)

show_information(1)

show_exception(1)

show_dataset_information(1)

set_offset(1)

setLevel(1)

log_for_test_graphing(1)

get_last_epoch(1)

get_logger(1)

get_name_from_args(1)

graph_test_stats(1)

open(1)

ok(1)

histo_summary(1)

image_summary(1)

log_scalars(1)

AddGraph(1)

Example #1

Show file

File: BanditSegNet.py Project: abhay-venkatesh/SegBandit

class BanditSegNet:
    ''' Network described by
            https://arxiv.org/pdf/1511.00561.pdf '''
    def load_vgg_weights(self):
        """ Use the VGG model trained on
            imagent dataset as a starting point for training """
        vgg_path = "models/imagenet-vgg-verydeep-19.mat"
        vgg_mat = scipy.io.loadmat(vgg_path)

        self.vgg_params = np.squeeze(vgg_mat['layers'])
        self.layers = ('conv1_1', 'relu1_1', 'conv1_2', 'relu1_2', 'pool1',
                       'conv2_1', 'relu2_1', 'conv2_2', 'relu2_2', 'pool2',
                       'conv3_1', 'relu3_1', 'conv3_2', 'relu3_2', 'conv3_3',
                       'relu3_3', 'conv3_4', 'relu3_4', 'pool3', 'conv4_1',
                       'relu4_1', 'conv4_2', 'relu4_2', 'conv4_3', 'relu4_3',
                       'conv4_4', 'relu4_4', 'pool4', 'conv5_1', 'relu5_1',
                       'conv5_2', 'relu5_2', 'conv5_3', 'relu5_3', 'conv5_4',
                       'relu5_4')

    def __init__(self, num_classes=11):
        self.num_classes = num_classes
        self.load_vgg_weights()
        self.build()

        # Begin a TensorFlow session
        config = tf.ConfigProto(allow_soft_placement=True)
        self.session = tf.Session(config=config)
        self.session.run(tf.global_variables_initializer())
        self.session.run(tf.local_variables_initializer())

        # Make saving trained weights and biases possible
        self.saver = tf.train.Saver(max_to_keep=5,
                                    keep_checkpoint_every_n_hours=1)
        self.checkpoint_directory = './checkpoints/'

        # Declare logging for logging capabilities
        self.logger = Logger()

    def vgg_weight_and_bias(self, name, W_shape, b_shape):
        """ 
            Initializes weights and biases to the pre-trained VGG model.
            
            Args:
                name: name of the layer for which you want to initialize weights
                W_shape: shape of weights tensor exkpected
                b_shape: shape of bias tensor expected
            returns:
                w_var: Initialized weight variable
                b_var: Initialized bias variable
        """
        if name not in self.layers:
            return self.weight_variable(W_shape), self.weight_variable(b_shape)
        else:
            w, b = self.vgg_params[self.layers.index(name)][0][0][0][0]
            init_w = tf.constant(value=np.transpose(w, (1, 0, 2, 3)),
                                 dtype=tf.float32,
                                 shape=W_shape)
            init_b = tf.constant(value=b.reshape(-1),
                                 dtype=tf.float32,
                                 shape=b_shape)
            w_var = tf.Variable(init_w)
            b_var = tf.Variable(init_b)
            return w_var, b_var

    def weight_variable(self, shape):
        initial = tf.truncated_normal(shape, stddev=0.1)
        return tf.Variable(initial)

    def bias_variable(self, shape):
        initial = tf.constant(0.1, shape=shape)
        return tf.Variable(initial)

    def pool_layer(self, x):
        return tf.nn.max_pool_with_argmax(x,
                                          ksize=[1, 2, 2, 1],
                                          strides=[1, 2, 2, 1],
                                          padding='SAME')

    def unpool(self, pool, ind, ksize=[1, 2, 2, 1], scope='unpool'):
        """ Unpooling layer after max_pool_with_argmax.
        Args:
            pool: max pooled output tensor
            ind: argmax indices
            ksize: ksize is the same as for the pool
        Return:
            unpool: unpooling tensor
        """
        with tf.variable_scope(scope):
            # Pool shape: BATCH_SIZE * ENCODED_WIDTH * ENCODED_HEIGHT * NUM_CLASSES
            input_shape = tf.shape(pool)
            output_shape = [
                input_shape[0], input_shape[1] * ksize[1],
                input_shape[2] * ksize[2], input_shape[3]
            ]

            flat_input_size = tf.cumprod(input_shape)[-1]
            flat_output_shape = tf.stack([
                output_shape[0],
                output_shape[1] * output_shape[2] * output_shape[3]
            ])

            pool_ = tf.reshape(pool, tf.stack([flat_input_size]))
            batch_range = tf.range(tf.cast(output_shape[0], tf.int64),
                                   dtype=ind.dtype)
            reshape_shape = tf.stack([input_shape[0], 1, 1, 1])
            reshaped_batch_range = tf.reshape(batch_range, shape=reshape_shape)

            b = tf.ones_like(ind) * reshaped_batch_range
            b = tf.reshape(b, tf.stack([flat_input_size, 1]))
            ind_ = tf.reshape(ind, tf.stack([flat_input_size, 1]))
            ind_ = tf.concat([b, ind_], 1)

            ret = tf.scatter_nd(ind_,
                                pool_,
                                shape=tf.cast(flat_output_shape, tf.int64))
            ret = tf.reshape(ret, tf.stack(output_shape))
            return ret

    def conv_layer_with_bn(self,
                           x,
                           W_shape,
                           train_phase,
                           name,
                           padding='SAME'):
        b_shape = W_shape[3]
        W, b = self.vgg_weight_and_bias(name, W_shape, [b_shape])
        convolved_output = tf.nn.conv2d(
            x, W, strides=[1, 1, 1, 1], padding=padding) + b
        batch_norm = tf.contrib.layers.batch_norm(convolved_output,
                                                  is_training=train_phase)
        return tf.nn.relu(batch_norm)

    def build(self):
        # Declare input placeholders
        self.x = tf.placeholder(tf.float32, shape=(None, None, None, 3))
        self.y = tf.placeholder(tf.int64, shape=(None, None, None))
        self.propensity = tf.placeholder(tf.float32, shape=(None, None, None))
        self.delta = tf.placeholder(tf.float32, shape=[])
        self.lagrange_mult = tf.placeholder(tf.float32, shape=[])
        self.train_phase = tf.placeholder(tf.bool, name='train_phase')
        self.rate = tf.placeholder(tf.float32, shape=[])

        # First encoder
        conv_1_1 = self.conv_layer_with_bn(self.x, [3, 3, 3, 64],
                                           self.train_phase, 'conv1_1')
        conv_1_2 = self.conv_layer_with_bn(conv_1_1, [3, 3, 64, 64],
                                           self.train_phase, 'conv1_2')
        pool_1, pool_1_argmax = self.pool_layer(conv_1_2)

        # Second encoder
        conv_2_1 = self.conv_layer_with_bn(pool_1, [3, 3, 64, 128],
                                           self.train_phase, 'conv2_1')
        conv_2_2 = self.conv_layer_with_bn(conv_2_1, [3, 3, 128, 128],
                                           self.train_phase, 'conv2_2')
        pool_2, pool_2_argmax = self.pool_layer(conv_2_2)

        # Third encoder
        conv_3_1 = self.conv_layer_with_bn(pool_2, [3, 3, 128, 256],
                                           self.train_phase, 'conv3_1')
        conv_3_2 = self.conv_layer_with_bn(conv_3_1, [3, 3, 256, 256],
                                           self.train_phase, 'conv3_2')
        conv_3_3 = self.conv_layer_with_bn(conv_3_2, [3, 3, 256, 256],
                                           self.train_phase, 'conv3_3')
        pool_3, pool_3_argmax = self.pool_layer(conv_3_3)

        # Fourth encoder
        conv_4_1 = self.conv_layer_with_bn(pool_3, [3, 3, 256, 512],
                                           self.train_phase, 'conv4_1')
        conv_4_2 = self.conv_layer_with_bn(conv_4_1, [3, 3, 512, 512],
                                           self.train_phase, 'conv4_2')
        conv_4_3 = self.conv_layer_with_bn(conv_4_2, [3, 3, 512, 512],
                                           self.train_phase, 'conv4_3')
        pool_4, pool_4_argmax = self.pool_layer(conv_4_3)

        # Fifth encoder
        conv_5_1 = self.conv_layer_with_bn(pool_4, [3, 3, 512, 512],
                                           self.train_phase, 'conv5_1')
        conv_5_2 = self.conv_layer_with_bn(conv_5_1, [3, 3, 512, 512],
                                           self.train_phase, 'conv5_2')
        conv_5_3 = self.conv_layer_with_bn(conv_5_2, [3, 3, 512, 512],
                                           self.train_phase, 'conv5_3')
        pool_5, pool_5_argmax = self.pool_layer(conv_5_3)

        # First decoder
        unpool_5 = self.unpool(pool_5, pool_5_argmax)
        deconv_5_3 = self.conv_layer_with_bn(unpool_5, [3, 3, 512, 512],
                                             self.train_phase, 'deconv5_3')
        deconv_5_2 = self.conv_layer_with_bn(deconv_5_3, [3, 3, 512, 512],
                                             self.train_phase, 'deconv5_2')
        deconv_5_1 = self.conv_layer_with_bn(deconv_5_2, [3, 3, 512, 512],
                                             self.train_phase, 'deconv5_1')

        # Second decoder
        unpool_4 = self.unpool(deconv_5_1, pool_4_argmax)
        deconv_4_3 = self.conv_layer_with_bn(unpool_4, [3, 3, 512, 512],
                                             self.train_phase, 'deconv4_3')
        deconv_4_2 = self.conv_layer_with_bn(deconv_4_3, [3, 3, 512, 512],
                                             self.train_phase, 'deconv4_2')
        deconv_4_1 = self.conv_layer_with_bn(deconv_4_2, [3, 3, 512, 256],
                                             self.train_phase, 'deconv4_1')

        # Third decoder
        unpool_3 = self.unpool(deconv_4_1, pool_3_argmax)
        deconv_3_3 = self.conv_layer_with_bn(unpool_3, [3, 3, 256, 256],
                                             self.train_phase, 'deconv3_3')
        deconv_3_2 = self.conv_layer_with_bn(deconv_3_3, [3, 3, 256, 256],
                                             self.train_phase, 'deconv3_2')
        deconv_3_1 = self.conv_layer_with_bn(deconv_3_2, [3, 3, 256, 128],
                                             self.train_phase, 'deconv3_1')

        # Fourth decoder
        unpool_2 = self.unpool(deconv_3_1, pool_2_argmax)
        deconv_2_2 = self.conv_layer_with_bn(unpool_2, [3, 3, 128, 128],
                                             self.train_phase, 'deconv2_2')
        deconv_2_1 = self.conv_layer_with_bn(deconv_2_2, [3, 3, 128, 64],
                                             self.train_phase, 'deconv2_1')

        # Fifth decoder
        unpool_1 = self.unpool(deconv_2_1, pool_1_argmax)
        deconv_1_2 = self.conv_layer_with_bn(unpool_1, [3, 3, 64, 64],
                                             self.train_phase, 'deconv1_2')
        deconv_1_1 = self.conv_layer_with_bn(deconv_1_2, [3, 3, 64, 32],
                                             self.train_phase, 'deconv1_1')

        # Produce class scores
        # score_1 dimensions: BATCH_SIZE * WIDTH * HEIGHT * NUM_CLASSES
        score_1 = self.conv_layer_with_bn(deconv_1_1,
                                          [1, 1, 32, self.num_classes],
                                          self.train_phase, 'score_1')

        # Compute Empirical Risk Minimization loss
        logits = tf.reshape(score_1, (-1, self.num_classes))
        softmaxed = tf.nn.softmax(logits)
        numerator = tf.multiply(softmaxed, (self.delta - self.lagrange_mult))

        # Have (5, 153600, 11)
        # Want (768000, 11)
        propensity_shape = tf.shape(self.propensity)
        flat_prop_size = tf.cumprod(propensity_shape)[-2]
        propensity_ = tf.reshape(self.propensity,
                                 tf.stack([flat_prop_size, self.num_classes]))

        # Loss of information possible here? Should be fine.
        self.loss = tf.reduce_mean(self.lagrange_mult +
                                   tf.divide(numerator, propensity_))

        # Declare optimizer
        optimizer = tf.train.AdamOptimizer(self.rate)
        self.train_step = optimizer.minimize(self.loss)

        # Metrics
        self.prediction = tf.argmax(score_1, axis=3, name="prediction")
        self.accuracy = tf.contrib.metrics.accuracy(self.prediction,
                                                    self.y,
                                                    name='accuracy')
        self.mean_IoU = tf.contrib.metrics.streaming_mean_iou(self.prediction,
                                                              self.y,
                                                              self.num_classes,
                                                              name='mean_IoU')

    def restore_session(self):
        global_step = 0

        if not os.path.exists(self.checkpoint_directory):
            raise IOError(self.checkpoint_directory + ' does not exist.')
        else:
            path = tf.train.get_checkpoint_state(self.checkpoint_directory)
            if path is None:
                pass
            else:
                self.saver.restore(self.session, path.model_checkpoint_path)
                global_step = int(path.model_checkpoint_path.split('-')[-1])

        return global_step

    def train(self,
              dataset_dir,
              feedback_dir,
              lagrange=0.8,
              num_iterations=10000,
              learning_rate=0.1,
              batch_size=5):

        current_step = self.restore_session()

        bdr = BatchDatasetReader(dataset_dir,
                                 480,
                                 320,
                                 current_step,
                                 batch_size,
                                 trainval_only=True)
        bfr = BanditFeedbackReader(feedback_dir, current_step)

        # Begin Training
        for i in range(current_step, num_iterations):

            # One training step
            images, ground_truths = bdr.next_training_batch()
            deltas, propensities = bfr.next_item_batch()

            feed_dict = {
                self.x: images,
                self.y: ground_truths,
                self.propensity: propensities,
                self.delta: np.mean(deltas),
                self.lagrange_mult: lagrange,
                self.train_phase: 1,
                self.rate: learning_rate
            }

            print('run train step: ' + str(i))
            self.train_step.run(session=self.session, feed_dict=feed_dict)

            # Print loss every 10 iterations
            if i % 10 == 0:
                train_loss = self.session.run(self.loss, feed_dict=feed_dict)
                print("Step: %d, Train_loss:%g" % (i, train_loss))

            # Run against validation dataset for 100 iterations
            if i % 100 == 0:
                images, ground_truths = bdr.next_training_batch()

                feed_dict = {
                    self.x: images,
                    self.y: ground_truths,
                    self.propensity: propensities,
                    self.delta: np.mean(deltas),
                    self.lagrange_mult: lagrange,
                    self.train_phase: 1,
                    self.rate: learning_rate
                }

                val_loss = self.session.run(self.loss, feed_dict=feed_dict)
                val_accuracy = self.session.run(self.accuracy,
                                                feed_dict=feed_dict)
                val_mean_IoU, update_op = self.session.run(self.mean_IoU,
                                                           feed_dict=feed_dict)
                print("%s ---> Validation_loss: %g" %
                      (datetime.datetime.now(), val_loss))
                print("%s ---> Validation_accuracy: %g" %
                      (datetime.datetime.now(), val_accuracy))

                self.logger.log("%s ---> Number of epochs: %g\n" %
                                (datetime.datetime.now(),
                                 math.floor((i * batch_size) / bdr.num_train)))
                self.logger.log("%s ---> Number of iterations: %g\n" %
                                (datetime.datetime.now(), i))
                self.logger.log("%s ---> Validation_loss: %g\n" %
                                (datetime.datetime.now(), val_loss))
                self.logger.log("%s ---> Validation_accuracy: %g\n" %
                                (datetime.datetime.now(), val_accuracy))
                self.logger.log_for_graphing(i, val_loss, val_accuracy,
                                             val_mean_IoU)

                # Save the model variables
                self.saver.save(self.session,
                                self.checkpoint_directory + 'segnet',
                                global_step=i)

            # Print outputs every 1000 iterations
            if i % 1000 == 0:
                self.logger.graph_training_stats()

Example #2

Show file

File: SegNetLogger.py Project: abhay-venkatesh/SegBandit

class SegNetLogger:
    ''' Network described by
            https://arxiv.org/pdf/1511.00561.pdf '''

    def load_vgg_weights(self):
        """ Use the VGG model trained on
            imagent dataset as a starting point for training """
        vgg_path = "models/imagenet-vgg-verydeep-19.mat"
        vgg_mat = scipy.io.loadmat(vgg_path)

        self.vgg_params = np.squeeze(vgg_mat['layers'])
        self.layers = ('conv1_1', 'relu1_1', 'conv1_2', 'relu1_2', 'pool1',
                        'conv2_1', 'relu2_1', 'conv2_2', 'relu2_2', 'pool2',
                        'conv3_1', 'relu3_1', 'conv3_2', 'relu3_2', 'conv3_3',
                        'relu3_3', 'conv3_4', 'relu3_4', 'pool3',
                        'conv4_1', 'relu4_1', 'conv4_2', 'relu4_2', 'conv4_3',
                        'relu4_3', 'conv4_4', 'relu4_4', 'pool4',
                        'conv5_1', 'relu5_1', 'conv5_2', 'relu5_2', 'conv5_3',
                        'relu5_3', 'conv5_4', 'relu5_4')

    def __init__(self, num_classes=11):
        self.num_classes = num_classes
        self.load_vgg_weights()
        self.build()

        # Begin a TensorFlow session
        config = tf.ConfigProto(allow_soft_placement=True)
        self.session = tf.Session(config=config)
        self.session.run(tf.global_variables_initializer())
        self.session.run(tf.local_variables_initializer())

        # Make saving trained weights and biases possible
        self.saver = tf.train.Saver(max_to_keep = 5, 
                                    keep_checkpoint_every_n_hours = 1)
        self.checkpoint_directory = './checkpoints/'

        self.logger = Logger()
        # Add summary logging capability
        """
        self.train_writer = tf.summary.FileWriter('./summaries' + '/train', 
                                                  self.session.graph)
        self.val_writer = tf.summary.FileWriter('./summaries' + '/val', 
                                                 self.session.graph)
        """


    def vgg_weight_and_bias(self, name, W_shape, b_shape):
        """ 
            Initializes weights and biases to the pre-trained VGG model.
            
            Args:
                name: name of the layer for which you want to initialize 
                      weights
                W_shape: shape of weights tensor exkpected
                b_shape: shape of bias tensor expected
            returns:
                w_var: Initialized weight variable
                b_var: Initialized bias variable
        """
        if name not in self.layers:
            return self.weight_variable(W_shape), self.weight_variable(b_shape)
        else:
            w, b = self.vgg_params[self.layers.index(name)][0][0][0][0]
            init_w = tf.constant(value=np.transpose(w, (1, 0, 2, 3)), 
                                 dtype=tf.float32, shape=W_shape)
            init_b = tf.constant(value=b.reshape(-1), dtype=tf.float32, 
                                 shape=b_shape)
            w_var = tf.Variable(init_w)
            b_var = tf.Variable(init_b)
            return w_var, b_var 

    def weight_variable(self, shape):
        initial = tf.truncated_normal(shape, stddev=0.1)
        return tf.Variable(initial)

    def bias_variable(self, shape):
        initial = tf.constant(0.1, shape=shape)
        return tf.Variable(initial)

    def pool_layer(self, x):
        return tf.nn.max_pool_with_argmax(x, ksize=[1, 2, 2, 1], 
                                          strides=[1, 2, 2, 1], padding='SAME')

    def unpool(self, pool, ind, ksize=[1, 2, 2, 1], scope='unpool'):
        """ Unpooling layer after max_pool_with_argmax.
        Args:
            pool: max pooled output tensor
            ind: argmax indices
            ksize: ksize is the same as for the pool
        Return:
            unpool: unpooling tensor
        """
        with tf.variable_scope(scope):
            input_shape =  tf.shape(pool)
            output_shape = [input_shape[0], 
                            input_shape[1] * ksize[1], 
                            input_shape[2] * ksize[2], 
                            input_shape[3]]

            flat_input_size = tf.cumprod(input_shape)[-1]
            flat_output_shape = tf.stack([output_shape[0], output_shape[1] 
                                                           * output_shape[2] 
                                                           * output_shape[3]])

            pool_ = tf.reshape(pool, tf.stack([flat_input_size]))
            batch_range = tf.range(tf.cast(output_shape[0], tf.int64), 
                                   dtype=ind.dtype)
            reshape_shape = tf.stack([input_shape[0], 1, 1, 1])
            reshaped_batch_range = tf.reshape(batch_range, 
                                              shape=reshape_shape)

            b = tf.ones_like(ind) * reshaped_batch_range
            b = tf.reshape(b, tf.stack([flat_input_size, 1]))
            ind_ = tf.reshape(ind, tf.stack([flat_input_size, 1]))
            ind_ = tf.concat([b, ind_], 1)

            ret = tf.scatter_nd(ind_, pool_, shape=tf.cast(flat_output_shape, 
                                                           tf.int64))
            ret = tf.reshape(ret, tf.stack(output_shape))
            return ret

    def conv_layer_with_bn(self, x, W_shape, train_phase, name, 
                           padding='SAME'):
        b_shape = W_shape[3]
        W, b = self.vgg_weight_and_bias(name, W_shape, [b_shape])
        convolved_output = tf.nn.conv2d(x, W, strides=[1,1,1,1], 
                                        padding=padding) + b
        batch_norm = tf.contrib.layers.batch_norm(convolved_output, 
                                                  is_training=train_phase)
        return tf.nn.relu(batch_norm)

    def build(self):
        # Declare placeholders
        self.x = tf.placeholder(tf.float32, shape=(None, None, None, 3))
        # self.y dimensions = BATCH_SIZE * WIDTH * HEIGHT
        self.y = tf.placeholder(tf.int64, shape=(None, None, None))
        expected = tf.expand_dims(self.y, -1)
        self.train_phase = tf.placeholder(tf.bool, name='train_phase')
        self.rate = tf.placeholder(tf.float32, shape=[])

        # First encoder
        conv_1_1 = self.conv_layer_with_bn(self.x, [3, 3, 3, 64], 
                                           self.train_phase, 'conv1_1')
        conv_1_2 = self.conv_layer_with_bn(conv_1_1, [3, 3, 64, 64], 
                                           self.train_phase, 'conv1_2')
        pool_1, pool_1_argmax = self.pool_layer(conv_1_2)

        # Second encoder
        conv_2_1 = self.conv_layer_with_bn(pool_1, [3, 3, 64, 128], 
                                           self.train_phase, 'conv2_1')
        conv_2_2 = self.conv_layer_with_bn(conv_2_1, [3, 3, 128, 128], 
                                           self.train_phase, 'conv2_2')
        pool_2, pool_2_argmax = self.pool_layer(conv_2_2)

        # Third encoder
        conv_3_1 = self.conv_layer_with_bn(pool_2, [3, 3, 128, 256], 
                                           self.train_phase, 'conv3_1')
        conv_3_2 = self.conv_layer_with_bn(conv_3_1, [3, 3, 256, 256], 
                                           self.train_phase, 'conv3_2')
        conv_3_3 = self.conv_layer_with_bn(conv_3_2, [3, 3, 256, 256], 
                                           self.train_phase, 'conv3_3')
        pool_3, pool_3_argmax = self.pool_layer(conv_3_3)

        # Fourth encoder
        conv_4_1 = self.conv_layer_with_bn(pool_3, [3, 3, 256, 512], 
                                           self.train_phase, 'conv4_1')
        conv_4_2 = self.conv_layer_with_bn(conv_4_1, [3, 3, 512, 512], 
                                           self.train_phase, 'conv4_2')
        conv_4_3 = self.conv_layer_with_bn(conv_4_2, [3, 3, 512, 512], 
                                           self.train_phase, 'conv4_3')
        pool_4, pool_4_argmax = self.pool_layer(conv_4_3)

        # Fifth encoder
        conv_5_1 = self.conv_layer_with_bn(pool_4, [3, 3, 512, 512], 
                                           self.train_phase, 'conv5_1')
        conv_5_2 = self.conv_layer_with_bn(conv_5_1, [3, 3, 512, 512], 
                                           self.train_phase, 'conv5_2')
        conv_5_3 = self.conv_layer_with_bn(conv_5_2, [3, 3, 512, 512], 
                                           self.train_phase, 'conv5_3')
        pool_5, pool_5_argmax = self.pool_layer(conv_5_3)

        # First decoder
        unpool_5 = self.unpool(pool_5, pool_5_argmax)
        deconv_5_3 = self.conv_layer_with_bn(unpool_5, [3, 3, 512, 512], 
                                             self.train_phase, 'deconv5_3')
        deconv_5_2 = self.conv_layer_with_bn(deconv_5_3, [3, 3, 512, 512], 
                                             self.train_phase, 'deconv5_2')
        deconv_5_1 = self.conv_layer_with_bn(deconv_5_2, [3, 3, 512, 512], 
                                             self.train_phase, 'deconv5_1')

        # Second decoder
        unpool_4 = self.unpool(deconv_5_1, pool_4_argmax)
        deconv_4_3 = self.conv_layer_with_bn(unpool_4, [3, 3, 512, 512], 
                                             self.train_phase, 'deconv4_3')
        deconv_4_2 = self.conv_layer_with_bn(deconv_4_3, [3, 3, 512, 512], 
                                             self.train_phase, 'deconv4_2')
        deconv_4_1 = self.conv_layer_with_bn(deconv_4_2, [3, 3, 512, 256], 
                                             self.train_phase, 'deconv4_1')

        # Third decoder
        unpool_3 = self.unpool(deconv_4_1, pool_3_argmax)
        deconv_3_3 = self.conv_layer_with_bn(unpool_3, [3, 3, 256, 256], 
                                             self.train_phase, 'deconv3_3')
        deconv_3_2 = self.conv_layer_with_bn(deconv_3_3, [3, 3, 256, 256], 
                                             self.train_phase, 'deconv3_2')
        deconv_3_1 = self.conv_layer_with_bn(deconv_3_2, [3, 3, 256, 128], 
                                             self.train_phase, 'deconv3_1')

        # Fourth decoder
        unpool_2 = self.unpool(deconv_3_1, pool_2_argmax)
        deconv_2_2 = self.conv_layer_with_bn(unpool_2, [3, 3, 128, 128], 
                                             self.train_phase, 'deconv2_2')
        deconv_2_1 = self.conv_layer_with_bn(deconv_2_2, [3, 3, 128, 64], 
                                             self.train_phase, 'deconv2_1')

        # Fifth decoder
        unpool_1 = self.unpool(deconv_2_1, pool_1_argmax)
        deconv_1_2 = self.conv_layer_with_bn(unpool_1, [3, 3, 64, 64], 
                                             self.train_phase, 'deconv1_2')
        deconv_1_1 = self.conv_layer_with_bn(deconv_1_2, [3, 3, 64, 32], 
                                             self.train_phase, 'deconv1_1')

        # Produce class scores
        # score_1 dimensions: BATCH_SIZE * WIDTH * HEIGHT * NUM_CLASSES
        score_1 = self.conv_layer_with_bn(deconv_1_1, 
                                          [1, 1, 32, self.num_classes], 
                                          self.train_phase, 
                                          'score_1')
        logits = tf.reshape(score_1, (-1, self.num_classes))

        # Prepare network outputs
        cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
            labels=tf.reshape(expected, [-1]), 
            logits=logits, 
            name='x_entropy')
        self.loss = tf.reduce_mean(cross_entropy, name='x_entropy_mean')
        optimizer = tf.train.AdamOptimizer(self.rate)
        self.train_step = optimizer.minimize(self.loss)
        
        # Metrics
        self.prediction = tf.argmax(score_1, axis=3, name="prediction")
        self.accuracy = tf.contrib.metrics.accuracy(self.prediction, 
                                                    self.y, 
                                                    name='accuracy')
        self.mean_IoU = tf.contrib.metrics.streaming_mean_iou(self.prediction, 
                                                    self.y,
                                                    self.num_classes, 
                                                    name='mean_IoU')

        self.propensity = tf.nn.softmax(logits)


    def restore_session(self):
        global_step = 0

        if not os.path.exists(self.checkpoint_directory):
            raise IOError(self.checkpoint_directory + ' does not exist.')
        else:
            path = tf.train.get_checkpoint_state(self.checkpoint_directory)
            if path is None:
                pass
            else:
                self.saver.restore(self.session, path.model_checkpoint_path)
                global_step = int(path.model_checkpoint_path.split('-')[-1])

        return global_step


    def train(self, dataset_directory, num_iterations=10000, learning_rate=0.1, 
              batch_size=5):
        current_step = self.restore_session()

        bdr = BatchDatasetReader(dataset_directory, 480, 320, current_step, 
                                 batch_size, trainval_only=True)

        # Begin Training
        for i in range(current_step, num_iterations):

            # One training step
            images, ground_truths = bdr.next_training_batch()
            feed_dict = {self.x: images, self.y: ground_truths, 
                         self.train_phase: 1, self.rate: learning_rate}
            print('run train step: ' + str(i))
            self.train_step.run(session=self.session, feed_dict=feed_dict)

            # Print loss every 10 iterations
            if i % 10 == 0:
                train_loss = self.session.run(self.loss, feed_dict=feed_dict)
                print("Step: %d, Train_loss:%g" % (i, train_loss))

            # Run against validation dataset for 100 iterations
            if i % 100 == 0:
                # Feed into network
                images, ground_truths = bdr.next_val_batch()
                feed_dict = {self.x: images, self.y: ground_truths, 
                             self.train_phase: 1, self.rate: learning_rate}

                # Get metrics and print them
                val_loss = self.session.run(self.loss, feed_dict=feed_dict)
                val_accuracy = self.session.run(self.accuracy, 
                                                feed_dict=feed_dict)
                val_mean_IoU, update_op = self.session.run(self.mean_IoU, 
                                                feed_dict=feed_dict)
                print("%s ---> Validation_loss: %g" % (datetime.datetime.now(), 
                                                       val_loss))
                print("%s ---> Validation_accuracy: %g" % 
                      (datetime.datetime.now(), val_accuracy))

                # Log stuff
                self.logger.log("%s ---> Number of epochs: %g\n" % 
                                (datetime.datetime.now(), 
                                 math.floor((i * batch_size)/bdr.num_train)))
                self.logger.log("%s ---> Number of iterations: %g\n" % 
                                 (datetime.datetime.now(), i))
                self.logger.log("%s ---> Validation_loss: %g\n" % 
                                 (datetime.datetime.now(), val_loss))
                self.logger.log("%s ---> Validation_accuracy: %g\n" % 
                                 (datetime.datetime.now(), val_accuracy))
                self.logger.log_for_graphing(i, val_loss, val_accuracy, 
                                             val_mean_IoU)

                # Save the model variables
                self.saver.save(self.session, 
                                self.checkpoint_directory + 'segnet', 
                                global_step = i)

            # Print outputs every 1000 iterations
            if i % 1000 == 0:
                self.logger.graph_training_stats()


    def build_contextual_feedback_log(self, dataset_directory, 
                                      learning_rate=0.1):

        # Get trained weights and biases
        current_step = self.restore_session()

        DESIRED_LOG_SIZE_MULTIPLIER = 1

        output_dir = "./logged_bandit_feedback/"
        if not os.path.exists(output_dir):
            os.makedirs(output_dir) 

        log = []
        dr = ValDatasetReader(480, 320, dataset_directory)
        for j in range(DESIRED_LOG_SIZE_MULTIPLIER):

            for i in range(dr.val_data_size):

                i = (dr.val_data_size * j) + i

                image, ground_truth, image_file = dr.next_val_pair()

                feed_dict = {self.x: [image], self.y: [ground_truth], 
                             self.train_phase: 1, self.rate: learning_rate}

                loss = self.session.run(self.loss, feed_dict=feed_dict)
                propensity = self.session.run(self.propensity, 
                                              feed_dict=feed_dict)

                log.append((i, loss, propensity))
                print(i)

                if i % 100 == 0 and i != 0:
                    with open(output_dir + 'log-' + str(int(i/100)), 'wb') as fp:
                        pickle.dump(log, fp)
                        log = []


        with open(output_dir + 'meta', 'a') as metafile:
            metafile.write("size, " + str(dr.val_data_size * 
                                          DESIRED_LOG_SIZE_MULTIPLIER))

Example #3

Show file

File: InvariantNet.py Project: ricklentz/invariant-net

class InvariantNet:
    def __init__(self, dataset_directory, num_classes=11):

        self.num_classes = num_classes
        self.load_vgg_weights()
        self.build()

        # Begin a TensorFlow session
        config = tf.ConfigProto(allow_soft_placement=True)
        self.session = tf.Session(config=config)
        self.session.run(tf.global_variables_initializer())
        self.session.run(tf.local_variables_initializer())

        # Make saving trained weights and biases possible
        self.saver = tf.train.Saver(max_to_keep=5,
                                    keep_checkpoint_every_n_hours=1)
        self.checkpoint_directory = './checkpoints/'

        self.logger = Logger()

    def load_vgg_weights(self):
        """ Use the VGG model trained on
            imagent dataset as a starting point for training """
        vgg_path = "models/imagenet-vgg-verydeep-19.mat"
        vgg_mat = scipy.io.loadmat(vgg_path)

        self.vgg_params = np.squeeze(vgg_mat['layers'])
        self.layers = ('conv1_1', 'relu1_1', 'conv1_2', 'relu1_2', 'pool1',
                       'conv2_1', 'relu2_1', 'conv2_2', 'relu2_2', 'pool2',
                       'conv3_1', 'relu3_1', 'conv3_2', 'relu3_2', 'conv3_3',
                       'relu3_3', 'conv3_4', 'relu3_4', 'pool3', 'conv4_1',
                       'relu4_1', 'conv4_2', 'relu4_2', 'conv4_3', 'relu4_3',
                       'conv4_4', 'relu4_4', 'pool4', 'conv5_1', 'relu5_1',
                       'conv5_2', 'relu5_2', 'conv5_3', 'relu5_3', 'conv5_4',
                       'relu5_4')

    def vgg_weight_and_bias(self, name, W_shape, b_shape):
        """ 
            Initializes weights and biases to the pre-trained VGG model.
            
            Args:
                name: name of the layer for which you want to initialize weights
                W_shape: shape of weights tensor exkpected
                b_shape: shape of bias tensor expected
            returns:
                w_var: Initialized weight variable
                b_var: Initialized bias variable
        """
        if name not in self.layers:
            return self.weight_variable(W_shape), \
                   self.weight_variable(b_shape)
        else:
            w, b = self.vgg_params[self.layers.index(name)][0][0][0][0]
            init_w = tf.constant(value=np.transpose(w, (1, 0, 2, 3)),
                                 dtype=tf.float32,
                                 shape=W_shape)
            init_b = tf.constant(value=b.reshape(-1),
                                 dtype=tf.float32,
                                 shape=b_shape)
            w_var = tf.Variable(init_w)
            b_var = tf.Variable(init_b)
            return w_var, b_var

    def weight_variable(self, shape, is_trainable):
        initial = tf.truncated_normal(shape, stddev=0.1)
        return tf.Variable(initial)

    def bias_variable(self, shape, is_trainable):
        initial = tf.constant(0.1, shape=shape)
        return tf.Variable(initial, trainable=True)

    def pool_layer(self, x):
        return tf.nn.max_pool_with_argmax(x,
                                          ksize=[1, 2, 2, 1],
                                          strides=[1, 2, 2, 1],
                                          padding='SAME')

    def unpool(self, pool, ind, ksize=[1, 2, 2, 1], scope='unpool'):
        """ 
            Unpooling layer after max_pool_with_argmax.

            Args:
                pool: max pooled output tensor
                ind: argmax indices
                ksize: ksize is the same as for the pool
            Return:
                unpool: unpooling tensor
        """
        with tf.variable_scope(scope):
            input_shape = tf.shape(pool)
            output_shape = [
                input_shape[0], input_shape[1] * ksize[1],
                input_shape[2] * ksize[2], input_shape[3]
            ]

            flat_input_size = tf.cumprod(input_shape)[-1]
            flat_output_shape = tf.stack([
                output_shape[0],
                output_shape[1] * output_shape[2] * output_shape[3]
            ])

            pool_ = tf.reshape(pool, tf.stack([flat_input_size]))
            batch_range = tf.range(tf.cast(output_shape[0], tf.int64),
                                   dtype=ind.dtype)
            reshape_shape = tf.stack([input_shape[0], 1, 1, 1])
            reshaped_batch_range = tf.reshape(batch_range, shape=reshape_shape)

            b = tf.ones_like(ind) * reshaped_batch_range
            b = tf.reshape(b, tf.stack([flat_input_size, 1]))
            ind_ = tf.reshape(ind, tf.stack([flat_input_size, 1]))
            ind_ = tf.concat([b, ind_], 1)

            ret = tf.scatter_nd(ind_,
                                pool_,
                                shape=tf.cast(flat_output_shape, tf.int64))
            ret = tf.reshape(ret, tf.stack(output_shape))
            return ret

    def conv_layer_with_bn(self, x, W_shape, name, padding='SAME'):
        b_shape = W_shape[3]
        W, b = self.vgg_weight_and_bias(name, W_shape, [b_shape])
        convolved_output = tf.nn.conv2d(
            x, W, strides=[1, 1, 1, 1], padding=padding) + b
        batch_norm = tf.contrib.layers.batch_norm(convolved_output,
                                                  is_training=True)
        return tf.nn.relu(batch_norm)

    def dynamic_filtering(self, pool_5):
        df = self.gen_dynamic_filter(self.theta,
                                     pool_5,
                                     filter_shape=[3, 3, 512, 512])
        pool_5 = self.dynamic_conv_layer(pool_5,
                                         filter_shape=[3, 3, 512, 512],
                                         dynamic_filter=df,
                                         name="conv_d")
        return pool_5

    def gen_dynamic_filter(self, theta, pooled_layer, filter_shape):
        """ 
            filter_shape=[3, 3, 512, 512]
            pooled_layer shape = NUM_BATCHES * HEIGHT * WIDTH * 512
        """
        # print(pooled_layer.get_shape())
        # pooled_layer shape = NUM_BATCHES(?) * 10 * 15 * 512

        feature_map = tf.reduce_mean(pooled_layer, axis=3)
        # print(feature_map.get_shape())
        # feature_map shape = NUM_BATCHES(?) * HEIGHT * WIDTH

        length = feature_map.get_shape()[1] * feature_map.get_shape()[2]
        # print(length)
        # length = HEIGHT * WIDTH = 150

        features = tf.reshape(feature_map, [-1, int(length)])
        # print(features.get_shape())
        # features shape = NUM_BATCHES(?) * 150
        num_batches = tf.shape(features)[0]
        """
        Theta with Reduce Mean

        theta = theta/20
        theta = tf.expand_dims(theta, 0)
        theta = tf.expand_dims(theta, 1)
        theta = tf.expand_dims(theta, 2)
        features = tf.expand_dims(features, 2)
        theta = tf.tile(theta, tf.stack([tf.shape(features)[0], features.get_shape()[1], 1]))
        features = tf.concat([features, theta], 2)
        features = tf.reduce_mean(features, axis=2)
        """
        """
        Theta with append
        """
        theta = theta / 20
        theta = tf.expand_dims(theta, 0)
        theta = tf.expand_dims(theta, 1)
        theta = tf.tile(theta, tf.stack([tf.shape(features)[0], 1]))
        features = tf.concat([features, theta], 1)
        # print(features.get_shape())

        fc1 = tf.contrib.layers.fully_connected(features, 64)
        fc2 = tf.contrib.layers.fully_connected(fc1, 128)
        fc3 = tf.contrib.layers.fully_connected(fc2,
                                                filter_shape[0] *
                                                filter_shape[1],
                                                activation_fn=None)
        fc3 = tf.reduce_mean(fc3, axis=0)
        filt = tf.reshape(fc3, filter_shape[0:2])
        filt = tf.expand_dims(filt, 2)
        filt = tf.expand_dims(filt, 3)
        filt = tf.tile(filt, [1, 1, filter_shape[2], filter_shape[3]])
        return filt

    def dynamic_conv_layer(self,
                           bottom,
                           filter_shape,
                           dynamic_filter,
                           name,
                           strides=[1, 1, 1, 1],
                           padding="SAME"):
        # init_w = tf.truncated_normal(filter_shape, stddev=0.2)
        init_b = tf.constant_initializer(value=0.0, dtype=tf.float32)
        filt = tf.get_variable(name="%s_w" % name,
                               shape=filter_shape,
                               initializer=tf.truncated_normal_initializer,
                               dtype=tf.float32)
        filt = tf.add(filt, dynamic_filter)
        conv = tf.nn.conv2d(bottom,
                            filter=filt,
                            strides=strides,
                            padding=padding,
                            name=name)
        bias = tf.get_variable(name="%s_b" % name,
                               initializer=init_b,
                               shape=[filter_shape[-1]],
                               dtype=tf.float32)
        return tf.nn.bias_add(conv, bias)

    def build(self):
        with tf.device('/gpu:0'):
            # Declare placeholders
            # self.x dimensions = BATCH_SIZE * HEIGHT * WIDTH * NUM_CHANNELS
            # TODO: Make flexible for image sizes
            self.x = tf.placeholder(tf.float32, shape=[None, 320, 480, 3])
            # self.y dimensions = BATCH_SIZE * WIDTH * HEIGHT
            self.y = tf.placeholder(tf.int64, shape=[None, 320, 480])
            expected = tf.expand_dims(self.y, -1)
            self.is_trainable = tf.placeholder(tf.bool, name='is_trainable')
            self.rate = tf.placeholder(tf.float32, shape=[])
            self.theta = tf.placeholder(tf.float32, shape=[], name='theta')

            # First encoder
            # conv_1_1 shape = BATCH_SIZE * HEIGHT * WIDTH * 64
            conv_1_1 = self.conv_layer_with_bn(self.x, [3, 3, 3, 64],
                                               'conv1_1')
            conv_1_2 = self.conv_layer_with_bn(conv_1_1, [3, 3, 64, 64],
                                               'conv1_2')
            pool_1, pool_1_argmax = self.pool_layer(conv_1_2)

            # Second encoder
            conv_2_1 = self.conv_layer_with_bn(pool_1, [3, 3, 64, 128],
                                               'conv2_1')
            conv_2_2 = self.conv_layer_with_bn(conv_2_1, [3, 3, 128, 128],
                                               'conv2_2')
            pool_2, pool_2_argmax = self.pool_layer(conv_2_2)

            # Third encoder
            conv_3_1 = self.conv_layer_with_bn(pool_2, [3, 3, 128, 256],
                                               'conv3_1')
            conv_3_2 = self.conv_layer_with_bn(conv_3_1, [3, 3, 256, 256],
                                               'conv3_2')
            conv_3_3 = self.conv_layer_with_bn(conv_3_2, [3, 3, 256, 256],
                                               'conv3_3')
            pool_3, pool_3_argmax = self.pool_layer(conv_3_3)

            # Fourth encoder
            conv_4_1 = self.conv_layer_with_bn(pool_3, [3, 3, 256, 512],
                                               'conv4_1')
            conv_4_2 = self.conv_layer_with_bn(conv_4_1, [3, 3, 512, 512],
                                               'conv4_2')
            conv_4_3 = self.conv_layer_with_bn(conv_4_2, [3, 3, 512, 512],
                                               'conv4_3')
            pool_4, pool_4_argmax = self.pool_layer(conv_4_3)

            # Fifth encoder
            conv_5_1 = self.conv_layer_with_bn(pool_4, [3, 3, 512, 512],
                                               'conv5_1')
            conv_5_2 = self.conv_layer_with_bn(conv_5_1, [3, 3, 512, 512],
                                               'conv5_2')
            conv_5_3 = self.conv_layer_with_bn(conv_5_2, [3, 3, 512, 512],
                                               'conv5_3')
            # pool_5 shape = BATCH_SIZE * HEIGHT * WIDTH * 512
            pool_5, pool_5_argmax = self.pool_layer(conv_5_3)

            # Dynamic Filtering when on non-street view
            y = lambda x: x
            pool_5 = tf.cond(self.is_trainable, lambda: y(pool_5),
                             lambda: self.dynamic_filtering(pool_5))

            # First decoder
            unpool_5 = self.unpool(pool_5, pool_5_argmax)
            deconv_5_3 = self.conv_layer_with_bn(unpool_5, [3, 3, 512, 512],
                                                 'deconv5_3')
            deconv_5_2 = self.conv_layer_with_bn(deconv_5_3, [3, 3, 512, 512],
                                                 'deconv5_2')
            deconv_5_1 = self.conv_layer_with_bn(deconv_5_2, [3, 3, 512, 512],
                                                 'deconv5_1')

            # Second decoder
            unpool_4 = self.unpool(deconv_5_1, pool_4_argmax)
            deconv_4_3 = self.conv_layer_with_bn(unpool_4, [3, 3, 512, 512],
                                                 'deconv4_3')
            deconv_4_2 = self.conv_layer_with_bn(deconv_4_3, [3, 3, 512, 512],
                                                 'deconv4_2')
            deconv_4_1 = self.conv_layer_with_bn(deconv_4_2, [3, 3, 512, 256],
                                                 'deconv4_1')

            # Third decoder
            unpool_3 = self.unpool(deconv_4_1, pool_3_argmax)
            deconv_3_3 = self.conv_layer_with_bn(unpool_3, [3, 3, 256, 256],
                                                 'deconv3_3')
            deconv_3_2 = self.conv_layer_with_bn(deconv_3_3, [3, 3, 256, 256],
                                                 'deconv3_2')
            deconv_3_1 = self.conv_layer_with_bn(deconv_3_2, [3, 3, 256, 128],
                                                 'deconv3_1')

            # Fourth decoder
            unpool_2 = self.unpool(deconv_3_1, pool_2_argmax)
            deconv_2_2 = self.conv_layer_with_bn(unpool_2, [3, 3, 128, 128],
                                                 'deconv2_2')
            deconv_2_1 = self.conv_layer_with_bn(deconv_2_2, [3, 3, 128, 64],
                                                 'deconv2_1')

            # Fifth decoder
            unpool_1 = self.unpool(deconv_2_1, pool_1_argmax)
            deconv_1_2 = self.conv_layer_with_bn(unpool_1, [3, 3, 64, 64],
                                                 'deconv1_2')
            deconv_1_1 = self.conv_layer_with_bn(deconv_1_2, [3, 3, 64, 32],
                                                 'deconv1_1')

            # Produce class scores
            # score_1 dimensions: BATCH_SIZE * HEIGHT * WIDTH * NUM_CLASSES
            score_1 = self.conv_layer_with_bn(deconv_1_1,
                                              [1, 1, 32, self.num_classes],
                                              'score_1')
            logits = tf.reshape(score_1, (-1, self.num_classes))

            # Prepare network outputs
            cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
                labels=tf.reshape(expected, [-1]),
                logits=logits,
                name='x_entropy')
            self.loss = tf.reduce_mean(cross_entropy, name='x_entropy_mean')
            optimizer = tf.train.AdamOptimizer(self.rate)
            self.train_step = optimizer.minimize(self.loss)

            # Metrics
            self.prediction = tf.argmax(score_1, axis=3, name="prediction")
            self.accuracy = tf.contrib.metrics.accuracy(self.prediction,
                                                        self.y,
                                                        name='accuracy')
            self.mean_IoU = tf.contrib.metrics.streaming_mean_iou(
                self.prediction, self.y, self.num_classes, name='mean_IoU')

    def restore_session(self):
        global_step = 0

        if not os.path.exists(self.checkpoint_directory):
            raise IOError(self.checkpoint_directory + ' does not exist.')
        else:
            path = tf.train.get_checkpoint_state(self.checkpoint_directory)
            if path is None:
                pass
            else:
                self.saver.restore(self.session, path.model_checkpoint_path)
                global_step = int(path.model_checkpoint_path.split('-')[-1])

        return global_step

    def train(self,
              num_iterations,
              theta,
              is_trainable,
              dataset_directory,
              learning_rate=0.1,
              batch_size=5):
        """
            Args:
                num_iterations
                theta: View perspective number

        """
        current_step = self.restore_session()

        bdr = BatchDatasetReader(dataset_directory, 480, 320, current_step,
                                 batch_size)

        # Begin Training
        for i in range(current_step, num_iterations):

            # One training step
            images, ground_truths = bdr.next_training_batch()

            # Train Phase Guide
            # is_trainable = True : street view training
            # is_trainable = False : non-street view training, freeze weights
            feed_dict = {
                self.x: images,
                self.y: ground_truths,
                self.is_trainable: is_trainable,
                self.theta: theta,
                self.rate: learning_rate
            }
            print('run train step: ' + str(i))
            self.train_step.run(session=self.session, feed_dict=feed_dict)

            # Print loss every 10 iterations
            if i % 10 == 0:
                train_loss = self.session.run(self.loss, feed_dict=feed_dict)
                print("Step: %d, Train_loss:%g" % (i, train_loss))

            # Run against validation dataset for 100 iterations
            if i % 100 == 0:
                images, ground_truths = bdr.next_val_batch()
                num_training_images = bdr.num_train

                # Make a validation prediction
                feed_dict = {
                    self.x: images,
                    self.y: ground_truths,
                    self.is_trainable: is_trainable,
                    self.theta: theta,
                    self.rate: learning_rate
                }
                val_loss = self.session.run(self.loss, feed_dict=feed_dict)
                val_accuracy = self.session.run(self.accuracy,
                                                feed_dict=feed_dict)
                val_mean_IoU, update_op = self.session.run(self.mean_IoU,
                                                           feed_dict=feed_dict)

                print("%s ---> Validation_loss: %g" %
                      (datetime.datetime.now(), val_loss))
                print("%s ---> Validation_accuracy: %g" %
                      (datetime.datetime.now(), val_accuracy))

                self.logger.log("%s ---> Number of epochs: %g\n" %
                                (datetime.datetime.now(),
                                 math.floor(
                                     (i * batch_size) / num_training_images)))
                self.logger.log("%s ---> Number of iterations: %g\n" %
                                (datetime.datetime.now(), i))
                self.logger.log("%s ---> Validation_loss: %g\n" %
                                (datetime.datetime.now(), val_loss))
                self.logger.log("%s ---> Validation_accuracy: %g\n" %
                                (datetime.datetime.now(), val_accuracy))
                self.logger.log_for_graphing(i, val_loss, val_accuracy,
                                             val_mean_IoU)

                # Save the model variables
                self.saver.save(self.session,
                                self.checkpoint_directory + 'DFSegNet',
                                global_step=i)

            # Print outputs every 1000 iterations
            if i % 1000 == 0:
                self.test(theta, is_trainable, dataset_directory, 1e-2)
                self.logger.graph_training_stats()

    def test(self, theta, is_trainable, dataset_directory, learning_rate):

        current_step = self.restore_session()

        dr = DatasetReader(480, 320, dataset_directory)

        for i in range(min(dr.test_data_size, 10)):
            image, ground_truth = dr.next_test_pair()

            feed_dict = {
                self.x: [image],
                self.y: [ground_truth],
                self.is_trainable: is_trainable,
                self.theta: theta,
                self.rate: learning_rate
            }
            segmentation = np.squeeze(
                self.session.run(self.prediction, feed_dict=feed_dict))

            dp = DataPostprocessor()
            dp.write_out(i, image, segmentation, ground_truth, current_step)