model.py

#Model file

import numpy as np
import tensorflow as tf
from tensorflow.python.ops.parallel_for import gradients

FLAGS = tf.app.flags.FLAGS

def complex_add(x, y):
    xr, xi = tf.real(x), tf.imag(x)
    yr, yi = tf.real(y), tf.imag(y)
    return tf.complex(xr + yr, xi + yi)

def complex_mul(x, y):
    xr, xi = tf.real(x), tf.imag(x)
    yr, yi = tf.real(y), tf.imag(y)
    return tf.complex(xr*yr - xi*yi, xr*yi + xi*yr)

def stack_k(x, axis, k):

    list_x = []
    for i in range(k):
        list_x.append(x)

    out = tf.stack(list_x, axis)

    return out


#DOWNSAMPLING
#DOWNSAMPLING
def downsample(x, mask):

    mask_kspace = tf.cast(mask, tf.complex64)
    data_kspace = Fourier(x, separate_complex=True)
    out = mask_kspace * data_kspace

    return out


#UPSAMPLING
def upsample(x, mask):

    image_complex = tf.ifft2d(x)
    image_size = [FLAGS.batch_size, FLAGS.sample_size, FLAGS.sample_size_y] #tf.shape(image_complex)

    #get real and imaginary parts
    image_real = tf.reshape(tf.real(image_complex), [image_size[0], image_size[1], image_size[2], 1])
    image_imag = tf.reshape(tf.imag(image_complex), [image_size[0], image_size[1], image_size[2], 1])

    out = tf.concat([image_real, image_imag], 3)

    return out


class Model:
    """A neural network model.

    Currently only supports a feedforward architecture."""
    
    def __init__(self, name, features):
        self.name = name
        self.outputs = [features]

    def _get_layer_str(self, layer=None):
        if layer is None:
            layer = self.get_num_layers()
        
        return '%s_L%03d' % (self.name, layer+1)

    def _get_num_inputs(self):
        return int(self.get_output().get_shape()[-1])

    def _glorot_initializer(self, prev_units, num_units, stddev_factor=1.0):
        """Initialization in the style of Glorot 2010.

        stddev_factor should be 1.0 for linear activations, and 2.0 for ReLUs"""
        stddev  = np.sqrt(stddev_factor / np.sqrt(prev_units*num_units))
        return tf.truncated_normal([prev_units, num_units],
                                    mean=0.0, stddev=stddev)

    def _glorot_initializer_conv2d(self, prev_units, num_units, mapsize, stddev_factor=1.0):
        """Initialization in the style of Glorot 2010.

        stddev_factor should be 1.0 for linear activations, and 2.0 for ReLUs"""

        stddev  = np.sqrt(stddev_factor / (np.sqrt(prev_units*num_units)*mapsize*mapsize))
        return tf.truncated_normal([mapsize, mapsize, prev_units, num_units],
                                    mean=0.0, stddev=stddev)

    def get_num_layers(self):
        return len(self.outputs)

    def add_batch_norm(self, scale=False):
        """Adds a batch normalization layer to this model.

        See ArXiv 1502.03167v3 for details."""

        # TBD: This appears to be very flaky, often raising InvalidArgumentError internally
        with tf.variable_scope(self._get_layer_str()):
            out = tf.contrib.layers.batch_norm(self.get_output(), scale=scale)
        
        self.outputs.append(out)
        return self

    def add_flatten(self):
        """Transforms the output of this network to a 1D tensor"""

        with tf.variable_scope(self._get_layer_str()):
            batch_size = int(self.get_output().get_shape()[0])
            out = tf.reshape(self.get_output(), [batch_size, -1])

        self.outputs.append(out)
        return self

    def add_dense(self, num_units, stddev_factor=1.0):
        """Adds a dense linear layer to this model.

        Uses Glorot 2010 initialization assuming linear activation."""
        
        assert len(self.get_output().get_shape()) == 2, "Previous layer must be 2-dimensional (batch, channels)"

        with tf.variable_scope(self._get_layer_str()):
            prev_units = self._get_num_inputs()
            
            # Weight term
            initw   = self._glorot_initializer(prev_units, num_units,
                                               stddev_factor=stddev_factor)
            weight  = tf.get_variable('weight', initializer=initw)

            # Bias term
            initb   = tf.constant(0.0, shape=[num_units])
            bias    = tf.get_variable('bias', initializer=initb)

            # Output of this layer
            out     = tf.matmul(self.get_output(), weight) + bias

        self.outputs.append(out)
        return self

    def add_sigmoid(self):
        """Adds a sigmoid (0,1) activation function layer to this model."""

        with tf.variable_scope(self._get_layer_str()):
            prev_units = self._get_num_inputs()
            out = tf.nn.sigmoid(self.get_output())
        
        self.outputs.append(out)
        return self

    def add_softmax(self):
        """Adds a softmax operation to this model"""

        with tf.variable_scope(self._get_layer_str()):
            this_input = tf.square(self.get_output())
            reduction_indices = list(range(1, len(this_input.get_shape())))
            acc = tf.reduce_sum(this_input, reduction_indices=reduction_indices, keep_dims=True)
            out = this_input / (acc+FLAGS.epsilon)
            #out = tf.verify_tensor_all_finite(out, "add_softmax failed; is sum equal to zero?")
        
        self.outputs.append(out)
        return self

    def add_relu(self):
        """Adds a ReLU activation function to this model"""

        with tf.variable_scope(self._get_layer_str()):
            out = tf.nn.relu(self.get_output())

        self.outputs.append(out)
        return self        

    def add_elu(self):
        """Adds a ELU activation function to this model"""

        with tf.variable_scope(self._get_layer_str()):
            out = tf.nn.elu(self.get_output())

        self.outputs.append(out)
        return self      

    def add_lrelu(self, leak=.2):
        """Adds a leaky ReLU (LReLU) activation function to this model"""

        with tf.variable_scope(self._get_layer_str()):
            t1  = .5 * (1 + leak)
            t2  = .5 * (1 - leak)
            out = t1 * self.get_output() + \
                  t2 * tf.abs(self.get_output())
            
        self.outputs.append(out)
        return self

    def add_conv2d(self, num_units, mapsize=1, stride=1, stddev_factor=1.0):
        """Adds a 2D convolutional layer."""

        assert len(self.get_output().get_shape()) == 4 and "Previous layer must be 4-dimensional (batch, width, height, channels)"
        
        with tf.variable_scope(self._get_layer_str()):
            prev_units = self._get_num_inputs()
            
            # Weight term and convolution
            initw  = self._glorot_initializer_conv2d(prev_units, num_units,
                                                     mapsize,
                                                     stddev_factor=stddev_factor)
            weight = tf.get_variable('weight', initializer=initw)
            out    = tf.nn.conv2d(self.get_output(), weight,
                                  strides=[1, stride, stride, 1],
                                  padding='SAME')

            # Bias term
            initb  = tf.constant(0.0, shape=[num_units])
            bias   = tf.get_variable('bias', initializer=initb)
            out    = tf.nn.bias_add(out, bias)  #?????!!!
            
        self.outputs.append(out)
        return self


    def add_fullconnect2d(self, num_units, stddev_factor=1.0):
        """Adds a 2D convolutional layer."""

        assert len(self.get_output().get_shape()) == 4 and "Previous layer must be 4-dimensional (batch, width, height, channels)"
        
        with tf.variable_scope(self._get_layer_str()):
            prev_units = self._get_num_inputs()
            
            # Weight term and full connection
            #initw  = self._glorot_initializer_conv2d(prev_units, num_units,
                                                     #mapsize,
                                                     #stddev_factor=stddev_factor)
            weight = tf.get_variable('weight', initializer=initw)
            out = tf.contrib.layers.fully_connected(self.get_output(), num_units, activation_fn=None, normalizer_fn=None, normalizer_params=None, 
                                                    weights_initializer=initializers.xavier_initializer(),
                                                    weights_regularizer=None,
                                                    biases_initializer=tf.zeros_initializer(),
                                                    biases_regularizer=None,
                                                    reuse=None,
                                                    variables_collections=None,
                                                    outputs_collections=None,
                                                    trainable=True,
                                                    scope=None)    #activation_fn=tf.nn.relu


            #out    = tf.nn.conv2d(self.get_output(), weight,
                                  #strides=[1, stride, stride, 1],
                                  #padding='SAME')

            # Bias term
            initb  = tf.constant(0.0, shape=[num_units])
            bias   = tf.get_variable('bias', initializer=initb)
            out    = tf.nn.bias_add(out, bias)
            
        self.outputs.append(out)
        return self


    def add_conv2d_transpose(self, num_units, mapsize=1, stride=1, stddev_factor=1.0):
        """Adds a transposed 2D convolutional layer"""

        assert len(self.get_output().get_shape()) == 4 and "Previous layer must be 4-dimensional (batch, width, height, channels)"

        with tf.variable_scope(self._get_layer_str()):
            prev_units = self._get_num_inputs()
            
            # Weight term and convolution
            initw  = self._glorot_initializer_conv2d(prev_units, num_units,
                                                     mapsize,
                                                     stddev_factor=stddev_factor)
            weight = tf.get_variable('weight', initializer=initw)
            weight = tf.transpose(weight, perm=[0, 1, 3, 2])
            prev_output = self.get_output()
            output_shape = [FLAGS.batch_size,
                            int(prev_output.get_shape()[1]) * stride,
                            int(prev_output.get_shape()[2]) * stride,
                            num_units]
            out = tf.nn.conv2d_transpose(self.get_output(), weight,
                                            output_shape=output_shape,
                                            strides=[1, stride, stride, 1],
                                            padding='SAME')

            # Bias term
            initb  = tf.constant(0.0, shape=[num_units])
            bias   = tf.get_variable('bias', initializer=initb)
            out    = tf.nn.bias_add(out, bias)
            
        self.outputs.append(out)
        return self

  
    def add_sum(self, term):
        """Adds a layer that sums the top layer with the given term"""

        with tf.variable_scope(self._get_layer_str()):
            prev_shape = self.get_output().get_shape()
            term_shape = term.get_shape()
            #print("%s %s" % (prev_shape, term_shape))
            assert prev_shape == term_shape and "Can't sum terms with a different size"
            out = tf.add(self.get_output(), term)
        
        self.outputs.append(out)
        return self


    def get_output(self):
        """Returns the output from the topmost layer of the network"""
        return self.outputs[-1]

    def get_variable(self, layer, name):
        """Returns a variable given its layer and name.

        The variable must already exist."""

        scope      = self._get_layer_str(layer)
        collection = tf.get_collection(tf.GraphKeys.VARIABLES, scope=scope)

        for var in collection:
            if var.name[:-2] == scope+'/'+name:
                return var

        return None

    def get_all_layer_variables(self, layer):
        """Returns all variables in the given layer"""
        scope = self._get_layer_str(layer)
        return tf.get_collection(tf.GraphKeys.VARIABLES, scope=scope)


    def gradients_out_in(output,input_img):
        return tf.gradients(output, input_img)


def _discriminator_model(sess, features, disc_input, layer_output_skip=5, hybrid_disc=0):

    # update 05092017, hybrid_disc consider whether to use hybrid space for discriminator
    # to study the kspace distribution/smoothness properties

    # Fully convolutional model
    mapsize = 3
    layers  = [8,16,32,64]   #[64, 128, 256, 512]   #[8,16]   #[8, 16, 32, 64]#

    old_vars = tf.global_variables()#tf.all_variables() , all_variables() are deprecated

    # augment data to hybrid domain = image+kspace
    if hybrid_disc>0:
        disc_size = tf.shape(disc_input)#disc_input.get_shape()
        # print(disc_size)        
        disc_kspace = Fourier(disc_input, separate_complex=False)
        disc_kspace_real = tf.cast(tf.real(disc_kspace), tf.float32)
        # print(disc_kspace_real)
        disc_kspace_real = tf.reshape(disc_kspace_real, [disc_size[0],disc_size[1],disc_size[2],1])
        disc_kspace_imag = tf.cast(tf.imag(disc_kspace), tf.float32)
        # print(disc_kspace_imag)        
        disc_kspace_imag = tf.reshape(disc_kspace_imag, [disc_size[0],disc_size[1],disc_size[2],1])
        disc_kspace_mag = tf.cast(tf.abs(disc_kspace), tf.float32)
        # print(disc_kspace_mag)
        disc_kspace_mag = tf.log(disc_kspace_mag)
        disc_kspace_mag = tf.reshape(disc_kspace_mag, [disc_size[0],disc_size[1],disc_size[2],1])
        if hybrid_disc == 1:
            disc_hybird = tf.concat(axis = 3, values = [disc_input * 2-1, disc_kspace_imag])
        else:
            disc_hybird = tf.concat(axis = 3, values = [disc_input * 2-1, disc_kspace_imag, disc_kspace_real, disc_kspace_imag])
    else:
        disc_hybird = disc_input #2 * disc_input - 1


    print('shape_disc_hybrid', disc_hybird.get_shape())

    print(hybrid_disc, 'discriminator input dimensions: {0}'.format(disc_hybird.get_shape()))
    model = Model('DIS', disc_hybird)        

    for layer in range(len(layers)):
        nunits = layers[layer]
        stddev_factor = 2.0

        model.add_conv2d(nunits, mapsize=mapsize, stride=2, stddev_factor=stddev_factor)
        model.add_batch_norm()
        model.add_relu()

    # Finalization a la "all convolutional net"
    model.add_conv2d(nunits, mapsize=mapsize, stride=1, stddev_factor=stddev_factor)
    model.add_batch_norm()
    model.add_relu()

    model.add_conv2d(nunits, mapsize=1, stride=1, stddev_factor=stddev_factor)
    model.add_batch_norm()
    model.add_relu()

    # Linearly map to real/fake and return average score
    # (softmax will be applied later)
    model.add_conv2d(1, mapsize=1, stride=1, stddev_factor=stddev_factor)  #1 for magnitude input images
    model.add_mean()

    new_vars  = tf.global_variables()#tf.all_variables() , all_variables() are deprecated
    disc_vars = list(set(new_vars) - set(old_vars))

    #select output
    output_layers = model.outputs[0:]  #[model.outputs[0]] + model.outputs[1:-1][::layer_output_skip] + [model.outputs[-1]]

    return model.get_output(), disc_vars, output_layers

def conv(batch_input, out_channels, stride=2, size_kernel=4):
    with tf.variable_scope("conv"):
        in_channels = batch_input.get_shape()[3]
        filter = tf.get_variable("filter", [size_kernel, size_kernel, in_channels, out_channels], dtype=tf.float32, initializer=tf.random_normal_initializer(0, 0.02))
        # [batch, in_height, in_width, in_channels], [filter_width, filter_height, in_channels, out_channels]
        #     => [batch, out_height, out_width, out_channels]
        padded_input = tf.pad(batch_input, [[0, 0], [1, 1], [1, 1], [0, 0]], mode="CONSTANT")
        conv = tf.nn.conv2d(padded_input, filter, [1, stride, stride, 1], padding="VALID")
        return conv

def deconv(batch_input, out_channels, size_kernel=3):
    with tf.variable_scope("deconv"):
        batch, in_height, in_width, in_channels = [int(d) for d in batch_input.get_shape()]
        filter = tf.get_variable("filter", [size_kernel, size_kernel, out_channels, in_channels], dtype=tf.float32, initializer=tf.random_normal_initializer(0, 0.02))
        # [batch, in_height, in_width, in_channels], [filter_width, filter_height, out_channels, in_channels]
        #     => [batch, out_height, out_width, out_channels]
        conv = tf.nn.conv2d_transpose(batch_input, filter, [batch, in_height * 2, in_width * 2, out_channels], [1, 2, 2, 1], padding="SAME")
        return conv        

def lrelu(x, a = 0.3):
    with tf.name_scope("lrelu"):
        return tf.maximum(x, tf.multiply(x, a))
        # adding these together creates the leak part and linear part
        # then cancels them out by subtracting/adding an absolute value term
        # leak: a*x/2 - a*abs(x)/2
        # linear: x/2 + abs(x)/2

        # this block looks like it has 2 inputs on the graph unless we do this

def batchnorm(input):
    with tf.variable_scope("batchnorm"):
        # this block looks like it has 3 inputs on the graph unless we do this
        input = tf.identity(input)

        channels = input.get_shape()[3]
        offset = tf.get_variable("offset", [channels], dtype=tf.float32, initializer=tf.zeros_initializer())
        scale = tf.get_variable("scale", [channels], dtype=tf.float32, initializer=tf.random_normal_initializer(1.0, 0.02))
        mean, variance = tf.nn.moments(input, axes=[0, 1, 2], keep_dims=False)
        variance_epsilon = 1e-5
        normalized = tf.nn.batch_normalization(input, mean, variance, offset, scale, variance_epsilon=variance_epsilon)
        return normalized      

def Fourier(x, separate_complex=True):    
    x = tf.cast(x, tf.complex64)
    if separate_complex:
        x_complex = x[:,:,:,0]+1j*x[:,:,:,1]
    else:
        x_complex = x
    x_complex = tf.reshape(x_complex,x_complex.get_shape()[:3])
    y_complex = tf.fft2d(x_complex)
    print('using Fourier, input dim {0}, output dim {1}'.format(x.get_shape(), y_complex.get_shape()))
    # x = tf.cast(x, tf.complex64)
    # y = tf.fft3d(x)
    # y = y[:,:,:,-1]
    return y_complex


def jacobian_func(fx, x, parallel_iterations=10):
    '''
    Given a tensor fx, which is a function of x, vectorize fx (via tf.reshape(fx, [-1])),
    and then compute the jacobian of each entry of fx with respect to x.
    Specifically, if x has shape (m,n,...,p), an d fx has L entries (tf.size(fx)=L), then
    the output will be (L,m,n,...,p), where output[i] will be (m,n,...,p), with each entry denoting the
    gradient of output[i] wrt the corresponding element of x.
    '''
    return map(lambda fxi: tf.gradients(fxi, x)[0],
               tf.reshape(fx, [-1]),
               dtype=x.dtype,
               parallel_iterations=parallel_iterations)


def variational_autoencoder(sess,features,labels,masks,train_phase,z_val,print_bool, channels = 2,layer_output_skip = 5):
    print("Use variational autoencoder model")
    old_vars = tf.global_variables()

    print("Input shape", features.shape)
    print("Input type", type(features))

    activation = lrelu
    keep_prob = 0.6
    n_latent = 1024
    batch_size = FLAGS.batch_size
    img = 0
    mn = 0
    sd = 0
    z = 0
    x1 = 0
    x2 = 0
    x3 = 0
    x4 = 0

    sing_vals = tf.zeros([64,1])
 

    #features = tf.image.resize_images(features,[160,128])
    print(features.shape)   #(b_size,160,128,2)


    num_filters = 64
    encoder_layers = []

    with tf.variable_scope("var_encoder"):
        x1 = tf.layers.conv2d(features,filters = num_filters,kernel_size = 5,strides = 2,padding = "same")
      #  x1 = tf.contrib.layers.batch_norm(x1,activation_fn = activation)
      #  x1 = tf.nn.dropout(x1, keep_prob)
        encoder_layers.append(x1)
        #size = (b_size,80,64,128)


        x2 = tf.layers.conv2d(x1, filters=num_filters*2, kernel_size=5, strides=2, padding='same')
      #  x2 = tf.contrib.layers.batch_norm(x2,activation_fn = activation)
      #  x2 = tf.nn.dropout(x2, keep_prob)
        encoder_layers.append(x2)
        #size = (b_size,40,32,256)

        x3 = tf.layers.conv2d(x2, filters=num_filters*4, kernel_size=5, strides=2, padding='same', activation=activation)
      #  x3 = tf.contrib.layers.batch_norm(x3,activation_fn = activation)
      #  x3 = tf.nn.dropout(x3, keep_prob)
        encoder_layers.append(x3)
        #size = (b_size,20,16,512)

        x4 = tf.layers.conv2d(x3, filters=num_filters*8, kernel_size=5, strides=2, padding='same', activation=activation)
      #  x4 = tf.contrib.layers.batch_norm(x4,activation_fn = activation)
      #  x4 = tf.nn.dropout(x4, keep_prob)
        encoder_layers.append(x4)
        #size = (b_size,10,8,1024)

        
        x = tf.contrib.layers.flatten(x4)
        #size = (b_size,10*8*1024)

        mn = tf.layers.dense(x, units=n_latent)
        #mn = tf.contrib.layers.batch_norm(mn,activation_fn = tf.identity)  
        #size = (b_size,1024)

        sd = tf.layers.dense(x, units=n_latent)
        #sd = tf.contrib.layers.batch_norm(sd,activation_fn = tf.nn.softplus)
        #sd = tf.add(sd,1e-6)
        #size = (b_size,1024)

        epsilon = tf.random_normal(tf.stack([batch_size, n_latent]))

        #z  = tf.add(mn, tf.multiply(epsilon, tf.sqrt(tf.exp(sd))))
        z = tf.add(mn,tf.multiply(epsilon,tf.exp(sd)))

    def f1(): return z
    def f2(): return z_val

    decoder_input = tf.cond(train_phase, f1, f2)

    with tf.variable_scope("var_decoder"):
        num_for_dense = num_filters * 4 * 5 * 8
        decoder_input.set_shape([batch_size,n_latent])
        x = tf.layers.dense(decoder_input, units=num_for_dense, activation=lrelu)   #(b_size,1024*10*8)
        x = tf.reshape(x, [-1,5,4,num_filters*8])  #(b_size,10,8,1024)
        x = tf.add(x,x4)


        #upsample
        x = tf.layers.conv2d_transpose(x, filters=num_filters*4, kernel_size=5, strides=2, padding='same')
       # x = tf.contrib.layers.batch_norm(x,activation_fn = activation)
       # x = tf.nn.dropout(x, keep_prob)
        x = tf.add(x,x3)
        #size = (b_size,20,16,512)


        x = tf.layers.conv2d_transpose(x, filters=num_filters*2, kernel_size=5, strides=2, padding='same')
       # x = tf.contrib.layers.batch_norm(x,activation_fn = activation)
       # x = tf.nn.dropout(x, keep_prob)
        x = tf.add(x,x2)
        #size = (b_size,40,32,256)


        x = tf.layers.conv2d_transpose(x, filters=num_filters, kernel_size=5, strides=2, padding='same')
       # x = tf.contrib.layers.batch_norm(x,activation_fn = activation)
        x = tf.add(x,x1)
        #size = (b_size,80,64,128)


        x = tf.layers.conv2d_transpose(x, filters=channels, kernel_size=5, strides=2, padding='same',activation = tf.nn.sigmoid)
        img = x

    # gradient stuff


        def g1():
            temp_grad = tf.gradients(img,features)
            print("IMAGE SHAPE", img)
            print("FEATURE SHAPE", features)

            jacobian = jacobian_func(img,features)

            #jacobian = gradients.jacobian(img,features)

            #print("Testing Shape",jacobian)


            gradient_slice = jacobian[0][0,:,:,0]
            #gradient_slice = temp_grad[0][0,:,:,0]


            sing_vals = tf.linalg.svd(tf.reshape(gradient_slice,[80,64]),compute_uv = False)
            #sing_vals = tf.zeros([64,1])
            
            return sing_vals

        def g2():
            return tf.ones([64,1])
       #     return 1
            ### Do Nothing

        sing_vals = tf.cond(print_bool,g1,g2)


        #size = (b_size,160,128,2)

    ### Data consistency
    #img = tf.image.resize_images(img,[320,256])

    def l1():
        return img
        masks_comp = 1.0 - masks
        correct_kspace = downsample(labels, masks) + downsample(img, masks_comp)
        correct_image = upsample(correct_kspace, masks)
        return correct_image

    def l2():
        return img
        masks_comp = 1.0 - masks
        correct_kspace = downsample(labels, masks) + downsample(img, masks_comp)
        correct_image = upsample(correct_kspace, masks)
        return correct_image
        
    
    output = tf.cond(train_phase,l1,l2)


    output_layers = [output]

    new_vars = tf.global_variables()
    gen_vars = list(set(new_vars) - set(old_vars))

    print("Output shape", output.shape)
    print("Output type", type(output))

    return output, gen_vars, output_layers, mn, sd, sing_vals


def create_model(sess, features, labels, masks, architecture):
    # sess: TF sesson
    # features: input, for SR/CS it is the input image
    # labels: output, for SR/CS it is the groundtruth image
    # architecture: aec for encode-decoder, resnet for upside down 
    # Generator
    rows      = int(features.get_shape()[1])
    cols      = int(features.get_shape()[2])
    channels  = int(features.get_shape()[3])
    n_latent = 1024
    temp_zeros = tf.zeros([FLAGS.batch_size,n_latent],tf.float32)

    #print('channels', features.get_shape())

    gene_minput = tf.placeholder_with_default(features, shape=[FLAGS.batch_size, rows, cols, channels])
    label_minput = tf.placeholder_with_default(tf.zeros([FLAGS.batch_size, rows, cols, channels]), shape=[FLAGS.batch_size, rows, cols, channels])
    train_phase = tf.placeholder_with_default(True, shape=())
    z_val = tf.placeholder_with_default(temp_zeros, shape= temp_zeros.shape)
    print_bool = tf.placeholder_with_default(False, shape=())

    features = gene_minput

    architecture = 'vae' #only deal with the variational autoencoder


    # TBD: Is there a better way to instance the generator?
    if architecture == 'vae':
        function_generator = lambda x,y,z,w,t,a,p: variational_autoencoder(x,y,z,w,t,a,p)
    

    gene_var_list = []
    gene_Var_list = []
    gene_layers_list = []
    gene_mlayers_list = []
    gene_output_list = []
    gene_moutput_list = []
    mask_list = []
    mask_list_0 = []
    eta = []

    kappa = []
    nmse = []

    with tf.variable_scope('gene_layer') as scope:

        gene_output = features
        gene_moutput = gene_minput

        for i in range(FLAGS.num_iteration):

             #train
             gene_output, gene_var_list, gene_layers, mn, sd, sing_vals = function_generator(sess, gene_output, labels, masks,train_phase,z_val,print_bool)
             #gene_output, gene_var_list, gene_layers = function_generator(sess, gene_output, labels, masks,train_phase)
             gene_layers_list.append(gene_layers)
             gene_output_list.append(gene_output)
             if i == 0:
                gene_Var_list = gene_var_list

             
             scope.reuse_variables()
             
             #test
             gene_moutput, _ , gene_mlayers, mn1, sd1, sing_vals1= function_generator(sess, gene_moutput, label_minput, masks,train_phase,z_val,print_bool)
             #gene_moutput, _ , gene_mlayers = function_generator(sess, gene_moutput, label_minput, masks,train_phase)
             gene_mlayers_list.append(gene_mlayers)
             gene_moutput_list.append(gene_moutput)
             #mask_list.append(gene_mlayers[3])

             scope.reuse_variables()
             #evaluate at the groun-truth solution
             gene_moutput_0, _ , gene_mlayers_0, mn2, sd2, sing_vals2 = function_generator(sess, label_minput, label_minput, masks,train_phase,z_val,print_bool)


    #eta = tf.zeros([4,4]) #eta_1 + eta_2
                    
    #Discriminator with real data
    gene_output_complex = tf.complex(gene_output[:,:,:,0], gene_output[:,:,:,1])
    gene_output_real = tf.abs(gene_output_complex)
    gene_output_real = tf.reshape(gene_output_real, [FLAGS.batch_size, rows, cols, 1])   #gene_output

    labels_complex = tf.complex(labels[:,:,:,0], labels[:,:,:,1])
    labels_real = tf.abs(labels_complex)
    labels_real = tf.reshape(labels_real, [FLAGS.batch_size, rows, cols, 1])   #gene_output

    disc_real_input = tf.identity(labels_real, name='disc_real_input')


    # TBD: Is there a better way to instance the discriminator?
    with tf.variable_scope('disc') as scope:
        print('hybrid_disc', FLAGS.hybrid_disc)
        disc_real_output, disc_var_list, disc_layers = \
                _discriminator_model(sess, features, disc_real_input, hybrid_disc=FLAGS.hybrid_disc)

        scope.reuse_variables()

            
        disc_fake_output, _, _ = _discriminator_model(sess, features, gene_output_real, hybrid_disc=FLAGS.hybrid_disc)


    return [sing_vals,mn, sd, gene_minput, label_minput, gene_moutput, gene_moutput_list,
            gene_output, gene_output_list, gene_Var_list, gene_layers_list, gene_mlayers_list, mask_list, mask_list_0,
            disc_real_output, disc_fake_output, disc_var_list, train_phase,print_bool, z_val,disc_layers, eta, nmse, kappa]   


def create_generator_loss(disc_output, gene_output, gene_output_list, features, labels, masks,mn,sd):
    
    # Cross entropy GAN cost
    cross_entropy = tf.nn.sigmoid_cross_entropy_with_logits(logits=disc_output, labels=tf.ones_like(disc_output))
    gene_ce_loss  = tf.reduce_mean(cross_entropy, name='gene_ce_loss')

    # LS GAN cost
    ls_loss = tf.square(disc_output - tf.ones_like(disc_output))
    gene_ls_loss  = tf.reduce_mean(ls_loss, name='gene_ls_loss')

    # I.e. does the result look like the feature?
    # K = int(gene_output.get_shape()[1])//int(features.get_shape()[1])
    # assert K == 2 or K == 4 or K == 8    
    # downscaled = _downscale(gene_output, K)


    # soft data-consistency loss
    #image_size = [128, 128]
    #K=2
    gene_dc_loss = 0
    for j in range(FLAGS.num_iteration):
    	gene_dc_loss =  gene_dc_loss + tf.cast(tf.reduce_mean(tf.square(tf.abs(downsample(labels - gene_output_list[j], masks))), name='gene_dc_loss'), tf.float32)

    gene_dc_norm = tf.cast(tf.reduce_mean(tf.square(tf.abs(downsample(labels, masks))), name='gene_dc_norm'), tf.float32)
    gene_dc_loss = gene_dc_loss / (gene_dc_norm * FLAGS.num_iteration)


    #generator MSE loss summed up over different copies
    gene_l2_loss = 0
    gene_l1_loss = 0
    for j in range(FLAGS.num_iteration):

        gene_l2_loss =  gene_l2_loss + tf.cast(tf.reduce_mean(tf.square(tf.abs(gene_output_list[j] - labels)), name='gene_l2_loss'), tf.float32)
        gene_l1_loss =  gene_l2_loss + tf.cast(tf.reduce_mean(tf.abs(gene_output_list[j] - labels), name='gene_l2_loss'), tf.float32)
    
     
    '''
    # mse loss
    gene_l1_loss  = tf.cast(tf.reduce_mean(tf.abs(gene_output - labels), name='gene_l1_loss'), tf.float32)
    gene_l2_loss  = tf.cast(tf.reduce_mean(tf.square(tf.abs(gene_output - labels)), name='gene_l2_loss'), tf.float32)
    '''

    # mse loss
    gene_mse_loss = tf.add(FLAGS.gene_l1l2_factor * gene_l1_loss, 
                        (1.0 - FLAGS.gene_l1l2_factor) * gene_l2_loss, name='gene_mse_loss')


    print("GENE",gene_output)
    print("LABEL",labels)
    print("LOSS",gene_mse_loss)


    # Add in KL divergence term to enforce normal constraint

    latent_loss = tf.reduce_mean(-0.5 * tf.reduce_sum(1.0 + sd - tf.square(mn) - tf.exp(sd), 1))

    gene_mse_loss = gene_mse_loss #+ 1e-4 * latent_loss

    #ssim loss
    gene_ssim_loss = loss_DSSIS_tf11(labels, gene_output)
    gene_mixmse_loss = tf.add(FLAGS.gene_ssim_factor * gene_ssim_loss, 
                            (1.0 - FLAGS.gene_ssim_factor) * gene_mse_loss, name='gene_mixmse_loss')
    
    # generator fool descriminator loss: gan LS or log loss
    #gene_fool_loss = tf.add(FLAGS.gene_ls_factor * gene_ls_loss,
        #                   FLAGS.gene_log_factor * gene_ce_loss, name='gene_fool_loss')

    gene_fool_loss = -tf.reduce_mean(disc_output)

    # non-mse loss = fool-loss + data consisntency loss
    gene_non_mse_l2     = gene_fool_loss  #tf.add((1.0 - FLAGS.gene_dc_factor) * gene_fool_loss,
                           #FLAGS.gene_dc_factor * gene_dc_loss, name='gene_nonmse_l2')
       
    gene_mse_factor  = tf.placeholder(dtype=tf.float32, name='gene_mse_factor')

    #total loss = fool-loss + data consistency loss + mse forward-passing loss
    #gene_loss     = tf.add((1.0 - FLAGS.gene_mse_factor) * gene_non_mse_l2, 
                            #FLAGS.gene_mse_factor * gene_mixmse_loss, name='gene_loss')

    #gene_mse_factor as a parameter
    #gene_loss  = tf.add((1.0 - gene_mse_factor) * gene_non_mse_l2,
                                  #gene_mse_factor * gene_mixmse_loss, name='gene_loss')

    gene_loss_pre  = tf.add((1.0 - gene_mse_factor) * gene_non_mse_l2,
                                  gene_mse_factor * gene_mixmse_loss, name='gene_loss')

    gene_loss = tf.add(FLAGS.gene_dc_factor * gene_dc_loss,
                                  (1.0 - FLAGS.gene_dc_factor) * gene_loss_pre, name='gene_loss')

    #list of loss
    list_gene_lose = [gene_mixmse_loss, gene_mse_loss, gene_l2_loss, gene_l1_loss, gene_ssim_loss, # regression loss
                        gene_dc_loss, gene_fool_loss, gene_non_mse_l2, gene_loss]


    # log to tensorboard
    #tf.summary.scalar('gene_non_mse_loss', gene_non_mse_l2)
    tf.summary.scalar('gene_fool_loss', gene_non_mse_l2)
    tf.summary.scalar('gene_dc_loss', gene_dc_loss)
    #tf.summary.scalar('gene_ls_loss', gene_ls_loss)
    tf.summary.scalar('gene_L1_loss', gene_mixmse_loss)


    return gene_loss, gene_dc_loss, gene_fool_loss, gene_mse_loss, list_gene_lose, gene_mse_factor
    

def create_discriminator_loss(disc_real_output, disc_fake_output, real_data = None, fake_data = None):
    ls_loss_real = tf.square(disc_real_output - tf.ones_like(disc_real_output))
    disc_real_loss = tf.reduce_mean(ls_loss_real, name='disc_real_loss')

    ls_loss_fake = tf.square(disc_fake_output)
    disc_fake_loss = tf.reduce_mean(ls_loss_fake, name='disc_fake_loss')

        # log to tensorboard
    tf.summary.scalar('disc_real_loss',disc_real_loss)
    tf.summary.scalar('disc_fake_loss',disc_fake_loss)
    return disc_real_loss, disc_fake_loss
    
    
def create_optimizers(gene_loss, gene_var_list,
                      disc_loss, disc_var_list):    
    # TBD: Does this global step variable need to be manually incremented? I think so.
    global_step    = tf.Variable(0, dtype=tf.int64,   trainable=False, name='global_step')
    learning_rate  = tf.placeholder(dtype=tf.float32, name='learning_rate')
    
    gene_opti = tf.train.AdamOptimizer(learning_rate=learning_rate,
                                       beta1=FLAGS.learning_beta1,
                                       name='gene_optimizer')
    disc_opti = tf.train.AdamOptimizer(learning_rate=learning_rate,
                                       beta1=FLAGS.learning_beta1,
                                       name='disc_optimizer')
     

    gene_minimize = gene_opti.minimize(gene_loss, var_list=gene_var_list, name='gene_loss_minimize', global_step=global_step)
    
    disc_minimize = disc_opti.minimize(disc_loss, var_list=disc_var_list, name='disc_loss_minimize', global_step=global_step)
    
    return (global_step, learning_rate, gene_minimize,disc_minimize)