Ejemplo n.º 1
0
class CelebA(object):
    """Implement DCGAN for CelebA dataset"""
    def __init__(self, train_params, ckpt_params, gan_params):
        # Training parameters
        self.root_dir = train_params['root_dir']
        self.gen_dir = train_params['gen_dir']
        self.batch_size = train_params['batch_size']
        self.train_len = train_params['train_len']
        self.learning_rate = train_params['learning_rate']
        self.momentum = train_params['momentum']
        self.optim = train_params['optim']
        self.use_cuda = train_params['use_cuda']

        # Checkpoint parameters (when, where)
        self.batch_report_interval = ckpt_params['batch_report_interval']
        self.ckpt_path = ckpt_params['ckpt_path']
        self.save_stats_interval = ckpt_params['save_stats_interval']

        # Create directories if they don't exist
        if not os.path.isdir(self.ckpt_path):
            os.mkdir(self.ckpt_path)
        if not os.path.isdir(self.gen_dir):
            os.mkdir(self.gen_dir)

        # GAN parameters
        self.gan_type = gan_params['gan_type']
        self.latent_dim = gan_params['latent_dim']
        self.n_critic = gan_params['n_critic']

        # Make sure report interval divides total num of batches
        self.num_batches = self.train_len // self.batch_size

        # Get ready to ruuummmmmmble
        self.compile()

    def compile(self):
        """Compile model (loss function, optimizers, etc.)"""

        # Create new GAN
        self.gan = DCGAN(self.gan_type, self.latent_dim, self.batch_size,
                         self.use_cuda)

        # Set optimizers for generator and discriminator
        if self.optim == 'adam':
            self.G_optimizer = optim.Adam(self.gan.G.parameters(),
                                          lr=self.learning_rate,
                                          betas=self.momentum)
            self.D_optimizer = optim.Adam(self.gan.D.parameters(),
                                          lr=self.learning_rate,
                                          betas=self.momentum)

        elif self.optim == 'rmsprop':
            self.G_optimizer = optim.RMSprop(self.gan.G.parameters(),
                                             lr=self.learning_rate)
            self.D_optimizer = optim.RMSprop(self.gan.D.parameters(),
                                             lr=self.learning_rate)

        else:
            raise NotImplementedError

        # CUDA support
        if torch.cuda.is_available() and self.use_cuda:
            self.gan = self.gan.cuda()

        # Create fixed latent variables for inference while training
        self.latent_vars = []
        for i in range(100):
            self.latent_vars.append(self.gan.create_latent_var(1))

    def save_stats(self, stats):
        """Save model statistics"""

        fname_pkl = '{}/{}-stats.pkl'.format(self.ckpt_path, self.gan_type)
        print('Saving model statistics to: {}'.format(fname_pkl))
        with open(fname_pkl, 'wb') as fp:
            pickle.dump(stats, fp)

    def eval(self, n, epoch=None, while_training=False):
        """Sample examples from generator's distribution"""

        # Evaluation mode
        self.gan.G.eval()

        # Montage size (square)
        m = int(np.sqrt(n))

        # Predict images to see progress
        for i in range(n):
            # Reuse fixed latent variables to keep random process intact
            if while_training:
                img = self.gan.generate_img(self.latent_vars[i])
            else:
                img = self.gan.generate_img()
            img = utils.unnormalize(img.squeeze())
            fname_in = '{}/test{:d}.png'.format(self.ckpt_path, i)
            torchvision.utils.save_image(img, fname_in)
        stack = 'montage {}/test* -tile {}x{} -geometry 64x64+1+1 \
            {}/epoch'.format(self.ckpt_path, m, m, self.ckpt_path)
        stack = stack + str(
            epoch + 1) + '.png' if epoch is not None else stack + '.png'
        sp.call(stack.split())
        for f in glob.glob('{}/test*'.format(self.ckpt_path)):
            os.remove(f)

    def train(self, nb_epochs, data_loader):
        """Train model on data"""

        # Initialize tracked quantities and prepare everything
        G_all_losses, D_all_losses, times = [], [], utils.AvgMeter()
        utils.format_hdr(self.gan, self.root_dir, self.train_len)
        start = datetime.datetime.now()

        g_iter, d_iter = 0, 0

        # Train
        for epoch in range(nb_epochs):
            print('EPOCH {:d} / {:d}'.format(epoch + 1, nb_epochs))
            G_losses, D_losses = utils.AvgMeter(), utils.AvgMeter()
            start_epoch = datetime.datetime.now()

            avg_time_per_batch = utils.AvgMeter()
            # Mini-batch SGD
            for batch_idx, (x, _) in enumerate(data_loader):

                # Critic update ratio
                if self.gan_type == 'wgan':
                    n_critic = 20 if g_iter < 50 or (
                        g_iter + 1) % 500 == 0 else self.n_critic
                else:
                    n_critic = self.n_critic

                # Training mode
                self.gan.G.train()

                # Discard last examples to simplify code
                if x.size(0) != self.batch_size:
                    break
                batch_start = datetime.datetime.now()

                # Print progress bar
                utils.progress_bar(batch_idx, self.batch_report_interval,
                                   G_losses.avg, D_losses.avg)

                x = Variable(x)
                if torch.cuda.is_available() and self.use_cuda:
                    x = x.cuda()

                # Update discriminator
                D_loss, fake_imgs = self.gan.train_D(x, self.D_optimizer,
                                                     self.batch_size)
                D_losses.update(D_loss, self.batch_size)
                d_iter += 1

                # Update generator
                if batch_idx % n_critic == 0:
                    G_loss = self.gan.train_G(self.G_optimizer,
                                              self.batch_size)
                    G_losses.update(G_loss, self.batch_size)
                    g_iter += 1

                batch_end = datetime.datetime.now()
                batch_time = int(
                    (batch_end - batch_start).total_seconds() * 1000)
                avg_time_per_batch.update(batch_time)

                # Report model statistics
                if (batch_idx % self.batch_report_interval == 0 and batch_idx) or \
                    self.batch_report_interval == self.num_batches:
                    G_all_losses.append(G_losses.avg)
                    D_all_losses.append(D_losses.avg)
                    utils.show_learning_stats(batch_idx, self.num_batches,
                                              G_losses.avg, D_losses.avg,
                                              avg_time_per_batch.avg)
                    [
                        k.reset()
                        for k in [G_losses, D_losses, avg_time_per_batch]
                    ]
                    self.eval(100, epoch=epoch, while_training=True)
                    # print('Critic iter: {}'.format(g_iter))

                # Save stats
                if batch_idx % self.save_stats_interval == 0 and batch_idx:
                    stats = dict(G_loss=G_all_losses, D_loss=D_all_losses)
                    self.save_stats(stats)

            # Save model
            utils.clear_line()
            print('Elapsed time for epoch: {}'.format(
                utils.time_elapsed_since(start_epoch)))
            self.gan.save_model(self.ckpt_path, epoch)
            self.eval(100, epoch=epoch, while_training=True)

        # Print elapsed time
        elapsed = utils.time_elapsed_since(start)
        print('Training done! Total elapsed time: {}\n'.format(elapsed))

        return G_loss, D_loss
Ejemplo n.º 2
0
    parser.add_argument('-v', '--video', help='turn frames into video/gif',
        action='store_true')
    excl = parser.add_mutually_exclusive_group()
    excl.add_argument('-l', '--latent', metavar=('SO', 'S1'),
        help='interpolate in latent space (random seeds s0 & s1)', nargs=2, type=int)
    excl.add_argument('-s', '--screen', metavar=('SO', 'S1'),
        help='interpolate in screen space (random seeds s0 & s1)', nargs=2, type=int)
    parser.add_argument('-lp', '--latent-play', metavar='S',
        help='play in latent space', type=int)
    args = parser.parse_args()

    # Compile GAN and load model (either on CPU or GPU)
    gan = DCGAN(gan_type=args.type, use_cuda=args.cuda)
    gan.eval()
    if torch.cuda.is_available() and args.cuda:
        gan = gan.cuda()
    gan.load_model(filename=args.pretrained, use_cuda=args.cuda)

    # Make directory if it doesn't exist yet
    if not os.path.isdir(args.dir):
        os.mkdir(args.dir)

    # Create random tensors from seeds
    if args.latent or args.screen:
        s0, s1 = args.latent if args.latent else args.screen
        space = 'latent' if args.latent else 'screen'
        print('Interpolating random seeds {:d} & {:d} in {} space...'.format(s0, s1, space))
        z0 = gan.create_latent_var(1, s0)
        z1 = gan.create_latent_var(1, s1)

        # Interpolate
Ejemplo n.º 3
0
from utils import provide_visual_samples
from constants import use_cuda

import torch
import json

if __name__ == "__main__":

    with open('params.json') as f:
        params = json.load(f)

    objective_type = params['objective_type']
    update_ratio = params['update_ratio']
    learning_rate = params['learning_rate']
    betas = (params['betas'][0], params['betas'][1])
    fake_input_dim = params['fake_input_dim']
    batch_size = params['batch_size']
    n_epochs = params['n_epochs']

    model = DCGAN(generator_type=params['generator_type'])

    # load pretrained model

    model.load_state_dict(torch.load(model.name + '.pt'))

    if use_cuda:
        model = model.cuda()

    provide_visual_samples(model,
                           fake_input_dim=fake_input_dim,
                           batch_size=batch_size)
class CelebA(object):
    """Implement DCGAN for CelebA dataset"""
    def __init__(self, train_params, ckpt_params, gan_params):
        # Training parameters
        self.root_dir = train_params['root_dir']
        self.batch_size = train_params['batch_size']
        self.train_len = train_params['train_len']
        self.learning_rate = train_params['learning_rate']
        self.momentum = train_params['momentum']
        self.optim = train_params['optim']
        self.use_cuda = train_params['use_cuda']

        # Checkpoint parameters (when, where)
        self.batch_report_interval = ckpt_params['batch_report_interval']
        self.ckpt_path = ckpt_params['ckpt_path']
        self.save_stats_interval = ckpt_params['save_stats_interval']

        # Create directories if they don't exist
        if not os.path.isdir(self.ckpt_path):
            print(self.ckpt_path)
            os.mkdir(self.ckpt_path)

        # GAN parameters
        self.gan_type = gan_params['gan_type']
        self.latent_dim = gan_params['latent_dim']
        self.n_critic = gan_params['n_critic']

        # Make sure report interval divides total num of batches
        self.num_batches = self.train_len // self.batch_size

        self.compile()
        #frequency weight
        self.freq_weight = 0

    def compile(self):
        """Compile model (loss function, optimizers, etc.)"""

        # Create new GAN
        self.gan = DCGAN(self.gan_type, self.latent_dim, self.batch_size,
                         self.use_cuda)

        # Set optimizers for generator and discriminator
        if self.optim == 'adam':
            self.G_optimizer = optim.Adam(self.gan.G.parameters(),
                                          lr=self.learning_rate,
                                          betas=self.momentum)
            self.D_optimizer = optim.Adam(self.gan.D.parameters(),
                                          lr=self.learning_rate,
                                          betas=self.momentum)

        elif self.optim == 'rmsprop':
            self.G_optimizer = optim.RMSprop(self.gan.G.parameters(),
                                             lr=self.learning_rate)
            self.D_optimizer = optim.RMSprop(self.gan.D.parameters(),
                                             lr=self.learning_rate)

        else:
            raise NotImplementedError

        # CUDA support
        if torch.cuda.is_available() and self.use_cuda:
            self.gan = self.gan.cuda()

    def save_stats(self, stats):
        """Save model statistics"""

        fname_pkl = '{}/{}-stats.pkl'.format(self.ckpt_path, self.gan_type)
        print('Saving model statistics to: {}'.format(fname_pkl))
        with open(fname_pkl, 'wb') as fp:
            pickle.dump(stats, fp)

    def test(self, epoch):
        fname_gen_pt = '{}/{}-gen-epoch-{}.pt'.format(self.ckpt_path,
                                                      self.gan_type, epoch + 1)
        self.gan.load_model(fname_gen_pt)

        directory = self.ckpt_path + "/testing/" + str(epoch + 1)
        if not os.path.exists(directory):
            os.makedirs(directory)

        # Evaluation mode
        self.gan.G.eval()
        n = 10000
        # Predict images to see progress
        for i in range(n):
            img = self.gan.generate_img()
            img = utils.unnormalize(img.squeeze())
            fname_in = '{}/{:d}_test.png'.format(directory, i)
            torchvision.utils.save_image(img, fname_in)

    def train(self, nb_epochs, data_loader):
        """Train model on data"""

        # Initialize tracked quantities and prepare everything
        G_all_losses, D_all_losses, times = [], [], utils.AvgMeter()
        utils.format_hdr(self.gan, self.root_dir, self.train_len)
        start = datetime.datetime.now()

        g_iter, d_iter = 0, 0

        # Train
        for epoch in range(nb_epochs):
            print('EPOCH {:d} / {:d}'.format(epoch + 1, nb_epochs))
            G_losses, D_losses = utils.AvgMeter(), utils.AvgMeter()
            start_epoch = datetime.datetime.now()

            avg_time_per_batch = utils.AvgMeter()
            # Mini-batch SGD
            for batch_idx, (x, _) in enumerate(data_loader):

                # Critic update ratio
                if self.gan_type == 'wgan':
                    n_critic = 20 if g_iter < 50 or (
                        g_iter + 1) % 500 == 0 else self.n_critic
                else:
                    n_critic = self.n_critic

                # Training mode
                self.gan.G.train()

                # Discard last examples to simplify code
                if x.size(0) != self.batch_size:
                    break
                batch_start = datetime.datetime.now()

                # Print progress bar
                utils.progress_bar(batch_idx, self.batch_report_interval,
                                   G_losses.avg, D_losses.avg)

                x = Variable(x)
                if torch.cuda.is_available() and self.use_cuda:
                    x = x.cuda()

                self.freq_weight = (epoch + 1) / nb_epochs
                # Update discriminator
                D_loss, fake_imgs = self.gan.train_D(x, self.freq_weight,
                                                     self.D_optimizer,
                                                     self.batch_size)
                D_losses.update(D_loss, self.batch_size)
                d_iter += 1

                # Update generator
                if batch_idx % n_critic == 0:
                    G_loss = self.gan.train_G(self.freq_weight,
                                              self.G_optimizer,
                                              self.batch_size)
                    G_losses.update(G_loss, self.batch_size)
                    g_iter += 1

                batch_end = datetime.datetime.now()
                batch_time = int(
                    (batch_end - batch_start).total_seconds() * 1000)
                avg_time_per_batch.update(batch_time)

                # Report model statistics
                if (batch_idx % self.batch_report_interval == 0 and batch_idx) or \
                    self.batch_report_interval == self.num_batches:
                    G_all_losses.append(G_losses.avg)
                    D_all_losses.append(D_losses.avg)
                    utils.show_learning_stats(batch_idx, self.num_batches,
                                              G_losses.avg, D_losses.avg,
                                              avg_time_per_batch.avg)
                    [
                        k.reset()
                        for k in [G_losses, D_losses, avg_time_per_batch]
                    ]

                # Save stats
                if batch_idx % self.save_stats_interval == 0 and batch_idx:
                    stats = dict(G_loss=G_all_losses, D_loss=D_all_losses)
                    self.save_stats(stats)

            # Save model
            utils.clear_line()
            print('Elapsed time for epoch: {}'.format(
                utils.time_elapsed_since(start_epoch)))
            self.gan.save_model(self.ckpt_path, epoch, False)
            # Generating
            model.test(epoch)

        # Print elapsed time
        elapsed = utils.time_elapsed_since(start)
        print('Training done! Total elapsed time: {}\n'.format(elapsed))

        return G_loss, D_loss