Exemplo n.º 1
0
class RLSolverBase(object):
    def __init__(self, env, model, optimizer, criterion, reward_func, config):
        super(RLSolverBase, self).__init__()
        self.config = config
        self.env = env
        self.model = model
        self.optimizer, self.criterion, self.reward_func = optimizer, criterion, reward_func
        ensure_dir(config.save_dir)
        self.logger = Logger()
        self.start_episode, self.step, self.update_step = 1, 0, 0
        self.device = torch.device('cpu')
        if config.use_cuda and torch.cuda.is_available():
            from torch.backends import cudnn
            cudnn.benchmark = True
            self.device = torch.device('cuda:0')
            self.model = self.model.to(self.device)
        self.memory = deque(maxlen=10000)

    def train_q_learning(self):
        """
        training q learning method
        """
        for episode in range(self.start_episode, self.config.episode + 1):
            result = self._train_episode(episode)
            self.logger.add_entry(result)
            if episode % self.config.display_interval == 0:
                print(result)
            if episode % self.config.save_interval == 0:
                self._save_checkpoint(episode)

    def _save_checkpoint(self, episode):
        """
        save results
        """
        arch = self.model.__name__
        state = {
            'episode': episode,
            'logger': self.logger,
            'arch': arch,
            'state_dict': self.model.state_dict(),
            'optimizer': self.optimizer.state_dict()
        }
        filename = os.path.join(self.config.save_dir,
                                '{}_episode{}.pth.tar'.format(arch, episode))
        print("save checkpoint: {} ...".format(filename))
        torch.save(state, filename)
Exemplo n.º 2
0
metric = accuracy
train_loader = mnist_train_loader(root, 200)
val_loader = mnist_validate_loader(root, 200)

for alpha in np.arange(-1.0, 2.0, 0.02):
    alpha = float(alpha)
    param = OrderedDict(
        (k, (1 - alpha) * param1[k] + alpha * param2[k]) for k in param1)
    model.load_state_dict(param)

    log = {'alpha': alpha}
    res = eval_model(model, train_loader, loss, metric, use_cuda)
    log.update({'loss': res[0], 'accuracy': res[1]})
    res = eval_model(model, val_loader, loss, metric, use_cuda)
    log.update({'val_loss': res[0], 'val_accuracy': res[1]})
    logger.add_entry(log)

x = [entry['alpha'] for _, entry in logger.entries.items()]
y1_train = [entry['loss'] for _, entry in logger.entries.items()]
y2_train = [entry['accuracy'] for _, entry in logger.entries.items()]
y1_val = [entry['val_loss'] for _, entry in logger.entries.items()]
y2_val = [entry['val_accuracy'] for _, entry in logger.entries.items()]
fig, ax1 = plt.subplots(figsize=(10, 10))
ax1.semilogy(x, y1_train, 'b', label='train')
ax1.semilogy(x, y1_val, 'b--', label='val')
ax1.legend(loc="best")
ax1.set_xlabel('alpha', color='b')
ax1.set_ylabel('cross_entropy', color='b')
ax2 = ax1.twinx()
ax2.plot(x, y2_train, 'r')
ax2.plot(x, y2_val, 'r--')
Exemplo n.º 3
0
class SolverBase(object):
    def __init__(self, model, optimizer, loss, metrics, config):
        super(SolverBase, self).__init__()
        self.config = config
        ensure_dir(config.save_dir)
        self.model, self.optimizer, self.loss, self.metrics = model, optimizer, loss, metrics
        self.logger = Logger()
        self.min_loss = math.inf
        self.identity = model.__name__
        self.start_epoch = 1
        self.device = torch.device('cpu')
        if config.use_cuda and torch.cuda.is_available():
            from torch.backends import cudnn
            cudnn.benchmark = True
            self.device = torch.device('cuda:0')
            self.model.to(self.device)
        if config.resume:
            self._resume_checkpoint(config.resume)

    def train(self):
        """
        training phase
        """
        for epoch in range(self.start_epoch, self.config.epochs + 1):
            result = self._train_epoch(epoch)
            log = {'epoch': epoch}
            for key, value in result.items():
                if key == 'metrics':
                    for i, metric in enumerate(self.metrics):
                        log[metric.__name__] = result['metrics'][i]
                elif key == 'val_metrics':
                    for i, metric in enumerate(self.metrics):
                        log['val_' + metric.__name__] = result['metrics'][i]
                else:
                    log[key] = value

            self._save_log(log)
            # TODO: may have bug
            if epoch % self.config.save_freq == 0:
                self._save_checkpoint(epoch, log['loss'])

    def _train_epoch(self, epoch):
        """
        Training logic for an epoch

        :param epoch: Current epoch number
        """
        raise NotImplementedError

    def _save_log(self, result):
        """
        save result to logger (for draw or print)
        """
        self.logger.add_entry(result)
        if self.config.verbosity >= 1:
            # TODO: fix bug
            print([(k, v) for k, v in result.items()
                   if k not in ['full_loss']])

    def _save_checkpoint(self, epoch, loss):
        """
        save model (include state)
        """
        if loss < self.min_loss:
            self.min_loss = loss
        arch = self.model.__name__
        state = {
            'epoch': epoch,
            'params_num': self.model.params_num(),
            'logger': self.logger,
            'arch': arch,
            'state_dict': self.model.state_dict(),
            'optimizer': {
                name: optimizer.state_dict()
                for name, optimizer in self.optimizer.items()
            } if isinstance(self.optimizer, dict) else
            self.optimizer.state_dict(),
            'min_loss': self.min_loss
        }
        filename = os.path.join(
            self.config.save_dir,
            self.identity + '_epoch{:02d}.pth.tar'.format(epoch))
        print("save checkpoint: {} ...".format(filename))
        torch.save(state, filename)
        if loss == self.min_loss:
            shutil.copyfile(
                filename,
                os.path.join(self.config.save_dir,
                             self.identity + '_best.pth.tar'))

    def _resume_checkpoint(self, resume_path):
        """
        resume training from resume_path
        """
        print("Loading checkpoint: {} ...".format(resume_path))
        checkpoint = torch.load(resume_path)
        self.start_epoch = checkpoint['epoch'] + 1
        self.min_loss = checkpoint['min_loss']
        self.model.load_state_dict(checkpoint['state_dict'])
        if isinstance(self.optimizer, dict):
            for name, state in checkpoint['optimizers'].items():
                self.optimizers[name].load_state_dict(state)
        else:
            self.optimizer.load_state_dict(checkpoint['optimizer'])
        self.logger = checkpoint['logger']
        print("Checkpoint '{}' (epoch {}) loaded".format(
            resume_path, self.start_epoch))