###################################################################
    # TEST
    # plot cost
    fig = plt.figure()
    plt.semilogy(train_costs)
    plt.show(block=False)
    fig.savefig('./eval/' + eval_prefix + '/' + eval_prefix + '_cost.png')

    fig = plt.figure()
    plt.semilogy(val_errs)
    plt.show(block=False)
    fig.savefig('./eval/' + eval_prefix + '/' + eval_prefix + '_errs.png')

    # save results
    poseNet.save("./eval/{}/net_{}.pkl".format(eval_prefix, eval_prefix))
    # poseNet.load("./eval/{}/net_{}.pkl".format(eval_prefix,eval_prefix))

    # add prior to network
    cfg = HiddenLayerParams(inputDim=(batchSize, train_gt3D_embed.shape[1]),
                            outputDim=(batchSize,
                                       numpy.prod(train_gt3D.shape[1:])),
                            activation=None)
    pcalayer = HiddenLayer(rng,
                           poseNet.layers[-1].output,
                           cfg,
                           copyLayer=None,
                           layerNum=len(poseNet.layers))
    pcalayer.W.set_value(pca.components_)
    pcalayer.b.set_value(pca.mean_)
    poseNet.layers.append(pcalayer)
Пример #2
0
Файл: train.py Проект: zgq91/BB8
class Network:
    def __init__(self):
        self.type = 1  # 1 = Regressor
        self.network_model = '0'  # 0 = Tiny BB8, 1 = BB8 - VGG arch.

        self.batch_size = 128
        self.optimizer = 'MOMENTUM'
        self.learning_rate = 0.001
        self.steps = []
        self.scales = []
        self.nb_epoch = 300

        self.network = None
        self.trainer = None
        self.network_name = None
        self.save_path = './'

        self.validation_size = 5000
        self.train_set_para = None

        self.config = None
        self.nb_process = 10

    def setup_from_config(self):
        if self.config is not None:
            with open(self.config, 'r') as f:
                config = yaml.load(f)
                for key in config.keys():
                    value = config[key]
                    print('set {0} to {1}'.format(key, value))
                    setattr(self, key, value)

    def update(self):
        self.setup_from_config()
        self.print_type()

        sys.path.insert(0,
                        self.train_set_para[:self.train_set_para.rindex('/')])
        self.create_training = __import__(
            self.train_set_para[self.train_set_para.rindex('/') + 1:],
            fromlist=['init', 'pre_create_data', 'create_data', 'get_dim'])
        self.create_training.init()

        self.regressor()

    def regressor(self):

        regressorNetType = regressorNetType = int(self.network_model)
        batch_size = int(self.batch_size)
        learning_rate = float(self.learning_rate)
        optimizer = self.optimizer

        assert len(self.steps) == len(self.scales)
        n_chan, h_in, w_in, output_dim = self.create_training.get_dim()
        assert n_chan is not None
        assert h_in is not None
        assert w_in is not None
        assert output_dim is not None
        nb_training = int(self.nb_training)

        rng = np.random.RandomState(23455)
        #theano.config.compute_test_value = 'warn'
        theano.config.exception_verbosity = 'high'

        regressorNetParams = PoseRegNetParams(type=regressorNetType,
                                              n_chan=n_chan,
                                              w_in=w_in,
                                              h_in=h_in,
                                              batchSize=batch_size,
                                              output_dim=output_dim)

        self.network = PoseRegNet(rng, cfgParams=regressorNetParams)
        if regressorNetType == 1:
            self.network.load_vgg()
        print(self.network)

        regressorNetTrainingParams = PoseRegNetTrainingParams()
        regressorNetTrainingParams.batch_size = batch_size
        regressorNetTrainingParams.learning_rate = learning_rate
        if self.scales != []:
            scales = [float(s) for s in self.scales.split()]
            regressorNetTrainingParams.learning_rate_scales = scales
        if self.steps != []:
            steps = [int(s) for s in self.steps.split()]
            regressorNetTrainingParams.learning_rate_steps = steps

        regressorNetTrainingParams.optimizer = optimizer

        self.trainer = PoseRegNetTrainer(self.network,
                                         regressorNetTrainingParams, rng)

        self.trainer.setup_para(nb_training,
                                n_chan,
                                h_in,
                                w_in,
                                output_dim,
                                type='regressor')
        self.create_training.pre_create_data()

    def train(self):
        self.trainer.train(n_epochs=int(self.nb_epoch), storeFilters=True)

    def train_para(self):
        self.trainer.train_para(int(self.nb_epoch),
                                self.create_training.create_data,
                                int(self.nb_process))

    def save(self):
        if self.network_name is None:
            self.network_name += "_model"
            self.network_name += str(self.network_model)
            self.network_name += "_epoch"
            self.network_name += str(self.nb_epoch)

        self.network.save(join(self.save_path, self.network_name + ".weight"))
        f = file(join(self.save_path, self.network_name + ".cfg"), 'wb')
        cPickle.dump(self.network.cfgParams,
                     f,
                     protocol=cPickle.HIGHEST_PROTOCOL)
        f.close()

    def print_type(self):
        if int(self.type) == 1:
            print('*****************************************************')
            print('*                    REGRESSOR                      *')
            print('*****************************************************')
        else:
            assert False, 'It is not implemented'