Python ImagePyramidLayer примеры использования

Язык программирования: Python

Пространство имен/Пакет: ImagePyramid

Класс/Тип: ImagePyramidLayer

Примеров на hotexamples.com: 4

Python ImagePyramidLayer - 4 примера найдено. Это лучшие примеры Python кода для ImagePyramid.ImagePyramidLayer, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

ImagePyramidLayer(3)

get_coords(1)

Основные методы

ImagePyramidLayer (3)

get_coords (1)

Пример #1

Показать файл

Файл: DirectVOLayer.py Проект: misspyun1/LKVOLearner

    def __init__(self, imH=128, imW=416, pyramid_layer_num=5, max_itr_num=20):
        super(DirectVO, self).__init__()
        self.max_itr_num = max_itr_num
        self.imH = imH
        self.imW = imW
        self.pyramid_layer_num = pyramid_layer_num

        self.twist2mat_batch_func = Twist2Mat()
        self.img_gradient_func = GradientLayer()
        self.pyramid_func = ImagePyramidLayer(
            chan=3, pyramid_layer_num=self.pyramid_layer_num)
        self.laplacian_func = LaplacianLayer()

        x_pyramid, y_pyramid = self.pyramid_func.get_coords(self.imH, self.imW)

        # self.x_pyramid = nn.ParameterList(
        #             [nn.Parameter(torch.from_numpy(x), False) for x in x_pyramid])
        # self.y_pyramid = nn.ParameterList(
        #             [nn.Parameter(torch.from_numpy(y), False) for y in y_pyramid])

        for i in range(self.pyramid_layer_num):
            self.register_buffer('x_' + str(i),
                                 torch.from_numpy(x_pyramid[i]).float())
            self.register_buffer('y_' + str(i),
                                 torch.from_numpy(y_pyramid[i]).float())
        self.register_buffer('o', torch.zeros(1, 1))
        self.register_buffer('E', torch.eye(3))

Пример #2

Показать файл

 def __init__(self, img_size=[128, 416], smooth_term = 'lap'):
     super(LKVOKernel, self).__init__()
     self.img_size = img_size
     self.fliplr_func = FlipLR(imW=img_size[1], dim_w=3)
     self.vo = DirectVO(imH=img_size[0], imW=img_size[1], pyramid_layer_num=5)
     self.depth_net = VggDepthEstimator(img_size)
     self.pyramid_func = ImagePyramidLayer(chan=1, pyramid_layer_num=5)
     self.smooth_term = smooth_term

Пример #3

Показать файл

Файл: SfMLearner.py Проект: davidjevans/16822finalProject

 def __init__(self, img_size=[128, 416], smooth_term = 'lap', use_expl_mask=False):
     super(SfMKernel, self).__init__()
     self.img_size = img_size
     self.fliplr_func = FlipLR(imW=img_size[1], dim_w=3)
     self.vo = DirectVO(imH=img_size[0], imW=img_size[1], pyramid_layer_num=4)
     self.depth_net = VggDepthEstimator(img_size)
     if use_expl_mask:
         self.pose_net = PoseExpNet(3)
     else:
         self.pose_net = PoseNet(3)
     self.pyramid_func = ImagePyramidLayer(chan=1, pyramid_layer_num=4)
     self.smooth_term = smooth_term
     self.use_expl_mask = use_expl_mask

Пример #4

Показать файл

Файл: DirectVOLayer.py Проект: misspyun1/LKVOLearner

class DirectVO(nn.Module):
    def __init__(self, imH=128, imW=416, pyramid_layer_num=5, max_itr_num=20):
        super(DirectVO, self).__init__()
        self.max_itr_num = max_itr_num
        self.imH = imH
        self.imW = imW
        self.pyramid_layer_num = pyramid_layer_num

        self.twist2mat_batch_func = Twist2Mat()
        self.img_gradient_func = GradientLayer()
        self.pyramid_func = ImagePyramidLayer(
            chan=3, pyramid_layer_num=self.pyramid_layer_num)
        self.laplacian_func = LaplacianLayer()

        x_pyramid, y_pyramid = self.pyramid_func.get_coords(self.imH, self.imW)

        # self.x_pyramid = nn.ParameterList(
        #             [nn.Parameter(torch.from_numpy(x), False) for x in x_pyramid])
        # self.y_pyramid = nn.ParameterList(
        #             [nn.Parameter(torch.from_numpy(y), False) for y in y_pyramid])

        for i in range(self.pyramid_layer_num):
            self.register_buffer('x_' + str(i),
                                 torch.from_numpy(x_pyramid[i]).float())
            self.register_buffer('y_' + str(i),
                                 torch.from_numpy(y_pyramid[i]).float())
        self.register_buffer('o', torch.zeros(1, 1))
        self.register_buffer('E', torch.eye(3))

    def setCamera(self, cx, cy, fx, fy):
        self.camparams = dict(fx=fx, fy=fy, cx=cx, cy=cy)

    def init(self, ref_frame_pyramid, inv_depth_pyramid):
        # ref_frame 3 * H * W
        assert (self.pyramid_layer_num == len(inv_depth_pyramid))
        self.inv_depth_pyramid = inv_depth_pyramid
        # self.ref_frame_pyramid = self.pyramid_func(ref_frame)
        self.ref_frame_pyramid = ref_frame_pyramid

        for i in range(self.pyramid_layer_num):
            assert (self.ref_frame_pyramid[i].size(-1) ==
                    inv_depth_pyramid[i].size(-1))
            assert (self.ref_frame_pyramid[i].size(-2) ==
                    inv_depth_pyramid[i].size(-2))
        self.init_lk_terms()

    def init_lk_terms(self):
        # self.inv_depth_pyramid, self.x_pyramid, self.y_pyramid = buildImagePyramid(inv_depth, self.pyramid_layer_num)
        self.xy_pyramid = []
        self.ref_imgrad_x_pyramid = []
        self.ref_imgrad_y_pyramid = []
        self.invH_pyramid = []
        self.dIdp_pyramid = []
        self.invH_dIdp_pyramid = []

        for i in range(self.pyramid_layer_num):
            _, h, w = self.ref_frame_pyramid[i].size()

            x = (Variable(getattr(self, 'x_' + str(i))) -
                 self.camparams['cx']) / self.camparams['fx']
            y = (Variable(getattr(self, 'y_' + str(i))) -
                 self.camparams['cy']) / self.camparams['fy']

            X, Y = meshgrid(x, y)
            xy = torch.cat((X.view(1, X.numel()), Y.view(1, Y.numel())), 0)
            self.xy_pyramid.append(xy)

            # compute image gradient
            imgrad_x, imgrad_y = self.img_gradient_func(
                self.ref_frame_pyramid[i])

            self.ref_imgrad_x_pyramid.append(imgrad_x *
                                             (self.camparams['fx'] / 2**i))
            self.ref_imgrad_y_pyramid.append(imgrad_y *
                                             (self.camparams['fy'] / 2**i))

            # precompute terms for LK regress
            dIdp = self.compute_dIdp(self.ref_imgrad_x_pyramid[i],
                                     self.ref_imgrad_y_pyramid[i],
                                     self.inv_depth_pyramid[i],
                                     self.xy_pyramid[i])
            self.dIdp_pyramid.append(dIdp)
            invH = inv(dIdp.t().mm(dIdp))
            self.invH_pyramid.append(invH)
            # self.invH_dIdp_pyramid.append(self.invH_pyramid[-1].mm(dIdp.t()))
            self.invH_dIdp_pyramid.append(invH.mm(dIdp.t()))

    def init_xy_pyramid(self, ref_frames_pyramid):
        # self.inv_depth_pyramid, self.x_pyramid, self.y_pyramid = buildImagePyramid(inv_depth, self.pyramid_layer_num)
        self.xy_pyramid = []
        self.ref_imgrad_x_pyramid = []
        self.ref_imgrad_y_pyramid = []

        for i in range(self.pyramid_layer_num):
            _, h, w = ref_frames_pyramid[i].size()

            x = (Variable(getattr(self, 'x_' + str(i))) -
                 self.camparams['cx']) / self.camparams['fx']
            y = (Variable(getattr(self, 'y_' + str(i))) -
                 self.camparams['cy']) / self.camparams['fy']

            X, Y = meshgrid(x, y)
            xy = torch.cat((X.view(1, X.numel()), Y.view(1, Y.numel())), 0)
            self.xy_pyramid.append(xy)

    def compute_dIdp(self, imgrad_x, imgrad_y, inv_depth, xy):
        k, h, w = imgrad_x.size()
        _, pt_num = xy.size()
        assert (h * w == pt_num)
        feat_dim = pt_num * k
        x = xy[0, :].view(pt_num, 1)
        y = xy[1, :].view(pt_num, 1)
        xty = x * y
        O = Variable(self.o).expand(pt_num, 1)
        inv_depth_ = inv_depth.view(pt_num, 1)
        dxdp = torch.cat(
            (-xty, 1 + x**2, -y, inv_depth_, O, -inv_depth_.mul(x)), 1)
        dydp = torch.cat(
            (-1 - y**2, xty, x, O, inv_depth_, -inv_depth_.mul(y)), 1)

        imgrad_x_ = imgrad_x.view(feat_dim, 1).expand(feat_dim, 6)
        imgrad_y_ = imgrad_y.view(feat_dim, 1).expand(feat_dim, 6)

        dIdp = imgrad_x_.mul(dxdp.repeat(k, 1)) + \
            imgrad_y_.mul(dydp.repeat(k, 1))
        return dIdp

    def LKregress(self, invH_dIdp, mask, It):
        batch_size, pt_num = mask.size()
        _, k, _ = It.size()
        feat_dim = k * pt_num
        invH_dIdp_ = invH_dIdp.view(1, 6,
                                    feat_dim).expand(batch_size, 6, feat_dim)
        mask_ = mask.view(batch_size, 1, pt_num).expand(batch_size, k, pt_num)
        # huber_weights = ((255*.2) / (It.abs()+1e-5)).clamp(max=1)
        # huber_weights = Variable(huber_weights.data)
        # dp = invH_dIdp_.bmm((mask_* huber_weights * It).view(batch_size, feat_dim, 1))
        dp = invH_dIdp_.bmm((mask_ * It).view(batch_size, feat_dim, 1))
        return dp.view(batch_size, 6)

    def warp_batch(self, img_batch, level_idx, R_batch, t_batch):
        return self.warp_batch_func(img_batch,
                                    self.inv_depth_pyramid[level_idx],
                                    level_idx, R_batch, t_batch)

    def warp_batch_func(self, img_batch, inv_depth, level_idx, R_batch,
                        t_batch):
        batch_size, k, h, w = img_batch.size()
        xy = self.xy_pyramid[level_idx]
        _, N = xy.size()
        # xyz = R_batch.bmm(torch.cat((xy.view(1, 2, N).expand(batch_size, 2, N), Variable(self.load_to_device(torch.ones(batch_size, 1, N)))), 1)) \
        #     + t_batch.view(batch_size, 3, 1).expand(batch_size, 3, N) * inv_depth.view(1, 1, N).expand(batch_size, 3, N)
        xyz = R_batch[:, :, 0:2].bmm(xy.view(1, 2, N).expand(batch_size, 2, N))\
            + R_batch[:, :, 2:3].expand(batch_size, 3, N)\
            + t_batch.view(batch_size, 3, 1).expand(batch_size, 3, N) * inv_depth.view(-1, 1, N).expand(batch_size, 3, N)
        z = xyz[:, 2:3, :].clamp(min=1e-10)
        xy_warp = xyz[:, 0:2, :] / z.expand(batch_size, 2, N)
        # u_warp = ((xy_warp[:, 0, :]*self.camparams['fx'] + self.camparams['cx'])/2**level_idx - .5).view(batch_size, N)
        # v_warp = ((xy_warp[:, 1, :]*self.camparams['fy'] + self.camparams['cy'])/2**level_idx - .5).view(batch_size, N)
        # print(self.x_pyramid[level_idx][0])
        u_warp = (
            (xy_warp[:, 0, :] * self.camparams['fx'] + self.camparams['cx']) -
            getattr(self, 'x_' + str(level_idx))[0]).view(batch_size,
                                                          N) / 2**level_idx
        v_warp = (
            (xy_warp[:, 1, :] * self.camparams['fy'] + self.camparams['cy']) -
            getattr(self, 'y_' + str(level_idx))[0]).view(batch_size,
                                                          N) / 2**level_idx

        Q, in_view_mask = grid_bilinear_sampling(img_batch, u_warp, v_warp)
        return Q, in_view_mask * (z.view_as(in_view_mask) > 1e-10).float()

    def compute_phtometric_loss(self,
                                ref_frames_pyramid,
                                src_frames_pyramid,
                                ref_inv_depth_pyramid,
                                src_inv_depth_pyramid,
                                rot_mat_batch,
                                trans_batch,
                                use_ssim=True,
                                levels=None,
                                ref_expl_mask_pyramid=None,
                                src_expl_mask_pyramid=None):
        bundle_size = rot_mat_batch.size(0) + 1
        inv_rot_mat_batch, inv_trans_batch = inv_rigid_transformation(
            rot_mat_batch, trans_batch)
        src_pyramid = []
        ref_pyramid = []
        depth_pyramid = []
        if levels is None:
            levels = range(self.pyramid_layer_num)

        use_expl_mask = not (ref_expl_mask_pyramid is None \
                            or src_expl_mask_pyramid is None)
        if use_expl_mask:
            expl_mask_pyramid = []
            for level_idx in levels:
                ref_mask = ref_expl_mask_pyramid[level_idx].unsqueeze(
                    0).repeat(bundle_size - 1, 1, 1)
                src_mask = src_expl_mask_pyramid[level_idx]
                expl_mask_pyramid.append(torch.cat((ref_mask, src_mask), 0))

        # for level_idx in range(len(ref_frames_pyramid)):
        for level_idx in levels:  # 기본적으로 pyramid layer개수만큼 돔 (5개)
            # for level_idx in range(3):
            ref_frame = ref_frames_pyramid[level_idx].unsqueeze(0).repeat(
                bundle_size - 1, 1, 1, 1)
            src_frame = src_frames_pyramid[level_idx]
            ref_depth = ref_inv_depth_pyramid[level_idx].unsqueeze(0).repeat(
                bundle_size - 1, 1, 1)
            src_depth = src_inv_depth_pyramid[level_idx]
            # print(src_depth.size())
            # 여기서 왜 그렇게 concat시킨걸 append하는 지 잘 모르겠음.
            ref_pyramid.append(torch.cat((ref_frame, src_frame), 0) / 127.5)
            src_pyramid.append(torch.cat((src_frame, ref_frame), 0) / 127.5)
            depth_pyramid.append(torch.cat((ref_depth, src_depth), 0))

        rot_mat = torch.cat((rot_mat_batch, inv_rot_mat_batch), 0)
        trans = torch.cat((trans_batch, inv_trans_batch), 0)

        loss = 0

        frames_warp_pyramid = []
        ref_frame_warp_pyramid = []

        # for level_idx in range(len(ref_pyramid)):
        # for level_idx in range(3):
        for level_idx in levels:
            # print(depth_pyramid[level_idx].size())
            _, h, w = depth_pyramid[level_idx].size()
            warp_img, in_view_mask = self.warp_batch_func(
                src_pyramid[level_idx], depth_pyramid[level_idx], level_idx,
                rot_mat, trans)
            warp_img = warp_img.view((bundle_size - 1) * 2, IMG_CHAN, h, w)
            if use_expl_mask:
                mask = in_view_mask.view(-1, h,
                                         w) * expl_mask_pyramid[level_idx]
            else:
                mask = in_view_mask
            mask_expand = mask.view((bundle_size - 1) * 2, 1, h, w).expand(
                (bundle_size - 1) * 2, IMG_CHAN, h, w)
            rgb_loss = ((ref_pyramid[level_idx] - warp_img).abs() *
                        mask_expand).mean()
            if use_ssim and level_idx < 1:
                # print("compute ssim loss------")
                warp_mu, warp_sigma = compute_img_stats(warp_img)
                ref_mu, ref_sigma = compute_img_stats(ref_pyramid[level_idx])
                ssim = compute_SSIM(ref_pyramid[level_idx], ref_mu, ref_sigma,
                                    warp_img, warp_mu, warp_sigma)
                ssim_loss = (ssim * mask_expand[:, :, 1:-1, 1:-1]).mean()
                loss += .85 * ssim_loss + .15 * rgb_loss
            else:
                loss += rgb_loss

        #     frames_warp_pyramid.append(warp_img*127.5)
        #     ref_frame_warp_pyramid.append(ref_pyramid[level_idx]*127.5)
        #
        # return loss, frames_warp_pyramid, ref_frame_warp_pyramid
        return loss

    def compute_smoothness_cost(self, inv_depth):
        x = self.laplacian_func(inv_depth)
        return x.mean()

    def compute_image_aware_laplacian_smoothness_cost(self, depth, img):
        img_lap = self.laplacian_func(img / 255, do_normalize=False)
        depth_lap = self.laplacian_func(depth, do_normalize=False)
        x = (-img_lap.mean(1)).exp() * (depth_lap)
        return x.mean()

    def compute_image_aware_2nd_smoothness_cost(self, depth, img):
        img_lap = self.laplacian_func(img / 255, do_normalize=False)
        depth_grad_x, depth_grad_y = gradient(depth, do_normalize=False)
        depth_grad_x2, depth_grad_xy = gradient(depth_grad_x,
                                                do_normalize=False)
        depth_grad_yx, depth_grad_y2 = gradient(depth_grad_y,
                                                do_normalize=False)
        return depth_grad_x2.abs().mean() \
            + depth_grad_xy.abs().mean() + depth_grad_yx.abs().mean() + depth_grad_y2.abs().mean()

    def compute_image_aware_1st_smoothness_cost(self, depth, img):
        depth_grad_x, depth_grad_y = gradient(depth, do_normalize=False)
        img_grad_x, img_grad_y = gradient(img / 255, do_normalize=False)
        if img.dim() == 3:
            weight_x = torch.exp(-img_grad_x.abs().mean(0))
            weight_y = torch.exp(-img_grad_y.abs().mean(0))
            cost = ((depth_grad_x.abs() * weight_x)[:-1, :] +
                    (depth_grad_y.abs() * weight_y)[:, :-1]).mean()
        else:
            weight_x = torch.exp(-img_grad_x.abs().mean(1))
            weight_y = torch.exp(-img_grad_y.abs().mean(1))
            cost = ((depth_grad_x.abs() * weight_x)[:, :-1, :] +
                    (depth_grad_y.abs() * weight_y)[:, :, :-1]).mean()
        return cost

    def multi_scale_smoothness_cost(self, inv_depth_pyramid, levels=None):
        cost = 0
        if levels is None:
            levels = range(self.pyramid_layer_num)

        # for level_idx in range(2, self.pyramid_layer_num):
        for level_idx in levels:
            # for level_idx in range(3,4):
            inv_depth = inv_depth_pyramid[level_idx]
            if inv_depth.dim() == 4:
                inv_depth = inv_depth.squeeze(1)
            # cost_this_level = compute_img_aware_smoothness_cost(inv_depth, self.ref_frame_pyramid[level_idx]/255)/(2**level_idx)
            cost += self.compute_smoothness_cost(inv_depth) / (2**level_idx)
        return cost

    def multi_scale_image_aware_smoothness_cost(self,
                                                inv_depth_pyramid,
                                                img_pyramid,
                                                levels=None,
                                                type='lap'):
        # for level_idx in range(self.pyramid_layer_num):
        cost = 0
        if levels is None:
            levels = range(self.pyramid_layer_num)
        for level_idx in levels:
            # print(level_idx)
            inv_depth = inv_depth_pyramid[level_idx]
            if inv_depth.dim() == 4:
                inv_depth = inv_depth.squeeze(1)
            # cost += compute_img_aware_smoothness_cost(inv_depth, img_pyramid[level_idx])/(2**level_idx)
            if type == 'lap':
                c = self.compute_image_aware_laplacian_smoothness_cost(
                    inv_depth, img_pyramid[level_idx])
            elif type == '1st':
                c = self.compute_image_aware_1st_smoothness_cost(
                    inv_depth, img_pyramid[level_idx])
            elif type == '2nd':
                c = self.compute_image_aware_2nd_smoothness_cost(
                    inv_depth, img_pyramid[level_idx])
            else:
                print("%s not implemented!" % (type))
            cost += (c / (2**level_idx))

        return cost

    def update(self, frames_pyramid, max_itr_num=10):
        frame_num, k, h, w = frames_pyramid[0].size()
        trans_batch = Variable(self.o).expand(frame_num, 3).contiguous()
        trans_batch_prev = Variable(self.o).expand(frame_num, 3).contiguous()

        rot_mat_batch = Variable(self.E).unsqueeze(0).expand(frame_num, 3,
                                                             3).contiguous()
        rot_mat_batch_prev = Variable(self.E).unsqueeze(0).expand(
            frame_num, 3, 3).contiguous()

        pixel_warp = []
        in_view_mask = []

        cur_time = timer()

        for level_idx in range(self.pyramid_layer_num - 1, -1, -1):

            max_photometric_cost = self.o.squeeze().expand(frame_num) + 10000
            # print(level_idx)
            for i in range(max_itr_num):
                # print(i)
                # cur_time = timer()
                pixel_warp, in_view_mask = self.warp_batch(
                    frames_pyramid[level_idx], level_idx, rot_mat_batch,
                    trans_batch)
                # t_warp += timer()-cur_time

                temporal_grad = pixel_warp - self.ref_frame_pyramid[
                    level_idx].view(3, -1).unsqueeze(0).expand_as(pixel_warp)

                photometric_cost, min_perc_in_view = compute_photometric_cost_norm(
                    temporal_grad.data, in_view_mask.data)
                # print(photometric_cost)
                # print(max_photometric_cost)
                # print(min_perc_in_view)
                # print((photometric_cost < max_photometric_cost).max())
                if min_perc_in_view < .5:
                    break

                if (photometric_cost < max_photometric_cost).max() > 0:
                    # print(photometric_cost)
                    trans_batch_prev = trans_batch

                    rot_mat_batch_prev = rot_mat_batch

                    dp = self.LKregress(
                        invH_dIdp=self.invH_dIdp_pyramid[level_idx],
                        mask=in_view_mask,
                        It=temporal_grad)

                    d_rot_mat_batch = self.twist2mat_batch_func(-dp[:, 0:3])
                    trans_batch_new = d_rot_mat_batch.bmm(
                        trans_batch.view(frame_num, 3, 1)).view(frame_num,
                                                                3) - dp[:, 3:6]
                    rot_mat_batch_new = d_rot_mat_batch.bmm(rot_mat_batch)

                    trans_list = []
                    rot_list = []
                    for k in range(frame_num):
                        if photometric_cost[k] < max_photometric_cost[k]:
                            rot_list.append(rot_mat_batch_new[k:k + 1, :, :])
                            trans_list.append(trans_batch_new[k:k + 1, :])
                            max_photometric_cost[k] = photometric_cost[k]
                        else:
                            rot_list.append(rot_mat_batch[k:k + 1, :, :])
                            trans_list.append(trans_batch[k:k + 1, :])
                    rot_mat_batch = torch.cat(rot_list, 0)
                    trans_batch = torch.cat(trans_list, 0)
                    # if photometric_cost[k] < max_photometric_cost[k]:
                    #     trans_batch = d_rot_mat_batch.bmm(trans_batch.view(frame_num, 3, 1)).view(frame_num, 3) - dp[:, 3:6]
                    #     rot_mat_batch = d_rot_mat_batch.bmm(rot_mat_batch)
                else:
                    break
            rot_mat_batch = rot_mat_batch_prev
            trans_batch = trans_batch_prev

        return rot_mat_batch, trans_batch, frames_pyramid

    def update_with_init_pose(self,
                              frames_pyramid,
                              rot_mat_batch,
                              trans_batch,
                              max_itr_num=10):
        frame_num, k, h, w = frames_pyramid[0].size()
        trans_batch_prev = trans_batch
        rot_mat_batch_prev = rot_mat_batch

        pixel_warp = []
        in_view_mask = []

        cur_time = timer()

        for level_idx in range(len(frames_pyramid) - 1, -1, -1):

            max_photometric_cost = self.o.squeeze().expand(frame_num) + 10000
            # print(level_idx)
            for i in range(max_itr_num):
                # print(i)
                # cur_time = timer()
                pixel_warp, in_view_mask = self.warp_batch(
                    frames_pyramid[level_idx], level_idx, rot_mat_batch,
                    trans_batch)
                # t_warp += timer()-cur_time

                temporal_grad = pixel_warp - self.ref_frame_pyramid[
                    level_idx].view(3, -1).unsqueeze(0).expand_as(pixel_warp)

                photometric_cost, min_perc_in_view = compute_photometric_cost_norm(
                    temporal_grad.data, in_view_mask.data)

                if min_perc_in_view < .5:
                    break

                if (photometric_cost < max_photometric_cost).max() > 0:

                    trans_batch_prev = trans_batch
                    rot_mat_batch_prev = rot_mat_batch

                    dp = self.LKregress(
                        invH_dIdp=self.invH_dIdp_pyramid[level_idx],
                        mask=in_view_mask,
                        It=temporal_grad)

                    # d_rot_mat_batch = self.twist2mat_batch_func(-dp[:, 0:3])
                    d_rot_mat_batch = self.twist2mat_batch_func(
                        dp[:, 0:3]).transpose(1, 2)
                    trans_batch_new = d_rot_mat_batch.bmm(
                        trans_batch.view(frame_num, 3, 1)).view(frame_num,
                                                                3) - dp[:, 3:6]
                    rot_mat_batch_new = d_rot_mat_batch.bmm(rot_mat_batch)

                    trans_list = []
                    rot_list = []
                    # print(photometric_cost)
                    for k in range(frame_num):
                        if photometric_cost[k] < max_photometric_cost[k]:
                            rot_list.append(rot_mat_batch_new[k:k + 1, :, :])
                            trans_list.append(trans_batch_new[k:k + 1, :])
                            max_photometric_cost[k] = photometric_cost[k]
                        else:
                            rot_list.append(rot_mat_batch[k:k + 1, :, :])
                            trans_list.append(trans_batch[k:k + 1, :])
                    rot_mat_batch = torch.cat(rot_list, 0)
                    trans_batch = torch.cat(trans_list, 0)
                else:
                    break
            rot_mat_batch = rot_mat_batch_prev
            trans_batch = trans_batch_prev

        return rot_mat_batch, trans_batch

    def forward(self,
                ref_frame_pyramid,
                src_frame_pyramid,
                ref_inv_depth_pyramid,
                max_itr_num=10):
        self.init(ref_frame_pyramid=ref_frame_pyramid,
                  inv_depth_pyramid=ref_inv_depth_pyramid)
        rot_mat_batch, trans_batch, src_frames_pyramid = self.update(
            src_frame_pyramid, max_itr_num=max_itr_num)
        return rot_mat_batch, trans_batch