moving_object_detection_alg.py

'''Functions for identifying moving object in almost static scene'''
import time
import os.path
import sys
#import matplotlib.pyplot as plt
import cPickle as pickle
import numpy as np
import cv2
import class_objects as co
import hand_segmentation_alg as hsa
import action_recognition_alg as ara
from scipy import ndimage
import array
import logging
LOG = logging.getLogger('__name__')
CH = logging.StreamHandler()
CH.setFormatter(logging.Formatter(
    '%(funcName)20s()(%(lineno)s)-%(levelname)s:%(message)s'))
LOG.addHandler(CH)
LOG.setLevel('INFO')

class Mog2(object):
    '''
    Implementation for handling of depth video
    '''

    def __init__(self, remove_noise=True,
                 gmm_num=co.CONST['gmm_num'],
                   bg_ratio=co.CONST['bg_ratio'],
                   var_thres=co.CONST['var_thres'],
                   history=co.CONST['history']):
        self.initialize(gmm_num, bg_ratio, var_thres, history)
        self.sync_count = -1
        self.kernel = np.ones((5, 5), np.uint8)
        self.init_num = co.CONST['calib_secs']*30
        self.valid_img = None
        self.untrusty_pixels = None
        self.initial_background = None
        self.initial_im_set = []
        self.filtered_data = None
        self.mog2_examples = []
    def initialize(self,
                   gmm_num=co.CONST['gmm_num'],
                   bg_ratio=co.CONST['bg_ratio'],
                   var_thres=co.CONST['var_thres'],
                   history=co.CONST['history']):
        cv2.ocl.setUseOpenCL(False)
        self.fgbg = cv2.createBackgroundSubtractorMOG2(history=int(history),
                                                       varThreshold=var_thres,
                                                       detectShadows=True)
        # self.fgbg.setNMixtures(int(gmm_num))
        self.fgbg.setBackgroundRatio(bg_ratio)
        self.fgbg.setComplexityReductionThreshold(0.9)
        self.preprocessed_examples = []
        self.raw_examples = []
        self.threshold = None

    def get_valid_data(self, img):
        return (img > 0).astype(bool)

    def run(self, save_example=False, data=None):
        '''
        Run detection
        '''
        self.sync_count += 1

        if data is None:
            LOG.warning('MOG2: Reading data from co.data.depth_im')
            data = co.data.depth_im.copy()
        if self.filtered_data is None:
            self.filtered_data = np.zeros_like(data)
        if self.sync_count < self.init_num:
            self.initial_im_set.append(data)
            if self.valid_img is None:
                self.valid_img = np.zeros_like(data)
            flag = self.get_valid_data(data)
            self.valid_img[flag] = data[flag]
            return None
        elif self.sync_count == self.init_num:
            self.initial_background = np.median(
                np.array(self.initial_im_set), axis=0)
            self.untrusty_pixels = (np.abs(self.initial_background -
                                           self.valid_img) >= 10)
            self.untrusty_pool = np.array(self.initial_im_set)[:,
                                                               self.untrusty_pixels]
        if save_example:
            co.draw_oper.save_pure_image(self.untrusty_pixels, 'untrusty_pixels.png')
        untrusty_pixels = self.untrusty_pixels.copy()
        untrusty_pixels[untrusty_pixels] = (
            np.sum(data[self.untrusty_pixels] == self.untrusty_pool,
                         axis=0)).astype(bool)
        if save_example:
            co.draw_oper.save_pure_image(untrusty_pixels, 'mod_untrusty_pixels.png')
        if save_example:
            self.raw_examples.append(data)
        flag = (np.logical_not(self.get_valid_data(data)) +
                untrusty_pixels).astype(bool)
        self.filtered_data = data.copy()
        self.filtered_data[flag] = self.valid_img[flag]
        inp = self.filtered_data
        if save_example:
            self.preprocessed_examples.append(inp)
        mog2_res = self.fgbg.apply(inp.astype(np.float32), 0.8)
        mog2_res = (mog2_res == 127).astype(np.uint8)
        if save_example:
            self.mog2_examples.append(mog2_res*255)
        return mog2_res

    def reset(self):
        self.fgbg = None
        self.sync_count = -1
        self.preprocessed_examples = []
        self.raw_examples = []
        '''
        if display:
            found_objects_mask[found_objects_mask > 0] = 255
            found_objects_mask[filtered_image > 0] = 125
            found_objects_mask = found_objects_mask.astype(np.uint8)
            co.im_results.images.append(found_objects_mask)
            co.im_results.images.append((found_objects_mask > 0)*filtered_image)
        co.meas.found_objects_mask = (filtered_image > 0).astype(np.uint8)
        '''


def detection_by_scene_segmentation():
    '''Detection of moving object by using Distortion field of centers of mass
    of background objects'''
    if co.counters.im_number == 0:
        co.segclass.needs_segmentation = 1
        if not co.segclass.exists_previous_segmentation:
            print 'No existing previous segmentation. The initialisation will delay...'
        else:
            print 'Checking similarity..'
            old_im = co.meas.background
            check_if_segmented = np.sqrt(np.sum(
                (co.data.depth_im[co.meas.trusty_pixels.astype(bool)].astype(float) -
                 old_im[co.meas.trusty_pixels.astype(bool)].astype(float))**2))
            print 'Euclidean Distance of old and new background is ' +\
                str(check_if_segmented)
            print 'Minimum Distance to approve previous segmentation is ' +\
                str(co.CONST['similar_bg_min_dist'])
            if check_if_segmented < co.CONST['similar_bg_min_dist']:
                print 'No need to segment again'
                co.segclass.needs_segmentation = 0
            else:
                print 'Segmentation is needed'

    if co.segclass.needs_segmentation and co.counters.im_number >= 1:
        if co.counters.im_number == (co.CONST['framerate'] *
                                     co.CONST['calib_secs'] - 1):
            co.segclass.flush_previous_segmentation()
            co.segclass.nz_objects.image = np.zeros_like(co.data.depth_im) - 1
            co.segclass.z_objects.image = np.zeros_like(co.data.depth_im) - 1
            levels_num = 8
            levels = np.linspace(np.min(co.data.depth_im[co.data.depth_im > 0]), np.max(
                co.data.depth_im), levels_num)
            co.segclass.segment_values = np.zeros_like(co.data.depth_im)
            for count in range(levels_num - 1):
                co.segclass.segment_values[(co.data.depth_im >= levels[count]) *
                                           (co.data.depth_im <= levels[count + 1])] = count + 1

        elif co.counters.im_number == (co.CONST['framerate'] *
                                       co.CONST['calib_secs']):
            co.segclass.nz_objects.count = -1
            co.segclass.z_objects.count = -1
            co.segclass.segment_values = co.segclass.segment_values * co.meas.trusty_pixels
            for val in np.unique(co.segclass.segment_values):
                objs = np.ones_like(co.data.depth_im) * \
                    (val == co.segclass.segment_values)
                labeled, nr_objects =\
                    ndimage.label(objs * co.edges.calib_frame)
                lbls = np.arange(1, nr_objects + 1)
                if val > 0:
                    ndimage.labeled_comprehension(objs, labeled, lbls,
                                                  co.segclass.nz_objects.process, float, 0,
                                                  True)
                else:
                    ndimage.labeled_comprehension(objs, labeled, lbls,
                                                  co.segclass.z_objects.process,
                                                  float, 0, True)
            for (points, pixsize,
                 xsize, ysize) in (co.segclass.nz_objects.untrusty +
                                   co.segclass.z_objects.untrusty):
                co.segclass.z_objects.count += 1
                co.segclass.z_objects.image[
                    tuple(points)] = co.segclass.z_objects.count
                co.segclass.z_objects.pixsize.append(pixsize)
                co.segclass.z_objects.xsize.append(xsize)
                co.segclass.z_objects.ysize.append(ysize)

            print 'Found or partitioned',\
                co.segclass.nz_objects.count +\
                co.segclass.z_objects.count + 2, 'background objects'
            co.segclass.needs_segmentation = 0
            with open(co.CONST['segmentation_data'] + '.pkl', 'wb') as output:
                pickle.dump((co.segclass, co.meas), output, -1)
            print 'Saved segmentation data for future use.'
    elif (not co.segclass.needs_segmentation) and co.counters.im_number >= 2:
        if not co.segclass.initialised_centers:
            try:
                co.segclass.nz_objects.find_object_center(1)
            except BaseException as err:
                print 'Centers initialisation Exception'
                raise err
            try:
                co.segclass.z_objects.find_object_center(0)
            except BaseException as err:
                print 'Centers initialisation Exception'
                raise err
            co.segclass.initialise_neighborhoods()
            co.segclass.initialised_centers = 1
        else:
            try:
                co.segclass.nz_objects.find_object_center(1)
            except BaseException as err:
                print 'Centers calculation Exception'
                raise err
        if co.segclass.nz_objects.center.size > 0:
            co.segclass.nz_objects.find_centers_displacement()
            co.meas.found_objects_mask = co.segclass.find_objects()

            points_on_im = co.data.depth3d.copy()
            # points_on_im[np.sum(points_on_im,axis=2)==0,:]=np.array([1,0,1])
            for calc, point1, point2 in zip(
                    co.segclass.nz_objects.centers_to_calculate,
                    co.segclass.nz_objects.initial_center,
                    co.segclass.nz_objects.center):
                if point1[0] != -1:
                    if calc:
                        cv2.arrowedLine(points_on_im,
                                        (point1[1], point1[0]),
                                        (point2[1], point2[0]), [0, 1, 0], 2, 1)
                    else:
                        cv2.arrowedLine(points_on_im,
                                        (point1[1], point1[0]),
                                        (point2[1], point2[0]), [0, 0, 1], 2, 1)
            struct_el = cv2.getStructuringElement(
                cv2.MORPH_ELLIPSE, tuple(2 * [5]))
            co.meas.found_objects_mask = cv2.morphologyEx(
                co.meas.found_objects_mask.astype(np.uint8), cv2.MORPH_CLOSE, struct_el)
            struct_el = cv2.getStructuringElement(
                cv2.MORPH_ELLIPSE, tuple(2 * [10]))
            co.meas.found_objects_mask = cv2.morphologyEx(
                co.meas.found_objects_mask.astype(np.uint8), cv2.MORPH_OPEN, struct_el)
            hand_patch, hand_patch_pos = hsa.main_process(
                co.meas.found_objects_mask.astype(
                    np.uint8), co.meas.all_positions, 1)
            co.meas.hand_patch = hand_patch
            co.meas.hand_patch_pos = hand_patch_pos
            if len(co.im_results.images) == 1:
                co.im_results.images.append(
                    (255 * co.meas.found_objects_mask).astype(np.uint8))
            co.im_results.images.append(points_on_im)
            # elif len(co.im_results.images)==2:
            #    co.im_results.images[1][co.im_results.images[1]==0]=(255*points_on_im).astype(np.uint8)[co.im_results.images[1]==0]
            # if hand_points.shape[1]>1:
            #    points_on_im[tuple(hand_points.T)]=[1,0,0]
            # co.im_results.images.append(points_on_im)
            return 1


def extract_background_values():
    '''function to extract initial background values from initial_im_set'''
    _, _, im_num = co.data.initial_im_set.shape
    valid_freq = np.zeros(co.data.initial_im_set[:, :, 0].shape)
    co.meas.background = np.zeros(co.data.initial_im_set[:, :, 0].shape)
    initial_nonzero_im_set = np.zeros(co.data.initial_im_set.shape)
    valid_values = np.zeros_like(co.meas.background)
    co.meas.all_positions = np.fliplr(cv2.findNonZero(np.ones_like(
        co.meas.background, dtype=np.uint8)).squeeze()).reshape(co.meas.background.shape + (2,))
    for count in range(im_num):
        valid_values[
            co.data.initial_im_set[:, :, count] > 0
        ] = co.data.initial_im_set[:, :, count][
            co.data.initial_im_set[:, :, count] > 0]
        co.meas.background = co.meas.background + \
            co.data.initial_im_set[:, :, count]
        valid_freq[co.data.initial_im_set[:, :, count] != 0] += 1

        initial_nonzero_im_set[:, :, count] += co.data.initial_im_set[
            :, :, count] != 0
    co.meas.valid_values = (valid_values * 255).astype(np.uint8)

    co.meas.trusty_pixels = (
        (valid_freq) == np.max(valid_freq)).astype(np.uint8)
    valid_freq[valid_freq == 0] = 1
    co.meas.background = co.meas.background / valid_freq

    return valid_freq, initial_nonzero_im_set, im_num


def init_noise_model():
    '''Compute Initial Background and Noise Estimate from the first im_num
     images with no moving object presence'''

    valid_freq, initial_nonzero_im_set, im_num = extract_background_values()
    # Assume Noise dependency from location

    cv2.imwrite('Background.jpg', (255 * co.meas.background).astype(int))
    cv2.imwrite('Validfreq.jpg', (255 * valid_freq /
                                  float(np.max(valid_freq))).astype(int))
    noise_deviation = np.zeros_like(co.data.depth_im)
    for c_im in range(im_num):
        # Remove white pixels from co.data.initial_im_set
        noise_deviation0 = ((co.meas.background -
                             co.data.initial_im_set[:, :, c_im]) *
                            initial_nonzero_im_set[:, :, c_im])
        noise_deviation0 = noise_deviation0 * noise_deviation0
        noise_deviation = noise_deviation + noise_deviation0
    noise_deviation = np.sqrt(noise_deviation / valid_freq)
    cv2.imwrite('noise_deviation.jpg', (255 * noise_deviation /
                                        np.max(noise_deviation)).astype(int))

    noise_deviation = np.minimum(noise_deviation, 0.2)
    noise_deviation = np.maximum(
        noise_deviation, co.CONST['lowest_pixel_noise_deviation'])
    max_background_thres = co.meas.background + noise_deviation
    cv2.imwrite('Max_Background.jpg', (255 * max_background_thres).astype(int))
    cv2.imwrite('Zero_Background.jpg', (255 *
                                        (co.meas.background == 0)).astype(int))
    min_background_thres = (co.meas.background - noise_deviation) * \
        ((co.meas.background - noise_deviation) > 0)
    cv2.imwrite('Min_Background.jpg', (255 * min_background_thres).astype(int))
    print "Recognition starts now"
    return min_background_thres, max_background_thres


def find_moving_object():
    '''Find the biggest moving object in scene'''
    found_object0 = np.ones(co.data.depth_im.shape)
    min_background_thres, max_background_thres = co.models.noise_model
    co.masks.background = np.logical_and(np.logical_or((co.data.depth_im > max_background_thres), (
        co.data.depth_im < min_background_thres)), co.data.depth_im != 0)

    co.im_results.images += [co.masks.background, co.data.depth_im]
    found_object0[co.masks.background] = co.data.depth_im[co.masks.background]
    laplacian = cv2.Laplacian(found_object0, cv2.CV_64F)
    found_object0[np.abs(laplacian) > co.thres.lap_thres] = 1.0
    # Remove also 0 values
    found_object0[found_object0 == 0.0] = 1.0
    # Isolate considered Object by choosing a contour from the ones found
    thresh = np.zeros(found_object0.shape, dtype=np.uint8)
    thresh[found_object0 < 1] = 255
    co.meas.contours_areas = []
    _, co.scene_contours, _ = cv2.findContours(
        thresh.copy(), cv2.RETR_TREE, cv2.CHAIN_APPROX_NONE)
    if not co.scene_contours:
        return "No Contours Found", [], [], []
    for i, count1 in enumerate(co.scene_contours):
        area = cv2.contourArea(count1)
        co.meas.contours_areas.append(area)
    # Sort co.scene_contours by area
    sorted_contours = sorted(zip(co.meas.contours_areas, co.scene_contours),
                             key=lambda x: x[0], reverse=True)

    sorted_contours = [x for (_, x) in sorted_contours]
    mask = np.zeros(co.data.depth_im.shape, np.uint8)
    sorted_depth = np.zeros(co.CONST['max_contours_num'])
    for i in range(min(len(co.scene_contours), co.CONST['max_contours_num'] - 1)):
        # Find mean depth for each shape matching each contour
        mask[:] = 0
        cv2.drawContours(mask, sorted_contours, 0, 255, -1)
        sorted_depth[i] = np.mean(co.data.depth_im[mask > 0])
    if (co.meas.aver_depth == []) | (co.meas.aver_depth == 0):
        co.meas.aver_depth = sorted_depth[0]
    match = (sorted_depth < (co.meas.aver_depth + co.thres.depth_thres)
             ) & (sorted_depth > (co.meas.aver_depth - co.thres.depth_thres))
    if np.sum(match[:]) == 0:
        chosen_contour = sorted_contours[0]
        chosen_depth = sorted_depth[0]
        matched = 0
    else:
        found_match = np.fliplr(cv2.findNonZero(match).squeeze())
        # the following line might want debugging
        matched = found_match[0, 0]
        chosen_contour = sorted_contours[matched]
        chosen_depth = sorted_depth[matched]
    if np.abs(chosen_depth - co.meas.aver_depth) < co.meas.aver_depth:
        co.counters.outlier_time = 0
        co.data.depth_mem.append(chosen_depth)
        co.counters.aver_count += 1
        if co.counters.aver_count > co.CONST['running_mean_depth_count']:
            co.meas.aver_depth = ((chosen_depth -
                                   co.data.depth_mem[
                                       co.counters.aver_count -
                                       co.CONST['running_mean_depth_count']] +
                                   co.meas.aver_depth *
                                   co.CONST['running_mean_depth_count']) /
                                  co.CONST['running_mean_depth_count'])
        else:
            co.meas.aver_depth = (chosen_depth + co.meas.aver_depth *
                                  (co.counters.aver_count - 1)) / co.counters.aver_count
    else:
        co.counters.outlier_time += 1
    if co.counters.outlier_time == co.CONST['outlier_shape_time'] * co.CONST['framerate']:
        co.counters.aver_count = 1
        co.meas.aver_depth = chosen_depth
        co.data.depth_mem = []
        co.data.depth_mem.append(chosen_depth)
    final_mask = np.zeros(co.data.depth_im.shape, np.uint8)
    cv2.drawContours(final_mask, sorted_contours, matched, 255, -1)
    if np.array(chosen_contour).squeeze().shape[0] <= 5:
        return "Arm not found", [], [], []
    return final_mask, chosen_contour, sorted_contours, matched