recorder.py

#!/usr/bin/python

import cv2, cv
import numpy
import subprocess
import time
import freenect
import random 
import threading
import copy
import datetime
import serial

from api import Api
from gui import Gui, Color
from gui.vector import V
from motion import MotionDetector
import calibration
import settings

DEBUG = settings.DEBUG
SHOW_WINDOW = settings.SHOW_WINDOW

class Recorder(object):
    def __init__(self, num_frames=settings.BUFFER_LENGTH, limit_fps=None):
        if SHOW_WINDOW:
            cv2.namedWindow("preview")

        self.last_video_frame = None

        self.num_frames = num_frames
        self.frames = [None] * self.num_frames
        self.current_jpg_frame = None
        self.buffer_index = 0

        self.keep_running = True
        self.frame_rate = 0
        self.last_frame = time.time()
        self.limit_fps = limit_fps

        self.api = Api(self)
        self.api_lock = threading.Lock()

        self.motion_detector = MotionDetector()

        self.ser = serial.Serial('/dev/ttyUSB0', 9600, timeout=1)
        self.encoding_subprocesses = []
        self.last_serial_command = None
        self.encoding_started = datetime.datetime.now()

        if settings.UI_ENABLED:
            if settings.UI_RESOLUTION:
                self.gui = Gui(width=settings.UI_RESOLUTION[0], height=settings.UI_RESOLUTION[1])
            else:
                self.gui = Gui()

            # Test recording button
            base_state = (
                self.gui.recording_button,
                [150, 150, 90],
                {}
            )
            hover_state = (
                self.gui.recording_button,
                [150, 150, 90],
                {'highlight':True}
            )
            active_state = (
                self.gui.recording_button,
                [150, 150, 90],
                {'active':True}
            )
            callback = lambda: self.log("triggered")#self.calibrate

            self.gui.add_element(element_id=2, base_state=base_state, hover_state=hover_state, active_state=active_state, callback=callback)

            base_state = (
                self.gui.button,
                [100, 100, 200, 30, 'Yeah buttons Baby'],
                {}
            )
            hover_state = (
                self.gui.button,
                [98, 98, 204, 34, 'Yeah buttons Baby'],
               {'fill_color': Color(0.95, 0.95, 0.95), 'bold':True}
            )
            active_state = (
                self.gui.button,
                [98, 98, 204, 34, 'Yeah buttons Baby'],
                {'fill_color': Color(0.9, 0.9, 0.9), 'bold': True}
            )
            callback = self.calibrate
            #self.gui.add_element(element_id=1, base_state=base_state, hover_state=hover_state, active_state=active_state, callback=callback)

            self.gui.update()
        else:
            self.gui = None

    def start_encoding_animation(self):
        self.encoding_started = datetime.datetime.now()
        self.last_serial_command = 'f'
        self.ser.write('f')

    def stop_encoding_animation(self):
        if self.last_serial_command != 's':
            self.last_serial_command = 's'
            self.ser.write('s')

    def log(self, text):
        print text

    def array(self, image):
        return numpy.asarray(image[:,:])

    def threshold(self, grayscale_array, low, high, value=1):
        grayscale_array = value * numpy.logical_and(grayscale_array >= low, grayscale_array < high)
        return grayscale_array

    def update_frame_rate(self):
        # FIXME: save some kind of average for the fps
        self.frame_diff = time.time() - self.last_frame

        if self.limit_fps:
            minimum_frame_diff = 1.0/self.limit_fps
            if self.frame_diff < minimum_frame_diff:
                time.sleep(minimum_frame_diff - self.frame_diff)
            self.frame_diff = time.time() - self.last_frame

        self.frame_rate = 1.0/self.frame_diff
        self.last_frame = time.time()

        if DEBUG:
            print "FPS: %s" % round(self.frame_rate)

    def buffer_frame(self, frame):
        (retval, jpg_frame) = cv2.imencode(".jpg", frame, (cv.CV_IMWRITE_JPEG_QUALITY, 50))
        jpg_frame = jpg_frame.tostring()
        self.current_jpg_frame = jpg_frame
        self.frames[self.buffer_index] = jpg_frame
        if self.buffer_index >= self.num_frames - 1:
           self.buffer_index = 0
        else:
           self.buffer_index += 1

    def get_ordered_buffer(self):
        """ Returns buffer in correct frame order """
        return copy.copy(self.frames[self.buffer_index:]+self.frames[:self.buffer_index])

    def loop(self):
        while self.keep_running:
            self.update_frame_rate()
            self.handle_events()
            self.handle_frame()
            if self.gui:
                self.gui.update()

    def _save_buffer_to_video(self):
        # Fixme: make shit configurable
        output_file = datetime.datetime.now().strftime("pool-%Y-%m-%d %H:%M:%S.avi")
        cmdstring = ('ffmpeg',
                     '-r', '%d' % int(round(self.frame_rate)),
                     '-f','image2pipe',
                     '-vcodec', 'mjpeg',
                     '-i', 'pipe:',
                     '-c:v', 'libx264',
                     '-preset', 'fast',
                     '-crf', '23',
                     output_file
                     )

        p = subprocess.Popen(cmdstring, stdin=subprocess.PIPE)
        self.encoding_subprocesses.append(p)
        for jpg_frame in self.get_ordered_buffer():
            if jpg_frame is not None:
                p.stdin.write(jpg_frame)
        p.stdin.close()

    def save_buffer_to_video(self):
        t = threading.Thread(target=self._save_buffer_to_video)
        t.daemon = True
        t.start()
        self.start_encoding_animation()

    def to_grayscale(self, image):
        tmp = cv.CreateImage(cv.GetSize(image), image.depth, 1)
        cv.CvtColor(image, tmp,cv.CV_BGR2GRAY)
        image = self.array(tmp)
        return image

    def calibrate(self):
        print "calibrate"
        self.gui.fill(Color(1, 1, 1))
        self.gui.update()
        time.sleep(0.2)
        white_frame = self.to_grayscale(self.capture_frame(as_array=False))

        self.gui.fill(Color(0, 0, 0))
        self.gui.update()
        time.sleep(0.2)
        black_frame = self.to_grayscale(self.capture_frame(as_array=False))

        self._calibrate(white_frame, black_frame)

    def _calibrate(self, white_frame, black_frame):
        """ Fill gui with white, capture a frame, fill with black, capture another frame.
            Substract the images and calculate a threshold, generate a gradient to get the borders.
            Calculate a transformation matrix that converts from the coordinates on the frame to screen coordinates.
        """
        height, width = white_frame.shape
        # Calculate threshold and gradient to end up with an image with just the border of the screen as white pixels
        diff_frame = cv2.subtract(white_frame, black_frame)
        threshold_frame = cv2.threshold(diff_frame, settings.CALIBRATION_THRESHOLD, 255, cv2.THRESH_BINARY)[1]
        gradient_frame = cv2.Laplacian(threshold_frame, cv2.CV_64F)
        gradient_frame = self.threshold(gradient_frame, 255, 256, 255.0)
        cv2.imwrite("white.jpg", white_frame)
        cv2.imwrite("black.jpg", black_frame)
        cv2.imwrite("diff.jpg", diff_frame)
        cv2.imwrite("threshold.jpg", threshold_frame)
        cv2.imwrite("gradient.jpg", gradient_frame)

        self.gui.fill(Color(1, 1, 1))
        self.gui.update()

        # Get list of all white pixels in the gradient as [(y,x), (y,x), ...]
        border_candidate_points = numpy.transpose(gradient_frame.nonzero())
        if not border_candidate_points.any():
            return
        borders = {}
        for border in ['left', 'right', 'top', 'bottom']:
            borders[border] = {
                'count': 0,
                'mean': V(0,0),
                'vectors': []
            }

        for x in range(0, 500):
            raw_y, raw_x = random.choice(border_candidate_points)
            can = V(raw_x, raw_y)
            up = down = left = right = None
            # Walk along a 13x13 square path around the point and look for other border points
            try:
                for x in range(-6, 7):
                    for y in [-6, 7]:
                        if gradient_frame[can.y+y][can.x+x] == 255:
                            if y < 0:
                                down = can + (x,y)
                            else:
                                up = can + (x,y)

                for y in range(-6, 7):
                    for x in [-6, 7]:
                        if gradient_frame[can.y+y][can.x+x] == 255:
                            if x < 0:
                                left = can + (x,y)
                            else:
                                right = can + (x,y)
            except IndexError:
                continue

            # If two opposing sides of the square have border points, and all three points are roughly on a line
            # then assume this is an actual proper point on the screen border
            point_found = False
            if up and down and not left and not right:
                p = up - can
                q = V(down.x - can.x, can.y - down.y)
                point_found = True
            elif left and right and not up and not down:
                p = V(can.x-left.x, left.y-can.y)
                q = V(right.x-can.x, can.y-right.y)
                point_found = True

            if point_found:
                # Test if the three points are roughly on one line
                if p*q/(p.abs()*q.abs()) > 0.95:
                    # For now, we will simply assume that the image is roughly centered,
                    # i.e. that the left edge is on the left half of the screen, etc
                    if up and down:
                        if can.x < width/2:
                            border = 'left'
                        else:
                            border = 'right'
                    else:
                        if can.y < height/2:
                            border = 'top'
                        else:
                            border = 'bottom'
                    borders[border]['count'] += 1
                    borders[border]['mean'] += can
                    borders[border]['vectors'].append(can)

                    # Paint discovered border point on original black frame for debugging
                    black_frame[can.y][can.x] = 255
                else:
                    black_frame[can.y][can.x] = 128

        cv2.imwrite("debug.jpg", black_frame)
        # Go through list of discovered border points and calculate vectors for the borders
        self.gui.draw_image_slow(black_frame)

        for (border_name, border) in borders.items():
            if not border['count']:
                self.gui.update()
                return
            # Divide mean vector by number of vectors to get actual mean for this border
            real_mean = border['real_mean'] = border['mean']/border['count']

            # Calculate mean direction of border
            direction_mean = V(0,0)
            direction_count = 0
            for vector in border['vectors']:
                if not vector:
                    continue
                direction_vector = real_mean - vector
                if (direction_vector+direction_mean).abs() < direction_mean.abs():
                    direction_vector = -direction_vector
                direction_mean += direction_vector
                direction_count += 1
            border['direction_mean'] = direction_mean = direction_mean/direction_count
            added = real_mean + direction_mean
            colors = {
                'left': Color(255, 0, 0),
                'right': Color(0, 255, 0),
                'top': Color(255, 255, 0),
                'bottom': Color(0, 0, 255)
            }
            self.gui.draw_line(real_mean.x, real_mean.y, added.x, added.y, stroke_color = colors[border_name])
            self.gui.draw_circle((real_mean.x, real_mean.y), 5, stroke_color = colors[border_name])

        corners = {}
        # Calculate corners from border intersections
        for border1, border2 in [('top', 'left'), ('top', 'right'), ('bottom', 'left'), ('bottom', 'right')]:
            o1 = borders[border1]['real_mean']
            d1 = borders[border1]['direction_mean']
            o2 = borders[border2]['real_mean']
            d2 = borders[border2]['direction_mean']
            corner = V.intersection(o1, d1, o2, d2)
            if not corner:
                self.gui.update()
                return
            print corner
            corners[border1+"_"+border2] = corner
            self.gui.draw_circle((corner.x, corner.y), 10, Color(255, 0, 255))
        print corners

        # Calculate transformation matrix
        self.gui.calibration_matrix = calibration.calibration_transformation_matrix(width, height, self.gui.width, self.gui.height, corners)
        m = self.gui.calibration_matrix
        b = corners['top_left']
        p = m[b.y+10][b.x+10]
        self.gui.draw_circle((p.x, p.y), 3, stroke_color = Color(0,1,0))
        b = corners['top_right']
        p = m[b.y+10][b.x-10]
        self.gui.draw_circle((p.x, p.y), 3, stroke_color = Color(0,1,0))
        b = corners['bottom_left']
        p = m[b.y-10][b.x+10]
        self.gui.draw_circle((p.x, p.y), 3, stroke_color = Color(0,1,0))
        b = corners['bottom_right']
        p = m[b.y-10][b.x-10]
        self.gui.draw_circle((p.x, p.y), 3, stroke_color = Color(0,1,0))

        self.gui.update()

        print "Calibration successful."

    def handle_custom_event(self, event):
        """ Child classes can override this to do additional event handling. """
        pass

    def handle_events(self):
        # Handle Api events
        while self.ser.inWaiting():
            if self.ser.readline().strip() == 'press':
                print "saving video"
                self.save_buffer_to_video()

        # Check on subprocesses
        still_running = []
        for p in self.encoding_subprocesses:
            print p.poll()
            if p.poll() is None:
                still_running.append(p)
        self.encoding_subprocesses = still_running

        if not self.encoding_subprocesses and datetime.datetime.now() - self.encoding_started > datetime.timedelta(seconds=1):
            self.stop_encoding_animation()

        # Handle Api events
        with self.api_lock:
            for event in self.api.events:
                if event == "save":
                    recorder.save_buffer_to_video()
                elif event == "quit":
                    self.keep_running = False
            self.api.events = []

        if self.gui:
            event = self.gui.process_events()
            if event.key == 'c':
                self.calibrate()
                self.gui.redraw_elements()
            elif event.key == 'p':
                self.keep_running = False
            elif event.key == 'f':
                matrix = numpy.zeros((640, 480))
                matrix[150:160, 150:160] = 1
                self.gui.trigger_event_matrix(matrix, event_type="mouse_move")
            else:
                self.handle_custom_event(event)

    def debugging_output(self, frame):
        if DEBUG:
            print "Buffer index: %s" % self.buffer_index
        if SHOW_WINDOW:
            cv2.imshow("preview", frame)

    def capture_frame(self, as_array=True):
        raise NotImplementedError()

    def handle_frame(self, *args, **kwargs):
        raise NotImplementedError()

    def start(self):
        raise NotImplementedError()

class CVCaptureRecorder(Recorder):
    def __init__(self, num_frames=settings.BUFFER_LENGTH, limit_fps=None):
        super(CVCaptureRecorder, self).__init__(num_frames, limit_fps)
        self.capture = cv.CaptureFromCAM(0)
        cv.SetCaptureProperty(self.capture, cv.CV_CAP_PROP_FRAME_WIDTH, 640)
        cv.SetCaptureProperty(self.capture, cv.CV_CAP_PROP_FRAME_HEIGHT, 480)


        if self.capture: # try to get the first frame
            frame = cv.QueryFrame(self.capture)
        else:
            raise Exception("Could not open video device")

    def capture_frame(self, as_array=True):
        frame = cv.QueryFrame(self.capture)
        if not as_array:
            return frame
        frame_array = numpy.asarray(frame[:,:])
        return frame_array

    def handle_frame(self):
        frame = self.capture_frame(as_array=False)
        frame_array = numpy.asarray(frame[:,:])

        self.motion_detector.update(frame)
        self.debugging_output(frame_array)

        if not self.api.video_locked:
            self.buffer_frame(frame_array)


class KinectRecorder(Recorder):
    def __init__(self, num_frames=settings.BUFFER_LENGTH, limit_fps=None):
        super(KinectRecorder, self).__init__(num_frames, limit_fps)

        # Kinect depth layers
        self.layers = settings.TOUCH_LAYERS

        self.overlay_video = settings.OVERLAY_VIDEO

        # Helper images to display depth overlay over video feed
        self.gray_image = None
        self.temp_image = None

        # Kinect loop settings
        self.dev = None
        self.ctx = None
        self.led_state = 0
        self.tilt = 0
        self.post_video_callbacks = []
        self.post_depth_callbacks = []

        # Calibration settings
        self.calibration_state = None

    def calibrate(self):
        if not self.calibration_state:
            print "calibrate"
            self.gui.fill(Color(1, 1, 1))
            self.gui.update()
            time.sleep(0.2)
            self.calibration_state = 'prepare'
            self.post_video_callbacks.append(self.calibrate)

        elif self.calibration_state == 'prepare':
            self.calibration_state = 'capture_white'
            self.post_video_callbacks.append(self.calibrate)

        elif self.calibration_state == 'capture_white':
            self.calibration_white_frame = self.to_grayscale(self.last_video_frame)
            self.gui.fill(Color(0, 0, 0))
            self.gui.update()
            time.sleep(0.2)
            self.calibration_state = 'capture_black'
            self.post_video_callbacks.append(self.calibrate)

        elif self.calibration_state == 'capture_black':
            self.calibration_state = None
            white_frame = self.calibration_white_frame
            black_frame = self.to_grayscale(self.last_video_frame)
            self._calibrate(white_frame, black_frame)

    def pretty_depth(self, depth):
        numpy.clip(depth, 0, 2**10 - 1, depth)
        depth >>= 2
        return depth

    def img_from_depth_frame(self, depth):
        depth = depth.astype(numpy.uint8)
        image = cv.CreateImageHeader((depth.shape[1], depth.shape[0]), cv.IPL_DEPTH_8U, 1)
        cv.SetData(image, depth.tostring(), depth.dtype.itemsize * depth.shape[1])
        return image

    def img_from_video_frame(self, video):
        video = video[:, :, ::-1]  # RGB -> BGR
        image = cv.CreateImageHeader((video.shape[1], video.shape[0]),
                                     cv.IPL_DEPTH_8U,
                                     3)
        cv.SetData(image, video.tostring(),
                   video.dtype.itemsize * 3 * video.shape[1])
        return image

    def sync_get_depth_frame(self, as_array=False):
        depth, timestamp = freenect.sync_get_depth()
        if as_array:
            return depth
        depth = self.pretty_depth(depth)
        image = cv.CreateImageHeader((depth.shape[1], depth.shape[0]),
                                     cv.IPL_DEPTH_8U,
                                     1)
        cv.SetData(image, depth.tostring(),
                   depth.dtype.itemsize * depth.shape[1])
        return image

    def sync_get_video_frame(self, as_array=False):
        video = freenect.sync_get_video()[0]
        if as_array:
            return video
        video = video[:, :, ::-1]  # RGB -> BGR
        image = cv.CreateImageHeader((video.shape[1], video.shape[0]),
                                     cv.IPL_DEPTH_8U,
                                     3)
        cv.SetData(image, video.tostring(),
                   video.dtype.itemsize * 3 * video.shape[1])
        return image

    def capture_frame(self, as_array=True):
        return self.sync_get_video_frame(as_array=as_array)

    def set_led(self, led_state):
        if not self.dev:
            print "no device set!"
            return
        freenect.set_led(self.dev, led_state)

    def set_tilt(self, tilt):
        if not self.dev:
            print "no device set!"
            return
        freenect.set_tilt_degs(self.dev, tilt)

    def handle_custom_event(self, event):
        if event.key == 'o':
            self.overlay_video = not self.overlay_video

    def kinect_body_callback(self, dev, ctx):
        self.handle_events()
        if not self.dev:
            self.dev = dev
            self.ctx = ctx
        if not self.keep_running:
            raise freenect.Kill

    def handle_frame(self):
        """ Synchronous handling of kinect frames, stupidly slow. """
        video = self.sync_get_video_frame(as_array=True)
        self.handle_video_frame(data=video)
        depth = self.sync_get_depth_frame(as_array=True)
        self.handle_depth_frame(data=depth)

    def handle_video_frame(self, dev=None, data=None, timestamp=None):
        self.update_frame_rate()
        #video_frame = numpy.asarray(data)
        video_frame = self.img_from_video_frame(data)
        frame_array = self.array(video_frame)
        self.last_video_frame = video_frame
        if frame_array.any() and not self.api.video_locked:
            self.buffer_frame(frame_array)

        self.motion_detector.update(video_frame)
        self.debugging_output(frame_array)

        callbacks = copy.copy(self.post_video_callbacks)
        self.post_video_callbacks = []
        for callback in callbacks:
            callback()

    def handle_depth_frame(self, dev=None, data=None, timestamp=None):
        return
        depth = self.pretty_depth(data)

        (low, high, value) = self.layers['touch']
        layer = self.threshold(depth, low, high, value=value)
        layer = layer.astype(numpy.uint8)
        kernel = numpy.ones((3,3), numpy.uint8)
        layer = cv2.erode(layer, kernel)
        #self.gui.trigger_event_matrix(layer, event_type='touch')
        self.buffer_frame(self.array(depth))

        for callback in self.post_depth_callbacks:
            callback()
        self.post_depth_callbacks = []

    def loop(self):
        """ Freenect has its own looping function, so we have to use that.
            Put general things that should happen in every frame into the "body" callback.
        """
        freenect.runloop(depth=self.handle_depth_frame, video=self.handle_video_frame, body=self.kinect_body_callback)
if __name__ == "__main__":
    if settings.RECORDER == 'cv':
        recorder = CVCaptureRecorder(limit_fps=settings.LIMIT_FPS)
    elif settings.RECORDER == 'kinect':
        recorder = KinectRecorder(limit_fps=settings.LIMIT_FPS)
    else:
        raise Exception("Unknown value %s for settings 'recorder'" % settings.RECORDER)

    try:
        recorder.loop()
    except KeyboardInterrupt:
        pass