audition.py

import lxml.etree as ET
import re
import pytimeparse
import pprint

import meta


def _get_markers(filename):
    with open(filename, 'rb') as f:
        o = ET.parse(f)
        xmp_as_xml_string = o.find('.//xmpMetadata').text
        namespaces = {'xmpDM': 'http://ns.adobe.com/xmp/1.0/DynamicMedia/'}
        xmp = ET.fromstring(xmp_as_xml_string)
        frame_rate = int(xmp.find('.//xmpDM:Tracks//xmpDM:frameRate', namespaces).text[1:])  # e.g. f44100
        markers_xpath = xmp.xpath('.//xmpDM:Tracks//xmpDM:trackName[.=\'CuePoint Markers\']/../xmpDM:markers//xmpDM:name/../xmpDM:startTime/..', namespaces=namespaces)
        markers = []
        for marker in markers_xpath:
            time = int(marker.find('xmpDM:startTime', namespaces).text)
            time_sec = time / frame_rate
            name = marker.find('xmpDM:name', namespaces).text
            markers.append([time_sec, name])
        return markers


def _get_clips(filename, track_name):
    clips = {}
    with open(filename, 'rb') as f:
        o = ET.parse(f)
        sample_rate = int(o.xpath('/sesx/session/@sampleRate')[0])
        els = o.xpath('.//audioTrack/trackParameters/name[.=\'' + track_name + '\']/../../audioClip')
        for el in els:
            start_point = int(el.attrib['startPoint'])/sample_rate
            end_point = int(el.attrib['endPoint'])/sample_rate
            source_in_point = int(el.attrib['sourceInPoint'])/sample_rate
            source_out_point = int(el.attrib['sourceOutPoint'])/sample_rate
            name = el.attrib['name']
            clips[name] = [start_point, end_point, source_in_point, source_out_point]
    return clips


def _find_time_in_clip(clip_name, rel_time, clips_translation, skip_time):
    for name, clip in clips_translation.items():
        if name == clip_name:
            return rel_time+clip[0]-clip[2]-skip_time


def _adjust_marker(time, clips_recorded, clips_translation, skip_time):
    for name, clip in clips_recorded.items():
        if clip[0] <= time <= clip[1]:
            rel_time = time - clip[0]
            adj_time = _find_time_in_clip(name, rel_time, clips_translation, skip_time)
            return adj_time


def _seconds_to_time_stamp(seconds):
    sec_round = round(seconds)
    hours = int(sec_round / 3600)
    min = int(sec_round / 60) % 60
    sec = sec_round % 60
    res = ''
    if hours:
        res += str(hours)+':'
    res += '%02d:%02d' % (min, sec)
    return res


def _adjust_markers(markers, clips_recorded, clips_translation, skip_time):
    adjusted_markers = []
    for marker in markers:
        marker_time = marker[0]
        marker_name = marker[1]
        adjusted_marker_time = _adjust_marker(marker_time, clips_recorded, clips_translation, skip_time)
        adjusted_markers.append([adjusted_marker_time, marker_name])
    return adjusted_markers


def timestamps(mp4_filename: str) -> str:
    """
    Return multi-line string with marker timestamps for given mp4 file. e.g.
    07:26 — Marker 37
    24:44 — Marker 38
    30:05 — Marker 39
    :rtype: str
    """
    sesx_filename = re.sub(r'\.mp4$', ' ru.sesx', mp4_filename)
    markers = _get_markers(sesx_filename)
    clips_recorded = _get_clips(sesx_filename, 'Track 1')
    clips_translation = _get_clips(sesx_filename, 'Translation')
    skip_time_str = meta.get_skip_time(mp4_filename)
    if skip_time_str == '':
        skip_time_str = '0:00'
    skip_time = pytimeparse.parse(skip_time_str)
    adjusted_markers = _adjust_markers(markers, clips_recorded, clips_translation, skip_time)

    timestamps_str = ''

    for marker in adjusted_markers:
        marker_time_sec = marker[0]
        marker_name = marker[1]
        if marker_time_sec is not None:
            marker_time = _seconds_to_time_stamp(marker_time_sec)
            timestamps_str += marker_time + ' — ' + marker_name + '\n'
    return timestamps_str


def _main():
    filename = 'D:\\video\\GoswamiMj-videos\\2017-03-12 goswamimj-madhusudanmj ru.sesx'
    mp4_filename = re.sub(r' ru\.sesx$', '.mp4', filename)
    print(timestamps(mp4_filename))


if __name__ == '__main__':
    _main()