hydrus/include/HydrusVideoHandling.py

#import numpy.core.multiarray # important this comes before cv!
import ClientConstants as CC
import cv2
from flvlib import tags as flv_tags
import HydrusConstants as HC
import HydrusExceptions
import HydrusImageHandling
import HydrusThreading
import matroska
import numpy
import os
import re
import subprocess
import traceback
import threading
import time
from wx import wx

if HC.PLATFORM_LINUX: FFMPEG_PATH = '"' + HC.BIN_DIR + os.path.sep + 'ffmpeg"'
elif HC.PLATFORM_OSX: FFMPEG_PATH = '"' + HC.BIN_DIR + os.path.sep + 'ffmpeg"'
elif HC.PLATFORM_WINDOWS: FFMPEG_PATH = '"' + HC.BIN_DIR + os.path.sep + 'ffmpeg.exe"'

def GetCVVideoProperties( path ):

    capture = cv2.VideoCapture( path )

    num_frames = int( capture.get( cv2.cv.CV_CAP_PROP_FRAME_COUNT ) )

    fps = capture.get( cv2.cv.CV_CAP_PROP_FPS )

    length_in_seconds = num_frames / fps

    length_in_ms = int( length_in_seconds * 1000 )

    duration = length_in_ms

    width = int( capture.get( cv2.cv.CV_CAP_PROP_FRAME_WIDTH ) )

    height = int( capture.get( cv2.cv.CV_CAP_PROP_FRAME_HEIGHT ) )

    return ( ( width, height ), duration, num_frames )

def GetFFMPEGVideoProperties( path ):

    info = Hydrusffmpeg_parse_infos( path )

    ( w, h ) = info[ 'video_size' ]

    duration_in_s = info[ 'duration' ]

    duration = int( duration_in_s * 1000 )

    num_frames = info[ 'video_nframes' ]

    return ( ( w, h ), duration, num_frames )

def GetFLVProperties( path ):

    with open( path, 'rb' ) as f:

        flv = flv_tags.FLV( f )

        script_tag = None

        for tag in flv.iter_tags():

            if isinstance( tag, flv_tags.ScriptTag ):

                script_tag = tag

                break


        width = 853
        height = 480
        duration = 0
        num_frames = 0

        if script_tag is not None:

            tag_dict = script_tag.variable

            # tag_dict can sometimes be a float?
            # it is on the broken one I tried!

            if 'width' in tag_dict: width = tag_dict[ 'width' ]
            if 'height' in tag_dict: height = tag_dict[ 'height' ]
            if 'duration' in tag_dict: duration = int( tag_dict[ 'duration' ] * 1000 )
            if 'framerate' in tag_dict: num_frames = int( ( duration / 1000.0 ) * tag_dict[ 'framerate' ] )


        return ( ( width, height ), duration, num_frames )


def GetVideoFrameDuration( path ):

    cv_video = cv2.VideoCapture( path )

    fps = cv_video.get( cv2.cv.CV_CAP_PROP_FPS )

    return 1000.0 / fps

def GetMatroskaOrWebm( path ):

    tags = matroska.parse( path )

    ebml = tags[ 'EBML' ][0]

    if ebml[ 'DocType' ][0] == 'matroska': return HC.VIDEO_MKV
    elif ebml[ 'DocType' ][0] == 'webm': return HC.VIDEO_WEBM

    raise Exception()

def GetMatroskaOrWebMProperties( path ):

    tags = matroska.parse( path )

    segment = tags['Segment'][0]

    info = segment['Info'][0]
    duration = int( ( info['Duration'][0] * info['TimecodeScale'][0] / 1e9 ) * 1000 )

    tracks = segment['Tracks'][0]
    trackentries = tracks['TrackEntry']

    for trackentry in trackentries:

        if 'Video' in trackentry:

            video = trackentry['Video'][0]

            width = video[ 'PixelWidth' ][0]
            height = video[ 'PixelHeight' ][0]

            break


    num_frames = 0

    return ( ( width, height ), duration, num_frames )

# this is cribbed from moviepy
def Hydrusffmpeg_parse_infos(filename, print_infos=False):
    """Get file infos using ffmpeg.

    Returns a dictionnary with the fields:
    "video_found", "video_fps", "duration", "video_nframes",
    "video_duration"
    "audio_found", "audio_fps"

    "video_duration" is slightly smaller than "duration" to avoid
    fetching the uncomplete frames at the end, which raises an error.

    """

    # open the file in a pipe, provoke an error, read output

    cmd = [FFMPEG_PATH, "-i", '"' + filename + '"']

    is_GIF = filename.endswith('.gif')

    if is_GIF:
        if HC.PLATFORM_WINDOWS: cmd += ["-f", "null", "NUL"]
        else: cmd += ["-f", "null", "/dev/null"]

    proc = subprocess.Popen( ' '.join( cmd ), shell = True, bufsize=10**5, stdout=subprocess.PIPE, stderr=subprocess.PIPE )

    infos = proc.stderr.read().decode('utf8')
    proc.terminate()

    del proc

    if print_infos:
        # print the whole info text returned by FFMPEG
        print( infos )

    lines = infos.splitlines()
    if "No such file or directory" in lines[-1]:
        raise IOError("%s not found ! Wrong path ?"%filename)

    result = dict()

    # get duration (in seconds)
    #   Duration: 00:00:02.46, start: 0.033000, bitrate: 1069 kb/s
    try:
        keyword = ('frame=' if is_GIF else 'Duration: ')
        line = [l for l in lines if keyword in l][0]

        if 'start:' in line:

            m = re.search( '(start\\: )' + '[0-9]\\.[0-9]*', line )

            start_offset = float( line[ m.start() + 7 : m.end() ] )

        else: start_offset = 0

        match = re.search("[0-9][0-9]:[0-9][0-9]:[0-9][0-9].[0-9][0-9]", line)
        hms = map(float, line[match.start()+1:match.end()].split(':'))

        if len(hms) == 1:
            result['duration'] = hms[0]
        elif len(hms) == 2:
            result['duration'] = 60*hms[0]+hms[1]
        elif len(hms) ==3:
            result['duration'] = 3600*hms[0]+60*hms[1]+hms[2]

        result[ 'duration' ] -= start_offset

    except:
        raise IOError("Error reading duration in file %s,"%(filename)+
                      "Text parsed: %s"%infos)

    # get the output line that speaks about video
    lines_video = [l for l in lines if ' Video: ' in l]

    result['video_found'] = ( lines_video != [] )

    if result['video_found']:

        line = lines_video[0]

        # get the size, of the form 460x320 (w x h)
        match = re.search(" [0-9]*x[0-9]*(,| )", line)
        s = list(map(int, line[match.start():match.end()-1].split('x')))
        result['video_size'] = s


        # get the frame rate
        try:
            match = re.search("( [0-9]*.| )[0-9]* tbr", line)
            result['video_fps'] = float(line[match.start():match.end()].split(' ')[1])
        except:
            match = re.search("( [0-9]*.| )[0-9]* fps", line)
            result['video_fps'] = float(line[match.start():match.end()].split(' ')[1])

        num_frames = result['duration'] * result['video_fps']

        if num_frames != int( num_frames ): num_frames += 1 # rounding up

        result['video_nframes'] = int( num_frames )

        result['video_duration'] = result['duration']
        # We could have also recomputed the duration from the number
        # of frames, as follows:
        # >>> result['video_duration'] = result['video_nframes'] / result['video_fps']


    lines_audio = [l for l in lines if ' Audio: ' in l]

    result['audio_found'] = lines_audio != []

    if result['audio_found']:
        line = lines_audio[0]
        try:
            match = re.search(" [0-9]* Hz", line)
            result['audio_fps'] = int(line[match.start()+1:match.end()])
        except:
            result['audio_fps'] = 'unknown'

    return result

class VideoContainer( HydrusImageHandling.RasterContainer ):

    BUFFER_SIZE = 1024 * 1024 * 96

    def __init__( self, media, target_resolution = None, init_position = 0 ):

        HydrusImageHandling.RasterContainer.__init__( self, media, target_resolution )

        self._frames = {}
        self._last_index_asked_for = -1
        self._buffer_start_index = -1
        self._buffer_end_index = -1

        ( x, y ) = self._target_resolution

        frame_buffer_length = self.BUFFER_SIZE / ( x * y * 3 )

        self._num_frames_backwards = frame_buffer_length * 2 / 3
        self._num_frames_forwards = frame_buffer_length / 3

        hash = self._media.GetHash()
        mime = self._media.GetMime()

        path = CC.GetFilePath( hash, mime )

        duration = self._media.GetDuration()
        num_frames = self._media.GetNumFrames()

        if self._media.GetMime() == HC.IMAGE_GIF:

            self._durations = HydrusImageHandling.GetGIFFrameDurations( self._path )

            self._renderer = GIFRenderer( path, num_frames, target_resolution )

        else:

            self._frame_duration = GetVideoFrameDuration( self._path )

            self._renderer = VideoRendererFFMPEG( path, mime, duration, num_frames, target_resolution )


        self._render_lock = threading.Lock()

        self._next_render_index = 0
        self._render_to_index = -1
        self._rendered_first_frame = False

        self.SetFramePosition( init_position )


    def _MaintainBuffer( self ):

        deletees = []

        for index in self._frames.keys():

            if self._buffer_start_index < self._buffer_end_index:

                if index < self._buffer_start_index or self._buffer_end_index < index: deletees.append( index )

            else:

                if self._buffer_end_index < index and index < self._buffer_start_index: deletees.append( index )


        for i in deletees: del self._frames[ i ]


    def _RENDERERSetRenderToPosition( self, index ):

        with self._render_lock:

            if self._render_to_index != index:

                self._render_to_index = index

                HydrusThreading.CallToThread( self.THREADRender )


    def _RENDERERSetFramePosition( self, index ):

        with self._render_lock:

            if index == self._next_render_index: return
            else:

                self._renderer.set_position( index )

                self._next_render_index = index
                self._render_to_index = index


    def THREADRender( self ):

        num_frames = self._media.GetNumFrames()

        while True:

            time.sleep( 0.00001 ) # thread yield

            with self._render_lock:

                if not self._rendered_first_frame or self._next_render_index != ( self._render_to_index + 1 ) % num_frames:

                    self._rendered_first_frame = True

                    frame_index = self._next_render_index # keep this before the get call, as it increments in a clock arithmetic way afterwards

                    try: numpy_image = self._renderer.read_frame()
                    except Exception as e:

                        HC.ShowException( e )

                        break

                    finally: self._next_render_index = ( self._next_render_index + 1 ) % num_frames

                    frame = HydrusImageHandling.GenerateHydrusBitmapFromNumPyImage( numpy_image )

                    wx.CallAfter( self.AddFrame, frame_index, frame )

                else: break


    def AddFrame( self, index, frame ): self._frames[ index ] = frame

    def GetDuration( self, index ):

        if self._media.GetMime() == HC.IMAGE_GIF: return self._durations[ index ]
        else: return self._frame_duration


    def GetFrame( self, index ):

        frame = self._frames[ index ]

        self._last_index_asked_for = index

        self._MaintainBuffer()

        return frame


    def GetHash( self ): return self._media.GetHash()

    def GetKey( self ): return ( self._media.GetHash(), self._target_resolution )

    def GetNumFrames( self ): return self._media.GetNumFrames()

    def GetResolution( self ): return self._media.GetResolution()

    def GetSize( self ): return self._target_resolution

    def GetTotalDuration( self ):

        if self._media.GetMime() == HC.IMAGE_GIF: return sum( self._durations )
        else: return self._frame_duration * self.GetNumFrames()


    def GetZoom( self ): return self._zoom

    def HasFrame( self, index ): return index in self._frames

    def IsScaled( self ): return self._zoom != 1.0

    def SetFramePosition( self, index ):

        num_frames = self.GetNumFrames()

        if num_frames > self._num_frames_backwards + 1 + self._num_frames_forwards:

            new_buffer_start_index = max( 0, index - self._num_frames_backwards ) % num_frames

            new_buffer_end_index = ( index + self._num_frames_forwards ) % num_frames

            if index == self._last_index_asked_for: return
            elif index < self._last_index_asked_for:

                if index < self._buffer_start_index:

                    self._buffer_start_index = new_buffer_start_index

                    self._RENDERERSetFramePosition( self._buffer_start_index )

                    self._buffer_end_index = new_buffer_end_index

                    self._RENDERERSetRenderToPosition( self._buffer_end_index )


            else: # index > self._last_index_asked_for

                currently_no_wraparound = self._buffer_start_index < self._buffer_end_index

                self._buffer_start_index = new_buffer_start_index

                if currently_no_wraparound:

                    if index > self._buffer_end_index:

                        self._RENDERERSetFramePosition( self._buffer_start_index )


                self._buffer_end_index = new_buffer_end_index

                self._RENDERERSetRenderToPosition( self._buffer_end_index )


        else:

            if self._buffer_end_index == -1:

                self._buffer_start_index = 0

                self._RENDERERSetFramePosition( 0 )

                self._buffer_end_index = num_frames - 1

                self._RENDERERSetRenderToPosition( self._buffer_end_index )


        self._MaintainBuffer()


# This was built from moviepy's FFMPEG_VideoReader
class VideoRendererFFMPEG( object ):

    def __init__( self, path, mime, duration, num_frames, target_resolution, pix_fmt = "rgb24" ):

        self._path = path
        self._mime = mime
        self._duration = float( duration ) / 1000.0
        self._num_frames = num_frames
        self._target_resolution = target_resolution

        self.fps = float( self._num_frames ) / self._duration

        if self.fps == 0: self.fps = 24

        self.pix_fmt = pix_fmt

        if pix_fmt == 'rgba': self.depth = 4
        else: self.depth = 3

        ( x, y ) = self._target_resolution
        bufsize = self.depth * x * y

        self.process = None

        self.bufsize = bufsize

        self.initialize()


    def __del__( self ):

        self.close()


    def close(self):

        if self.process is not None:

            self.process.terminate()

            self.process.stdout.close()
            self.process.stderr.close()

            self.process = None


    def initialize( self, start_index = 0 ):

        self.close()

        if self._mime == HC.IMAGE_GIF:

            ss = 0
            self.pos = 0
            skip_frames = start_index

        else:

            ss = float( start_index ) / self.fps
            self.pos = start_index
            skip_frames = 0


        ( w, h ) = self._target_resolution

        cmd = ( [ FFMPEG_PATH,
            '-ss', "%.03f" % ss,
            '-i', '"' + self._path + '"',
            '-loglevel', 'quiet',
            '-f', 'image2pipe',
            "-pix_fmt", self.pix_fmt,
            "-s", str( w ) + 'x' + str( h ),
            '-vcodec', 'rawvideo', '-' ] )

        self.process = subprocess.Popen( ' '.join( cmd ), shell = True, bufsize= self.bufsize, stdout=subprocess.PIPE, stderr=subprocess.PIPE )

        self.skip_frames( skip_frames )


    def skip_frames( self, n ):

        ( w, h ) = self._target_resolution

        for i in range( n ):

            self.process.stdout.read( self.depth * w * h )

            self.process.stdout.flush()

            self.pos += 1


    def read_frame( self ):

        if self.pos == self._num_frames: self.initialize()

        if self.process is None: result = self.lastread
        else:

            ( w, h ) = self._target_resolution

            nbytes = self.depth * w * h

            s = self.process.stdout.read(nbytes)

            if len(s) != nbytes:

                print( "Warning: in file %s, "%(self._path)+
                       "%d bytes wanted but %d bytes read,"%(nbytes, len(s))+
                       "at frame %d/%d, at time %.02f/%.02f sec. "%(
                        self.pos,self._num_frames,
                        1.0*self.pos/self.fps,
                        self._duration)+
                       "Using the last valid frame instead.")

                result = self.lastread

                self.close()

            else:

                result = numpy.fromstring( s, dtype = 'uint8' ).reshape( ( h, w, len( s ) // ( w * h ) ) )

                self.lastread = result


        self.pos += 1

        return result


    def set_position( self, pos ):

        rewind = pos < self.pos
        jump_a_long_way_ahead = pos > self.pos + 60

        if rewind or jump_a_long_way_ahead: self.initialize( pos )
        else: self.skip_frames( pos - self.pos )


class GIFRenderer( object ):

    def __init__( self, path, num_frames, target_resolution ):

        self._path = path
        self._num_frames = num_frames
        self._target_resolution = target_resolution

        self._cv_mode = True

        self._InitialiseCV()


    def _GetCurrentFrame( self ):

        if self._cv_mode:

            ( retval, numpy_image ) = self._cv_video.read()

            if not retval:

                self._next_render_index = ( self._next_render_index + 1 ) % self._num_frames

                raise HydrusExceptions.CantRenderWithCVException( 'CV could not render frame ' + HC.u( self._next_render_index - 1 ) + '.' )


        else:

            if self._pil_image.mode == 'P' and 'transparency' in self._pil_image.info:

                # I think gif problems are around here somewhere; the transparency info is not converted to RGBA properly, so it starts drawing colours when it should draw nothing

                current_frame = self._pil_image.convert( 'RGBA' )

                if self._pil_canvas is None: self._pil_canvas = current_frame
                else: self._pil_canvas.paste( current_frame, None, current_frame ) # use the rgba image as its own mask

            else: self._pil_canvas = self._pil_image

            numpy_image = HydrusImageHandling.GenerateNumPyImageFromPILImage( self._pil_canvas )


        self._next_render_index = ( self._next_render_index + 1 ) % self._num_frames

        if self._next_render_index == 0:

            self._RewindGIF()

        else:

            if not self._cv_mode:

                self._pil_image.seek( self._next_render_index )

                if self._pil_image.palette == self._pil_global_palette: # for some reason, when pil falls back from local palette to global palette, a bunch of important variables reset!

                    pil_image.palette.dirty = self._pil_dirty
                    pil_image.palette.mode = self._pil_mode
                    pil_image.palette.rawmode = self._pil_rawmode


        return numpy_image


    def _InitialiseCV( self ):

        self._cv_video = cv2.VideoCapture( self._path )

        self._cv_video.set( cv2.cv.CV_CAP_PROP_CONVERT_RGB, True )

        self._next_render_index = 0
        self._last_frame = None


    def _InitialisePIL( self ):

        self._pil_image = HydrusImageHandling.GeneratePILImage( self._path )

        self._pil_canvas = None

        self._pil_global_palette = self._pil_image.palette

        self._pil_dirty = self._pil_image.palette.dirty
        self._pil_mode = self._pil_image.palette.mode
        self._pil_rawmode = self._pil_image.palette.rawmode

        self._next_render_index = 0
        self._last_frame = None

        # believe it or not, doing this actually fixed a couple of gifs!
        self._pil_image.seek( 1 )
        self._pil_image.seek( 0 )


    def _RenderCurrentFrame( self ):

        if self._cv_mode:

            try:

                numpy_image = self._GetCurrentFrame()

                numpy_image = HydrusImageHandling.EfficientlyResizeNumpyImage( numpy_image, self._target_resolution )

                numpy_image = cv2.cvtColor( numpy_image, cv2.COLOR_BGR2RGB )

                self._last_frame = numpy_image

            except HydrusExceptions.CantRenderWithCVException:

                if self._last_frame is None:

                    self._cv_mode = False

                    self._InitialisePIL()

                    return self._RenderCurrentFrame()

                else: numpy_image = self._last_frame


        else:

            numpy_image = self._GetCurrentFrame()

            numpy_image = HydrusImageHandling.EfficientlyResizeNumpyImage( numpy_image, self._target_resolution )

            self._last_frame = numpy_image


        return numpy_image


    def _RewindGIF( self ):

        if self._cv_mode:

            self._cv_video.release()
            self._cv_video.open( self._path )

            self._next_render_index = 0

            #self._cv_video.set( cv2.cv.CV_CAP_PROP_POS_FRAMES, 0.0 )

        else:

            self._pil_image.seek( 0 )


    def read_frame( self ): return self._RenderCurrentFrame()

    def set_position( self, index ):

        if index == self._next_render_index: return
        elif index < self._next_render_index: self._RewindGIF()

        while self._next_render_index < index: self._GetCurrentFrame()

        #self._cv_video.set( cv2.cv.CV_CAP_PROP_POS_FRAMES, index )