hydrus/hydrus/core/HydrusVideoHandling.py

1322 lines
38 KiB
Python

import numpy
import os
import re
import struct
import subprocess
from hydrus.core import HydrusAudioHandling
from hydrus.core import HydrusConstants as HC
from hydrus.core import HydrusData
from hydrus.core import HydrusExceptions
from hydrus.core import HydrusText
from hydrus.core import HydrusThreading
FFMPEG_MISSING_ERROR_PUBBED = False
FFMPEG_NO_CONTENT_ERROR_PUBBED = False
if HC.PLATFORM_WINDOWS:
FFMPEG_PATH = os.path.join( HC.BIN_DIR, 'ffmpeg.exe' )
else:
FFMPEG_PATH = os.path.join( HC.BIN_DIR, 'ffmpeg' )
if not os.path.exists( FFMPEG_PATH ):
FFMPEG_PATH = os.path.basename( FFMPEG_PATH )
def CheckFFMPEGError( lines ):
if len( lines ) == 0:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Could not parse that file--no FFMPEG output given.' )
if "No such file or directory" in lines[-1]:
raise IOError( "File not found!" )
if 'Invalid data' in lines[-1]:
raise HydrusExceptions.DamagedOrUnusualFileException( 'FFMPEG could not parse.' )
def GetAPNGChunks( file_header_bytes: bytes ):
# https://wiki.mozilla.org/APNG_Specification
# a chunk is:
# 4 bytes of data size, unsigned int
# 4 bytes of chunk name
# n bytes of data
# 4 bytes of CRC
# lop off 8 bytes of 'this is a PNG' at the top
remaining_chunk_bytes = file_header_bytes[8:]
chunks = []
while len( remaining_chunk_bytes ) > 12:
( num_data_bytes, ) = struct.unpack( '>I', remaining_chunk_bytes[ : 4 ] )
chunk_name = remaining_chunk_bytes[ 4 : 8 ]
chunk_data = remaining_chunk_bytes[ 8 : 8 + num_data_bytes ]
chunks.append( ( chunk_name, chunk_data ) )
remaining_chunk_bytes = remaining_chunk_bytes[ 8 + num_data_bytes + 4 : ]
return chunks
def GetAPNGACTLChunkData( file_header_bytes: bytes ):
# the acTL chunk can be in different places, but it has to be near the top
# although it is almost always in fixed position (I think byte 29), we have seen both pHYs and sRGB chunks appear before it
# so to be proper we need to parse chunks and find the right one
apng_actl_chunk_header = b'acTL'
chunks = GetAPNGChunks( file_header_bytes )
chunks = dict( chunks )
if apng_actl_chunk_header in chunks:
return chunks[ apng_actl_chunk_header ]
else:
return None
def GetAPNGDuration( apng_bytes: bytes ):
frame_control_chunk_name = b'fcTL'
chunks = GetAPNGChunks( apng_bytes )
total_duration = 0
for ( chunk_name, chunk_data ) in chunks:
if chunk_name == frame_control_chunk_name and len( chunk_data ) >= 24:
( delay_numerator, ) = struct.unpack( '>H', chunk_data[20:22] )
( delay_denominator, ) = struct.unpack( '>H', chunk_data[22:24] )
if delay_denominator == 0:
duration = 0.1
else:
duration = delay_numerator / delay_denominator
total_duration += duration
return total_duration
def GetAPNGNumFrames( apng_actl_bytes: bytes ):
( num_frames, ) = struct.unpack( '>I', apng_actl_bytes[ : 4 ] )
return num_frames
def GetFFMPEGVersion():
cmd = [ FFMPEG_PATH, '-version' ]
HydrusData.CheckProgramIsNotShuttingDown()
try:
sbp_kwargs = HydrusData.GetSubprocessKWArgs( text = True )
process = subprocess.Popen( cmd, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, **sbp_kwargs )
except FileNotFoundError:
return 'no ffmpeg found at path "{}"'.format( FFMPEG_PATH )
except Exception as e:
HydrusData.ShowException( e )
return 'unable to execute ffmpeg at path "{}"'.format( FFMPEG_PATH )
( stdout, stderr ) = HydrusThreading.SubprocessCommunicate( process )
del process
lines = stdout.splitlines()
if len( lines ) > 0:
# typically 'ffmpeg version [VERSION] Copyright ...
top_line = lines[0]
if top_line.startswith( 'ffmpeg version ' ):
top_line = top_line.replace( 'ffmpeg version ', '' )
if ' ' in top_line:
version_string = top_line.split( ' ' )[0]
return version_string
message = 'FFMPEG was recently contacted to fetch version information. While FFMPEG could be found, the response could not be understood. Significant debug information has been printed to the log, which hydrus_dev would be interested in.'
HydrusData.ShowText( message )
message += os.linesep * 2
message += str( sbp_kwargs )
message += os.linesep * 2
message += str( os.environ )
message += os.linesep * 2
message += 'STDOUT Response: {}'.format( stdout )
message += os.linesep * 2
message += 'STDERR Response: {}'.format( stderr )
HydrusData.Print( message )
global FFMPEG_NO_CONTENT_ERROR_PUBBED
FFMPEG_NO_CONTENT_ERROR_PUBBED = True
return 'unknown'
# bits of this were originally cribbed from moviepy
def GetFFMPEGInfoLines( path, count_frames_manually = False, only_first_second = False ):
# open the file in a pipe, provoke an error, read output
cmd = [ FFMPEG_PATH, "-i", path ]
if only_first_second:
cmd.insert( 1, '-t' )
cmd.insert( 2, '1' )
if count_frames_manually:
# added -an here to remove audio component, which was sometimes causing convert fails on single-frame music webms
if HC.PLATFORM_WINDOWS:
cmd += [ "-vf", "scale=-2:120", "-an", "-f", "null", "NUL" ]
else:
cmd += [ "-vf", "scale=-2:120", "-an", "-f", "null", "/dev/null" ]
sbp_kwargs = HydrusData.GetSubprocessKWArgs()
HydrusData.CheckProgramIsNotShuttingDown()
try:
process = subprocess.Popen( cmd, bufsize = 10**5, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, **sbp_kwargs )
except FileNotFoundError as e:
global FFMPEG_MISSING_ERROR_PUBBED
if not FFMPEG_MISSING_ERROR_PUBBED:
message = 'FFMPEG, which hydrus uses to parse and render video, was not found! This may be due to it not being available on your system, or hydrus being unable to find it.'
message += os.linesep * 2
if HC.PLATFORM_WINDOWS:
message += 'You are on Windows, so there should be a copy of ffmpeg.exe in your install_dir/bin folder. If not, please check if your anti-virus has removed it and restore it through a new install.'
else:
message += 'If you are certain that FFMPEG is installed on your OS and accessible in your PATH, please let hydrus_dev know, as this problem is likely due to an environment problem. You may be able to solve this problem immediately by putting a static build of the ffmpeg executable in your install_dir/bin folder.'
message += os.linesep * 2
message += 'You can check your current FFMPEG status through help->about.'
HydrusData.ShowText( message )
FFMPEG_MISSING_ERROR_PUBBED = True
raise FileNotFoundError( 'Cannot interact with video because FFMPEG not found--are you sure it is installed? Full error: ' + str( e ) )
( stdout, stderr ) = HydrusThreading.SubprocessCommunicate( process )
data_bytes = stderr
if len( data_bytes ) == 0:
global FFMPEG_NO_CONTENT_ERROR_PUBBED
if not FFMPEG_NO_CONTENT_ERROR_PUBBED:
message = 'FFMPEG, which hydrus uses to parse and render video, did not return any data on a recent file metadata check! More debug info has been written to the log.'
message += os.linesep * 2
message += 'You can check this info again through help->about.'
HydrusData.ShowText( message )
message += os.linesep * 2
message += str( sbp_kwargs )
message += os.linesep * 2
message += str( os.environ )
message += os.linesep * 2
message += 'STDOUT Response: {}'.format( stdout )
message += os.linesep * 2
message += 'STDERR Response: {}'.format( stderr )
HydrusData.DebugPrint( message )
FFMPEG_NO_CONTENT_ERROR_PUBBED = True
raise HydrusExceptions.DataMissing( 'Cannot interact with video because FFMPEG did not return any content.' )
del process
( text, encoding ) = HydrusText.NonFailingUnicodeDecode( data_bytes, 'utf-8' )
lines = text.splitlines()
CheckFFMPEGError( lines )
return lines
def GetFFMPEGAPNGProperties( path ):
with open( path, 'rb' ) as f:
file_header_bytes = f.read( 256 )
apng_actl_bytes = GetAPNGACTLChunkData( file_header_bytes )
if apng_actl_bytes is None:
raise HydrusExceptions.DamagedOrUnusualFileException( 'This APNG had an unusual file header!' )
num_frames = GetAPNGNumFrames( apng_actl_bytes )
with open( path, 'rb' ) as f:
file_bytes = f.read()
duration = GetAPNGDuration( file_bytes )
lines = GetFFMPEGInfoLines( path )
resolution = ParseFFMPEGVideoResolution( lines, png_ok = True )
duration_in_ms = int( duration * 1000 )
has_audio = False
return ( resolution, duration_in_ms, num_frames, has_audio )
def GetFFMPEGVideoProperties( path, force_count_frames_manually = False ):
lines_for_first_second = GetFFMPEGInfoLines( path, count_frames_manually = True, only_first_second = True )
( has_video, video_format ) = ParseFFMPEGVideoFormat( lines_for_first_second )
if not has_video:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Wanted to parse video data, but file did not appear to have a video stream!' )
resolution = ParseFFMPEGVideoResolution( lines_for_first_second )
( file_duration_in_s, stream_duration_in_s ) = ParseFFMPEGDuration( lines_for_first_second )
# this will have to be fixed when I add audio, and dynamically accounted for on dual vid/audio rendering
duration = stream_duration_in_s
( fps, confident_fps ) = ParseFFMPEGFPS( lines_for_first_second )
if duration is None and not confident_fps:
# ok default to fall back on
( fps, confident_fps ) = ( 24, True )
if fps is None or fps == 0:
fps = 1
if duration is None:
force_count_frames_manually = True
else:
num_frames_estimate = int( duration * fps )
# if file is big or long, don't try to force a manual count when one not explicitly asked for
# we don't care about a dropped frame on a 10min vid tbh
num_frames_seems_ok_to_count = duration < 15 or num_frames_estimate < 2400
file_is_ok_size = os.path.getsize( path ) < 128 * 1024 * 1024
if num_frames_seems_ok_to_count and file_is_ok_size:
last_frame_has_unusual_duration = num_frames_estimate != duration * fps
unusual_video_start = file_duration_in_s != stream_duration_in_s
if not confident_fps or last_frame_has_unusual_duration or unusual_video_start:
force_count_frames_manually = True
if force_count_frames_manually:
lines = GetFFMPEGInfoLines( path, count_frames_manually = True )
num_frames = ParseFFMPEGNumFramesManually( lines )
if duration is None:
duration = num_frames / fps
else:
num_frames = int( duration * fps )
duration_in_ms = int( duration * 1000 )
has_audio = VideoHasAudio( path, lines_for_first_second )
return ( resolution, duration_in_ms, num_frames, has_audio )
def GetMime( path ):
lines = GetFFMPEGInfoLines( path )
try:
mime_text = ParseFFMPEGMimeText( lines )
except HydrusExceptions.UnsupportedFileException:
return HC.APPLICATION_UNKNOWN
( has_video, video_format ) = ParseFFMPEGVideoFormat( lines )
( has_audio, audio_format ) = HydrusAudioHandling.ParseFFMPEGAudio( lines )
if 'matroska' in mime_text or 'webm' in mime_text:
# a webm has at least vp8/vp9 video and optionally vorbis audio
has_webm_video = False
if has_video:
webm_video_formats = ( 'vp8', 'vp9' )
has_webm_video = True in ( webm_video_format in video_format for webm_video_format in webm_video_formats )
if has_audio:
webm_audio_formats = ( 'vorbis', 'opus' )
has_webm_audio = True in ( webm_audio_format in audio_format for webm_audio_format in webm_audio_formats )
else:
# no audio at all is not a vote against webm
has_webm_audio = True
if has_webm_video and has_webm_audio:
return HC.VIDEO_WEBM
else:
if has_video:
return HC.VIDEO_MKV
elif has_audio:
return HC.AUDIO_MKV
elif mime_text in ( 'mpeg', 'mpegvideo', 'mpegts' ):
return HC.VIDEO_MPEG
elif mime_text == 'flac':
return HC.AUDIO_FLAC
elif mime_text == 'wav':
return HC.AUDIO_WAVE
elif mime_text == 'mp3':
return HC.AUDIO_MP3
elif mime_text == 'tta':
return HC.AUDIO_TRUEAUDIO
elif 'mp4' in mime_text:
container = ParseFFMPEGMetadataContainer( lines )
if container == 'M4A':
return HC.AUDIO_M4A
elif container == 'qt':
return HC.VIDEO_MOV
elif container in ( 'isom', 'mp42' ): # mp42 is version 2 of mp4 standard
if has_video:
return HC.VIDEO_MP4
elif has_audio:
return HC.AUDIO_MP4
if has_audio and 'mjpeg' in video_format:
return HC.AUDIO_M4A
elif has_video:
return HC.VIDEO_MP4
elif has_audio:
return HC.AUDIO_MP4
elif mime_text == 'ogg':
if has_video:
return HC.VIDEO_OGV
else:
return HC.AUDIO_OGG
elif 'rm' in mime_text:
if ParseFFMPEGHasVideo( lines ):
return HC.VIDEO_REALMEDIA
else:
return HC.AUDIO_REALMEDIA
elif mime_text == 'asf':
if ParseFFMPEGHasVideo( lines ):
return HC.VIDEO_WMV
else:
return HC.AUDIO_WMA
return HC.APPLICATION_UNKNOWN
def HasVideoStream( path ):
lines = GetFFMPEGInfoLines( path )
return ParseFFMPEGHasVideo( lines )
def RenderImageToPNGPath( path, temp_png_path ):
# -y to overwrite the temp path
cmd = [ FFMPEG_PATH, '-y', "-i", path, temp_png_path ]
sbp_kwargs = HydrusData.GetSubprocessKWArgs()
HydrusData.CheckProgramIsNotShuttingDown()
try:
process = subprocess.Popen( cmd, bufsize = 10**5, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, **sbp_kwargs )
except FileNotFoundError as e:
global FFMPEG_MISSING_ERROR_PUBBED
if not FFMPEG_MISSING_ERROR_PUBBED:
message = 'FFMPEG, which hydrus uses to parse and render video, was not found! This may be due to it not being available on your system, or hydrus being unable to find it.'
message += os.linesep * 2
if HC.PLATFORM_WINDOWS:
message += 'You are on Windows, so there should be a copy of ffmpeg.exe in your install_dir/bin folder. If not, please check if your anti-virus has removed it and restore it through a new install.'
else:
message += 'If you are certain that FFMPEG is installed on your OS and accessible in your PATH, please let hydrus_dev know, as this problem is likely due to an environment problem. You may be able to solve this problem immediately by putting a static build of the ffmpeg executable in your install_dir/bin folder.'
message += os.linesep * 2
message += 'You can check your current FFMPEG status through help->about.'
HydrusData.ShowText( message )
FFMPEG_MISSING_ERROR_PUBBED = True
raise FileNotFoundError( 'Cannot interact with video because FFMPEG not found--are you sure it is installed? Full error: ' + str( e ) )
( stdout, stderr ) = HydrusThreading.SubprocessCommunicate( process )
def ParseFFMPEGDuration( lines ):
# get duration (in seconds)
# Duration: 00:00:02.46, start: 0.033000, bitrate: 1069 kb/s
try:
# had a vid with 'Duration:' in title, ha ha, so now a regex
line = [ l for l in lines if re.search( r'^\s*Duration:', l ) is not None ][0]
if 'Duration: N/A' in line:
return ( None, None )
if 'start:' in line:
m = re.search( r'(start: )-?[0-9]+\.[0-9]*', line )
start_offset = float( line[ m.start() + 7 : m.end() ] )
else:
start_offset = 0
match = re.search("[0-9]+:[0-9][0-9]:[0-9][0-9].[0-9][0-9]", line)
hms = [ float( float_string ) for float_string in line[match.start():match.end()].split(':') ]
duration = 0
if len( hms ) == 1:
duration = hms[0]
elif len( hms ) == 2:
duration = 60 * hms[0] + hms[1]
elif len( hms ) == 3:
duration = 3600 * hms[0] + 60 * hms[1] + hms[2]
if duration == 0:
return ( None, None )
if start_offset > 0.85 * duration:
# as an example, Duration: 127:57:31.25, start: 460633.291000 lmao
return ( None, None )
# we'll keep this for now I think
if start_offset > 1:
start_offset = 0
file_duration = duration + start_offset
stream_duration = duration
return ( file_duration, stream_duration )
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Error reading duration!' )
def ParseFFMPEGFPS( lines, png_ok = False ):
try:
line = ParseFFMPEGVideoLine( lines, png_ok = png_ok )
( possible_results, confident ) = ParseFFMPEGFPSPossibleResults( line )
if len( possible_results ) == 0:
fps = 1
confident = False
else:
fps = min( possible_results )
return ( fps, confident )
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Error estimating framerate!' )
def ParseFFMPEGFPSFromFirstSecond( lines_for_first_second ):
try:
line = ParseFFMPEGVideoLine( lines_for_first_second )
( possible_results, confident ) = ParseFFMPEGFPSPossibleResults( line )
num_frames_in_first_second = ParseFFMPEGNumFramesManually( lines_for_first_second )
if len( possible_results ) == 0:
fps = num_frames_in_first_second
confident = False
else:
# in some cases, fps is 0.77 and tbr is incorrectly 20. extreme values cause bad results. let's default to slowest, but test our actual first second for most legit-looking
sensible_first_second = 1 <= num_frames_in_first_second <= 288
fps = min( possible_results )
fps_matches_with_first_second = False
for possible_fps in possible_results:
if num_frames_in_first_second - 1 <= possible_fps <= num_frames_in_first_second + 1:
fps = possible_fps
fps_matches_with_first_second = True
break
confident = sensible_first_second and fps_matches_with_first_second
if fps is None or fps == 0:
fps = 1
confident = False
return ( fps, confident )
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Error estimating framerate!' )
def ParseFFMPEGFPSPossibleResults( video_line ):
# get the frame rate
possible_results = set()
match = re.search("( [0-9]*.| )[0-9]* tbr", video_line)
if match is not None:
tbr = video_line[match.start():match.end()].split(' ')[1]
tbr_fps_is_likely_garbage = match is None or tbr.endswith( 'k' ) or float( tbr ) > 144
if not tbr_fps_is_likely_garbage:
possible_results.add( float( tbr ) )
#
match = re.search("( [0-9]*.| )[0-9]* fps", video_line)
if match is not None:
fps = video_line[match.start():match.end()].split(' ')[1]
fps_is_likely_garbage = match is None or fps.endswith( 'k' ) or float( fps ) > 144
if not fps_is_likely_garbage:
possible_results.add( float( fps ) )
possible_results.discard( 0 )
if len( possible_results ) == 0:
confident = False
else:
# if we have 60 and 59.99, that's fine mate
max_fps = max( possible_results )
if False not in ( possible_fps >= max_fps * 0.95 for possible_fps in possible_results ):
confident = True
else:
confident = len( possible_results ) <= 1
return ( possible_results, confident )
def ParseFFMPEGHasVideo( lines ):
try:
ParseFFMPEGVideoLine( lines )
except HydrusExceptions.UnsupportedFileException:
return False
return True
def ParseFFMPEGMetadataContainer( lines ) -> str:
# Metadata:
# major_brand : isom
match_metadata_line_re = r'\s*Metadata:\s*'
metadata_line_index = None
for ( i, line ) in enumerate( lines ):
if re.match( match_metadata_line_re, line ) is not None:
metadata_line_index = i
break
if metadata_line_index is None:
return ''
match_major_brand_re = r'\s*major_brand\s*:.+'
for line in lines[ metadata_line_index : ]:
if re.match( match_major_brand_re, line ) is not None:
container = line.split( ':', 1 )[1].strip()
return container
return ''
def ParseFFMPEGMimeText( lines ):
try:
( input_line, ) = [ l for l in lines if l.startswith( 'Input #0' ) ]
# Input #0, matroska, webm, from 'm.mkv':
text = input_line[10:]
mime_text = text.split( ', from' )[0]
return mime_text
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Error reading file type!' )
def ParseFFMPEGNumFramesManually( lines ):
frame_lines = [ line for line in lines if line.startswith( 'frame=' ) ]
if len( frame_lines ) == 0:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Video appears to be broken and non-renderable--perhaps a damaged single-frame video?' )
final_line = frame_lines[-1] # there will be many progress rows, counting up as the file renders. we hence want the final one
line = final_line
line = line.replace( 'frame=', '' )
while line.startswith( ' ' ):
line = line[1:]
try:
frames_string = line.split( ' ' )[0]
num_frames = int( frames_string )
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Video was unable to render correctly--could not parse ffmpeg output line: "{}"'.format( final_line ) )
return num_frames
def ParseFFMPEGVideoFormat( lines ):
try:
line = ParseFFMPEGVideoLine( lines )
except HydrusExceptions.UnsupportedFileException:
return ( False, 'unknown' )
try:
match = re.search( r'(?<=Video:\s).+?(?=,)', line )
video_format = match.group()
except:
video_format = 'unknown'
return ( True, video_format )
def ParseFFMPEGVideoLine( lines, png_ok = False ):
if png_ok:
bad_video_formats = [ 'jpg' ]
else:
bad_video_formats = [ 'png', 'jpg' ]
# get the output line that speaks about video
# the ^\sStream is to exclude the 'title' line, when it exists, includes the string 'Video: ', ha ha
lines_video = [ l for l in lines if re.search( r'^\s*Stream', l ) is not None and 'Video: ' in l and True not in ( 'Video: {}'.format( bad_video_format ) in l for bad_video_format in bad_video_formats ) ] # mp3 says it has a 'png' video stream
if len( lines_video ) == 0:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Could not find video information!' )
line = lines_video[0]
return line
def ParseFFMPEGVideoResolution( lines, png_ok = False ):
try:
line = ParseFFMPEGVideoLine( lines, png_ok = png_ok )
# get the size, of the form 460x320 (w x h)
match = re.search(" [0-9]*x[0-9]*([, ])", line)
resolution_string = line[match.start():match.end()-1]
( width_string, height_string ) = resolution_string.split( 'x' )
width = int( width_string )
height = int( height_string )
# if a vid has an SAR, this 'sample' aspect ratio basically just stretches it
# when you convert the width using SAR, the resulting resolution should match the DAR, 'display' aspect ratio, which is what we actually want in final product
# MPC-HC seems to agree with this calculation, Firefox does not
# examples:
# ' Stream #0:0: Video: hevc (Main), yuv420p(tv, bt709), 1280x720 [SAR 69:80 DAR 23:15], 30 fps, 30 tbr, 1k tbn (default)'
# ' Stream #0:0: Video: vp9 (Profile 0), yuv420p(tv, progressive), 1120x1080, SAR 10:11 DAR 280:297, 30 fps, 30 tbr, 1k tbn (default)'
sar_match = re.search( "[\\[\\s]SAR [0-9]*:[0-9]*[,\\s]", line )
if sar_match is not None:
# ' SAR 2:3 '
sar_string = line[ sar_match.start() : sar_match.end() ]
# '2:3'
sar_string = sar_string[5:-1]
( sar_width_string, sar_height_string ) = sar_string.split( ':' )
sar_width = int( sar_width_string )
sar_height = int( sar_height_string )
width *= sar_width
width //= sar_height
return ( width, height )
except:
raise HydrusExceptions.DamagedOrUnusualFileException( 'Error parsing resolution!' )
def VideoHasAudio( path, info_lines ):
( audio_found, audio_format ) = HydrusAudioHandling.ParseFFMPEGAudio( info_lines )
if not audio_found:
return False
# just because video metadata has an audio stream doesn't mean it has audio. some vids have silent audio streams lmao
# so, let's read it as PCM and see if there is any noise
# this obviously only works for single audio stream vids, we'll adapt this if someone discovers a multi-stream mkv with a silent channel that doesn't work here
cmd = [ FFMPEG_PATH ]
# this is perhaps not sensible for eventual playback and I should rather go for wav file-like and feed into python 'wave' in order to maintain stereo/mono and so on and have easy chunk-reading
cmd.extend( [ '-i', path,
'-loglevel', 'quiet',
'-f', 's16le',
'-' ] )
sbp_kwargs = HydrusData.GetSubprocessKWArgs()
HydrusData.CheckProgramIsNotShuttingDown()
try:
process = subprocess.Popen( cmd, bufsize = 65536, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, **sbp_kwargs )
except FileNotFoundError as e:
HydrusData.ShowText( 'Cannot render audio--FFMPEG not found!' )
raise
# silent PCM data is just 00 bytes
# every now and then, you'll get a couple ffs for some reason, but this is not legit audio data
try:
chunk_of_pcm_data = process.stdout.read( 65536 )
while len( chunk_of_pcm_data ) > 0:
# iterating over bytes gives you ints, recall
# this used to be 'if not 0 or 255', but I found some that had 1 too, so let's just change the tolerance to reduce false positives
if True in ( 5 <= b <= 250 for b in chunk_of_pcm_data ):
return True
chunk_of_pcm_data = process.stdout.read( 65536 )
return False
finally:
process.terminate()
process.stdout.close()
process.stderr.close()
# This was built from moviepy's FFMPEG_VideoReader
class VideoRendererFFMPEG( object ):
def __init__( self, path, mime, duration, num_frames, target_resolution, pix_fmt = "rgb24", clip_rect = None ):
self._path = path
self._mime = mime
self._duration = duration / 1000.0
self._num_frames = num_frames
self._target_resolution = target_resolution
self._clip_rect = clip_rect
self.lastread = None
self.fps = self._num_frames / self._duration
if self.fps == 0:
self.fps = 24
self.pix_fmt = pix_fmt
if pix_fmt == 'rgba': self.depth = 4
else: self.depth = 3
( x, y ) = self._target_resolution
bufsize = self.depth * x * y
self.process = None
self.bufsize = bufsize
self.initialize()
def close( self ):
if self.process is not None:
self.process.terminate()
self.process.stdout.close()
self.process.stderr.close()
self.process = None
def initialize( self, start_index = 0 ):
self.close()
if self._mime in ( HC.IMAGE_APNG, HC.IMAGE_GIF ):
do_ss = False
ss = 0
self.pos = 0
skip_frames = start_index
else:
if start_index == 0:
do_ss = False
else:
do_ss = True
ss = start_index / self.fps
self.pos = start_index
skip_frames = 0
do_fast_seek = True
( w, h ) = self._target_resolution
cmd = [ FFMPEG_PATH ]
if do_ss and do_fast_seek: # fast seek
cmd.extend( [ '-ss', "%.03f" % ss ] )
cmd.extend( [ '-i', self._path ] )
if do_ss and not do_fast_seek: # slow seek
cmd.extend( [ '-ss', "%.03f" % ss ] )
if self._clip_rect is not None:
( clip_x, clip_y, clip_width, clip_height ) = self._clip_rect
cmd.extend( [ '-vf', 'crop={}:{}:{}:{}'.format( clip_width, clip_height, clip_x, clip_y ) ] )
cmd.extend( [
'-loglevel', 'quiet',
'-f', 'image2pipe',
"-pix_fmt", self.pix_fmt,
"-s", str( w ) + 'x' + str( h ),
'-vsync', '0',
'-vcodec', 'rawvideo',
'-'
] )
sbp_kwargs = HydrusData.GetSubprocessKWArgs()
HydrusData.CheckProgramIsNotShuttingDown()
try:
self.process = subprocess.Popen( cmd, bufsize = self.bufsize, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, **sbp_kwargs )
except FileNotFoundError as e:
HydrusData.ShowText( 'Cannot render video--FFMPEG not found!' )
raise
if skip_frames > 0:
self.skip_frames( skip_frames )
def skip_frames( self, n ):
n = int( n )
( w, h ) = self._target_resolution
for i in range( n ):
if self.process is not None:
self.process.stdout.read( self.depth * w * h )
self.process.stdout.flush()
self.pos += 1
def read_frame( self ):
if self.pos == self._num_frames:
self.initialize()
if self.process is None:
result = self.lastread
else:
( w, h ) = self._target_resolution
nbytes = self.depth * w * h
s = self.process.stdout.read( nbytes )
if len(s) != nbytes:
if self.lastread is None:
if self.pos != 0:
# this renderer was asked to render starting from mid-vid and this was not possible due to broken key frame index whatever
# lets try and render from the vid start before we say the whole vid is broke
# I tried doing 'start from 0 and skip n frames', but this is super laggy so would need updates further up the pipe to display this to the user
# atm this error states does not communicate to the videocontainer that the current frame num has changed, so the frames are henceforth out of phase
#frames_to_jump = self.pos
self.set_position( 0 )
return self.read_frame()
raise Exception( 'Unable to render that video! Please send it to hydrus dev so he can look at it!' )
result = self.lastread
self.close()
else:
result = numpy.fromstring( s, dtype = 'uint8' ).reshape( ( h, w, len( s ) // ( w * h ) ) )
self.lastread = result
self.pos += 1
return result
def set_position( self, pos ):
rewind = pos < self.pos
jump_a_long_way_ahead = pos > self.pos + 60
if rewind or jump_a_long_way_ahead:
self.initialize( pos )
else:
self.skip_frames( pos - self.pos )
def Stop( self ):
self.close()