2003-02-03 10:27:50 +00:00
////////// Codec-specific routines used to interface between "MPlayer"
2005-09-23 22:35:04 +00:00
////////// and the "LIVE555 Streaming Media" libraries:
2003-02-03 10:27:50 +00:00
# include "demux_rtp_internal.h"
extern " C " {
2007-01-15 04:57:43 +00:00
# include <limits.h>
2007-01-23 22:26:13 +00:00
# include <math.h>
2003-02-03 10:27:50 +00:00
# include "stheader.h"
}
2003-03-11 19:08:31 +00:00
static void
needVideoFrameRate ( demuxer_t * demuxer , MediaSubsession * subsession ) ; // forward
2003-02-03 10:27:50 +00:00
static Boolean
parseQTState_video ( QuickTimeGenericRTPSource : : QTState const & qtState ,
unsigned & fourcc ) ; // forward
static Boolean
parseQTState_audio ( QuickTimeGenericRTPSource : : QTState const & qtState ,
unsigned & fourcc , unsigned & numChannels ) ; // forward
2007-02-20 20:21:15 +00:00
static BITMAPINFOHEADER * insertVideoExtradata ( BITMAPINFOHEADER * bih ,
unsigned char * extraData ,
unsigned size )
{
BITMAPINFOHEADER * original = bih ;
if ( ! size | | size > INT_MAX - sizeof ( BITMAPINFOHEADER ) )
return bih ;
bih = ( BITMAPINFOHEADER * ) realloc ( bih , sizeof ( BITMAPINFOHEADER ) + size ) ;
if ( ! bih )
return original ;
bih - > biSize = sizeof ( BITMAPINFOHEADER ) + size ;
memcpy ( bih + 1 , extraData , size ) ;
return bih ;
}
2003-02-03 10:27:50 +00:00
void rtpCodecInitialize_video ( demuxer_t * demuxer ,
MediaSubsession * subsession ,
unsigned & flags ) {
flags = 0 ;
// Create a dummy video stream header
// to make the main MPlayer code happy:
sh_video_t * sh_video = new_sh_video ( demuxer , 0 ) ;
BITMAPINFOHEADER * bih
= ( BITMAPINFOHEADER * ) calloc ( 1 , sizeof ( BITMAPINFOHEADER ) ) ;
bih - > biSize = sizeof ( BITMAPINFOHEADER ) ;
sh_video - > bih = bih ;
demux_stream_t * d_video = demuxer - > video ;
d_video - > sh = sh_video ; sh_video - > ds = d_video ;
// Map known video MIME types to the BITMAPINFOHEADER parameters
// that this program uses. (Note that not all types need all
// of the parameters to be set.)
2003-07-27 10:16:14 +00:00
if ( strcmp ( subsession - > codecName ( ) , " MPV " ) = = 0 ) {
2003-03-11 19:08:31 +00:00
flags | = RTPSTATE_IS_MPEG12_VIDEO ;
2003-07-27 10:16:14 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " MP1S " ) = = 0 | |
strcmp ( subsession - > codecName ( ) , " MP2T " ) = = 0 ) {
flags | = RTPSTATE_IS_MPEG12_VIDEO | RTPSTATE_IS_MULTIPLEXED ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " H263 " ) = = 0 | |
2007-02-16 00:30:05 +00:00
strcmp ( subsession - > codecName ( ) , " H263-2000 " ) = = 0 | |
2003-02-03 10:27:50 +00:00
strcmp ( subsession - > codecName ( ) , " H263-1998 " ) = = 0 ) {
bih - > biCompression = sh_video - > format
= mmioFOURCC ( ' H ' , ' 2 ' , ' 6 ' , ' 3 ' ) ;
2003-03-11 19:08:31 +00:00
needVideoFrameRate ( demuxer , subsession ) ;
2006-08-16 23:40:51 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " H264 " ) = = 0 ) {
bih - > biCompression = sh_video - > format
= mmioFOURCC ( ' H ' , ' 2 ' , ' 6 ' , ' 4 ' ) ;
needVideoFrameRate ( demuxer , subsession ) ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " H261 " ) = = 0 ) {
bih - > biCompression = sh_video - > format
= mmioFOURCC ( ' H ' , ' 2 ' , ' 6 ' , ' 1 ' ) ;
2003-03-11 19:08:31 +00:00
needVideoFrameRate ( demuxer , subsession ) ;
2003-02-09 17:06:38 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " JPEG " ) = = 0 ) {
bih - > biCompression = sh_video - > format
= mmioFOURCC ( ' M ' , ' J ' , ' P ' , ' G ' ) ;
2003-03-11 19:08:31 +00:00
needVideoFrameRate ( demuxer , subsession ) ;
2003-02-09 17:06:38 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " MP4V-ES " ) = = 0 ) {
bih - > biCompression = sh_video - > format
= mmioFOURCC ( ' m ' , ' p ' , ' 4 ' , ' v ' ) ;
2003-03-11 19:08:31 +00:00
// For the codec to work correctly, it may need a 'VOL Header' to be
// inserted at the front of the data stream. Construct this from the
// "config" MIME parameter, which was present (hopefully) in the
// session's SDP description:
unsigned configLen ;
unsigned char * configData
= parseGeneralConfigStr ( subsession - > fmtp_config ( ) , configLen ) ;
2007-02-20 20:21:15 +00:00
sh_video - > bih = bih = insertVideoExtradata ( bih , configData , configLen ) ;
2003-03-11 19:08:31 +00:00
needVideoFrameRate ( demuxer , subsession ) ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " X-QT " ) = = 0 | |
strcmp ( subsession - > codecName ( ) , " X-QUICKTIME " ) = = 0 ) {
// QuickTime generic RTP format, as described in
// http://developer.apple.com/quicktime/icefloe/dispatch026.html
// We can't initialize this stream until we've received the first packet
// that has QuickTime "sdAtom" information in the header. So, keep
// reading packets until we get one:
2003-03-11 19:08:31 +00:00
unsigned char * packetData ; unsigned packetDataLen ; float pts ;
2003-02-03 10:27:50 +00:00
QuickTimeGenericRTPSource * qtRTPSource
= ( QuickTimeGenericRTPSource * ) ( subsession - > rtpSource ( ) ) ;
unsigned fourcc ;
do {
2003-03-11 19:08:31 +00:00
if ( ! awaitRTPPacket ( demuxer , demuxer - > video ,
packetData , packetDataLen , pts ) ) {
2003-02-03 10:27:50 +00:00
return ;
}
} while ( ! parseQTState_video ( qtRTPSource - > qtState , fourcc ) ) ;
bih - > biCompression = sh_video - > format = fourcc ;
2007-01-12 19:59:47 +00:00
bih - > biWidth = qtRTPSource - > qtState . width ;
bih - > biHeight = qtRTPSource - > qtState . height ;
2007-02-04 14:02:35 +00:00
if ( bih - > biCompression = = mmioFOURCC ( ' a ' , ' v ' , ' c ' , ' 1 ' ) | |
2007-02-07 23:41:07 +00:00
bih - > biCompression = = mmioFOURCC ( ' m ' , ' p ' , ' 4 ' , ' v ' ) | |
2007-02-04 14:02:35 +00:00
bih - > biCompression = = mmioFOURCC ( ' S ' , ' V ' , ' Q ' , ' 3 ' ) ) {
2007-01-12 19:59:47 +00:00
uint8_t * pos = ( uint8_t * ) qtRTPSource - > qtState . sdAtom + 86 ;
uint8_t * endpos = ( uint8_t * ) qtRTPSource - > qtState . sdAtom
+ qtRTPSource - > qtState . sdAtomSize ;
while ( pos + 8 < endpos ) {
unsigned atomLength = pos [ 0 ] < < 24 | pos [ 1 ] < < 16 | pos [ 2 ] < < 8 | pos [ 3 ] ;
if ( atomLength = = 0 | | atomLength > endpos - pos ) break ;
2007-02-07 23:41:07 +00:00
if ( ( ! memcmp ( pos + 4 , " avcC " , 4 ) | |
! memcmp ( pos + 4 , " esds " , 4 ) | |
! memcmp ( pos + 4 , " SMI " , 4 ) ) & &
2007-02-20 20:21:15 +00:00
atomLength > 8 ) {
sh_video - > bih = bih =
insertVideoExtradata ( bih , pos + 8 , atomLength - 8 ) ;
2007-01-12 19:59:47 +00:00
break ;
}
pos + = atomLength ;
}
needVideoFrameRate ( demuxer , subsession ) ;
}
2003-02-03 10:27:50 +00:00
} else {
fprintf ( stderr ,
" Unknown MPlayer format code for MIME type \" video/%s \" \n " ,
subsession - > codecName ( ) ) ;
}
}
void rtpCodecInitialize_audio ( demuxer_t * demuxer ,
MediaSubsession * subsession ,
unsigned & flags ) {
flags = 0 ;
// Create a dummy audio stream header
// to make the main MPlayer code happy:
sh_audio_t * sh_audio = new_sh_audio ( demuxer , 0 ) ;
WAVEFORMATEX * wf = ( WAVEFORMATEX * ) calloc ( 1 , sizeof ( WAVEFORMATEX ) ) ;
sh_audio - > wf = wf ;
demux_stream_t * d_audio = demuxer - > audio ;
d_audio - > sh = sh_audio ; sh_audio - > ds = d_audio ;
2003-03-11 19:08:31 +00:00
wf - > nChannels = subsession - > numChannels ( ) ;
2003-02-03 10:27:50 +00:00
// Map known audio MIME types to the WAVEFORMATEX parameters
// that this program uses. (Note that not all types need all
// of the parameters to be set.)
wf - > nSamplesPerSec
= subsession - > rtpSource ( ) - > timestampFrequency ( ) ; // by default
if ( strcmp ( subsession - > codecName ( ) , " MPA " ) = = 0 | |
strcmp ( subsession - > codecName ( ) , " MPA-ROBUST " ) = = 0 | |
strcmp ( subsession - > codecName ( ) , " X-MP3-DRAFT-00 " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x55 ;
// Note: 0x55 is for layer III, but should work for I,II also
wf - > nSamplesPerSec = 0 ; // sample rate is deduced from the data
} else if ( strcmp ( subsession - > codecName ( ) , " AC3 " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x2000 ;
wf - > nSamplesPerSec = 0 ; // sample rate is deduced from the data
2003-07-27 10:16:14 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " L16 " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x736f7774 ; // "twos"
wf - > nBlockAlign = 1 ;
wf - > wBitsPerSample = 16 ;
wf - > cbSize = 0 ;
} else if ( strcmp ( subsession - > codecName ( ) , " L8 " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x20776172 ; // "raw "
wf - > nBlockAlign = 1 ;
wf - > wBitsPerSample = 8 ;
wf - > cbSize = 0 ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " PCMU " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x7 ;
wf - > nAvgBytesPerSec = 8000 ;
wf - > nBlockAlign = 1 ;
wf - > wBitsPerSample = 8 ;
wf - > cbSize = 0 ;
} else if ( strcmp ( subsession - > codecName ( ) , " PCMA " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = 0x6 ;
wf - > nAvgBytesPerSec = 8000 ;
wf - > nBlockAlign = 1 ;
wf - > wBitsPerSample = 8 ;
wf - > cbSize = 0 ;
2007-03-06 22:53:52 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " AMR " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' s ' , ' a ' , ' m ' , ' r ' ) ;
} else if ( strcmp ( subsession - > codecName ( ) , " AMR-WB " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' s ' , ' a ' , ' w ' , ' b ' ) ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " GSM " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' a ' , ' g ' , ' s ' , ' m ' ) ;
wf - > nAvgBytesPerSec = 1650 ;
wf - > nBlockAlign = 33 ;
wf - > wBitsPerSample = 16 ;
wf - > cbSize = 0 ;
} else if ( strcmp ( subsession - > codecName ( ) , " QCELP " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' Q ' , ' c ' , ' l ' , ' p ' ) ;
wf - > nAvgBytesPerSec = 1750 ;
wf - > nBlockAlign = 35 ;
wf - > wBitsPerSample = 16 ;
wf - > cbSize = 0 ;
} else if ( strcmp ( subsession - > codecName ( ) , " MP4A-LATM " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' m ' , ' p ' , ' 4 ' , ' a ' ) ;
// For the codec to work correctly, it needs "AudioSpecificConfig"
// data, which is parsed from the "StreamMuxConfig" string that
// was present (hopefully) in the SDP description:
unsigned codecdata_len ;
sh_audio - > codecdata
= parseStreamMuxConfigStr ( subsession - > fmtp_config ( ) ,
codecdata_len ) ;
sh_audio - > codecdata_len = codecdata_len ;
2007-02-17 21:45:16 +00:00
//faad doesn't understand LATM's data length field, so omit it
( ( MPEG4LATMAudioRTPSource * ) subsession - > rtpSource ( ) ) - > omitLATMDataLengthField ( ) ;
2003-03-11 19:08:31 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " MPEG4-GENERIC " ) = = 0 ) {
wf - > wFormatTag = sh_audio - > format = mmioFOURCC ( ' m ' , ' p ' , ' 4 ' , ' a ' ) ;
// For the codec to work correctly, it needs "AudioSpecificConfig"
// data, which was present (hopefully) in the SDP description:
unsigned codecdata_len ;
sh_audio - > codecdata
= parseGeneralConfigStr ( subsession - > fmtp_config ( ) ,
codecdata_len ) ;
sh_audio - > codecdata_len = codecdata_len ;
2003-02-03 10:27:50 +00:00
} else if ( strcmp ( subsession - > codecName ( ) , " X-QT " ) = = 0 | |
strcmp ( subsession - > codecName ( ) , " X-QUICKTIME " ) = = 0 ) {
// QuickTime generic RTP format, as described in
// http://developer.apple.com/quicktime/icefloe/dispatch026.html
// We can't initialize this stream until we've received the first packet
// that has QuickTime "sdAtom" information in the header. So, keep
// reading packets until we get one:
2003-03-11 19:08:31 +00:00
unsigned char * packetData ; unsigned packetDataLen ; float pts ;
2003-02-03 10:27:50 +00:00
QuickTimeGenericRTPSource * qtRTPSource
= ( QuickTimeGenericRTPSource * ) ( subsession - > rtpSource ( ) ) ;
unsigned fourcc , numChannels ;
do {
2003-03-11 19:08:31 +00:00
if ( ! awaitRTPPacket ( demuxer , demuxer - > audio ,
packetData , packetDataLen , pts ) ) {
2003-02-03 10:27:50 +00:00
return ;
}
} while ( ! parseQTState_audio ( qtRTPSource - > qtState , fourcc , numChannels ) ) ;
wf - > wFormatTag = sh_audio - > format = fourcc ;
wf - > nChannels = numChannels ;
2007-02-26 21:54:52 +00:00
uint8_t * pos = ( uint8_t * ) qtRTPSource - > qtState . sdAtom + 52 ;
uint8_t * endpos = ( uint8_t * ) qtRTPSource - > qtState . sdAtom
+ qtRTPSource - > qtState . sdAtomSize ;
while ( pos + 8 < endpos ) {
unsigned atomLength = pos [ 0 ] < < 24 | pos [ 1 ] < < 16 | pos [ 2 ] < < 8 | pos [ 3 ] ;
if ( atomLength = = 0 | | atomLength > endpos - pos ) break ;
if ( ! memcmp ( pos + 4 , " wave " , 4 ) & & fourcc = = mmioFOURCC ( ' Q ' , ' D ' , ' M ' , ' 2 ' ) & &
atomLength > 8 & &
atomLength < = INT_MAX ) {
sh_audio - > codecdata = ( unsigned char * ) malloc ( atomLength - 8 ) ;
if ( sh_audio - > codecdata ) {
memcpy ( sh_audio - > codecdata , pos + 8 , atomLength - 8 ) ;
sh_audio - > codecdata_len = atomLength - 8 ;
}
break ;
}
pos + = atomLength ;
}
2003-02-03 10:27:50 +00:00
} else {
fprintf ( stderr ,
" Unknown MPlayer format code for MIME type \" audio/%s \" \n " ,
subsession - > codecName ( ) ) ;
}
}
2003-03-11 19:08:31 +00:00
static void needVideoFrameRate ( demuxer_t * demuxer ,
MediaSubsession * subsession ) {
// For some codecs, MPlayer's decoding software can't (or refuses to :-)
// figure out the frame rate by itself, so (unless the user specifies
// it manually, using "-fps") we figure it out ourselves here, using the
// presentation timestamps in successive packets,
extern float force_fps ; if ( force_fps ! = 0.0 ) return ; // user used "-fps"
demux_stream_t * d_video = demuxer - > video ;
2003-04-12 09:29:13 +00:00
sh_video_t * sh_video = ( sh_video_t * ) ( d_video - > sh ) ;
2003-03-11 19:08:31 +00:00
// If we already know the subsession's video frame rate, use it:
int fps = ( int ) ( subsession - > videoFPS ( ) ) ;
if ( fps ! = 0 ) {
sh_video - > fps = fps ;
2007-02-27 21:20:24 +00:00
sh_video - > frametime = 1.0f / fps ;
2003-03-11 19:08:31 +00:00
return ;
}
// Keep looking at incoming frames until we see two with different,
// non-zero "pts" timestamps:
unsigned char * packetData ; unsigned packetDataLen ;
float lastPTS = 0.0 , curPTS ;
2003-11-06 05:53:04 +00:00
unsigned const maxNumFramesToWaitFor = 300 ;
2007-01-23 22:26:13 +00:00
int lastfps = 0 ;
2003-03-11 19:08:31 +00:00
for ( unsigned i = 0 ; i < maxNumFramesToWaitFor ; + + i ) {
2003-04-12 09:29:13 +00:00
if ( ! awaitRTPPacket ( demuxer , d_video , packetData , packetDataLen , curPTS ) ) {
break ;
}
2003-03-11 19:08:31 +00:00
2007-01-23 22:26:13 +00:00
if ( curPTS ! = lastPTS & & lastPTS ! = 0.0 ) {
2003-03-11 19:08:31 +00:00
// Use the difference between these two "pts"s to guess the frame rate.
// (should really check that there were no missing frames inbetween)#####
// Guess the frame rate as an integer. If it's not, use "-fps" instead.
2007-01-23 22:26:13 +00:00
fps = ( int ) ( 1 / fabs ( curPTS - lastPTS ) + 0.5 ) ; // rounding
if ( fps = = lastfps ) {
2003-03-11 19:08:31 +00:00
fprintf ( stderr , " demux_rtp: Guessed the video frame rate as %d frames-per-second. \n \t (If this is wrong, use the \" -fps <frame-rate> \" option instead.) \n " , fps ) ;
sh_video - > fps = fps ;
2007-01-23 22:26:13 +00:00
sh_video - > frametime = 1.0f / fps ;
2003-03-11 19:08:31 +00:00
return ;
2007-01-23 22:26:13 +00:00
}
if ( fps > lastfps ) lastfps = fps ;
2003-03-11 19:08:31 +00:00
}
lastPTS = curPTS ;
}
fprintf ( stderr , " demux_rtp: Failed to guess the video frame rate \n " ) ;
}
2003-02-03 10:27:50 +00:00
static Boolean
parseQTState_video ( QuickTimeGenericRTPSource : : QTState const & qtState ,
unsigned & fourcc ) {
// qtState's "sdAtom" field is supposed to contain a QuickTime video
// 'sample description' atom. This atom's name is the 'fourcc' that we want:
char const * sdAtom = qtState . sdAtom ;
if ( sdAtom = = NULL | | qtState . sdAtomSize < 2 * 4 ) return False ;
fourcc = * ( unsigned * ) ( & sdAtom [ 4 ] ) ; // put in host order
return True ;
}
static Boolean
parseQTState_audio ( QuickTimeGenericRTPSource : : QTState const & qtState ,
unsigned & fourcc , unsigned & numChannels ) {
// qtState's "sdAtom" field is supposed to contain a QuickTime audio
// 'sample description' atom. This atom's name is the 'fourcc' that we want.
// Also, the top half of the 5th word following the atom name should
// contain the number of channels ("numChannels") that we want:
char const * sdAtom = qtState . sdAtom ;
if ( sdAtom = = NULL | | qtState . sdAtomSize < 7 * 4 ) return False ;
fourcc = * ( unsigned * ) ( & sdAtom [ 4 ] ) ; // put in host order
char const * word7Ptr = & sdAtom [ 6 * 4 ] ;
numChannels = ( word7Ptr [ 0 ] < < 8 ) | ( word7Ptr [ 1 ] ) ;
return True ;
}