/* * ISO Media common code * copyright (c) 2001 Fabrice Bellard * copyright (c) 2002 Francois Revol * copyright (c) 2006 Baptiste Coudurier * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #ifndef AVFORMAT_ISOM_H #define AVFORMAT_ISOM_H #include #include #include "libavutil/encryption_info.h" #include "libavutil/mastering_display_metadata.h" #include "libavutil/ambient_viewing_environment.h" #include "libavutil/spherical.h" #include "libavutil/stereo3d.h" #include "avio.h" #include "internal.h" #include "dv.h" /* isom.c */ extern const AVCodecTag ff_mp4_obj_type[]; extern const AVCodecTag ff_codec_movvideo_tags[]; extern const AVCodecTag ff_codec_movaudio_tags[]; extern const AVCodecTag ff_codec_movsubtitle_tags[]; extern const AVCodecTag ff_codec_movdata_tags[]; int ff_mov_iso639_to_lang(const char lang[4], int mp4); int ff_mov_lang_to_iso639(unsigned code, char to[4]); struct AVAESCTR; /* the QuickTime file format is quite convoluted... * it has lots of index tables, each indexing something in another one... * Here we just use what is needed to read the chunks */ typedef struct MOVStts { unsigned int count; unsigned int duration; } MOVStts; typedef struct MOVCtts { unsigned int count; int duration; } MOVCtts; typedef struct MOVStsc { int first; int count; int id; } MOVStsc; typedef struct MOVElst { int64_t duration; int64_t time; float rate; } MOVElst; typedef struct MOVDref { uint32_t type; char *path; char *dir; char volume[28]; char filename[64]; int16_t nlvl_to, nlvl_from; } MOVDref; typedef struct MOVAtom { uint32_t type; int64_t size; /* total size (excluding the size and type fields) */ } MOVAtom; struct MOVParseTableEntry; typedef struct MOVFragment { int found_tfhd; unsigned track_id; uint64_t base_data_offset; uint64_t moof_offset; uint64_t implicit_offset; unsigned stsd_id; unsigned duration; unsigned size; unsigned flags; } MOVFragment; typedef struct MOVTrackExt { unsigned track_id; unsigned stsd_id; unsigned duration; unsigned size; unsigned flags; } MOVTrackExt; typedef struct MOVSbgp { unsigned int count; unsigned int index; } MOVSbgp; typedef struct MOVEncryptionIndex { // Individual encrypted samples. If there are no elements, then the default // settings will be used. unsigned int nb_encrypted_samples; AVEncryptionInfo **encrypted_samples; uint8_t* auxiliary_info_sizes; size_t auxiliary_info_sample_count; uint8_t auxiliary_info_default_size; uint64_t* auxiliary_offsets; ///< Absolute seek position size_t auxiliary_offsets_count; } MOVEncryptionIndex; typedef struct MOVFragmentStreamInfo { int id; int64_t sidx_pts; int64_t first_tfra_pts; int64_t tfdt_dts; int64_t next_trun_dts; // Index of the first sample/trun in the fragment. int index_base; int index_entry; MOVEncryptionIndex *encryption_index; int stsd_id; // current fragment stsd_id } MOVFragmentStreamInfo; typedef struct MOVFragmentIndexItem { int64_t moof_offset; int headers_read; int current; int nb_stream_info; MOVFragmentStreamInfo * stream_info; } MOVFragmentIndexItem; typedef struct MOVFragmentIndex { int allocated_size; int complete; int current; int nb_items; MOVFragmentIndexItem * item; } MOVFragmentIndex; typedef struct MOVIndexRange { int64_t start; int64_t end; } MOVIndexRange; typedef struct MOVStreamContext { AVIOContext *pb; int refcount; int pb_is_copied; int id; ///< AVStream id int ffindex; ///< AVStream index int next_chunk; unsigned int chunk_count; int64_t *chunk_offsets; unsigned int stts_count; MOVStts *stts_data; unsigned int sdtp_count; uint8_t *sdtp_data; unsigned int ctts_count; unsigned int ctts_allocated_size; MOVCtts *ctts_data; unsigned int stsc_count; MOVStsc *stsc_data; unsigned int stsc_index; int stsc_sample; unsigned int stps_count; unsigned *stps_data; ///< partial sync sample for mpeg-2 open gop MOVElst *elst_data; unsigned int elst_count; int ctts_index; int ctts_sample; unsigned int sample_size; ///< may contain value calculated from stsd or value from stsz atom unsigned int stsz_sample_size; ///< always contains sample size from stsz atom unsigned int sample_count; unsigned int *sample_sizes; int keyframe_absent; unsigned int keyframe_count; int *keyframes; int time_scale; int64_t time_offset; ///< time offset of the edit list entries int64_t min_corrected_pts; ///< minimum Composition time shown by the edits excluding empty edits. int current_sample; int64_t current_index; MOVIndexRange* index_ranges; MOVIndexRange* current_index_range; unsigned int bytes_per_frame; unsigned int samples_per_frame; int dv_audio_container; int pseudo_stream_id; ///< -1 means demux all ids int16_t audio_cid; ///< stsd audio compression id unsigned drefs_count; MOVDref *drefs; int dref_id; unsigned tref_flags; int tref_id; int timecode_track; int width; ///< tkhd width int height; ///< tkhd height int h_spacing; ///< pasp hSpacing int v_spacing; ///< pasp vSpacing int dts_shift; ///< dts shift when ctts is negative uint32_t palette[256]; int has_palette; int64_t data_size; uint32_t tmcd_flags; ///< tmcd track flags uint8_t tmcd_nb_frames; ///< tmcd number of frames per tick / second int64_t track_end; ///< used for dts generation in fragmented movie files int start_pad; ///< amount of samples to skip due to enc-dec delay unsigned int rap_group_count; MOVSbgp *rap_group; unsigned int sync_group_count; MOVSbgp *sync_group; uint8_t *sgpd_sync; uint32_t sgpd_sync_count; int32_t *sample_offsets; int sample_offsets_count; int *open_key_samples; int open_key_samples_count; uint32_t min_sample_duration; int nb_frames_for_fps; int64_t duration_for_fps; /** extradata array (and size) for multiple stsd */ uint8_t **extradata; int *extradata_size; int last_stsd_index; int stsd_count; int stsd_version; int32_t *display_matrix; AVStereo3D *stereo3d; size_t stereo3d_size; AVSphericalMapping *spherical; size_t spherical_size; AVMasteringDisplayMetadata *mastering; size_t mastering_size; AVContentLightMetadata *coll; size_t coll_size; AVAmbientViewingEnvironment *ambient; size_t ambient_size; uint32_t format; int has_sidx; // If there is an sidx entry for this stream. struct { struct AVAESCTR* aes_ctr; struct AVAES *aes_ctx; unsigned int per_sample_iv_size; // Either 0, 8, or 16. AVEncryptionInfo *default_encrypted_sample; MOVEncryptionIndex *encryption_index; } cenc; struct IAMFDemuxContext *iamf; } MOVStreamContext; typedef struct HEIFItem { AVStream *st; char *name; int item_id; int64_t extent_length; int64_t extent_offset; int width; int height; int rotation; int hflip; int vflip; int type; int is_idat_relative; uint8_t *icc_profile; size_t icc_profile_size; } HEIFItem; typedef struct HEIFGrid { HEIFItem *item; HEIFItem **tile_item_list; int16_t *tile_id_list; int nb_tiles; } HEIFGrid; typedef struct MOVContext { const AVClass *class; ///< class for private options AVFormatContext *fc; int time_scale; int64_t duration; ///< duration of the longest track int found_moov; ///< 'moov' atom has been found int found_iloc; ///< 'iloc' atom has been found int found_iinf; ///< 'iinf' atom has been found int found_mdat; ///< 'mdat' atom has been found int found_hdlr_mdta; ///< 'hdlr' atom with type 'mdta' has been found int trak_index; ///< Index of the current 'trak' char **meta_keys; unsigned meta_keys_count; DVDemuxContext *dv_demux; AVFormatContext *dv_fctx; int isom; ///< 1 if file is ISO Media (mp4/3gp) MOVFragment fragment; ///< current fragment in moof atom MOVTrackExt *trex_data; unsigned trex_count; int itunes_metadata; ///< metadata are itunes style int handbrake_version; int *chapter_tracks; unsigned int nb_chapter_tracks; int use_absolute_path; int ignore_editlist; int advanced_editlist; int advanced_editlist_autodisabled; int ignore_chapters; int seek_individually; int64_t next_root_atom; ///< offset of the next root atom int export_all; int export_xmp; int *bitrates; ///< bitrates read before streams creation int bitrates_count; int moov_retry; int use_mfra_for; int has_looked_for_mfra; int use_tfdt; MOVFragmentIndex frag_index; int atom_depth; unsigned int aax_mode; ///< 'aax' file has been detected uint8_t file_key[20]; uint8_t file_iv[20]; void *activation_bytes; int activation_bytes_size; void *audible_fixed_key; int audible_fixed_key_size; void *audible_key; int audible_key_size; void *audible_iv; int audible_iv_size; struct AVAES *aes_decrypt; uint8_t *decryption_key; int decryption_key_len; int enable_drefs; int32_t movie_display_matrix[3][3]; ///< display matrix from mvhd int have_read_mfra_size; uint32_t mfra_size; uint32_t max_stts_delta; int primary_item_id; int cur_item_id; HEIFItem **heif_item; int nb_heif_item; HEIFGrid *heif_grid; int nb_heif_grid; int thmb_item_id; int64_t idat_offset; int interleaved_read; } MOVContext; int ff_mp4_read_descr_len(AVIOContext *pb); int ff_mp4_read_descr(void *logctx, AVIOContext *pb, int *tag); int ff_mp4_read_dec_config_descr(void *logctx, AVStream *st, AVIOContext *pb); void ff_mp4_parse_es_descr(AVIOContext *pb, int *es_id); #define MP4ODescrTag 0x01 #define MP4IODescrTag 0x02 #define MP4ESDescrTag 0x03 #define MP4DecConfigDescrTag 0x04 #define MP4DecSpecificDescrTag 0x05 #define MP4SLDescrTag 0x06 #define MOV_TFHD_BASE_DATA_OFFSET 0x01 #define MOV_TFHD_STSD_ID 0x02 #define MOV_TFHD_DEFAULT_DURATION 0x08 #define MOV_TFHD_DEFAULT_SIZE 0x10 #define MOV_TFHD_DEFAULT_FLAGS 0x20 #define MOV_TFHD_DURATION_IS_EMPTY 0x010000 #define MOV_TFHD_DEFAULT_BASE_IS_MOOF 0x020000 #define MOV_TRUN_DATA_OFFSET 0x01 #define MOV_TRUN_FIRST_SAMPLE_FLAGS 0x04 #define MOV_TRUN_SAMPLE_DURATION 0x100 #define MOV_TRUN_SAMPLE_SIZE 0x200 #define MOV_TRUN_SAMPLE_FLAGS 0x400 #define MOV_TRUN_SAMPLE_CTS 0x800 #define MOV_FRAG_SAMPLE_FLAG_DEGRADATION_PRIORITY_MASK 0x0000ffff #define MOV_FRAG_SAMPLE_FLAG_IS_NON_SYNC 0x00010000 #define MOV_FRAG_SAMPLE_FLAG_PADDING_MASK 0x000e0000 #define MOV_FRAG_SAMPLE_FLAG_REDUNDANCY_MASK 0x00300000 #define MOV_FRAG_SAMPLE_FLAG_DEPENDED_MASK 0x00c00000 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_MASK 0x03000000 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_NO 0x02000000 #define MOV_FRAG_SAMPLE_FLAG_DEPENDS_YES 0x01000000 #define MOV_TKHD_FLAG_ENABLED 0x0001 #define MOV_TKHD_FLAG_IN_MOVIE 0x0002 #define MOV_TKHD_FLAG_IN_PREVIEW 0x0004 #define MOV_TKHD_FLAG_IN_POSTER 0x0008 #define MOV_SAMPLE_DEPENDENCY_UNKNOWN 0x0 #define MOV_SAMPLE_DEPENDENCY_YES 0x1 #define MOV_SAMPLE_DEPENDENCY_NO 0x2 #define MOV_TREF_FLAG_ENHANCEMENT 0x1 #define TAG_IS_AVCI(tag) \ ((tag) == MKTAG('a', 'i', '5', 'p') || \ (tag) == MKTAG('a', 'i', '5', 'q') || \ (tag) == MKTAG('a', 'i', '5', '2') || \ (tag) == MKTAG('a', 'i', '5', '3') || \ (tag) == MKTAG('a', 'i', '5', '5') || \ (tag) == MKTAG('a', 'i', '5', '6') || \ (tag) == MKTAG('a', 'i', '1', 'p') || \ (tag) == MKTAG('a', 'i', '1', 'q') || \ (tag) == MKTAG('a', 'i', '1', '2') || \ (tag) == MKTAG('a', 'i', '1', '3') || \ (tag) == MKTAG('a', 'i', '1', '5') || \ (tag) == MKTAG('a', 'i', '1', '6') || \ (tag) == MKTAG('a', 'i', 'v', 'x') || \ (tag) == MKTAG('A', 'V', 'i', 'n')) int ff_mov_read_esds(AVFormatContext *fc, AVIOContext *pb); int ff_mov_read_stsd_entries(MOVContext *c, AVIOContext *pb, int entries); void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout); #define FF_MOV_FLAG_MFRA_AUTO -1 #define FF_MOV_FLAG_MFRA_DTS 1 #define FF_MOV_FLAG_MFRA_PTS 2 /** * Compute codec id for 'lpcm' tag. * See CoreAudioTypes and AudioStreamBasicDescription at Apple. */ static inline enum AVCodecID ff_mov_get_lpcm_codec_id(int bps, int flags) { /* lpcm flags: * 0x1 = float * 0x2 = big-endian * 0x4 = signed */ return ff_get_pcm_codec_id(bps, flags & 1, flags & 2, flags & 4 ? -1 : 0); } #define MOV_ISMV_TTML_TAG MKTAG('d', 'f', 'x', 'p') #define MOV_MP4_TTML_TAG MKTAG('s', 't', 'p', 'p') #define MOV_MP4_FPCM_TAG MKTAG('f', 'p', 'c', 'm') #define MOV_MP4_IPCM_TAG MKTAG('i', 'p', 'c', 'm') struct MP4TrackKindValueMapping { int disposition; const char *value; }; struct MP4TrackKindMapping { const char *scheme_uri; const struct MP4TrackKindValueMapping *value_maps; }; extern const struct MP4TrackKindMapping ff_mov_track_kind_table[]; #endif /* AVFORMAT_ISOM_H */