mirror of https://git.ffmpeg.org/ffmpeg.git
250 lines
7.3 KiB
C
250 lines
7.3 KiB
C
/*
|
|
* MPEG-4 encoder/decoder internal header.
|
|
* Copyright (c) 2000,2001 Fabrice Bellard
|
|
* Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef AVCODEC_MPEG4VIDEO_H
|
|
#define AVCODEC_MPEG4VIDEO_H
|
|
|
|
#include <stdint.h>
|
|
|
|
#include "get_bits.h"
|
|
#include "mpegvideo.h"
|
|
|
|
// shapes
|
|
#define RECT_SHAPE 0
|
|
#define BIN_SHAPE 1
|
|
#define BIN_ONLY_SHAPE 2
|
|
#define GRAY_SHAPE 3
|
|
|
|
#define SIMPLE_VO_TYPE 1
|
|
#define CORE_VO_TYPE 3
|
|
#define MAIN_VO_TYPE 4
|
|
#define NBIT_VO_TYPE 5
|
|
#define ARTS_VO_TYPE 10
|
|
#define ACE_VO_TYPE 12
|
|
#define SIMPLE_STUDIO_VO_TYPE 14
|
|
#define CORE_STUDIO_VO_TYPE 15
|
|
#define ADV_SIMPLE_VO_TYPE 17
|
|
|
|
#define VOT_VIDEO_ID 1
|
|
#define VOT_STILL_TEXTURE_ID 2
|
|
|
|
// aspect_ratio_info
|
|
#define EXTENDED_PAR 15
|
|
|
|
//vol_sprite_usage / sprite_enable
|
|
#define STATIC_SPRITE 1
|
|
#define GMC_SPRITE 2
|
|
|
|
#define MOTION_MARKER 0x1F001
|
|
#define DC_MARKER 0x6B001
|
|
|
|
#define VOS_STARTCODE 0x1B0
|
|
#define USER_DATA_STARTCODE 0x1B2
|
|
#define GOP_STARTCODE 0x1B3
|
|
#define VISUAL_OBJ_STARTCODE 0x1B5
|
|
#define VOP_STARTCODE 0x1B6
|
|
#define SLICE_STARTCODE 0x1B7
|
|
#define EXT_STARTCODE 0x1B8
|
|
|
|
#define QUANT_MATRIX_EXT_ID 0x3
|
|
|
|
/* smaller packets likely don't contain a real frame */
|
|
#define MAX_NVOP_SIZE 19
|
|
|
|
typedef struct Mpeg4DecContext {
|
|
MpegEncContext m;
|
|
|
|
/// number of bits to represent the fractional part of time
|
|
int time_increment_bits;
|
|
int shape;
|
|
int vol_sprite_usage;
|
|
int sprite_brightness_change;
|
|
int num_sprite_warping_points;
|
|
/// sprite trajectory points
|
|
uint16_t sprite_traj[4][2];
|
|
/// sprite shift [isChroma]
|
|
int sprite_shift[2];
|
|
|
|
// reversible vlc
|
|
int rvlc;
|
|
/// could this stream contain resync markers
|
|
int resync_marker;
|
|
/// time distance of first I -> B, used for interlaced B-frames
|
|
int t_frame;
|
|
|
|
int new_pred;
|
|
int enhancement_type;
|
|
int scalability;
|
|
|
|
/// QP above which the ac VLC should be used for intra dc
|
|
int intra_dc_threshold;
|
|
|
|
/* bug workarounds */
|
|
int divx_version;
|
|
int divx_build;
|
|
int xvid_build;
|
|
int lavc_build;
|
|
|
|
int vo_type;
|
|
|
|
/// flag for having shown the warning about invalid Divx B-frames
|
|
int showed_packed_warning;
|
|
/** does the stream contain the low_delay flag,
|
|
* used to work around buggy encoders. */
|
|
int vol_control_parameters;
|
|
int cplx_estimation_trash_i;
|
|
int cplx_estimation_trash_p;
|
|
int cplx_estimation_trash_b;
|
|
|
|
int rgb;
|
|
|
|
int32_t block32[12][64];
|
|
// 0 = DCT, 1 = DPCM top to bottom scan, -1 = DPCM bottom to top scan
|
|
int dpcm_direction;
|
|
int16_t dpcm_macroblock[3][256];
|
|
} Mpeg4DecContext;
|
|
|
|
|
|
void ff_mpeg4_decode_studio(MpegEncContext *s, uint8_t *dest_y, uint8_t *dest_cb,
|
|
uint8_t *dest_cr, int block_size, int uvlinesize,
|
|
int dct_linesize, int dct_offset);
|
|
void ff_mpeg4_encode_mb(MpegEncContext *s,
|
|
int16_t block[6][64],
|
|
int motion_x, int motion_y);
|
|
void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n,
|
|
int dir);
|
|
void ff_set_mpeg4_time(MpegEncContext *s);
|
|
int ff_mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
|
|
|
|
int ff_mpeg4_decode_picture_header(Mpeg4DecContext *ctx, GetBitContext *gb,
|
|
int header, int parse_only);
|
|
void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
|
|
void ff_mpeg4_clean_buffers(MpegEncContext *s);
|
|
void ff_mpeg4_stuffing(PutBitContext *pbc);
|
|
void ff_mpeg4_init_partitions(MpegEncContext *s);
|
|
void ff_mpeg4_merge_partitions(MpegEncContext *s);
|
|
void ff_clean_mpeg4_qscales(MpegEncContext *s);
|
|
int ff_mpeg4_decode_partitions(Mpeg4DecContext *ctx);
|
|
int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
|
|
int ff_mpeg4_decode_video_packet_header(Mpeg4DecContext *ctx);
|
|
int ff_mpeg4_decode_studio_slice_header(Mpeg4DecContext *ctx);
|
|
void ff_mpeg4_init_direct_mv(MpegEncContext *s);
|
|
int ff_mpeg4_workaround_bugs(AVCodecContext *avctx);
|
|
int ff_mpeg4_frame_end(AVCodecContext *avctx, const uint8_t *buf, int buf_size);
|
|
|
|
/**
|
|
* @return the mb_type
|
|
*/
|
|
int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
|
|
|
|
#if 0 //3IV1 is quite rare and it slows things down a tiny bit
|
|
#define IS_3IV1 s->codec_tag == AV_RL32("3IV1")
|
|
#else
|
|
#define IS_3IV1 0
|
|
#endif
|
|
|
|
/**
|
|
* Predict the dc.
|
|
* encoding quantized level -> quantized diff
|
|
* decoding quantized diff -> quantized level
|
|
* @param n block index (0-3 are luma, 4-5 are chroma)
|
|
* @param dir_ptr pointer to an integer where the prediction direction will be stored
|
|
*/
|
|
static inline int ff_mpeg4_pred_dc(MpegEncContext *s, int n, int level,
|
|
int *dir_ptr, int encoding)
|
|
{
|
|
int a, b, c, wrap, pred, scale, ret;
|
|
int16_t *dc_val;
|
|
|
|
/* find prediction */
|
|
if (n < 4)
|
|
scale = s->y_dc_scale;
|
|
else
|
|
scale = s->c_dc_scale;
|
|
if (IS_3IV1)
|
|
scale = 8;
|
|
|
|
wrap = s->block_wrap[n];
|
|
dc_val = s->dc_val[0] + s->block_index[n];
|
|
|
|
/* B C
|
|
* A X
|
|
*/
|
|
a = dc_val[-1];
|
|
b = dc_val[-1 - wrap];
|
|
c = dc_val[-wrap];
|
|
|
|
/* outside slice handling (we can't do that by memset as we need the
|
|
* dc for error resilience) */
|
|
if (s->first_slice_line && n != 3) {
|
|
if (n != 2)
|
|
b = c = 1024;
|
|
if (n != 1 && s->mb_x == s->resync_mb_x)
|
|
b = a = 1024;
|
|
}
|
|
if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1) {
|
|
if (n == 0 || n == 4 || n == 5)
|
|
b = 1024;
|
|
}
|
|
|
|
if (abs(a - b) < abs(b - c)) {
|
|
pred = c;
|
|
*dir_ptr = 1; /* top */
|
|
} else {
|
|
pred = a;
|
|
*dir_ptr = 0; /* left */
|
|
}
|
|
/* we assume pred is positive */
|
|
pred = FASTDIV((pred + (scale >> 1)), scale);
|
|
|
|
if (encoding) {
|
|
ret = level - pred;
|
|
} else {
|
|
level += pred;
|
|
ret = level;
|
|
}
|
|
level *= scale;
|
|
if (level & (~2047)) {
|
|
if (!s->encoding && (s->avctx->err_recognition & (AV_EF_BITSTREAM | AV_EF_AGGRESSIVE))) {
|
|
if (level < 0) {
|
|
av_log(s->avctx, AV_LOG_ERROR,
|
|
"dc<0 at %dx%d\n", s->mb_x, s->mb_y);
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
if (level > 2048 + scale) {
|
|
av_log(s->avctx, AV_LOG_ERROR,
|
|
"dc overflow at %dx%d\n", s->mb_x, s->mb_y);
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
}
|
|
if (level < 0)
|
|
level = 0;
|
|
else if (!(s->workaround_bugs & FF_BUG_DC_CLIP))
|
|
level = 2047;
|
|
}
|
|
dc_val[0] = level;
|
|
|
|
return ret;
|
|
}
|
|
|
|
#endif /* AVCODEC_MPEG4VIDEO_H */
|