mirror of https://git.ffmpeg.org/ffmpeg.git
294 lines
9.0 KiB
C
294 lines
9.0 KiB
C
#ifndef AVCODEC_H
|
|
#define AVCODEC_H
|
|
|
|
#include "common.h"
|
|
|
|
enum CodecID {
|
|
CODEC_ID_NONE,
|
|
CODEC_ID_MPEG1VIDEO,
|
|
CODEC_ID_H263,
|
|
CODEC_ID_RV10,
|
|
CODEC_ID_MP2,
|
|
CODEC_ID_MP3LAME,
|
|
CODEC_ID_AC3,
|
|
CODEC_ID_MJPEG,
|
|
CODEC_ID_MPEG4,
|
|
CODEC_ID_RAWVIDEO,
|
|
CODEC_ID_MSMPEG4,
|
|
CODEC_ID_H263P,
|
|
CODEC_ID_H263I,
|
|
|
|
/* various pcm "codecs" */
|
|
CODEC_ID_PCM_S16LE,
|
|
CODEC_ID_PCM_S16BE,
|
|
CODEC_ID_PCM_U16LE,
|
|
CODEC_ID_PCM_U16BE,
|
|
CODEC_ID_PCM_S8,
|
|
CODEC_ID_PCM_U8,
|
|
CODEC_ID_PCM_MULAW,
|
|
CODEC_ID_PCM_ALAW,
|
|
};
|
|
|
|
enum CodecType {
|
|
CODEC_TYPE_VIDEO,
|
|
CODEC_TYPE_AUDIO,
|
|
};
|
|
|
|
enum PixelFormat {
|
|
PIX_FMT_YUV420P,
|
|
PIX_FMT_YUV422,
|
|
PIX_FMT_RGB24,
|
|
PIX_FMT_BGR24,
|
|
PIX_FMT_YUV422P,
|
|
PIX_FMT_YUV444P,
|
|
};
|
|
|
|
/* currently unused, may be used if 24/32 bits samples ever supported */
|
|
enum SampleFormat {
|
|
SAMPLE_FMT_S16 = 0, /* signed 16 bits */
|
|
};
|
|
|
|
/* in bytes */
|
|
#define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432
|
|
|
|
/* motion estimation type */
|
|
extern int motion_estimation_method;
|
|
#define ME_ZERO 0
|
|
#define ME_FULL 1
|
|
#define ME_LOG 2
|
|
#define ME_PHODS 3
|
|
#define ME_EPZS 4
|
|
#define ME_X1 5
|
|
|
|
/* encoding support */
|
|
|
|
#define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */
|
|
#define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
|
|
|
|
/* codec capabilities */
|
|
|
|
/* decoder can use draw_horiz_band callback */
|
|
#define CODEC_CAP_DRAW_HORIZ_BAND 0x0001
|
|
|
|
#define FRAME_RATE_BASE 10000
|
|
|
|
typedef struct AVCodecContext {
|
|
int bit_rate;
|
|
int bit_rate_tolerance; /* amount of +- bits (>0)*/
|
|
int flags;
|
|
int sub_id; /* some codecs needs additionnal format info. It is
|
|
stored there */
|
|
/* video only */
|
|
int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */
|
|
int width, height;
|
|
int aspect_ratio_info;
|
|
#define FF_ASPECT_SQUARE 1
|
|
#define FF_ASPECT_4_3_625 2
|
|
#define FF_ASPECT_4_3_525 3
|
|
#define FF_ASPECT_16_9_625 4
|
|
#define FF_ASPECT_16_9_525 5
|
|
int gop_size; /* 0 = intra only */
|
|
int pix_fmt; /* pixel format, see PIX_FMT_xxx */
|
|
|
|
/* if non NULL, 'draw_horiz_band' is called by the libavcodec
|
|
decoder to draw an horizontal band. It improve cache usage. Not
|
|
all codecs can do that. You must check the codec capabilities
|
|
before */
|
|
void (*draw_horiz_band)(struct AVCodecContext *s,
|
|
UINT8 **src_ptr, int linesize,
|
|
int y, int width, int height);
|
|
|
|
/* audio only */
|
|
int sample_rate; /* samples per sec */
|
|
int channels;
|
|
int sample_fmt; /* sample format, currenly unused */
|
|
|
|
/* the following data should not be initialized */
|
|
int frame_size; /* in samples, initialized when calling 'init' */
|
|
int frame_number; /* audio or video frame number */
|
|
int key_frame; /* true if the previous compressed frame was
|
|
a key frame (intra, or seekable) */
|
|
int quality; /* quality of the previous encoded frame
|
|
(between 1 (good) and 31 (bad)) */
|
|
float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
|
|
float qblur; /* amount of qscale smoothing over time (0.0-1.0) */
|
|
int qmin; /* min qscale */
|
|
int qmax; /* max qscale */
|
|
int max_qdiff; /* max qscale difference between frames */
|
|
|
|
struct AVCodec *codec;
|
|
void *priv_data;
|
|
|
|
/* The following data is for RTP friendly coding */
|
|
/* By now only H.263/H.263+ coder honours this */
|
|
int rtp_mode; /* 1 for activate RTP friendly-mode */
|
|
/* highers numbers represent more error-prone */
|
|
/* enviroments, by now just "1" exist */
|
|
|
|
int rtp_payload_size; /* The size of the RTP payload, the coder will */
|
|
/* do it's best to deliver a chunk with size */
|
|
/* below rtp_payload_size, the chunk will start */
|
|
/* with a start code on some codecs like H.263 */
|
|
/* This doesn't take account of any particular */
|
|
/* headers inside the transmited RTP payload */
|
|
|
|
|
|
/* The RTP callcack: This function is called */
|
|
/* every time the encoder as a packet to send */
|
|
/* Depends on the encoder if the data starts */
|
|
/* with a Start Code (it should) H.263 does */
|
|
void (*rtp_callback)(void *data, int size, int packet_number);
|
|
|
|
/* These are for PSNR calculation, if you set get_psnr to 1 */
|
|
/* after encoding you will have the PSNR on psnr_y/cb/cr */
|
|
int get_psnr;
|
|
float psnr_y;
|
|
float psnr_cb;
|
|
float psnr_cr;
|
|
|
|
/* the following fields are ignored */
|
|
void *opaque; /* can be used to carry app specific stuff */
|
|
char codec_name[32];
|
|
int codec_type; /* see CODEC_TYPE_xxx */
|
|
int codec_id; /* see CODEC_ID_xxx */
|
|
unsigned int codec_tag; /* codec tag, only used if unknown codec */
|
|
} AVCodecContext;
|
|
|
|
typedef struct AVCodec {
|
|
char *name;
|
|
int type;
|
|
int id;
|
|
int priv_data_size;
|
|
int (*init)(AVCodecContext *);
|
|
int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
|
|
int (*close)(AVCodecContext *);
|
|
int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
|
|
UINT8 *buf, int buf_size);
|
|
int capabilities;
|
|
struct AVCodec *next;
|
|
} AVCodec;
|
|
|
|
/* three components are given, that's all */
|
|
typedef struct AVPicture {
|
|
UINT8 *data[3];
|
|
int linesize[3];
|
|
} AVPicture;
|
|
|
|
extern AVCodec ac3_encoder;
|
|
extern AVCodec mp2_encoder;
|
|
extern AVCodec mp3lame_encoder;
|
|
extern AVCodec mpeg1video_encoder;
|
|
extern AVCodec h263_encoder;
|
|
extern AVCodec h263p_encoder;
|
|
extern AVCodec rv10_encoder;
|
|
extern AVCodec mjpeg_encoder;
|
|
extern AVCodec mpeg4_encoder;
|
|
extern AVCodec msmpeg4_encoder;
|
|
|
|
extern AVCodec h263_decoder;
|
|
extern AVCodec mpeg4_decoder;
|
|
extern AVCodec msmpeg4_decoder;
|
|
extern AVCodec mpeg_decoder;
|
|
extern AVCodec h263i_decoder;
|
|
extern AVCodec rv10_decoder;
|
|
extern AVCodec mjpeg_decoder;
|
|
extern AVCodec mp3_decoder;
|
|
|
|
/* pcm codecs */
|
|
#define PCM_CODEC(id, name) \
|
|
extern AVCodec name ## _decoder; \
|
|
extern AVCodec name ## _encoder;
|
|
|
|
PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
|
|
PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
|
|
PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
|
|
PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
|
|
PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
|
|
PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
|
|
PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
|
|
PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);
|
|
|
|
#undef PCM_CODEC
|
|
|
|
/* dummy raw video codec */
|
|
extern AVCodec rawvideo_codec;
|
|
|
|
/* the following codecs use external GPL libs */
|
|
extern AVCodec ac3_decoder;
|
|
|
|
/* resample.c */
|
|
|
|
struct ReSampleContext;
|
|
|
|
typedef struct ReSampleContext ReSampleContext;
|
|
|
|
ReSampleContext *audio_resample_init(int output_channels, int input_channels,
|
|
int output_rate, int input_rate);
|
|
int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
|
|
void audio_resample_close(ReSampleContext *s);
|
|
|
|
/* YUV420 format is assumed ! */
|
|
|
|
struct ImgReSampleContext;
|
|
|
|
typedef struct ImgReSampleContext ImgReSampleContext;
|
|
|
|
ImgReSampleContext *img_resample_init(int output_width, int output_height,
|
|
int input_width, int input_height);
|
|
void img_resample(ImgReSampleContext *s,
|
|
AVPicture *output, AVPicture *input);
|
|
|
|
void img_resample_close(ImgReSampleContext *s);
|
|
|
|
void avpicture_fill(AVPicture *picture, UINT8 *ptr,
|
|
int pix_fmt, int width, int height);
|
|
int avpicture_get_size(int pix_fmt, int width, int height);
|
|
|
|
/* convert among pixel formats */
|
|
int img_convert(AVPicture *dst, int dst_pix_fmt,
|
|
AVPicture *src, int pix_fmt,
|
|
int width, int height);
|
|
|
|
/* deinterlace a picture */
|
|
int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
|
|
int pix_fmt, int width, int height);
|
|
|
|
/* external high level API */
|
|
|
|
extern AVCodec *first_avcodec;
|
|
|
|
void avcodec_init(void);
|
|
|
|
void register_avcodec(AVCodec *format);
|
|
AVCodec *avcodec_find_encoder(enum CodecID id);
|
|
AVCodec *avcodec_find_encoder_by_name(const char *name);
|
|
AVCodec *avcodec_find_decoder(enum CodecID id);
|
|
AVCodec *avcodec_find_decoder_by_name(const char *name);
|
|
void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
|
|
|
|
int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
|
|
int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples,
|
|
int *frame_size_ptr,
|
|
UINT8 *buf, int buf_size);
|
|
int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture,
|
|
int *got_picture_ptr,
|
|
UINT8 *buf, int buf_size);
|
|
int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size,
|
|
const short *samples);
|
|
int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size,
|
|
const AVPicture *pict);
|
|
|
|
int avcodec_close(AVCodecContext *avctx);
|
|
|
|
void avcodec_register_all(void);
|
|
|
|
#ifdef FF_POSTPROCESS
|
|
#ifndef MBC
|
|
#define MBC 48
|
|
#define MBR 36
|
|
#endif
|
|
extern int quant_store[MBR+1][MBC+1]; // [Review]
|
|
#endif
|
|
|
|
#endif /* AVCODEC_H */
|