mirror of
https://git.ffmpeg.org/ffmpeg.git
synced 2024-12-27 09:52:17 +00:00
f52b4a6e69
Reviewed-by: Michael Niedermayer <michael@niedermayer.cc> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
432 lines
14 KiB
C
432 lines
14 KiB
C
/*
|
|
* Copyright (C) 2004 Michael Niedermayer <michaelni@gmx.at>
|
|
* Copyright (C) 2006 Robert Edele <yartrebo@earthlink.net>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef AVCODEC_SNOW_H
|
|
#define AVCODEC_SNOW_H
|
|
|
|
#include "libavutil/motion_vector.h"
|
|
|
|
#include "avcodec.h"
|
|
#include "hpeldsp.h"
|
|
#include "snow_dwt.h"
|
|
|
|
#include "rangecoder.h"
|
|
#include "mathops.h"
|
|
|
|
#include "h264qpel.h"
|
|
#include "videodsp.h"
|
|
|
|
#define SNOW_MAX_PLANES 4
|
|
|
|
#define MID_STATE 128
|
|
|
|
#define MAX_PLANES 4
|
|
#define QSHIFT 5
|
|
#define QROOT (1<<QSHIFT)
|
|
#define LOSSLESS_QLOG -128
|
|
#define FRAC_BITS 4
|
|
#define MAX_REF_FRAMES 8
|
|
|
|
#define LOG2_OBMC_MAX 8
|
|
#define OBMC_MAX (1<<(LOG2_OBMC_MAX))
|
|
typedef struct BlockNode{
|
|
int16_t mx; ///< Motion vector component X, see mv_scale
|
|
int16_t my; ///< Motion vector component Y, see mv_scale
|
|
uint8_t ref; ///< Reference frame index
|
|
uint8_t color[3]; ///< Color for intra
|
|
uint8_t type; ///< Bitfield of BLOCK_*
|
|
//#define TYPE_SPLIT 1
|
|
#define BLOCK_INTRA 1 ///< Intra block, inter otherwise
|
|
#define BLOCK_OPT 2 ///< Block needs no checks in this round of iterative motion estiation
|
|
//#define TYPE_NOCOLOR 4
|
|
uint8_t level; //FIXME merge into type?
|
|
}BlockNode;
|
|
|
|
static const BlockNode null_block= { //FIXME add border maybe
|
|
.color= {128,128,128},
|
|
.mx= 0,
|
|
.my= 0,
|
|
.ref= 0,
|
|
.type= 0,
|
|
.level= 0,
|
|
};
|
|
|
|
#define LOG2_MB_SIZE 4
|
|
#define MB_SIZE (1<<LOG2_MB_SIZE)
|
|
#define ENCODER_EXTRA_BITS 4
|
|
#define HTAPS_MAX 8
|
|
|
|
typedef struct x_and_coeff{
|
|
int16_t x;
|
|
uint16_t coeff;
|
|
} x_and_coeff;
|
|
|
|
typedef struct SubBand{
|
|
int level;
|
|
int stride;
|
|
int width;
|
|
int height;
|
|
int qlog; ///< log(qscale)/log[2^(1/6)]
|
|
DWTELEM *buf;
|
|
IDWTELEM *ibuf;
|
|
int buf_x_offset;
|
|
int buf_y_offset;
|
|
int stride_line; ///< Stride measured in lines, not pixels.
|
|
x_and_coeff * x_coeff;
|
|
struct SubBand *parent;
|
|
uint8_t state[/*7*2*/ 7 + 512][32];
|
|
}SubBand;
|
|
|
|
typedef struct Plane{
|
|
int width;
|
|
int height;
|
|
SubBand band[MAX_DECOMPOSITIONS][4];
|
|
|
|
int htaps;
|
|
int8_t hcoeff[HTAPS_MAX/2];
|
|
int diag_mc;
|
|
int fast_mc;
|
|
|
|
int last_htaps;
|
|
int8_t last_hcoeff[HTAPS_MAX/2];
|
|
int last_diag_mc;
|
|
}Plane;
|
|
|
|
typedef struct SnowContext{
|
|
AVClass *class;
|
|
AVCodecContext *avctx;
|
|
RangeCoder c;
|
|
HpelDSPContext hdsp;
|
|
VideoDSPContext vdsp;
|
|
H264QpelContext h264qpel;
|
|
SnowDWTContext dwt;
|
|
AVFrame *input_picture; ///< new_picture with the internal linesizes
|
|
AVFrame *current_picture;
|
|
AVFrame *last_picture[MAX_REF_FRAMES];
|
|
AVFrame *mconly_picture;
|
|
// uint8_t q_context[16];
|
|
uint8_t header_state[32];
|
|
uint8_t block_state[128 + 32*128];
|
|
int keyframe;
|
|
int always_reset;
|
|
int version;
|
|
int spatial_decomposition_type;
|
|
int last_spatial_decomposition_type;
|
|
int temporal_decomposition_type;
|
|
int spatial_decomposition_count;
|
|
int last_spatial_decomposition_count;
|
|
int temporal_decomposition_count;
|
|
int max_ref_frames;
|
|
int ref_frames;
|
|
int16_t (*ref_mvs[MAX_REF_FRAMES])[2];
|
|
uint32_t *ref_scores[MAX_REF_FRAMES];
|
|
DWTELEM *spatial_dwt_buffer;
|
|
DWTELEM *temp_dwt_buffer;
|
|
IDWTELEM *spatial_idwt_buffer;
|
|
IDWTELEM *temp_idwt_buffer;
|
|
int *run_buffer;
|
|
int colorspace_type;
|
|
int chroma_h_shift;
|
|
int chroma_v_shift;
|
|
int spatial_scalability;
|
|
int qlog;
|
|
int last_qlog;
|
|
int mv_scale;
|
|
int last_mv_scale;
|
|
int qbias;
|
|
int last_qbias;
|
|
#define QBIAS_SHIFT 3
|
|
int b_width;
|
|
int b_height;
|
|
int block_max_depth;
|
|
int last_block_max_depth;
|
|
int nb_planes;
|
|
Plane plane[MAX_PLANES];
|
|
BlockNode *block;
|
|
slice_buffer sb;
|
|
|
|
uint8_t *scratchbuf;
|
|
uint8_t *emu_edge_buffer;
|
|
|
|
AVMotionVector *avmv;
|
|
unsigned avmv_size;
|
|
int avmv_index;
|
|
}SnowContext;
|
|
|
|
/* Tables */
|
|
extern const uint8_t * const ff_obmc_tab[4];
|
|
extern const uint8_t ff_qexp[QROOT];
|
|
extern int ff_scale_mv_ref[MAX_REF_FRAMES][MAX_REF_FRAMES];
|
|
|
|
/* common code */
|
|
|
|
int ff_snow_common_init(AVCodecContext *avctx);
|
|
int ff_snow_common_init_after_header(AVCodecContext *avctx);
|
|
void ff_snow_common_end(SnowContext *s);
|
|
void ff_snow_release_buffer(AVCodecContext *avctx);
|
|
void ff_snow_reset_contexts(SnowContext *s);
|
|
int ff_snow_alloc_blocks(SnowContext *s);
|
|
int ff_snow_frames_prepare(SnowContext *s);
|
|
void ff_snow_pred_block(SnowContext *s, uint8_t *dst, uint8_t *tmp, ptrdiff_t stride,
|
|
int sx, int sy, int b_w, int b_h, const BlockNode *block,
|
|
int plane_index, int w, int h);
|
|
/* common inline functions */
|
|
//XXX doublecheck all of them should stay inlined
|
|
|
|
static inline void pred_mv(SnowContext *s, int *mx, int *my, int ref,
|
|
const BlockNode *left, const BlockNode *top, const BlockNode *tr){
|
|
if(s->ref_frames == 1){
|
|
*mx = mid_pred(left->mx, top->mx, tr->mx);
|
|
*my = mid_pred(left->my, top->my, tr->my);
|
|
}else{
|
|
const int *scale = ff_scale_mv_ref[ref];
|
|
*mx = mid_pred((left->mx * scale[left->ref] + 128) >>8,
|
|
(top ->mx * scale[top ->ref] + 128) >>8,
|
|
(tr ->mx * scale[tr ->ref] + 128) >>8);
|
|
*my = mid_pred((left->my * scale[left->ref] + 128) >>8,
|
|
(top ->my * scale[top ->ref] + 128) >>8,
|
|
(tr ->my * scale[tr ->ref] + 128) >>8);
|
|
}
|
|
}
|
|
|
|
static av_always_inline int same_block(BlockNode *a, BlockNode *b){
|
|
if((a->type&BLOCK_INTRA) && (b->type&BLOCK_INTRA)){
|
|
return !((a->color[0] - b->color[0]) | (a->color[1] - b->color[1]) | (a->color[2] - b->color[2]));
|
|
}else{
|
|
return !((a->mx - b->mx) | (a->my - b->my) | (a->ref - b->ref) | ((a->type ^ b->type)&BLOCK_INTRA));
|
|
}
|
|
}
|
|
|
|
//FIXME name cleanup (b_w, block_w, b_width stuff)
|
|
//XXX should we really inline it?
|
|
static av_always_inline void add_yblock(SnowContext *s, int sliced, slice_buffer *sb, IDWTELEM *dst, uint8_t *dst8, const uint8_t *obmc, int src_x, int src_y, int b_w, int b_h, int w, int h, int dst_stride, int src_stride, int obmc_stride, int b_x, int b_y, int add, int offset_dst, int plane_index){
|
|
const int b_width = s->b_width << s->block_max_depth;
|
|
const int b_height= s->b_height << s->block_max_depth;
|
|
const int b_stride= b_width;
|
|
BlockNode *lt= &s->block[b_x + b_y*b_stride];
|
|
BlockNode *rt= lt+1;
|
|
BlockNode *lb= lt+b_stride;
|
|
BlockNode *rb= lb+1;
|
|
uint8_t *block[4];
|
|
// When src_stride is large enough, it is possible to interleave the blocks.
|
|
// Otherwise the blocks are written sequentially in the tmp buffer.
|
|
int tmp_step= src_stride >= 7*MB_SIZE ? MB_SIZE : MB_SIZE*src_stride;
|
|
uint8_t *tmp = s->scratchbuf;
|
|
uint8_t *ptmp;
|
|
int x,y;
|
|
|
|
if(b_x<0){
|
|
lt= rt;
|
|
lb= rb;
|
|
}else if(b_x + 1 >= b_width){
|
|
rt= lt;
|
|
rb= lb;
|
|
}
|
|
if(b_y<0){
|
|
lt= lb;
|
|
rt= rb;
|
|
}else if(b_y + 1 >= b_height){
|
|
lb= lt;
|
|
rb= rt;
|
|
}
|
|
|
|
if(src_x<0){ //FIXME merge with prev & always round internal width up to *16
|
|
obmc -= src_x;
|
|
b_w += src_x;
|
|
if(!sliced && !offset_dst)
|
|
dst -= src_x;
|
|
src_x=0;
|
|
}
|
|
if(src_x + b_w > w){
|
|
b_w = w - src_x;
|
|
}
|
|
if(src_y<0){
|
|
obmc -= src_y*obmc_stride;
|
|
b_h += src_y;
|
|
if(!sliced && !offset_dst)
|
|
dst -= src_y*dst_stride;
|
|
src_y=0;
|
|
}
|
|
if(src_y + b_h> h){
|
|
b_h = h - src_y;
|
|
}
|
|
|
|
if(b_w<=0 || b_h<=0) return;
|
|
|
|
if(!sliced && offset_dst)
|
|
dst += src_x + src_y*dst_stride;
|
|
dst8+= src_x + src_y*src_stride;
|
|
// src += src_x + src_y*src_stride;
|
|
|
|
ptmp= tmp + 3*tmp_step;
|
|
block[0]= ptmp;
|
|
ptmp+=tmp_step;
|
|
ff_snow_pred_block(s, block[0], tmp, src_stride, src_x, src_y, b_w, b_h, lt, plane_index, w, h);
|
|
|
|
if(same_block(lt, rt)){
|
|
block[1]= block[0];
|
|
}else{
|
|
block[1]= ptmp;
|
|
ptmp+=tmp_step;
|
|
ff_snow_pred_block(s, block[1], tmp, src_stride, src_x, src_y, b_w, b_h, rt, plane_index, w, h);
|
|
}
|
|
|
|
if(same_block(lt, lb)){
|
|
block[2]= block[0];
|
|
}else if(same_block(rt, lb)){
|
|
block[2]= block[1];
|
|
}else{
|
|
block[2]= ptmp;
|
|
ptmp+=tmp_step;
|
|
ff_snow_pred_block(s, block[2], tmp, src_stride, src_x, src_y, b_w, b_h, lb, plane_index, w, h);
|
|
}
|
|
|
|
if(same_block(lt, rb) ){
|
|
block[3]= block[0];
|
|
}else if(same_block(rt, rb)){
|
|
block[3]= block[1];
|
|
}else if(same_block(lb, rb)){
|
|
block[3]= block[2];
|
|
}else{
|
|
block[3]= ptmp;
|
|
ff_snow_pred_block(s, block[3], tmp, src_stride, src_x, src_y, b_w, b_h, rb, plane_index, w, h);
|
|
}
|
|
if(sliced){
|
|
s->dwt.inner_add_yblock(obmc, obmc_stride, block, b_w, b_h, src_x,src_y, src_stride, sb, add, dst8);
|
|
}else{
|
|
for(y=0; y<b_h; y++){
|
|
//FIXME ugly misuse of obmc_stride
|
|
const uint8_t *obmc1= obmc + y*obmc_stride;
|
|
const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
|
|
const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
|
|
const uint8_t *obmc4= obmc3+ (obmc_stride>>1);
|
|
for(x=0; x<b_w; x++){
|
|
int v= obmc1[x] * block[3][x + y*src_stride]
|
|
+obmc2[x] * block[2][x + y*src_stride]
|
|
+obmc3[x] * block[1][x + y*src_stride]
|
|
+obmc4[x] * block[0][x + y*src_stride];
|
|
|
|
v <<= 8 - LOG2_OBMC_MAX;
|
|
if(FRAC_BITS != 8){
|
|
v >>= 8 - FRAC_BITS;
|
|
}
|
|
if(add){
|
|
v += dst[x + y*dst_stride];
|
|
v = (v + (1<<(FRAC_BITS-1))) >> FRAC_BITS;
|
|
if(v&(~255)) v= ~(v>>31);
|
|
dst8[x + y*src_stride] = v;
|
|
}else{
|
|
dst[x + y*dst_stride] -= v;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
static av_always_inline void predict_slice(SnowContext *s, IDWTELEM *buf, int plane_index, int add, int mb_y){
|
|
Plane *p= &s->plane[plane_index];
|
|
const int mb_w= s->b_width << s->block_max_depth;
|
|
const int mb_h= s->b_height << s->block_max_depth;
|
|
int x, y, mb_x;
|
|
int block_size = MB_SIZE >> s->block_max_depth;
|
|
int block_w = plane_index ? block_size>>s->chroma_h_shift : block_size;
|
|
int block_h = plane_index ? block_size>>s->chroma_v_shift : block_size;
|
|
const uint8_t *obmc = plane_index ? ff_obmc_tab[s->block_max_depth+s->chroma_h_shift] : ff_obmc_tab[s->block_max_depth];
|
|
const int obmc_stride= plane_index ? (2*block_size)>>s->chroma_h_shift : 2*block_size;
|
|
int ref_stride= s->current_picture->linesize[plane_index];
|
|
uint8_t *dst8= s->current_picture->data[plane_index];
|
|
int w= p->width;
|
|
int h= p->height;
|
|
av_assert2(s->chroma_h_shift == s->chroma_v_shift); // obmc params assume squares
|
|
if(s->keyframe || (s->avctx->debug&512)){
|
|
if(mb_y==mb_h)
|
|
return;
|
|
|
|
if(add){
|
|
for(y=block_h*mb_y; y<FFMIN(h,block_h*(mb_y+1)); y++){
|
|
for(x=0; x<w; x++){
|
|
int v= buf[x + y*w] + (128<<FRAC_BITS) + (1<<(FRAC_BITS-1));
|
|
v >>= FRAC_BITS;
|
|
if(v&(~255)) v= ~(v>>31);
|
|
dst8[x + y*ref_stride]= v;
|
|
}
|
|
}
|
|
}else{
|
|
for(y=block_h*mb_y; y<FFMIN(h,block_h*(mb_y+1)); y++){
|
|
for(x=0; x<w; x++){
|
|
buf[x + y*w]-= 128<<FRAC_BITS;
|
|
}
|
|
}
|
|
}
|
|
|
|
return;
|
|
}
|
|
|
|
for(mb_x=0; mb_x<=mb_w; mb_x++){
|
|
add_yblock(s, 0, NULL, buf, dst8, obmc,
|
|
block_w*mb_x - block_w/2,
|
|
block_h*mb_y - block_h/2,
|
|
block_w, block_h,
|
|
w, h,
|
|
w, ref_stride, obmc_stride,
|
|
mb_x - 1, mb_y - 1,
|
|
add, 1, plane_index);
|
|
}
|
|
}
|
|
|
|
static av_always_inline void predict_plane(SnowContext *s, IDWTELEM *buf, int plane_index, int add){
|
|
const int mb_h= s->b_height << s->block_max_depth;
|
|
int mb_y;
|
|
for(mb_y=0; mb_y<=mb_h; mb_y++)
|
|
predict_slice(s, buf, plane_index, add, mb_y);
|
|
}
|
|
|
|
static inline void set_blocks(SnowContext *s, int level, int x, int y, int l, int cb, int cr, int mx, int my, int ref, int type){
|
|
const int w= s->b_width << s->block_max_depth;
|
|
const int rem_depth= s->block_max_depth - level;
|
|
const int index= (x + y*w) << rem_depth;
|
|
const int block_w= 1<<rem_depth;
|
|
const int block_h= 1<<rem_depth; //FIXME "w!=h"
|
|
BlockNode block;
|
|
int i,j;
|
|
|
|
block.color[0]= l;
|
|
block.color[1]= cb;
|
|
block.color[2]= cr;
|
|
block.mx= mx;
|
|
block.my= my;
|
|
block.ref= ref;
|
|
block.type= type;
|
|
block.level= level;
|
|
|
|
for(j=0; j<block_h; j++){
|
|
for(i=0; i<block_w; i++){
|
|
s->block[index + i + j*w]= block;
|
|
}
|
|
}
|
|
}
|
|
|
|
extern const int8_t ff_quant3bA[256];
|
|
|
|
#define QEXPSHIFT (7-FRAC_BITS+8) //FIXME try to change this to 0
|
|
|
|
#endif /* AVCODEC_SNOW_H */
|