mirror of https://github.com/mpv-player/mpv
474 lines
12 KiB
C
474 lines
12 KiB
C
/*
|
|
* Copyright (C) 2002 Michael Niedermayer <michaelni@gmx.at>
|
|
*
|
|
* This file is part of MPlayer.
|
|
*
|
|
* MPlayer is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* MPlayer is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with MPlayer; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <inttypes.h>
|
|
#include <math.h>
|
|
|
|
#include "config.h"
|
|
#include "mp_msg.h"
|
|
#include "cpudetect.h"
|
|
|
|
#if HAVE_MALLOC_H
|
|
#include <malloc.h>
|
|
#endif
|
|
|
|
#include "img_format.h"
|
|
#include "mp_image.h"
|
|
#include "vf.h"
|
|
#include "libvo/fastmemcpy.h"
|
|
|
|
#define MAX_NOISE 4096
|
|
#define MAX_SHIFT 1024
|
|
#define MAX_RES (MAX_NOISE-MAX_SHIFT)
|
|
|
|
//===========================================================================//
|
|
|
|
static inline void lineNoise_C(uint8_t *dst, uint8_t *src, int8_t *noise, int len, int shift);
|
|
static inline void lineNoiseAvg_C(uint8_t *dst, uint8_t *src, int len, int8_t **shift);
|
|
|
|
static void (*lineNoise)(uint8_t *dst, uint8_t *src, int8_t *noise, int len, int shift)= lineNoise_C;
|
|
static void (*lineNoiseAvg)(uint8_t *dst, uint8_t *src, int len, int8_t **shift)= lineNoiseAvg_C;
|
|
|
|
typedef struct FilterParam{
|
|
int strength;
|
|
int uniform;
|
|
int temporal;
|
|
int quality;
|
|
int averaged;
|
|
int pattern;
|
|
int shiftptr;
|
|
int8_t *noise;
|
|
int8_t *prev_shift[MAX_RES][3];
|
|
}FilterParam;
|
|
|
|
struct vf_priv_s {
|
|
FilterParam lumaParam;
|
|
FilterParam chromaParam;
|
|
unsigned int outfmt;
|
|
};
|
|
|
|
static int nonTempRandShift_init;
|
|
static int nonTempRandShift[MAX_RES];
|
|
|
|
static int patt[4] = {
|
|
-1,0,1,0
|
|
};
|
|
|
|
#define RAND_N(range) ((int) ((double)range*rand()/(RAND_MAX+1.0)))
|
|
static int8_t *initNoise(FilterParam *fp){
|
|
int strength= fp->strength;
|
|
int uniform= fp->uniform;
|
|
int averaged= fp->averaged;
|
|
int pattern= fp->pattern;
|
|
int8_t *noise= memalign(16, MAX_NOISE*sizeof(int8_t));
|
|
int i, j;
|
|
|
|
srand(123457);
|
|
|
|
for(i=0,j=0; i<MAX_NOISE; i++,j++)
|
|
{
|
|
if(uniform) {
|
|
if (averaged) {
|
|
if (pattern) {
|
|
noise[i]= (RAND_N(strength) - strength/2)/6
|
|
+patt[j%4]*strength*0.25/3;
|
|
} else {
|
|
noise[i]= (RAND_N(strength) - strength/2)/3;
|
|
}
|
|
} else {
|
|
if (pattern) {
|
|
noise[i]= (RAND_N(strength) - strength/2)/2
|
|
+ patt[j%4]*strength*0.25;
|
|
} else {
|
|
noise[i]= RAND_N(strength) - strength/2;
|
|
}
|
|
}
|
|
} else {
|
|
double x1, x2, w, y1;
|
|
do {
|
|
x1 = 2.0 * rand()/(float)RAND_MAX - 1.0;
|
|
x2 = 2.0 * rand()/(float)RAND_MAX - 1.0;
|
|
w = x1 * x1 + x2 * x2;
|
|
} while ( w >= 1.0 );
|
|
|
|
w = sqrt( (-2.0 * log( w ) ) / w );
|
|
y1= x1 * w;
|
|
y1*= strength / sqrt(3.0);
|
|
if (pattern) {
|
|
y1 /= 2;
|
|
y1 += patt[j%4]*strength*0.35;
|
|
}
|
|
if (y1<-128) y1=-128;
|
|
else if(y1> 127) y1= 127;
|
|
if (averaged) y1 /= 3.0;
|
|
noise[i]= (int)y1;
|
|
}
|
|
if (RAND_N(6) == 0) j--;
|
|
}
|
|
|
|
|
|
for (i = 0; i < MAX_RES; i++)
|
|
for (j = 0; j < 3; j++)
|
|
fp->prev_shift[i][j] = noise + (rand()&(MAX_SHIFT-1));
|
|
|
|
if(!nonTempRandShift_init){
|
|
for(i=0; i<MAX_RES; i++){
|
|
nonTempRandShift[i]= rand()&(MAX_SHIFT-1);
|
|
}
|
|
nonTempRandShift_init = 1;
|
|
}
|
|
|
|
fp->noise= noise;
|
|
fp->shiftptr= 0;
|
|
return noise;
|
|
}
|
|
|
|
/***************************************************************************/
|
|
|
|
#if HAVE_MMX
|
|
static inline void lineNoise_MMX(uint8_t *dst, uint8_t *src, int8_t *noise, int len, int shift){
|
|
x86_reg mmx_len= len&(~7);
|
|
noise+=shift;
|
|
|
|
__asm__ volatile(
|
|
"mov %3, %%"REG_a" \n\t"
|
|
"pcmpeqb %%mm7, %%mm7 \n\t"
|
|
"psllw $15, %%mm7 \n\t"
|
|
"packsswb %%mm7, %%mm7 \n\t"
|
|
ASMALIGN(4)
|
|
"1: \n\t"
|
|
"movq (%0, %%"REG_a"), %%mm0 \n\t"
|
|
"movq (%1, %%"REG_a"), %%mm1 \n\t"
|
|
"pxor %%mm7, %%mm0 \n\t"
|
|
"paddsb %%mm1, %%mm0 \n\t"
|
|
"pxor %%mm7, %%mm0 \n\t"
|
|
"movq %%mm0, (%2, %%"REG_a") \n\t"
|
|
"add $8, %%"REG_a" \n\t"
|
|
" js 1b \n\t"
|
|
:: "r" (src+mmx_len), "r" (noise+mmx_len), "r" (dst+mmx_len), "g" (-mmx_len)
|
|
: "%"REG_a
|
|
);
|
|
if(mmx_len!=len)
|
|
lineNoise_C(dst+mmx_len, src+mmx_len, noise+mmx_len, len-mmx_len, 0);
|
|
}
|
|
#endif
|
|
|
|
//duplicate of previous except movntq
|
|
#if HAVE_MMX2
|
|
static inline void lineNoise_MMX2(uint8_t *dst, uint8_t *src, int8_t *noise, int len, int shift){
|
|
x86_reg mmx_len= len&(~7);
|
|
noise+=shift;
|
|
|
|
__asm__ volatile(
|
|
"mov %3, %%"REG_a" \n\t"
|
|
"pcmpeqb %%mm7, %%mm7 \n\t"
|
|
"psllw $15, %%mm7 \n\t"
|
|
"packsswb %%mm7, %%mm7 \n\t"
|
|
ASMALIGN(4)
|
|
"1: \n\t"
|
|
"movq (%0, %%"REG_a"), %%mm0 \n\t"
|
|
"movq (%1, %%"REG_a"), %%mm1 \n\t"
|
|
"pxor %%mm7, %%mm0 \n\t"
|
|
"paddsb %%mm1, %%mm0 \n\t"
|
|
"pxor %%mm7, %%mm0 \n\t"
|
|
"movntq %%mm0, (%2, %%"REG_a") \n\t"
|
|
"add $8, %%"REG_a" \n\t"
|
|
" js 1b \n\t"
|
|
:: "r" (src+mmx_len), "r" (noise+mmx_len), "r" (dst+mmx_len), "g" (-mmx_len)
|
|
: "%"REG_a
|
|
);
|
|
if(mmx_len!=len)
|
|
lineNoise_C(dst+mmx_len, src+mmx_len, noise+mmx_len, len-mmx_len, 0);
|
|
}
|
|
#endif
|
|
|
|
static inline void lineNoise_C(uint8_t *dst, uint8_t *src, int8_t *noise, int len, int shift){
|
|
int i;
|
|
noise+= shift;
|
|
for(i=0; i<len; i++)
|
|
{
|
|
int v= src[i]+ noise[i];
|
|
if(v>255) dst[i]=255; //FIXME optimize
|
|
else if(v<0) dst[i]=0;
|
|
else dst[i]=v;
|
|
}
|
|
}
|
|
|
|
/***************************************************************************/
|
|
|
|
#if HAVE_MMX
|
|
static inline void lineNoiseAvg_MMX(uint8_t *dst, uint8_t *src, int len, int8_t **shift){
|
|
x86_reg mmx_len= len&(~7);
|
|
|
|
__asm__ volatile(
|
|
"mov %5, %%"REG_a" \n\t"
|
|
ASMALIGN(4)
|
|
"1: \n\t"
|
|
"movq (%1, %%"REG_a"), %%mm1 \n\t"
|
|
"movq (%0, %%"REG_a"), %%mm0 \n\t"
|
|
"paddb (%2, %%"REG_a"), %%mm1 \n\t"
|
|
"paddb (%3, %%"REG_a"), %%mm1 \n\t"
|
|
"movq %%mm0, %%mm2 \n\t"
|
|
"movq %%mm1, %%mm3 \n\t"
|
|
"punpcklbw %%mm0, %%mm0 \n\t"
|
|
"punpckhbw %%mm2, %%mm2 \n\t"
|
|
"punpcklbw %%mm1, %%mm1 \n\t"
|
|
"punpckhbw %%mm3, %%mm3 \n\t"
|
|
"pmulhw %%mm0, %%mm1 \n\t"
|
|
"pmulhw %%mm2, %%mm3 \n\t"
|
|
"paddw %%mm1, %%mm1 \n\t"
|
|
"paddw %%mm3, %%mm3 \n\t"
|
|
"paddw %%mm0, %%mm1 \n\t"
|
|
"paddw %%mm2, %%mm3 \n\t"
|
|
"psrlw $8, %%mm1 \n\t"
|
|
"psrlw $8, %%mm3 \n\t"
|
|
"packuswb %%mm3, %%mm1 \n\t"
|
|
"movq %%mm1, (%4, %%"REG_a") \n\t"
|
|
"add $8, %%"REG_a" \n\t"
|
|
" js 1b \n\t"
|
|
:: "r" (src+mmx_len), "r" (shift[0]+mmx_len), "r" (shift[1]+mmx_len), "r" (shift[2]+mmx_len),
|
|
"r" (dst+mmx_len), "g" (-mmx_len)
|
|
: "%"REG_a
|
|
);
|
|
|
|
if(mmx_len!=len){
|
|
int8_t *shift2[3]={shift[0]+mmx_len, shift[1]+mmx_len, shift[2]+mmx_len};
|
|
lineNoiseAvg_C(dst+mmx_len, src+mmx_len, len-mmx_len, shift2);
|
|
}
|
|
}
|
|
#endif
|
|
|
|
static inline void lineNoiseAvg_C(uint8_t *dst, uint8_t *src, int len, int8_t **shift){
|
|
int i;
|
|
int8_t *src2= (int8_t*)src;
|
|
|
|
for(i=0; i<len; i++)
|
|
{
|
|
const int n= shift[0][i] + shift[1][i] + shift[2][i];
|
|
dst[i]= src2[i]+((n*src2[i])>>7);
|
|
}
|
|
}
|
|
|
|
/***************************************************************************/
|
|
|
|
static void noise(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int width, int height, FilterParam *fp){
|
|
int8_t *noise= fp->noise;
|
|
int y;
|
|
int shift=0;
|
|
|
|
if(!noise)
|
|
{
|
|
if(src==dst) return;
|
|
|
|
if(dstStride==srcStride) fast_memcpy(dst, src, srcStride*height);
|
|
else
|
|
{
|
|
for(y=0; y<height; y++)
|
|
{
|
|
fast_memcpy(dst, src, width);
|
|
dst+= dstStride;
|
|
src+= srcStride;
|
|
}
|
|
}
|
|
return;
|
|
}
|
|
|
|
for(y=0; y<height; y++)
|
|
{
|
|
if(fp->temporal) shift= rand()&(MAX_SHIFT -1);
|
|
else shift= nonTempRandShift[y];
|
|
|
|
if(fp->quality==0) shift&= ~7;
|
|
if (fp->averaged) {
|
|
lineNoiseAvg(dst, src, width, fp->prev_shift[y]);
|
|
fp->prev_shift[y][fp->shiftptr] = noise + shift;
|
|
} else {
|
|
lineNoise(dst, src, noise, width, shift);
|
|
}
|
|
dst+= dstStride;
|
|
src+= srcStride;
|
|
}
|
|
fp->shiftptr++;
|
|
if (fp->shiftptr == 3) fp->shiftptr = 0;
|
|
}
|
|
|
|
static int config(struct vf_instance* vf,
|
|
int width, int height, int d_width, int d_height,
|
|
unsigned int flags, unsigned int outfmt){
|
|
|
|
return vf_next_config(vf,width,height,d_width,d_height,flags,outfmt);
|
|
}
|
|
|
|
static void get_image(struct vf_instance* vf, mp_image_t *mpi){
|
|
if(mpi->flags&MP_IMGFLAG_PRESERVE) return; // don't change
|
|
if(mpi->imgfmt!=vf->priv->outfmt) return; // colorspace differ
|
|
// ok, we can do pp in-place (or pp disabled):
|
|
vf->dmpi=vf_get_image(vf->next,mpi->imgfmt,
|
|
mpi->type, mpi->flags, mpi->w, mpi->h);
|
|
mpi->planes[0]=vf->dmpi->planes[0];
|
|
mpi->stride[0]=vf->dmpi->stride[0];
|
|
mpi->width=vf->dmpi->width;
|
|
if(mpi->flags&MP_IMGFLAG_PLANAR){
|
|
mpi->planes[1]=vf->dmpi->planes[1];
|
|
mpi->planes[2]=vf->dmpi->planes[2];
|
|
mpi->stride[1]=vf->dmpi->stride[1];
|
|
mpi->stride[2]=vf->dmpi->stride[2];
|
|
}
|
|
mpi->flags|=MP_IMGFLAG_DIRECT;
|
|
}
|
|
|
|
static int put_image(struct vf_instance* vf, mp_image_t *mpi, double pts){
|
|
mp_image_t *dmpi;
|
|
|
|
if(!(mpi->flags&MP_IMGFLAG_DIRECT)){
|
|
// no DR, so get a new image! hope we'll get DR buffer:
|
|
vf->dmpi=vf_get_image(vf->next,vf->priv->outfmt,
|
|
MP_IMGTYPE_TEMP, MP_IMGFLAG_ACCEPT_STRIDE,
|
|
mpi->w,mpi->h);
|
|
//printf("nodr\n");
|
|
}
|
|
//else printf("dr\n");
|
|
dmpi= vf->dmpi;
|
|
|
|
noise(dmpi->planes[0], mpi->planes[0], dmpi->stride[0], mpi->stride[0], mpi->w, mpi->h, &vf->priv->lumaParam);
|
|
noise(dmpi->planes[1], mpi->planes[1], dmpi->stride[1], mpi->stride[1], mpi->w/2, mpi->h/2, &vf->priv->chromaParam);
|
|
noise(dmpi->planes[2], mpi->planes[2], dmpi->stride[2], mpi->stride[2], mpi->w/2, mpi->h/2, &vf->priv->chromaParam);
|
|
|
|
vf_clone_mpi_attributes(dmpi, mpi);
|
|
|
|
#if HAVE_MMX
|
|
if(gCpuCaps.hasMMX) __asm__ volatile ("emms\n\t");
|
|
#endif
|
|
#if HAVE_MMX2
|
|
if(gCpuCaps.hasMMX2) __asm__ volatile ("sfence\n\t");
|
|
#endif
|
|
|
|
return vf_next_put_image(vf,dmpi, pts);
|
|
}
|
|
|
|
static void uninit(struct vf_instance* vf){
|
|
if(!vf->priv) return;
|
|
|
|
if(vf->priv->chromaParam.noise) free(vf->priv->chromaParam.noise);
|
|
vf->priv->chromaParam.noise= NULL;
|
|
|
|
if(vf->priv->lumaParam.noise) free(vf->priv->lumaParam.noise);
|
|
vf->priv->lumaParam.noise= NULL;
|
|
|
|
free(vf->priv);
|
|
vf->priv=NULL;
|
|
}
|
|
|
|
//===========================================================================//
|
|
|
|
static int query_format(struct vf_instance* vf, unsigned int fmt){
|
|
switch(fmt)
|
|
{
|
|
case IMGFMT_YV12:
|
|
case IMGFMT_I420:
|
|
case IMGFMT_IYUV:
|
|
return vf_next_query_format(vf,vf->priv->outfmt);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static void parse(FilterParam *fp, char* args){
|
|
char *pos;
|
|
char *max= strchr(args, ':');
|
|
|
|
if(!max) max= args + strlen(args);
|
|
|
|
fp->strength= atoi(args);
|
|
pos= strchr(args, 'u');
|
|
if(pos && pos<max) fp->uniform=1;
|
|
pos= strchr(args, 't');
|
|
if(pos && pos<max) fp->temporal=1;
|
|
pos= strchr(args, 'h');
|
|
if(pos && pos<max) fp->quality=1;
|
|
pos= strchr(args, 'p');
|
|
if(pos && pos<max) fp->pattern=1;
|
|
pos= strchr(args, 'a');
|
|
if(pos && pos<max) {
|
|
fp->temporal=1;
|
|
fp->averaged=1;
|
|
}
|
|
|
|
if(fp->strength) initNoise(fp);
|
|
}
|
|
|
|
static const unsigned int fmt_list[]={
|
|
IMGFMT_YV12,
|
|
IMGFMT_I420,
|
|
IMGFMT_IYUV,
|
|
0
|
|
};
|
|
|
|
static int vf_open(vf_instance_t *vf, char *args){
|
|
vf->config=config;
|
|
vf->put_image=put_image;
|
|
vf->get_image=get_image;
|
|
vf->query_format=query_format;
|
|
vf->uninit=uninit;
|
|
vf->priv=malloc(sizeof(struct vf_priv_s));
|
|
memset(vf->priv, 0, sizeof(struct vf_priv_s));
|
|
if(args)
|
|
{
|
|
char *arg2= strchr(args,':');
|
|
if(arg2) parse(&vf->priv->chromaParam, arg2+1);
|
|
parse(&vf->priv->lumaParam, args);
|
|
}
|
|
|
|
// check csp:
|
|
vf->priv->outfmt=vf_match_csp(&vf->next,fmt_list,IMGFMT_YV12);
|
|
if(!vf->priv->outfmt)
|
|
{
|
|
uninit(vf);
|
|
return 0; // no csp match :(
|
|
}
|
|
|
|
|
|
#if HAVE_MMX
|
|
if(gCpuCaps.hasMMX){
|
|
lineNoise= lineNoise_MMX;
|
|
lineNoiseAvg= lineNoiseAvg_MMX;
|
|
}
|
|
#endif
|
|
#if HAVE_MMX2
|
|
if(gCpuCaps.hasMMX2) lineNoise= lineNoise_MMX2;
|
|
// if(gCpuCaps.hasMMX) lineNoiseAvg= lineNoiseAvg_MMX2;
|
|
#endif
|
|
|
|
return 1;
|
|
}
|
|
|
|
const vf_info_t vf_info_noise = {
|
|
"noise generator",
|
|
"noise",
|
|
"Michael Niedermayer",
|
|
"",
|
|
vf_open,
|
|
NULL
|
|
};
|
|
|
|
//===========================================================================//
|