mirror of https://git.ffmpeg.org/ffmpeg.git
vf_yadif: support slice threading
This commit is contained in:
parent
129bb23843
commit
cb79881b49
|
@ -32,6 +32,14 @@
|
|||
#undef NDEBUG
|
||||
#include <assert.h>
|
||||
|
||||
typedef struct ThreadData {
|
||||
AVFrame *frame;
|
||||
int plane;
|
||||
int w, h;
|
||||
int parity;
|
||||
int tff;
|
||||
} ThreadData;
|
||||
|
||||
#define CHECK(j)\
|
||||
{ int score = FFABS(cur[mrefs - 1 + (j)] - cur[prefs - 1 - (j)])\
|
||||
+ FFABS(cur[mrefs +(j)] - cur[prefs -(j)])\
|
||||
|
@ -173,50 +181,67 @@ static void filter_edges_16bit(void *dst1, void *prev1, void *cur1, void *next1,
|
|||
FILTER(w - 3, w, 0)
|
||||
}
|
||||
|
||||
static int filter_slice(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
|
||||
{
|
||||
YADIFContext *s = ctx->priv;
|
||||
ThreadData *td = arg;
|
||||
int refs = s->cur->linesize[td->plane];
|
||||
int df = (s->csp->comp[td->plane].depth_minus1 + 8) / 8;
|
||||
int pix_3 = 3 * df;
|
||||
int slice_h = td->h / nb_jobs;
|
||||
int slice_start = jobnr * slice_h;
|
||||
int slice_end = (jobnr == nb_jobs - 1) ? td->h : (jobnr + 1) * slice_h;
|
||||
int y;
|
||||
|
||||
/* filtering reads 3 pixels to the left/right; to avoid invalid reads,
|
||||
* we need to call the c variant which avoids this for border pixels
|
||||
*/
|
||||
for (y = slice_start; y < slice_end; y++) {
|
||||
if ((y ^ td->parity) & 1) {
|
||||
uint8_t *prev = &s->prev->data[td->plane][y * refs];
|
||||
uint8_t *cur = &s->cur ->data[td->plane][y * refs];
|
||||
uint8_t *next = &s->next->data[td->plane][y * refs];
|
||||
uint8_t *dst = &td->frame->data[td->plane][y * td->frame->linesize[td->plane]];
|
||||
int mode = y == 1 || y + 2 == td->h ? 2 : s->mode;
|
||||
s->filter_line(dst + pix_3, prev + pix_3, cur + pix_3,
|
||||
next + pix_3, td->w - 6,
|
||||
y + 1 < td->h ? refs : -refs,
|
||||
y ? -refs : refs,
|
||||
td->parity ^ td->tff, mode);
|
||||
s->filter_edges(dst, prev, cur, next, td->w,
|
||||
y + 1 < td->h ? refs : -refs,
|
||||
y ? -refs : refs,
|
||||
td->parity ^ td->tff, mode);
|
||||
} else {
|
||||
memcpy(&td->frame->data[td->plane][y * td->frame->linesize[td->plane]],
|
||||
&s->cur->data[td->plane][y * refs], td->w * df);
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void filter(AVFilterContext *ctx, AVFrame *dstpic,
|
||||
int parity, int tff)
|
||||
{
|
||||
YADIFContext *yadif = ctx->priv;
|
||||
int y, i;
|
||||
ThreadData td = { .frame = dstpic, .parity = parity, .tff = tff };
|
||||
int i;
|
||||
|
||||
for (i = 0; i < yadif->csp->nb_components; i++) {
|
||||
int w = dstpic->width;
|
||||
int h = dstpic->height;
|
||||
int refs = yadif->cur->linesize[i];
|
||||
int df = (yadif->csp->comp[i].depth_minus1 + 8) / 8;
|
||||
int pix_3 = 3 * df;
|
||||
|
||||
if (i == 1 || i == 2) {
|
||||
/* Why is this not part of the per-plane description thing? */
|
||||
w >>= yadif->csp->log2_chroma_w;
|
||||
h >>= yadif->csp->log2_chroma_h;
|
||||
}
|
||||
|
||||
/* filtering reads 3 pixels to the left/right; to avoid invalid reads,
|
||||
* we need to call the c variant which avoids this for border pixels
|
||||
*/
|
||||
|
||||
for (y = 0; y < h; y++) {
|
||||
if ((y ^ parity) & 1) {
|
||||
uint8_t *prev = &yadif->prev->data[i][y * refs];
|
||||
uint8_t *cur = &yadif->cur ->data[i][y * refs];
|
||||
uint8_t *next = &yadif->next->data[i][y * refs];
|
||||
uint8_t *dst = &dstpic->data[i][y * dstpic->linesize[i]];
|
||||
int mode = y == 1 || y + 2 == h ? 2 : yadif->mode;
|
||||
yadif->filter_line(dst + pix_3, prev + pix_3, cur + pix_3,
|
||||
next + pix_3, w - 6,
|
||||
y + 1 < h ? refs : -refs,
|
||||
y ? -refs : refs,
|
||||
parity ^ tff, mode);
|
||||
yadif->filter_edges(dst, prev, cur, next, w,
|
||||
y + 1 < h ? refs : -refs,
|
||||
y ? -refs : refs,
|
||||
parity ^ tff, mode);
|
||||
} else {
|
||||
memcpy(&dstpic->data[i][y * dstpic->linesize[i]],
|
||||
&yadif->cur->data[i][y * refs], w * df);
|
||||
}
|
||||
}
|
||||
td.w = w;
|
||||
td.h = h;
|
||||
td.plane = i;
|
||||
|
||||
ctx->internal->execute(ctx, filter_slice, &td, NULL, FFMIN(h, ctx->graph->nb_threads));
|
||||
}
|
||||
|
||||
emms_c();
|
||||
|
@ -504,4 +529,6 @@ AVFilter avfilter_vf_yadif = {
|
|||
.inputs = avfilter_vf_yadif_inputs,
|
||||
|
||||
.outputs = avfilter_vf_yadif_outputs,
|
||||
|
||||
.flags = AVFILTER_FLAG_SLICE_THREADS,
|
||||
};
|
||||
|
|
Loading…
Reference in New Issue