Commit 360bee8c authored by Jun Zhao's avatar Jun Zhao

lavfi/colorlevels: Add slice threading support

Add slice threading support, use the command like:

./ffmpeg -i input -vf colorlevels -f null /dev/null

with 1080p h264 clip, the fps from 39 fps to 79 fps
in the local(Intel(R) Core(TM) i5-8265U CPU @ 1.60GHz)
Reviewed-by: 's avatarPaul B Mahol <onemda@gmail.com>
Signed-off-by: 's avatarJun Zhao <barryjzhao@tencent.com>
parent 468f0038
...@@ -105,6 +105,68 @@ static int config_input(AVFilterLink *inlink) ...@@ -105,6 +105,68 @@ static int config_input(AVFilterLink *inlink)
return 0; return 0;
} }
struct thread_data {
const uint8_t *srcrow;
uint8_t *dstrow;
int dst_linesize;
int src_linesize;
double coeff;
uint8_t offset;
int h;
int imin;
int omin;
};
#define LOAD_COMMON\
ColorLevelsContext *s = ctx->priv;\
const struct thread_data *td = arg;\
\
int process_h = td->h;\
const int slice_start = (process_h * jobnr ) / nb_jobs;\
const int slice_end = (process_h * (jobnr+1)) / nb_jobs;\
int x, y;\
const uint8_t *srcrow = td->srcrow;\
uint8_t *dstrow = td->dstrow;\
const int step = s->step;\
const uint8_t offset = td->offset;\
\
int imin = td->imin;\
int omin = td->omin;\
double coeff = td->coeff;\
static int colorlevel_slice_8(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
{
LOAD_COMMON
for (y = slice_start; y < slice_end; y++) {
const uint8_t *src = srcrow + y * td->src_linesize;
uint8_t *dst = dstrow + y * td->dst_linesize;
for (x = 0; x < s->linesize; x += step)
dst[x + offset] = av_clip_uint8((src[x + offset] - imin) * coeff + omin);
}
return 0;
}
static int colorlevel_slice_16(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
{
LOAD_COMMON
for (y = slice_start; y < slice_end; y++) {
const uint16_t *src = (const uint16_t *)(srcrow + y * td->src_linesize);
uint16_t *dst = (uint16_t *)(dstrow + y * td->dst_linesize);
for (x = 0; x < s->linesize; x += step)
dst[x + offset] = av_clip_uint16((src[x + offset] - imin) * coeff + omin);
}
return 0;
}
static int filter_frame(AVFilterLink *inlink, AVFrame *in) static int filter_frame(AVFilterLink *inlink, AVFrame *in)
{ {
AVFilterContext *ctx = inlink->dst; AVFilterContext *ctx = inlink->dst;
...@@ -137,6 +199,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in) ...@@ -137,6 +199,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
int omin = lrint(r->out_min * UINT8_MAX); int omin = lrint(r->out_min * UINT8_MAX);
int omax = lrint(r->out_max * UINT8_MAX); int omax = lrint(r->out_max * UINT8_MAX);
double coeff; double coeff;
struct thread_data td;
if (imin < 0) { if (imin < 0) {
imin = UINT8_MAX; imin = UINT8_MAX;
...@@ -162,15 +225,19 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in) ...@@ -162,15 +225,19 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
srcrow = in->data[0]; srcrow = in->data[0];
coeff = (omax - omin) / (double)(imax - imin); coeff = (omax - omin) / (double)(imax - imin);
for (y = 0; y < inlink->h; y++) {
const uint8_t *src = srcrow; td.srcrow = srcrow;
uint8_t *dst = dstrow; td.dstrow = dstrow;
td.dst_linesize = out->linesize[0];
for (x = 0; x < s->linesize; x += step) td.src_linesize = in->linesize[0];
dst[x + offset] = av_clip_uint8((src[x + offset] - imin) * coeff + omin); td.coeff = coeff;
dstrow += out->linesize[0]; td.offset = offset;
srcrow += in->linesize[0]; td.h = inlink->h;
} td.imin = imin;
td.omin = omin;
ctx->internal->execute(ctx, colorlevel_slice_8, &td, NULL,
FFMIN(inlink->h, ff_filter_get_nb_threads(ctx)));
} }
break; break;
case 2: case 2:
...@@ -184,6 +251,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in) ...@@ -184,6 +251,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
int omin = lrint(r->out_min * UINT16_MAX); int omin = lrint(r->out_min * UINT16_MAX);
int omax = lrint(r->out_max * UINT16_MAX); int omax = lrint(r->out_max * UINT16_MAX);
double coeff; double coeff;
struct thread_data td;
if (imin < 0) { if (imin < 0) {
imin = UINT16_MAX; imin = UINT16_MAX;
...@@ -209,15 +277,19 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in) ...@@ -209,15 +277,19 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
srcrow = in->data[0]; srcrow = in->data[0];
coeff = (omax - omin) / (double)(imax - imin); coeff = (omax - omin) / (double)(imax - imin);
for (y = 0; y < inlink->h; y++) {
const uint16_t *src = (const uint16_t*)srcrow; td.srcrow = srcrow;
uint16_t *dst = (uint16_t *)dstrow; td.dstrow = dstrow;
td.dst_linesize = out->linesize[0];
for (x = 0; x < s->linesize; x += step) td.src_linesize = in->linesize[0];
dst[x + offset] = av_clip_uint16((src[x + offset] - imin) * coeff + omin); td.coeff = coeff;
dstrow += out->linesize[0]; td.offset = offset;
srcrow += in->linesize[0]; td.h = inlink->h;
} td.imin = imin;
td.omin = omin;
ctx->internal->execute(ctx, colorlevel_slice_16, &td, NULL,
FFMIN(inlink->h, ff_filter_get_nb_threads(ctx)));
} }
} }
...@@ -252,5 +324,5 @@ AVFilter ff_vf_colorlevels = { ...@@ -252,5 +324,5 @@ AVFilter ff_vf_colorlevels = {
.query_formats = query_formats, .query_formats = query_formats,
.inputs = colorlevels_inputs, .inputs = colorlevels_inputs,
.outputs = colorlevels_outputs, .outputs = colorlevels_outputs,
.flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS,
}; };
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment