Commit 4f589d66 authored by Ting Fu's avatar Ting Fu Committed by Ruiling Song

avfilter/x86/vf_eq: add SSE2 version

Signed-off-by: 's avatarTing Fu <ting.fu@intel.com>
parent 6aff2042
...@@ -24,7 +24,7 @@ ...@@ -24,7 +24,7 @@
SECTION .text SECTION .text
INIT_MMX mmxext %macro PROCESS_ONE_LINE 1
cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
movd m3, contrastd movd m3, contrastd
movd m4, brightnessd movd m4, brightnessd
...@@ -39,7 +39,7 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w ...@@ -39,7 +39,7 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
pxor m1, m1 pxor m1, m1
mov scalard, wd mov scalard, wd
and scalard, mmsize-1 and scalard, mmsize-1
sar wd, 3 sar wd, %1
cmp wd, 1 cmp wd, 1
jl .loop1 jl .loop1
...@@ -80,3 +80,11 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w ...@@ -80,3 +80,11 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
.end: .end:
RET RET
%endmacro
INIT_MMX mmxext
PROCESS_ONE_LINE 3
INIT_XMM sse2
PROCESS_ONE_LINE 4
...@@ -28,6 +28,8 @@ ...@@ -28,6 +28,8 @@
extern void ff_process_one_line_mmxext(const uint8_t *src, uint8_t *dst, short contrast, extern void ff_process_one_line_mmxext(const uint8_t *src, uint8_t *dst, short contrast,
short brightness, int w); short brightness, int w);
extern void ff_process_one_line_sse2(const uint8_t *src, uint8_t *dst, short contrast,
short brightness, int w);
static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride, static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride,
const uint8_t *src, int src_stride, int w, int h) const uint8_t *src, int src_stride, int w, int h)
...@@ -44,6 +46,20 @@ static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride, ...@@ -44,6 +46,20 @@ static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride,
emms_c(); emms_c();
} }
static void process_sse2(EQParameters *param, uint8_t *dst, int dst_stride,
const uint8_t *src, int src_stride, int w, int h)
{
short contrast = (short) (param->contrast * 256 * 16);
short brightness = ((short) (100.0 * param->brightness + 100.0) * 511)
/ 200 - 128 - contrast / 32;
while (h--) {
ff_process_one_line_sse2(src, dst, contrast, brightness, w);
src += src_stride;
dst += dst_stride;
}
}
av_cold void ff_eq_init_x86(EQContext *eq) av_cold void ff_eq_init_x86(EQContext *eq)
{ {
int cpu_flags = av_get_cpu_flags(); int cpu_flags = av_get_cpu_flags();
...@@ -51,4 +67,7 @@ av_cold void ff_eq_init_x86(EQContext *eq) ...@@ -51,4 +67,7 @@ av_cold void ff_eq_init_x86(EQContext *eq)
if (cpu_flags & AV_CPU_FLAG_MMXEXT) { if (cpu_flags & AV_CPU_FLAG_MMXEXT) {
eq->process = process_mmxext; eq->process = process_mmxext;
} }
if (cpu_flags & AV_CPU_FLAG_SSE2) {
eq->process = process_sse2;
}
} }
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment