Commit 48576887 authored by James Almer's avatar James Almer

x86/vf_v360: use a faster horizontal add in remap4_8bit_line_avx2

Signed-off-by: 's avatarJames Almer <jamrial@gmail.com>
parent 2200cf1a
...@@ -130,14 +130,11 @@ cglobal remap4_8bit_line, 7, 9, 11, dst, width, src, in_linesize, u, v, ker, x, ...@@ -130,14 +130,11 @@ cglobal remap4_8bit_line, 7, 9, 11, dst, width, src, in_linesize, u, v, ker, x,
pmulld m4, m5 pmulld m4, m5
paddd m2, m4 paddd m2, m4
vextracti128 xm1, m2, 1 HADDD m2, m1
paddd m1, m2 psrld m2, m2, 0xe
phaddd m1, m1 packuswb m2, m2
phaddd m1, m1
psrld m1, m1, 0xe
packuswb m1, m1
pextrb [dstq+xq], xm1, 0 pextrb [dstq+xq], xm2, 0
add xq, 1 add xq, 1
add yq, 32 add yq, 32
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment