Commit 82dbfcca authored by James Almer's avatar James Almer

x86/aacdec: use HADDPS macro

Signed-off-by: 's avatarJames Almer <jamrial@gmail.com>
parent 99b89948
......@@ -38,17 +38,7 @@ cglobal ps_add_squares, 3, 3, %1, dst, src, n
movaps m1, [srcq+mmsize]
mulps m0, m0
mulps m1, m1
%if cpuflag(sse3)
haddps m0, m1
%else
movaps m3, m0
movaps m4, m1
shufps m3, m3, q0301
shufps m4, m4, q0301
addps m0, m3
addps m1, m4
shufps m0, m1, q2020
%endif
HADDPS m0, m1, m2
addps m0, [dstq]
movaps [dstq], m0
add dstq, mmsize
......@@ -59,9 +49,9 @@ cglobal ps_add_squares, 3, 3, %1, dst, src, n
%endmacro
INIT_XMM sse
PS_ADD_SQUARES 3
PS_ADD_SQUARES 2
INIT_XMM sse3
PS_ADD_SQUARES 5
PS_ADD_SQUARES 3
;*******************************************************************
;void ff_ps_mul_pair_single_sse(float (*dst)[2], float (*src0)[2],
......
......@@ -526,31 +526,15 @@ align 16
xorps m2, [ps_mask3]
xorps m5, [ps_mask3]
xorps m6, [ps_mask3]
HADDPS m2, m5, m3
HADDPS m7, m6, m4
%if cpuflag(sse3)
movshdup m0, m1
haddps m2, m5
haddps m7, m6
addss m1, m0
%else
movaps m3, m2
movaps m0, m5
movaps m4, m6
shufps m3, m3, q0301
shufps m0, m0, q0301
shufps m4, m4, q0301
addps m2, m3
addps m5, m0
addps m6, m4
movss m0, m7
movss m3, m1
shufps m7, m7, q0001
movss m0, m1
shufps m1, m1, q0001
addss m7, m0
addss m1, m3
shufps m2, m5, q2020
shufps m7, m6, q2020
%endif
addss m1, m0
movaps [phiq ], m2
movhps [phiq+0x18], m7
movss [phiq+0x28], m7
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment