Commit 95057b19 authored by Michael Niedermayer's avatar Michael Niedermayer

swr: int16->int32: use the old index negate trick to avoid 2 adds

Signed-off-by: 's avatarMichael Niedermayer <michaelni@gmx.at>
parent 113738d6
...@@ -35,18 +35,20 @@ cglobal int16_to_int32_%1, 3, 3, 3, dst, src, len ...@@ -35,18 +35,20 @@ cglobal int16_to_int32_%1, 3, 3, 3, dst, src, len
%else %else
int16_to_int32_u_int %+ SUFFIX int16_to_int32_u_int %+ SUFFIX
%endif %endif
add dstq, lenq
shr lenq, 1
add srcq, lenq
neg lenq
.next .next
mov%1 m4, [srcq] mov%1 m2, [srcq+lenq]
pxor m0, m0 pxor m0, m0
pxor m1, m1 pxor m1, m1
punpcklwd m0, m4 punpcklwd m0, m2
punpckhwd m1, m4 punpckhwd m1, m2
mov%1 [ dstq], m0 mov%1 [ dstq+2*lenq], m0
mov%1 [mmsize + dstq], m1 mov%1 [mmsize + dstq+2*lenq], m1
add srcq, mmsize add lenq, mmsize
add dstq, 2*mmsize jl .next
sub lenq, 2*mmsize
jg .next
%if mmsize == 8 %if mmsize == 8
emms emms
%endif %endif
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment