Commit dab5f65b authored by James Almer's avatar James Almer

x86/takdsp: use arithmetic shift instructions

p1 and p2 are int32_t.
Reviewed-by: 's avatarRonald S. Bultje <rsbultje@gmail.com>
Signed-off-by: 's avatarJames Almer <jamrial@gmail.com>
parent 4ab56667
...@@ -75,8 +75,8 @@ cglobal tak_decorrelate_sm, 3, 3, 6, p1, p2, length ...@@ -75,8 +75,8 @@ cglobal tak_decorrelate_sm, 3, 3, 6, p1, p2, length
mova m4, [p2q+lengthq+mmsize] mova m4, [p2q+lengthq+mmsize]
mova m2, m1 mova m2, m1
mova m5, m4 mova m5, m4
psrld m2, 1 psrad m2, 1
psrld m5, 1 psrad m5, 1
psubd m0, m2 psubd m0, m2
psubd m3, m5 psubd m3, m5
paddd m1, m0 paddd m1, m0
...@@ -104,10 +104,10 @@ cglobal tak_decorrelate_sf, 3, 3, 5, p1, p2, length, dshift, dfactor ...@@ -104,10 +104,10 @@ cglobal tak_decorrelate_sf, 3, 3, 5, p1, p2, length, dshift, dfactor
.loop: .loop:
mova m0, [p1q+lengthq] mova m0, [p1q+lengthq]
mova m1, [p2q+lengthq] mova m1, [p2q+lengthq]
psrld m1, m2 psrad m1, m2
pmulld m1, m3 pmulld m1, m3
paddd m1, m4 paddd m1, m4
psrld m1, 8 psrad m1, 8
pslld m1, m2 pslld m1, m2
psubd m1, m0 psubd m1, m0
mova [p1q+lengthq], m1 mova [p1q+lengthq], m1
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment