Commit 664e9e43 authored by James Almer's avatar James Almer Committed by Michael Niedermayer

x86/hevc_deblock: load less data in hevc_h_loop_filter_luma_8

Reading 8 bytes is enough.
Signed-off-by: 's avatarJames Almer <jamrial@gmail.com>
Signed-off-by: 's avatarMichael Niedermayer <michaelni@gmx.at>
parent f1378761
...@@ -799,14 +799,14 @@ cglobal hevc_h_loop_filter_luma_8, 4, 15, 16, pix, stride, beta, tc, count, pix0 ...@@ -799,14 +799,14 @@ cglobal hevc_h_loop_filter_luma_8, 4, 15, 16, pix, stride, beta, tc, count, pix0
mov pix0q, pixq mov pix0q, pixq
sub pix0q, src3strideq sub pix0q, src3strideq
sub pix0q, strideq sub pix0q, strideq
movdqu m0, [pix0q]; p3 movq m0, [pix0q]; p3
movdqu m1, [pix0q + strideq]; p2 movq m1, [pix0q + strideq]; p2
movdqu m2, [pix0q + 2 * strideq]; p1 movq m2, [pix0q + 2 * strideq]; p1
movdqu m3, [pix0q + src3strideq]; p0 movq m3, [pix0q + src3strideq]; p0
movdqu m4, [pixq]; q0 movq m4, [pixq]; q0
movdqu m5, [pixq + strideq]; q1 movq m5, [pixq + strideq]; q1
movdqu m6, [pixq + 2 * strideq]; q2 movq m6, [pixq + 2 * strideq]; q2
movdqu m7, [pixq + src3strideq]; q3 movq m7, [pixq + src3strideq]; q3
pxor m8, m8 pxor m8, m8
punpcklbw m0, m8 punpcklbw m0, m8
punpcklbw m1, m8 punpcklbw m1, m8
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment