Commit a4f876a1 authored by James Almer's avatar James Almer

x86/vf_fspp: move pxor in store slice functions out of the loop

m7 is not overwritten, so we only need to clear it once.
Found by Christophe Gisquet.
Signed-off-by: 's avatarJames Almer <jamrial@gmail.com>
parent 466e32bf
...@@ -77,11 +77,11 @@ cglobal store_slice, 2, 7, 0, dst, src, width, dither_height, dither, tmp, tmp2 ...@@ -77,11 +77,11 @@ cglobal store_slice, 2, 7, 0, dst, src, width, dither_height, dither, tmp, tmp2
mov src_strideq, tmp2q mov src_strideq, tmp2q
shl tmpq, 4 shl tmpq, 4
lea dither_heightq, [ditherq+dither_heightq*8] lea dither_heightq, [ditherq+dither_heightq*8]
pxor m7, m7
.loop_height: .loop_height:
movq m3, [ditherq] movq m3, [ditherq]
movq m4, m3 movq m4, m3
pxor m7, m7
punpcklbw m3, m7 punpcklbw m3, m7
punpckhbw m4, m7 punpckhbw m4, m7
mov tmp2q, widthq mov tmp2q, widthq
...@@ -143,11 +143,11 @@ cglobal store_slice2, 0, 7, 0, dst, src, width, dither_height, dither, tmp, tmp2 ...@@ -143,11 +143,11 @@ cglobal store_slice2, 0, 7, 0, dst, src, width, dither_height, dither, tmp, tmp2
mov src_strideq, tmp2q mov src_strideq, tmp2q
shl tmpq, 5 shl tmpq, 5
lea dither_heightq, [ditherq+dither_heightq*8] lea dither_heightq, [ditherq+dither_heightq*8]
pxor m7, m7
.loop_height: .loop_height:
movq m3, [ditherq] movq m3, [ditherq]
movq m4, m3 movq m4, m3
pxor m7, m7
punpcklbw m3, m7 punpcklbw m3, m7
punpckhbw m4, m7 punpckhbw m4, m7
mov tmp2q,widthq mov tmp2q,widthq
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment