From: Fiona Glaser Date: Sat, 7 Feb 2009 09:57:43 +0000 (-0800) Subject: Faster coeff_last64 on 32-bit X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=5a7a1d14e461c431370d9111f3e6eb4efc15737f;p=libx264 Faster coeff_last64 on 32-bit --- diff --git a/common/x86/quant-a.asm b/common/x86/quant-a.asm index d1b39919..a013e538 100644 --- a/common/x86/quant-a.asm +++ b/common/x86/quant-a.asm @@ -820,17 +820,17 @@ cglobal x264_coeff_last16_%1, 1,3 %ifndef ARCH_X86_64 cglobal x264_coeff_last64_%1, 1, 5-mmsize/16 pxor m2, m2 - LAST_MASK r1d, r0, r4d - LAST_MASK r2d, r0+32, r4d - shl r2d, 16 - or r1d, r2d LAST_MASK r2d, r0+64, r4d LAST_MASK r3d, r0+96, r4d shl r3d, 16 or r2d, r3d - not r1d xor r2d, -1 jne .secondhalf + LAST_MASK r1d, r0, r4d + LAST_MASK r3d, r0+32, r4d + shl r3d, 16 + or r1d, r3d + not r1d LAST eax, r1d, 0x1f RET .secondhalf: