]> granicus.if.org Git - libx264/commitdiff
Faster coeff_last64 on 32-bit
authorFiona Glaser <fiona@x264.com>
Sat, 7 Feb 2009 09:57:43 +0000 (01:57 -0800)
committerFiona Glaser <fiona@x264.com>
Mon, 9 Feb 2009 10:32:28 +0000 (02:32 -0800)
common/x86/quant-a.asm

index d1b39919abc4b0f60f69f89cacb6e5b8296ec188..a013e538817e2027320fe3e52606a617b5a1a546 100644 (file)
@@ -820,17 +820,17 @@ cglobal x264_coeff_last16_%1, 1,3
 %ifndef ARCH_X86_64
 cglobal x264_coeff_last64_%1, 1, 5-mmsize/16
     pxor m2, m2
-    LAST_MASK r1d, r0, r4d
-    LAST_MASK r2d, r0+32, r4d
-    shl r2d, 16
-    or  r1d, r2d
     LAST_MASK r2d, r0+64, r4d
     LAST_MASK r3d, r0+96, r4d
     shl r3d, 16
     or  r2d, r3d
-    not r1d
     xor r2d, -1
     jne .secondhalf
+    LAST_MASK r1d, r0, r4d
+    LAST_MASK r3d, r0+32, r4d
+    shl r3d, 16
+    or  r1d, r3d
+    not r1d
     LAST eax, r1d, 0x1f
     RET
 .secondhalf: