From: Martin Storsjö Date: Thu, 13 Aug 2015 20:59:25 +0000 (+0300) Subject: arm: Use aligned loads in x264_coeff_last15_neon X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=d2b04a26b26d02c41ffb05cf1a605dafe9e6fa59;p=libx264 arm: Use aligned loads in x264_coeff_last15_neon After subtracting 2, the pointer will be aligned. checkasm timing Cortex-A7 A8 A9 coeff_last15_c 423 375 230 coeff_last15_neon 350 420 404 (before) coeff_last15_neon 350 400 394 (after) --- diff --git a/common/arm/quant-a.S b/common/arm/quant-a.S index 4b2129ab..ad8d8f84 100644 --- a/common/arm/quant-a.S +++ b/common/arm/quant-a.S @@ -337,10 +337,8 @@ endfunc function x264_coeff_last\size\()_neon .if \size == 15 sub r0, r0, #2 - vld1.64 {d0-d3}, [r0] -.else - vld1.64 {d0-d3}, [r0,:128] .endif + vld1.64 {d0-d3}, [r0,:128] vtst.16 q0, q0 vtst.16 q1, q1 vshrn.u16 d0, q0, #8