From 264f13aeaf52c7c8c38a35ab781561c4692e251e Mon Sep 17 00:00:00 2001 From: Loren Merritt Date: Sun, 2 Mar 2008 02:27:45 +0000 Subject: [PATCH] remove x86_64 predict_8x8_ddl_mmxext because sse2 is faster even on amd git-svn-id: svn://svn.videolan.org/x264/trunk@744 df754926-b1dd-0310-bc7b-ec298dee348c --- common/amd64/predict-a.asm | 32 -------------------------------- common/i386/predict-c.c | 2 +- 2 files changed, 1 insertion(+), 33 deletions(-) diff --git a/common/amd64/predict-a.asm b/common/amd64/predict-a.asm index caecde3a..bdbbedce 100644 --- a/common/amd64/predict-a.asm +++ b/common/amd64/predict-a.asm @@ -204,38 +204,6 @@ cglobal predict_8x8_dc_left_mmxext STORE8x8 mm0, mm0 ret -;----------------------------------------------------------------------------- -; void predict_8x8_ddl_mmxext( uint8_t *src, uint8_t *edge ) -;----------------------------------------------------------------------------- -cglobal predict_8x8_ddl_mmxext - movq mm5, [parm2q+16] - movq mm2, [parm2q+17] - movq mm3, [parm2q+23] - movq mm4, [parm2q+25] - movq mm1, mm5 - psllq mm1, 8 - PRED8x8_LOWPASS mm0, mm1, mm2, mm5, mm7 - PRED8x8_LOWPASS mm1, mm3, mm4, [parm2q+24], mm6 - -%assign Y 7 -%rep 6 - movq [parm1q+Y*FDEC_STRIDE], mm1 - movq mm2, mm0 - psllq mm1, 8 - psrlq mm2, 56 - psllq mm0, 8 - por mm1, mm2 -%assign Y (Y-1) -%endrep - movq [parm1q+Y*FDEC_STRIDE], mm1 - psllq mm1, 8 - psrlq mm0, 56 - por mm1, mm0 -%assign Y (Y-1) - movq [parm1q+Y*FDEC_STRIDE], mm1 - - ret - ;----------------------------------------------------------------------------- ; void predict_8x8_ddl_sse2( uint8_t *src, uint8_t *edge ) ;----------------------------------------------------------------------------- diff --git a/common/i386/predict-c.c b/common/i386/predict-c.c index 63f48307..8ff531a2 100644 --- a/common/i386/predict-c.c +++ b/common/i386/predict-c.c @@ -538,9 +538,9 @@ void x264_predict_8x8_init_mmx( int cpu, x264_predict8x8_t pf[12] ) pf[I_PRED_8x8_DC] = predict_8x8_dc_mmxext; pf[I_PRED_8x8_DC_TOP] = predict_8x8_dc_top_mmxext; pf[I_PRED_8x8_DC_LEFT]= predict_8x8_dc_left_mmxext; - pf[I_PRED_8x8_DDL] = predict_8x8_ddl_mmxext; pf[I_PRED_8x8_VR] = predict_8x8_vr_mmxext; #ifdef ARCH_X86 + pf[I_PRED_8x8_DDL] = predict_8x8_ddl_mmxext; pf[I_PRED_8x8_DDR] = predict_8x8_ddr_mmxext; #endif if( !(cpu&X264_CPU_SSE2) ) -- 2.40.0