From: Simon Pilgrim Date: Thu, 28 Feb 2019 10:53:58 +0000 (+0000) Subject: [X86][AVX] Fold vf64 concat_vectors(movddup(x),movddup(x)) -> broadcast(x) X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=e6ae1b850432c6b7f9e740b2612e9272bea0fd19;p=llvm [X86][AVX] Fold vf64 concat_vectors(movddup(x),movddup(x)) -> broadcast(x) git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@355078 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp index 460c95a25ed..76f65782907 100644 --- a/lib/Target/X86/X86ISelLowering.cpp +++ b/lib/Target/X86/X86ISelLowering.cpp @@ -41777,6 +41777,8 @@ static SDValue combineConcatVectorOps(const SDLoc &DL, MVT VT, ArrayRef Ops, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const X86Subtarget &Subtarget) { + assert(Subtarget.hasAVX() && "AVX assumed for concat_vectors"); + if (llvm::all_of(Ops, [](SDValue Op) { return Op.isUndef(); })) return DAG.getUNDEF(VT); @@ -41811,8 +41813,16 @@ static SDValue combineConcatVectorOps(const SDLoc &DL, MVT VT, Op0.getOpcode() == X86ISD::SUBV_BROADCAST) return DAG.getNode(Op0.getOpcode(), DL, VT, Op0.getOperand(0)); + // concat_vectors(movddup(x),movddup(x)) -> broadcast(x) + if (Op0.getOpcode() == X86ISD::MOVDDUP && VT == MVT::v4f64 && + (Subtarget.hasAVX2() || MayFoldLoad(Op0.getOperand(0)))) + return DAG.getNode(X86ISD::VBROADCAST, DL, VT, + DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, MVT::f64, + Op0.getOperand(0), + DAG.getIntPtrConstant(0, DL))); + // concat_vectors(scalar_to_vector(x),scalar_to_vector(x)) -> broadcast(x) - if (Op0.getOpcode() == ISD::SCALAR_TO_VECTOR && Subtarget.hasAVX() && + if (Op0.getOpcode() == ISD::SCALAR_TO_VECTOR && (Subtarget.hasAVX2() || (VT.getScalarSizeInBits() >= 32 && MayFoldLoad(Op0.getOperand(0)))) && Op0.getOperand(0).getValueType() == VT.getScalarType()) diff --git a/test/CodeGen/X86/widened-broadcast.ll b/test/CodeGen/X86/widened-broadcast.ll index ae4f901b157..b43c8a4649f 100644 --- a/test/CodeGen/X86/widened-broadcast.ll +++ b/test/CodeGen/X86/widened-broadcast.ll @@ -43,21 +43,10 @@ define <8 x float> @load_splat_8f32_4f32_01010101(<4 x float>* %ptr) nounwind uw ; SSE42-NEXT: movapd %xmm0, %xmm1 ; SSE42-NEXT: retq ; -; AVX1-LABEL: load_splat_8f32_4f32_01010101: -; AVX1: # %bb.0: # %entry -; AVX1-NEXT: vmovddup {{.*#+}} xmm0 = mem[0,0] -; AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 -; AVX1-NEXT: retq -; -; AVX2-LABEL: load_splat_8f32_4f32_01010101: -; AVX2: # %bb.0: # %entry -; AVX2-NEXT: vbroadcastsd (%rdi), %ymm0 -; AVX2-NEXT: retq -; -; AVX512-LABEL: load_splat_8f32_4f32_01010101: -; AVX512: # %bb.0: # %entry -; AVX512-NEXT: vbroadcastsd (%rdi), %ymm0 -; AVX512-NEXT: retq +; AVX-LABEL: load_splat_8f32_4f32_01010101: +; AVX: # %bb.0: # %entry +; AVX-NEXT: vbroadcastsd (%rdi), %ymm0 +; AVX-NEXT: retq entry: %ld = load <4 x float>, <4 x float>* %ptr %ret = shufflevector <4 x float> %ld, <4 x float> undef, <8 x i32>