From: Mikael Holmen Date: Mon, 1 Apr 2019 13:48:56 +0000 (+0000) Subject: [InstCombine] Handle vector gep with scalar argument in evaluateInDifferentElementOrder X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=75216a6dbcfe5fb55039ef06a07e419fa875f4a5;p=llvm [InstCombine] Handle vector gep with scalar argument in evaluateInDifferentElementOrder This fixes PR41270. The recursive function evaluateInDifferentElementOrder expects to be called on a vector Value, so when we call it on a vector GEP's arguments, we must first check that the argument is indeed a vector. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@357385 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/Transforms/InstCombine/InstCombineVectorOps.cpp b/lib/Transforms/InstCombine/InstCombineVectorOps.cpp index 49c29fe651b..665064c4c8d 100644 --- a/lib/Transforms/InstCombine/InstCombineVectorOps.cpp +++ b/lib/Transforms/InstCombine/InstCombineVectorOps.cpp @@ -1171,7 +1171,14 @@ static Value *evaluateInDifferentElementOrder(Value *V, ArrayRef Mask) { SmallVector NewOps; bool NeedsRebuild = (Mask.size() != I->getType()->getVectorNumElements()); for (int i = 0, e = I->getNumOperands(); i != e; ++i) { - Value *V = evaluateInDifferentElementOrder(I->getOperand(i), Mask); + Value *V; + // Recursively call evaluateInDifferentElementOrder on vector arguments + // as well. E.g. GetElementPtr may have scalar operands even if the + // return value is a vector, so we need to examine the operand type. + if (I->getOperand(i)->getType()->isVectorTy()) + V = evaluateInDifferentElementOrder(I->getOperand(i), Mask); + else + V = I->getOperand(i); NewOps.push_back(V); NeedsRebuild |= (V != I->getOperand(i)); } diff --git a/test/Transforms/InstCombine/vec_gep_scalar_arg.ll b/test/Transforms/InstCombine/vec_gep_scalar_arg.ll new file mode 100644 index 00000000000..33ed7cb6a7f --- /dev/null +++ b/test/Transforms/InstCombine/vec_gep_scalar_arg.ll @@ -0,0 +1,16 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; RUN: opt -instcombine -S < %s | FileCheck %s + +define <4 x i16*> @PR41270([4 x i16]* %x) { +; CHECK-LABEL: @PR41270( +; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x [4 x i16]*> undef, [4 x i16]* [[X:%.*]], i32 0 +; CHECK-NEXT: [[TMP2:%.*]] = getelementptr inbounds [4 x i16], <4 x [4 x i16]*> [[TMP1]], i64 0, i64 3 +; CHECK-NEXT: ret <4 x i16*> [[TMP2]] +; + %ins = insertelement <4 x [4 x i16]*> undef, [4 x i16]* %x, i32 0 + %splat = shufflevector <4 x [4 x i16]*> %ins, <4 x [4 x i16]*> undef, <4 x i32> zeroinitializer + %t2 = getelementptr inbounds [4 x i16], <4 x [4 x i16]*> %splat, i32 0, i32 3 + %t3 = extractelement <4 x i16*> %t2, i32 3 + %ins2 = insertelement <4 x i16*> undef, i16* %t3, i32 0 + ret <4 x i16*> %ins2 +}