[X86] EltsFromConsecutiveLoads - early out for non-byte sized memory (PR42909)
authorSimon Pilgrim <llvm-dev@redking.me.uk>
Wed, 7 Aug 2019 12:41:59 +0000 (12:41 +0000)
committerSimon Pilgrim <llvm-dev@redking.me.uk>
Wed, 7 Aug 2019 12:41:59 +0000 (12:41 +0000)
Don't attempt to merge loads for types that aren't modulo 8-bits.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@368165 91177308-0d34-0410-b5e6-96231b3b80d8

lib/Target/X86/X86ISelLowering.cpp
test/CodeGen/X86/pr42909.ll [new file with mode: 0644]

index 3a2fca7de7138c696e1f4305936b8bbb0e34f6ce..d85d6bc2020b245879ccded6c66d5ce3701475c3 100644 (file)
@@ -7631,6 +7631,9 @@ static SDValue EltsFromConsecutiveLoads(EVT VT, ArrayRef<SDValue> Elts,
                                         const SDLoc &DL, SelectionDAG &DAG,
                                         const X86Subtarget &Subtarget,
                                         bool isAfterLegalize) {
+  if ((VT.getScalarSizeInBits() % 8) != 0)
+    return SDValue();
+
   unsigned NumElems = Elts.size();
 
   int LastLoadedElt = -1;
diff --git a/test/CodeGen/X86/pr42909.ll b/test/CodeGen/X86/pr42909.ll
new file mode 100644 (file)
index 0000000..afa9fe9
--- /dev/null
@@ -0,0 +1,21 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=corei7 -x86-experimental-vector-widening-legalization=1 | FileCheck %s
+
+define void @autogen_SD31033(i16* %a0) {
+; CHECK-LABEL: autogen_SD31033:
+; CHECK:       # %bb.0: # %BB
+; CHECK-NEXT:    .p2align 4, 0x90
+; CHECK-NEXT:  .LBB0_1: # %CF
+; CHECK-NEXT:    # =>This Inner Loop Header: Depth=1
+; CHECK-NEXT:    jmp .LBB0_1
+BB:
+  %L5 = load i16, i16* %a0
+  %I8 = insertelement <4 x i16> zeroinitializer, i16 %L5, i32 1
+  %Tr = trunc <4 x i16> %I8 to <4 x i1>
+  %Shuff28 = shufflevector <4 x i1> zeroinitializer, <4 x i1> %Tr, <4 x i32> <i32 undef, i32 3, i32 5, i32 undef>
+  br label %CF
+
+CF:                                               ; preds = %CF, %BB
+  %E42 = extractelement <4 x i1> %Shuff28, i32 3
+  br label %CF
+}