Merging r322106:

author Hans Wennborg <hans@hanshq.net>

Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)

committer Hans Wennborg <hans@hanshq.net>

Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)
author Hans Wennborg <hans@hanshq.net>
Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)
committer Hans Wennborg <hans@hanshq.net>
Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)
diff --git a/lib/Target/X86/X86TargetTransformInfo.cpp b/lib/Target/X86/X86TargetTransformInfo.cpp

index 223eed3048db68526b941b6d4897f1295d8c9547..967d67a84bc0294307e9afbc02880dfb6b9d9f37 100644 (file)
--- a/lib/Target/X86/X86TargetTransformInfo.cpp
+++ b/lib/Target/X86/X86TargetTransformInfo.cpp
@@ -754,7 +754,8 @@ int X86TTIImpl::getShuffleCost(TTI::ShuffleKind Kind, Type *Tp, int Index,
    // type remains the same.
    if (Kind == TTI::SK_PermuteSingleSrc && LT.first != 1) {
      MVT LegalVT = LT.second;
-    if (LegalVT.getVectorElementType().getSizeInBits() ==
+    if (LegalVT.isVector() &&
+        LegalVT.getVectorElementType().getSizeInBits() ==
              Tp->getVectorElementType()->getPrimitiveSizeInBits() &&
          LegalVT.getVectorNumElements() < Tp->getVectorNumElements()) {
  
diff --git a/test/Transforms/SLPVectorizer/X86/PR35865.ll b/test/Transforms/SLPVectorizer/X86/PR35865.ll

new file mode 100644 (file)

index 0000000..b022dd7
--- /dev/null
+++ b/test/Transforms/SLPVectorizer/X86/PR35865.ll
@@ -0,0 +1,27 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -slp-vectorizer < %s -S -o - -mtriple=x86_64-apple-macosx10.10.0 -mcpu=core2 | FileCheck %s
+
+define void @_Z10fooConvertPDv4_xS0_S0_PKS_() {
+; CHECK-LABEL: @_Z10fooConvertPDv4_xS0_S0_PKS_(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[TMP0:%.*]] = extractelement <16 x half> undef, i32 4
+; CHECK-NEXT:    [[CONV_I_4_I:%.*]] = fpext half [[TMP0]] to float
+; CHECK-NEXT:    [[TMP1:%.*]] = bitcast float [[CONV_I_4_I]] to i32
+; CHECK-NEXT:    [[VECINS_I_4_I:%.*]] = insertelement <8 x i32> undef, i32 [[TMP1]], i32 4
+; CHECK-NEXT:    [[TMP2:%.*]] = extractelement <16 x half> undef, i32 5
+; CHECK-NEXT:    [[CONV_I_5_I:%.*]] = fpext half [[TMP2]] to float
+; CHECK-NEXT:    [[TMP3:%.*]] = bitcast float [[CONV_I_5_I]] to i32
+; CHECK-NEXT:    [[VECINS_I_5_I:%.*]] = insertelement <8 x i32> [[VECINS_I_4_I]], i32 [[TMP3]], i32 5
+; CHECK-NEXT:    ret void
+;
+entry:
+  %0 = extractelement <16 x half> undef, i32 4
+  %conv.i.4.i = fpext half %0 to float
+  %1 = bitcast float %conv.i.4.i to i32
+  %vecins.i.4.i = insertelement <8 x i32> undef, i32 %1, i32 4
+  %2 = extractelement <16 x half> undef, i32 5
+  %conv.i.5.i = fpext half %2 to float
+  %3 = bitcast float %conv.i.5.i to i32
+  %vecins.i.5.i = insertelement <8 x i32> %vecins.i.4.i, i32 %3, i32 5
+  ret void
+}
author	Hans Wennborg <hans@hanshq.net>
	Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)
committer	Hans Wennborg <hans@hanshq.net>
	Wed, 17 Jan 2018 16:20:48 +0000 (16:20 +0000)
lib/Target/X86/X86TargetTransformInfo.cpp		patch \| blob \| history
test/Transforms/SLPVectorizer/X86/PR35865.ll	[new file with mode: 0644]	patch \| blob