[TargetLowering] add tests to show effect of setcc sub->shift; NFC

author Sanjay Patel <spatel@rotateright.com>

Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)

committer Sanjay Patel <spatel@rotateright.com>

Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)
author Sanjay Patel <spatel@rotateright.com>
Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)
committer Sanjay Patel <spatel@rotateright.com>
Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index b933f0324097e0057dc07d90f265bbc1bdc77abc..eae5a45906f1668beb1907934260b70fa67ae3c1 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -3075,7 +3075,6 @@ SDValue TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                                  DAG.getConstant(0, dl, N0.getValueType()),
                                  Cond);
            // The shift is not valid if this is a bool (i1).
-          // TODO: This transform needs evidence to justify its existence.
            if (N0.getNode()->hasOneUse() && OpVT.getScalarSizeInBits() != 1) {
              assert(N0.getOpcode() == ISD::SUB && "Unexpected operation!");
              auto &DL = DAG.getDataLayout();
diff --git a/test/CodeGen/X86/setcc-combine.ll b/test/CodeGen/X86/setcc-combine.ll

index c13d2f114cf9b3f08933780335e6d69c1445b51a..ed3dfcdd7b1d6c0f8b054403575c9ae56e0545ab 100644 (file)
--- a/test/CodeGen/X86/setcc-combine.ll
+++ b/test/CodeGen/X86/setcc-combine.ll
@@ -297,3 +297,41 @@ define i64 @sub_to_shift_to_add(i32 %x, i32 %y, i64 %s1, i64 %s2) {
    ret i64 %r
  }
  
+define <4 x float> @sub_to_shift_to_add_vec(<4 x i32> %x, <4 x i32> %y, <4 x float> %s1, <4 x float> %s2) {
+; SSE2-LABEL: sub_to_shift_to_add_vec:
+; SSE2:       # %bb.0:
+; SSE2-NEXT:    paddd %xmm1, %xmm1
+; SSE2-NEXT:    pcmpeqd %xmm0, %xmm1
+; SSE2-NEXT:    pand %xmm1, %xmm2
+; SSE2-NEXT:    pandn %xmm3, %xmm1
+; SSE2-NEXT:    por %xmm2, %xmm1
+; SSE2-NEXT:    movdqa %xmm1, %xmm0
+; SSE2-NEXT:    retq
+;
+; SSE41-LABEL: sub_to_shift_to_add_vec:
+; SSE41:       # %bb.0:
+; SSE41-NEXT:    paddd %xmm1, %xmm1
+; SSE41-NEXT:    pcmpeqd %xmm1, %xmm0
+; SSE41-NEXT:    blendvps %xmm0, %xmm2, %xmm3
+; SSE41-NEXT:    movaps %xmm3, %xmm0
+; SSE41-NEXT:    retq
+  %sub = sub <4 x i32> %x, %y
+  %cmp = icmp eq <4 x i32> %sub, %y
+  %r = select <4 x i1> %cmp, <4 x float> %s1, <4 x float> %s2
+  ret <4 x float> %r
+}
+
+define i64 @sub_constant_to_shift_to_add(i32 %x, i64 %s1, i64 %s2) {
+; CHECK-LABEL: sub_constant_to_shift_to_add:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    movq %rsi, %rax
+; CHECK-NEXT:    addl %edi, %edi
+; CHECK-NEXT:    cmpl $42, %edi
+; CHECK-NEXT:    cmovneq %rdx, %rax
+; CHECK-NEXT:    retq
+  %sub = sub i32 42, %x
+  %cmp = icmp eq i32 %sub, %x
+  %r = select i1 %cmp, i64 %s1, i64 %s2
+  ret i64 %r
+}
+
author	Sanjay Patel <spatel@rotateright.com>
	Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)
committer	Sanjay Patel <spatel@rotateright.com>
	Sat, 9 Feb 2019 17:03:59 +0000 (17:03 +0000)
lib/CodeGen/SelectionDAG/TargetLowering.cpp		patch \| blob \| history
test/CodeGen/X86/setcc-combine.ll		patch \| blob \| history