[SelectionDAG][X86] Enable iX SimplifyDemandedBits to vXi1 SimplifyDemandedVectorElts...

author Craig Topper <craig.topper@intel.com>

Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)

committer Craig Topper <craig.topper@intel.com>

Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)
author Craig Topper <craig.topper@intel.com>
Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)
committer Craig Topper <craig.topper@intel.com>
Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index 8b66cc471af353169ab9768f792979b879b945bf..f4438d41f65355f5d90515b606dde22345ff0af4 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -1819,9 +1819,7 @@ bool TargetLowering::SimplifyDemandedBits(
      // Bitcast from a vector using SimplifyDemanded Bits/VectorElts.
      // Demand the elt/bit if any of the original elts/bits are demanded.
      // TODO - bigendian once we have test coverage.
-    // TODO - bool vectors once SimplifyDemandedVectorElts has SETCC support.
-    if (SrcVT.isVector() && NumSrcEltBits > 1 &&
-        (BitWidth % NumSrcEltBits) == 0 &&
+    if (SrcVT.isVector() && (BitWidth % NumSrcEltBits) == 0 &&
          TLO.DAG.getDataLayout().isLittleEndian()) {
        unsigned Scale = BitWidth / NumSrcEltBits;
        unsigned NumSrcElts = SrcVT.getVectorNumElements();
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 1a986bc8ce7bf7301209a9ae1b976db81cfb431b..306b8bc1f6ac9363015a70cb535e1684039370fe 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -35380,6 +35380,26 @@ static SDValue combineBitcast(SDNode *N, SelectionDAG &DAG,
      // type, widen both sides to avoid a trip through memory.
      if ((SrcVT == MVT::v4i1 || SrcVT == MVT::v2i1) && VT.isScalarInteger() &&
          Subtarget.hasAVX512()) {
+      // Use zeros for the widening if we already have some zeroes. This can
+      // allow SimplifyDemandedBits to remove scalar ANDs that may be down
+      // stream of this.
+      // FIXME: It might make sense to detect a concat_vectors with a mix of
+      // zeroes and undef and turn it into insert_subvector for i1 vectors as
+      // a separate combine. What we can't do is canonicalize the operands of
+      // such a concat or we'll get into a loop with SimplifyDemandedBits.
+      if (N0.getOpcode() == ISD::CONCAT_VECTORS) {
+        SDValue LastOp = N0.getOperand(N0.getNumOperands() - 1);
+        if (ISD::isBuildVectorAllZeros(LastOp.getNode())) {
+          SrcVT = LastOp.getValueType();
+          unsigned NumConcats = 8 / SrcVT.getVectorNumElements();
+          SmallVector<SDValue, 4> Ops(N0->op_begin(), N0->op_end());
+          Ops.resize(NumConcats, DAG.getConstant(0, dl, SrcVT));
+          N0 = DAG.getNode(ISD::CONCAT_VECTORS, dl, MVT::v8i1, Ops);
+          N0 = DAG.getBitcast(MVT::i8, N0);
+          return DAG.getNode(ISD::TRUNCATE, dl, VT, N0);
+        }
+      }
+
        unsigned NumConcats = 8 / SrcVT.getVectorNumElements();
        SmallVector<SDValue, 4> Ops(NumConcats, DAG.getUNDEF(SrcVT));
        Ops[0] = N0;
author	Craig Topper <craig.topper@intel.com>
	Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)
committer	Craig Topper <craig.topper@intel.com>
	Fri, 23 Aug 2019 17:14:58 +0000 (17:14 +0000)
lib/CodeGen/SelectionDAG/TargetLowering.cpp		patch \| blob \| history
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history