[Alignment][NFC] Instructions::getLoadStoreAlignment

author Guillaume Chatelet <gchatelet@google.com>

Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)

committer Guillaume Chatelet <gchatelet@google.com>

Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)
author Guillaume Chatelet <gchatelet@google.com>
Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)
committer Guillaume Chatelet <gchatelet@google.com>
Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)
diff --git a/include/llvm/IR/Instructions.h b/include/llvm/IR/Instructions.h

index eaaf50646462086bf7c4ddd439e3899d5a677930..1e29d2cd361d1dee6eba63fa32b8b978fde0865d 100644 (file)
--- a/include/llvm/IR/Instructions.h
+++ b/include/llvm/IR/Instructions.h
@@ -5283,12 +5283,12 @@ inline Value *getPointerOperand(Value *V) {
  }
  
  /// A helper function that returns the alignment of load or store instruction.
-inline unsigned getLoadStoreAlignment(Value *I) {
+inline MaybeAlign getLoadStoreAlignment(Value *I) {
    assert((isa<LoadInst>(I) || isa<StoreInst>(I)) &&
           "Expected Load or Store instruction");
    if (auto *LI = dyn_cast<LoadInst>(I))
-    return LI->getAlignment();
-  return cast<StoreInst>(I)->getAlignment();
+    return MaybeAlign(LI->getAlignment());
+  return MaybeAlign(cast<StoreInst>(I)->getAlignment());
  }
  
  /// A helper function that returns the address space of the pointer operand of
diff --git a/lib/Transforms/Vectorize/LoopVectorizationLegality.cpp b/lib/Transforms/Vectorize/LoopVectorizationLegality.cpp

index 0a20ab71dfaaa917fd6d72f7f0bd98e8ee3dad9f..f43842be535744a70e38a9beb3d79a4b077019ca 100644 (file)
--- a/lib/Transforms/Vectorize/LoopVectorizationLegality.cpp
+++ b/lib/Transforms/Vectorize/LoopVectorizationLegality.cpp
@@ -741,9 +741,9 @@ bool LoopVectorizationLegality::canVectorizeInstrs() {
            // Arbitrarily try a vector of 2 elements.
            Type *VecTy = VectorType::get(T, /*NumElements=*/2);
            assert(VecTy && "did not find vectorized version of stored type");
-          unsigned Alignment = getLoadStoreAlignment(ST);
+          const MaybeAlign Alignment = getLoadStoreAlignment(ST);
            assert(Alignment && "Alignment should be set");
-          if (!TTI->isLegalNTStore(VecTy, Align(Alignment))) {
+          if (!TTI->isLegalNTStore(VecTy, *Alignment)) {
              reportVectorizationFailure(
                  "nontemporal store instruction cannot be vectorized",
                  "nontemporal store instruction cannot be vectorized",
@@ -758,9 +758,9 @@ bool LoopVectorizationLegality::canVectorizeInstrs() {
            // supported on the target (arbitrarily try a vector of 2 elements).
            Type *VecTy = VectorType::get(I.getType(), /*NumElements=*/2);
            assert(VecTy && "did not find vectorized version of load type");
-          unsigned Alignment = getLoadStoreAlignment(LD);
+          const MaybeAlign Alignment = getLoadStoreAlignment(LD);
            assert(Alignment && "Alignment should be set");
-          if (!TTI->isLegalNTLoad(VecTy, Align(Alignment))) {
+          if (!TTI->isLegalNTLoad(VecTy, *Alignment)) {
              reportVectorizationFailure(
                  "nontemporal load instruction cannot be vectorized",
                  "nontemporal load instruction cannot be vectorized",
diff --git a/lib/Transforms/Vectorize/LoopVectorize.cpp b/lib/Transforms/Vectorize/LoopVectorize.cpp

index 51d0b47714407f495d5d5386318c29e3fa3ec085..8f0bf70f873cf5264f5ca6e51ab08c8b06d3064c 100644 (file)
--- a/lib/Transforms/Vectorize/LoopVectorize.cpp
+++ b/lib/Transforms/Vectorize/LoopVectorize.cpp
@@ -1190,16 +1190,16 @@ public:
  
    /// Returns true if the target machine supports masked store operation
    /// for the given \p DataType and kind of access to \p Ptr.
-  bool isLegalMaskedStore(Type *DataType, Value *Ptr, unsigned Alignment) {
+  bool isLegalMaskedStore(Type *DataType, Value *Ptr, MaybeAlign Alignment) {
      return Legal->isConsecutivePtr(Ptr) &&
-           TTI.isLegalMaskedStore(DataType, MaybeAlign(Alignment));
+           TTI.isLegalMaskedStore(DataType, Alignment);
    }
  
    /// Returns true if the target machine supports masked load operation
    /// for the given \p DataType and kind of access to \p Ptr.
-  bool isLegalMaskedLoad(Type *DataType, Value *Ptr, unsigned Alignment) {
+  bool isLegalMaskedLoad(Type *DataType, Value *Ptr, MaybeAlign Alignment) {
      return Legal->isConsecutivePtr(Ptr) &&
-           TTI.isLegalMaskedLoad(DataType, MaybeAlign(Alignment));
+           TTI.isLegalMaskedLoad(DataType, Alignment);
    }
  
    /// Returns true if the target machine supports masked scatter operation
@@ -2359,12 +2359,11 @@ void InnerLoopVectorizer::vectorizeMemoryInstruction(Instruction *Instr,
    Type *ScalarDataTy = getMemInstValueType(Instr);
    Type *DataTy = VectorType::get(ScalarDataTy, VF);
    Value *Ptr = getLoadStorePointerOperand(Instr);
-  unsigned Alignment = getLoadStoreAlignment(Instr);
    // An alignment of 0 means target abi alignment. We need to use the scalar's
    // target abi alignment in such a case.
    const DataLayout &DL = Instr->getModule()->getDataLayout();
-  if (!Alignment)
-    Alignment = DL.getABITypeAlignment(ScalarDataTy);
+  const Align Alignment =
+      DL.getValueOrABITypeAlignment(getLoadStoreAlignment(Instr), ScalarDataTy);
    unsigned AddressSpace = getLoadStoreAddressSpace(Instr);
  
    // Determine if the pointer operand of the access is either consecutive or
@@ -2428,8 +2427,8 @@ void InnerLoopVectorizer::vectorizeMemoryInstruction(Instruction *Instr,
        if (CreateGatherScatter) {
          Value *MaskPart = isMaskRequired ? Mask[Part] : nullptr;
          Value *VectorGep = getOrCreateVectorValue(Ptr, Part);
-        NewSI = Builder.CreateMaskedScatter(StoredVal, VectorGep, Alignment,
-                                            MaskPart);
+        NewSI = Builder.CreateMaskedScatter(StoredVal, VectorGep,
+                                            Alignment.value(), MaskPart);
        } else {
          if (Reverse) {
            // If we store to reverse consecutive memory locations, then we need
@@ -2440,10 +2439,11 @@ void InnerLoopVectorizer::vectorizeMemoryInstruction(Instruction *Instr,
          }
          auto *VecPtr = CreateVecPtr(Part, Ptr);
          if (isMaskRequired)
-          NewSI = Builder.CreateMaskedStore(StoredVal, VecPtr, Alignment,
-                                            Mask[Part]);
+          NewSI = Builder.CreateMaskedStore(StoredVal, VecPtr,
+                                            Alignment.value(), Mask[Part]);
          else
-          NewSI = Builder.CreateAlignedStore(StoredVal, VecPtr, Alignment);
+          NewSI =
+              Builder.CreateAlignedStore(StoredVal, VecPtr, Alignment.value());
        }
        addMetadata(NewSI, SI);
      }
@@ -2458,18 +2458,18 @@ void InnerLoopVectorizer::vectorizeMemoryInstruction(Instruction *Instr,
      if (CreateGatherScatter) {
        Value *MaskPart = isMaskRequired ? Mask[Part] : nullptr;
        Value *VectorGep = getOrCreateVectorValue(Ptr, Part);
-      NewLI = Builder.CreateMaskedGather(VectorGep, Alignment, MaskPart,
+      NewLI = Builder.CreateMaskedGather(VectorGep, Alignment.value(), MaskPart,
                                           nullptr, "wide.masked.gather");
        addMetadata(NewLI, LI);
      } else {
        auto *VecPtr = CreateVecPtr(Part, Ptr);
        if (isMaskRequired)
-        NewLI = Builder.CreateMaskedLoad(VecPtr, Alignment, Mask[Part],
+        NewLI = Builder.CreateMaskedLoad(VecPtr, Alignment.value(), Mask[Part],
                                           UndefValue::get(DataTy),
                                           "wide.masked.load");
        else
-        NewLI =
-            Builder.CreateAlignedLoad(DataTy, VecPtr, Alignment, "wide.load");
+        NewLI = Builder.CreateAlignedLoad(DataTy, VecPtr, Alignment.value(),
+                                          "wide.load");
  
        // Add metadata to the load, but setVectorValue to the reverse shuffle.
        addMetadata(NewLI, LI);
@@ -4553,7 +4553,6 @@ bool LoopVectorizationCostModel::isScalarWithPredication(Instruction *I, unsigne
        return false;
      auto *Ptr = getLoadStorePointerOperand(I);
      auto *Ty = getMemInstValueType(I);
-    unsigned Alignment = getLoadStoreAlignment(I);
      // We have already decided how to vectorize this instruction, get that
      // result.
      if (VF > 1) {
@@ -4562,6 +4561,7 @@ bool LoopVectorizationCostModel::isScalarWithPredication(Instruction *I, unsigne
               "Widening decision should be ready at this moment");
        return WideningDecision == CM_Scalarize;
      }
+    const MaybeAlign Alignment = getLoadStoreAlignment(I);
      return isa<LoadInst>(I) ?
          !(isLegalMaskedLoad(Ty, Ptr, Alignment) || isLegalMaskedGather(Ty))
        : !(isLegalMaskedStore(Ty, Ptr, Alignment) || isLegalMaskedScatter(Ty));
@@ -4607,9 +4607,9 @@ bool LoopVectorizationCostModel::interleavedAccessCanBeWidened(Instruction *I,
           "Masked interleave-groups for predicated accesses are not enabled.");
  
    auto *Ty = getMemInstValueType(I);
-  unsigned Alignment = getLoadStoreAlignment(I);
-  return isa<LoadInst>(I) ? TTI.isLegalMaskedLoad(Ty, MaybeAlign(Alignment))
-                          : TTI.isLegalMaskedStore(Ty, MaybeAlign(Alignment));
+  const MaybeAlign Alignment = getLoadStoreAlignment(I);
+  return isa<LoadInst>(I) ? TTI.isLegalMaskedLoad(Ty, Alignment)
+                          : TTI.isLegalMaskedStore(Ty, Alignment);
  }
  
  bool LoopVectorizationCostModel::memoryInstructionCanBeWidened(Instruction *I,
@@ -5731,7 +5731,6 @@ unsigned LoopVectorizationCostModel::getMemInstScalarizationCost(Instruction *I,
    Type *ValTy = getMemInstValueType(I);
    auto SE = PSE.getSE();
  
-  unsigned Alignment = getLoadStoreAlignment(I);
    unsigned AS = getLoadStoreAddressSpace(I);
    Value *Ptr = getLoadStorePointerOperand(I);
    Type *PtrTy = ToVectorTy(Ptr->getType(), VF);
@@ -5745,9 +5744,9 @@ unsigned LoopVectorizationCostModel::getMemInstScalarizationCost(Instruction *I,
  
    // Don't pass *I here, since it is scalar but will actually be part of a
    // vectorized loop where the user of it is a vectorized instruction.
-  Cost += VF *
-          TTI.getMemoryOpCost(I->getOpcode(), ValTy->getScalarType(), Alignment,
-                              AS);
+  const MaybeAlign Alignment = getLoadStoreAlignment(I);
+  Cost += VF * TTI.getMemoryOpCost(I->getOpcode(), ValTy->getScalarType(),
+                                   Alignment ? Alignment->value() : 0, AS);
  
    // Get the overhead of the extractelement and insertelement instructions
    // we might create due to scalarization.
@@ -5772,18 +5771,20 @@ unsigned LoopVectorizationCostModel::getConsecutiveMemOpCost(Instruction *I,
                                                               unsigned VF) {
    Type *ValTy = getMemInstValueType(I);
    Type *VectorTy = ToVectorTy(ValTy, VF);
-  unsigned Alignment = getLoadStoreAlignment(I);
    Value *Ptr = getLoadStorePointerOperand(I);
    unsigned AS = getLoadStoreAddressSpace(I);
    int ConsecutiveStride = Legal->isConsecutivePtr(Ptr);
  
    assert((ConsecutiveStride == 1 || ConsecutiveStride == -1) &&
           "Stride should be 1 or -1 for consecutive memory access");
+  const MaybeAlign Alignment = getLoadStoreAlignment(I);
    unsigned Cost = 0;
    if (Legal->isMaskRequired(I))
-    Cost += TTI.getMaskedMemoryOpCost(I->getOpcode(), VectorTy, Alignment, AS);
+    Cost += TTI.getMaskedMemoryOpCost(I->getOpcode(), VectorTy,
+                                      Alignment ? Alignment->value() : 0, AS);
    else
-    Cost += TTI.getMemoryOpCost(I->getOpcode(), VectorTy, Alignment, AS, I);
+    Cost += TTI.getMemoryOpCost(I->getOpcode(), VectorTy,
+                                Alignment ? Alignment->value() : 0, AS, I);
  
    bool Reverse = ConsecutiveStride < 0;
    if (Reverse)
@@ -5795,33 +5796,37 @@ unsigned LoopVectorizationCostModel::getUniformMemOpCost(Instruction *I,
                                                           unsigned VF) {
    Type *ValTy = getMemInstValueType(I);
    Type *VectorTy = ToVectorTy(ValTy, VF);
-  unsigned Alignment = getLoadStoreAlignment(I);
+  const MaybeAlign Alignment = getLoadStoreAlignment(I);
    unsigned AS = getLoadStoreAddressSpace(I);
    if (isa<LoadInst>(I)) {
      return TTI.getAddressComputationCost(ValTy) +
-           TTI.getMemoryOpCost(Instruction::Load, ValTy, Alignment, AS) +
+           TTI.getMemoryOpCost(Instruction::Load, ValTy,
+                               Alignment ? Alignment->value() : 0, AS) +
             TTI.getShuffleCost(TargetTransformInfo::SK_Broadcast, VectorTy);
    }
    StoreInst *SI = cast<StoreInst>(I);
  
    bool isLoopInvariantStoreValue = Legal->isUniform(SI->getValueOperand());
    return TTI.getAddressComputationCost(ValTy) +
-         TTI.getMemoryOpCost(Instruction::Store, ValTy, Alignment, AS) +
-         (isLoopInvariantStoreValue ? 0 : TTI.getVectorInstrCost(
-                                               Instruction::ExtractElement,
-                                               VectorTy, VF - 1));
+         TTI.getMemoryOpCost(Instruction::Store, ValTy,
+                             Alignment ? Alignment->value() : 0, AS) +
+         (isLoopInvariantStoreValue
+              ? 0
+              : TTI.getVectorInstrCost(Instruction::ExtractElement, VectorTy,
+                                       VF - 1));
  }
  
  unsigned LoopVectorizationCostModel::getGatherScatterCost(Instruction *I,
                                                            unsigned VF) {
    Type *ValTy = getMemInstValueType(I);
    Type *VectorTy = ToVectorTy(ValTy, VF);
-  unsigned Alignment = getLoadStoreAlignment(I);
+  const MaybeAlign Alignment = getLoadStoreAlignment(I);
    Value *Ptr = getLoadStorePointerOperand(I);
  
    return TTI.getAddressComputationCost(VectorTy) +
           TTI.getGatherScatterOpCost(I->getOpcode(), VectorTy, Ptr,
-                                    Legal->isMaskRequired(I), Alignment);
+                                    Legal->isMaskRequired(I),
+                                    Alignment ? Alignment->value() : 0);
  }
  
  unsigned LoopVectorizationCostModel::getInterleaveGroupCost(Instruction *I,
@@ -5868,11 +5873,12 @@ unsigned LoopVectorizationCostModel::getMemoryInstructionCost(Instruction *I,
    // moment.
    if (VF == 1) {
      Type *ValTy = getMemInstValueType(I);
-    unsigned Alignment = getLoadStoreAlignment(I);
+    const MaybeAlign Alignment = getLoadStoreAlignment(I);
      unsigned AS = getLoadStoreAddressSpace(I);
  
      return TTI.getAddressComputationCost(ValTy) +
-           TTI.getMemoryOpCost(I->getOpcode(), ValTy, Alignment, AS, I);
+           TTI.getMemoryOpCost(I->getOpcode(), ValTy,
+                               Alignment ? Alignment->value() : 0, AS, I);
    }
    return getWideningCost(I, VF);
  }
author	Guillaume Chatelet <gchatelet@google.com>
	Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)
committer	Guillaume Chatelet <gchatelet@google.com>
	Mon, 21 Oct 2019 14:49:28 +0000 (14:49 +0000)
include/llvm/IR/Instructions.h		patch \| blob \| history
lib/Transforms/Vectorize/LoopVectorizationLegality.cpp		patch \| blob \| history
lib/Transforms/Vectorize/LoopVectorize.cpp		patch \| blob \| history