[LICM] Infer proper alignment from loads during scalar promotion

author Philip Reames <listmail@philipreames.com>

Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)

committer Philip Reames <listmail@philipreames.com>

Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)
author Philip Reames <listmail@philipreames.com>
Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)
committer Philip Reames <listmail@philipreames.com>
Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)
diff --git a/lib/Transforms/Scalar/LICM.cpp b/lib/Transforms/Scalar/LICM.cpp

index 1be0d053b7b6a45eb827922a30bf1bf789b443b4..93ee25cbfb8a45a42427c8d45b72b35a44e34ce6 100644 (file)
--- a/lib/Transforms/Scalar/LICM.cpp
+++ b/lib/Transforms/Scalar/LICM.cpp
@@ -1924,9 +1924,21 @@ bool llvm::promoteLoopAccessesToScalars(
          SawUnorderedAtomic |= Load->isAtomic();
          SawNotAtomic |= !Load->isAtomic();
  
-        if (!DereferenceableInPH)
-          DereferenceableInPH = isSafeToExecuteUnconditionally(
-              *Load, DT, CurLoop, SafetyInfo, ORE, Preheader->getTerminator());
+        unsigned InstAlignment = Load->getAlignment();
+        if (!InstAlignment)
+          InstAlignment =
+              MDL.getABITypeAlignment(Load->getType());
+
+        // Note that proving a load safe to speculate requires proving
+        // sufficient alignment at the target location.  Proving it guaranteed
+        // to execute does as well.  Thus we can increase our guaranteed
+        // alignment as well. 
+        if (!DereferenceableInPH || (InstAlignment > Alignment))
+          if (isSafeToExecuteUnconditionally(*Load, DT, CurLoop, SafetyInfo,
+                                             ORE, Preheader->getTerminator())) {
+            DereferenceableInPH = true;
+            Alignment = std::max(Alignment, InstAlignment);
+          }
        } else if (const StoreInst *Store = dyn_cast<StoreInst>(UI)) {
          // Stores *of* the pointer are not interesting, only stores *to* the
          // pointer.
@@ -1997,6 +2009,14 @@ bool llvm::promoteLoopAccessesToScalars(
    if (SawUnorderedAtomic && SawNotAtomic)
      return false;
  
+  // If we're inserting an atomic load in the preheader, we must be able to
+  // lower it.  We're only guaranteed to be able to lower naturally aligned
+  // atomics.
+  auto *SomePtrElemType = SomePtr->getType()->getPointerElementType();
+  if (SawUnorderedAtomic &&
+      Alignment < MDL.getTypeStoreSize(SomePtrElemType))
+    return false;
+
    // If we couldn't prove we can hoist the load, bail.
    if (!DereferenceableInPH)
      return false;
diff --git a/test/Transforms/LICM/promote-tls.ll b/test/Transforms/LICM/promote-tls.ll

index 3fe46e81ed9778b51819d2d39303aa0e8d09f615..db4d4c312012205ee164afb08ccd9cabfb564526 100644 (file)
--- a/test/Transforms/LICM/promote-tls.ll
+++ b/test/Transforms/LICM/promote-tls.ll
@@ -22,7 +22,7 @@ entry:
  
  for.body.lr.ph:                                   ; preds = %entry
  ; CHECK-LABEL: for.body.lr.ph:
-; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 1
+; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 4
    br label %for.header
  
  for.header:
@@ -35,7 +35,7 @@ for.header:
  
  early-exit:
  ; CHECK-LABEL: early-exit:
-; CHECK: store i32 %new1.lcssa, i32* %addr, align 1
+; CHECK: store i32 %new1.lcssa, i32* %addr, align 4
    ret i32* null
  
  for.body:
@@ -47,7 +47,7 @@ for.body:
  
  for.cond.for.end_crit_edge:                       ; preds = %for.body
  ; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK: store i32 %new.lcssa, i32* %addr, align 1
+; CHECK: store i32 %new.lcssa, i32* %addr, align 4
    %split = phi i32* [ %addr, %for.body ]
    ret i32* null
  }
@@ -62,7 +62,7 @@ entry:
  
  for.body.lr.ph:                                   ; preds = %entry
  ; CHECK-LABEL: for.body.lr.ph:
-; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 1
+; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 4
    br label %for.header
  
  for.header:
@@ -75,7 +75,7 @@ for.header:
  
  early-exit:
  ; CHECK-LABEL: early-exit:
-; CHECK: store i32 %new1.lcssa, i32* %addr, align 1
+; CHECK: store i32 %new1.lcssa, i32* %addr, align 4
    ret i32* null
  
  for.body:
@@ -87,7 +87,7 @@ for.body:
  
  for.cond.for.end_crit_edge:                       ; preds = %for.body
  ; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK: store i32 %new.lcssa, i32* %addr, align 1
+; CHECK: store i32 %new.lcssa, i32* %addr, align 4
    %split = phi i32* [ %addr, %for.body ]
    ret i32* null
  }
diff --git a/test/Transforms/LICM/scalar-promote-unwind.ll b/test/Transforms/LICM/scalar-promote-unwind.ll

index 697222d4394d0b4300670d610ceb9a90abdb9b80..5de6ae9c277707ee2a809d7beedf420d6ca781a5 100644 (file)
--- a/test/Transforms/LICM/scalar-promote-unwind.ll
+++ b/test/Transforms/LICM/scalar-promote-unwind.ll
@@ -74,7 +74,7 @@ define void @test3(i1 zeroext %y) uwtable {
  entry:
  ; CHECK-LABEL: entry:
  ; CHECK-NEXT:  %a = alloca i32
-; CHECK-NEXT:  %a.promoted = load i32, i32* %a, align 1
+; CHECK-NEXT:  %a.promoted = load i32, i32* %a, align 4
    %a = alloca i32
    br label %for.body
  
@@ -90,20 +90,18 @@ for.body:
  
  for.cond.cleanup:
  ; CHECK-LABEL: for.cond.cleanup:
-; CHECK: store i32 %add.lcssa, i32* %a, align 1
+; CHECK: store i32 %add.lcssa, i32* %a, align 4
  ; CHECK-NEXT: ret void
    ret void
  }
  
  ;; Same as test3, but with unordered atomics
-;; FIXME: doing the transform w/o alignment here is wrong since we're
-;; creating an unaligned atomic which we may not be able to lower.
  define void @test3b(i1 zeroext %y) uwtable {
  ; CHECK-LABEL: @test3
  entry:
  ; CHECK-LABEL: entry:
  ; CHECK-NEXT:  %a = alloca i32
-; CHECK-NEXT:  %a.promoted = load atomic i32, i32* %a unordered, align 1
+; CHECK-NEXT:  %a.promoted = load atomic i32, i32* %a unordered, align 4
    %a = alloca i32
    br label %for.body
  
@@ -119,7 +117,7 @@ for.body:
  
  for.cond.cleanup:
  ; CHECK-LABEL: for.cond.cleanup:
-; CHECK: store atomic i32 %add.lcssa, i32* %a unordered, align 1
+; CHECK: store atomic i32 %add.lcssa, i32* %a unordered, align 4
  ; CHECK-NEXT: ret void
    ret void
  }
author	Philip Reames <listmail@philipreames.com>
	Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)
committer	Philip Reames <listmail@philipreames.com>
	Fri, 1 Mar 2019 18:45:05 +0000 (18:45 +0000)
lib/Transforms/Scalar/LICM.cpp		patch \| blob \| history
test/Transforms/LICM/promote-tls.ll		patch \| blob \| history
test/Transforms/LICM/scalar-promote-unwind.ll		patch \| blob \| history