[NVPTX] Only lower sin/cos to approximate instructions if unsafe math is allowed.

author Artem Belevich <tra@google.com>

Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)

committer Artem Belevich <tra@google.com>

Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)
author Artem Belevich <tra@google.com>
Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)
committer Artem Belevich <tra@google.com>
Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)
diff --git a/lib/Target/NVPTX/NVPTXISelDAGToDAG.cpp b/lib/Target/NVPTX/NVPTXISelDAGToDAG.cpp

index 43c478f4212f784bf4cf694bd88bda68bc5a1095..4f3129c0774e47b9e1b7e4a3b4c54843645d3d00 100644 (file)
--- a/lib/Target/NVPTX/NVPTXISelDAGToDAG.cpp
+++ b/lib/Target/NVPTX/NVPTXISelDAGToDAG.cpp
@@ -103,6 +103,11 @@ bool NVPTXDAGToDAGISel::allowFMA() const {
    return TL->allowFMA(*MF, OptLevel);
  }
  
+bool NVPTXDAGToDAGISel::allowUnsafeFPMath() const {
+  const NVPTXTargetLowering *TL = Subtarget->getTargetLowering();
+  return TL->allowUnsafeFPMath(*MF);
+}
+
  /// Select - Select instructions not customized! Used for
  /// expanded, promoted and normal instructions.
  void NVPTXDAGToDAGISel::Select(SDNode *N) {
diff --git a/lib/Target/NVPTX/NVPTXISelDAGToDAG.h b/lib/Target/NVPTX/NVPTXISelDAGToDAG.h

index 0591035a6aa83ad15fb74499f79af7223f00cad9..b4cbc8a3f448d357583dcf20237978b31bb841cd 100644 (file)
--- a/lib/Target/NVPTX/NVPTXISelDAGToDAG.h
+++ b/lib/Target/NVPTX/NVPTXISelDAGToDAG.h
@@ -34,6 +34,7 @@ class LLVM_LIBRARY_VISIBILITY NVPTXDAGToDAGISel : public SelectionDAGISel {
    bool usePrecSqrtF32() const;
    bool useF32FTZ() const;
    bool allowFMA() const;
+  bool allowUnsafeFPMath() const;
  
  public:
    explicit NVPTXDAGToDAGISel(NVPTXTargetMachine &tm,
diff --git a/lib/Target/NVPTX/NVPTXISelLowering.cpp b/lib/Target/NVPTX/NVPTXISelLowering.cpp

index 7a760fd38d0f6f6f2fee0c702ed68b3c79777b88..30870c6ee5949636768b573384779b013b8de26b 100644 (file)
--- a/lib/Target/NVPTX/NVPTXISelLowering.cpp
+++ b/lib/Target/NVPTX/NVPTXISelLowering.cpp
@@ -3863,27 +3863,35 @@ NVPTXTargetLowering::getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
  
  bool NVPTXTargetLowering::allowFMA(MachineFunction &MF,
                                     CodeGenOpt::Level OptLevel) const {
-  const Function *F = MF.getFunction();
-  const TargetOptions &TO = MF.getTarget().Options;
-
    // Always honor command-line argument
-  if (FMAContractLevelOpt.getNumOccurrences() > 0) {
+  if (FMAContractLevelOpt.getNumOccurrences() > 0)
      return FMAContractLevelOpt > 0;
-  } else if (OptLevel == 0) {
-    // Do not contract if we're not optimizing the code
+
+  // Do not contract if we're not optimizing the code.
+  if (OptLevel == 0)
      return false;
-  } else if (TO.AllowFPOpFusion == FPOpFusion::Fast || TO.UnsafeFPMath) {
-    // Honor TargetOptions flags that explicitly say fusion is okay
+
+  // Honor TargetOptions flags that explicitly say fusion is okay.
+  if (MF.getTarget().Options.AllowFPOpFusion == FPOpFusion::Fast)
+    return true;
+
+  return allowUnsafeFPMath(MF);
+}
+
+bool NVPTXTargetLowering::allowUnsafeFPMath(MachineFunction &MF) const {
+  // Honor TargetOptions flags that explicitly say unsafe math is okay.
+  if (MF.getTarget().Options.UnsafeFPMath)
      return true;
-  } else if (F->hasFnAttribute("unsafe-fp-math")) {
-    // Check for unsafe-fp-math=true coming from Clang
+
+  // Allow unsafe math if unsafe-fp-math attribute explicitly says so.
+  const Function *F = MF.getFunction();
+  if (F->hasFnAttribute("unsafe-fp-math")) {
      Attribute Attr = F->getFnAttribute("unsafe-fp-math");
      StringRef Val = Attr.getValueAsString();
      if (Val == "true")
        return true;
    }
  
-  // We did not have a clear indication that fusion is allowed, so assume not
    return false;
  }
  
diff --git a/lib/Target/NVPTX/NVPTXISelLowering.h b/lib/Target/NVPTX/NVPTXISelLowering.h

index e433aed7781b7d57eee1f45f103c339fab26884d..fa25fe1264a0892826316ec942ce2e6dd14ddb5f 100644 (file)
--- a/lib/Target/NVPTX/NVPTXISelLowering.h
+++ b/lib/Target/NVPTX/NVPTXISelLowering.h
@@ -511,6 +511,7 @@ public:
    getPreferredVectorAction(EVT VT) const override;
  
    bool allowFMA(MachineFunction &MF, CodeGenOpt::Level OptLevel) const;
+  bool allowUnsafeFPMath(MachineFunction &MF) const;
  
    bool isFMAFasterThanFMulAndFAdd(EVT) const override { return true; }
  
diff --git a/lib/Target/NVPTX/NVPTXInstrInfo.td b/lib/Target/NVPTX/NVPTXInstrInfo.td

index 0fbb0448e4c46089d9b2c19bdc938359f3619276..c276f177fab8b98d5f23986c21936fdeeaf5c4a2 100644 (file)
--- a/lib/Target/NVPTX/NVPTXInstrInfo.td
+++ b/lib/Target/NVPTX/NVPTXInstrInfo.td
@@ -134,6 +134,7 @@ def doMulWide      : Predicate<"doMulWide">;
  
  def allowFMA : Predicate<"allowFMA()">;
  def noFMA : Predicate<"!allowFMA()">;
+def allowUnsafeFPMath : Predicate<"allowUnsafeFPMath()">;
  
  def do_DIVF32_APPROX : Predicate<"getDivF32Level()==0">;
  def do_DIVF32_FULL : Predicate<"getDivF32Level()==1">;
@@ -949,10 +950,12 @@ defm FMA64     : FMA<"fma.rn.f64", Float64Regs, f64imm, true>;
  // sin/cos
  def SINF:  NVPTXInst<(outs Float32Regs:$dst), (ins Float32Regs:$src),
                        "sin.approx.f32 \t$dst, $src;",
-                      [(set Float32Regs:$dst, (fsin Float32Regs:$src))]>;
+                      [(set Float32Regs:$dst, (fsin Float32Regs:$src))]>,
+                      Requires<[allowUnsafeFPMath]>;
  def COSF:  NVPTXInst<(outs Float32Regs:$dst), (ins Float32Regs:$src),
                        "cos.approx.f32 \t$dst, $src;",
-                      [(set Float32Regs:$dst, (fcos Float32Regs:$src))]>;
+                      [(set Float32Regs:$dst, (fcos Float32Regs:$src))]>,
+                      Requires<[allowUnsafeFPMath]>;
  
  // Lower (frem x, y) into (sub x, (mul (floor (div x, y)) y)),
  // i.e. "poor man's fmod()"
diff --git a/test/CodeGen/NVPTX/fast-math.ll b/test/CodeGen/NVPTX/fast-math.ll

index d0a333d369ca45173e7c4586d31777c949a19c62..08b435b993f5a5a0cd6616d9fb84efe50a4b4d85 100644 (file)
--- a/test/CodeGen/NVPTX/fast-math.ll
+++ b/test/CodeGen/NVPTX/fast-math.ll
@@ -34,5 +34,22 @@ define float @fadd_ftz(float %a, float %b) #1 {
    ret float %t1
  }
  
+declare float @llvm.sin.f32(float)
+declare float @llvm.cos.f32(float)
+
+; CHECK-LABEL: fsin_approx
+; CHECK:       sin.approx.f32
+define float @fsin_approx(float %a) #0 {
+  %r = tail call float @llvm.sin.f32(float %a)
+  ret float %r
+}
+
+; CHECK-LABEL: fcos_approx
+; CHECK:       cos.approx.f32
+define float @fcos_approx(float %a) #0 {
+  %r = tail call float @llvm.cos.f32(float %a)
+  ret float %r
+}
+
  attributes #0 = { "unsafe-fp-math" = "true" }
  attributes #1 = { "nvptx-f32ftz" = "true" }
diff --git a/test/CodeGen/NVPTX/fcos-no-fast-math.ll b/test/CodeGen/NVPTX/fcos-no-fast-math.ll

new file mode 100644 (file)

index 0000000..d435c1d
--- /dev/null
+++ b/test/CodeGen/NVPTX/fcos-no-fast-math.ll
@@ -0,0 +1,14 @@
+; RUN: not llc < %s -march=nvptx -mcpu=sm_20 2>&1 | FileCheck %s
+
+; Check that we fail to select fcos without fast-math enabled
+
+declare float @llvm.cos.f32(float)
+
+; CHECK: LLVM ERROR: Cannot select: {{.*}}: f32 = fcos
+; CHECK: In function: test_fcos_safe
+define float @test_fcos_safe(float %a) #0 {
+  %r = tail call float @llvm.cos.f32(float %a)
+  ret float %r
+}
+
+attributes #0 = { "unsafe-fp-math" = "false" }
diff --git a/test/CodeGen/NVPTX/fsin-no-fast-math.ll b/test/CodeGen/NVPTX/fsin-no-fast-math.ll

new file mode 100644 (file)

index 0000000..56396b8
--- /dev/null
+++ b/test/CodeGen/NVPTX/fsin-no-fast-math.ll
@@ -0,0 +1,14 @@
+; RUN: not llc < %s -march=nvptx -mcpu=sm_20 2>&1 | FileCheck %s
+
+; Check that we fail to select fsin without fast-math enabled
+
+declare float @llvm.sin.f32(float)
+
+; CHECK: LLVM ERROR: Cannot select: {{.*}}: f32 = fsin
+; CHECK: In function: test_fsin_safe
+define float @test_fsin_safe(float %a) #0 {
+  %r = tail call float @llvm.sin.f32(float %a)
+  ret float %r
+}
+
+attributes #0 = { "unsafe-fp-math" = "false" }
author	Artem Belevich <tra@google.com>
	Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)
committer	Artem Belevich <tra@google.com>
	Fri, 13 Jan 2017 18:48:13 +0000 (18:48 +0000)
lib/Target/NVPTX/NVPTXISelDAGToDAG.cpp		patch \| blob \| history
lib/Target/NVPTX/NVPTXISelDAGToDAG.h		patch \| blob \| history
lib/Target/NVPTX/NVPTXISelLowering.cpp		patch \| blob \| history
lib/Target/NVPTX/NVPTXISelLowering.h		patch \| blob \| history
lib/Target/NVPTX/NVPTXInstrInfo.td		patch \| blob \| history
test/CodeGen/NVPTX/fast-math.ll		patch \| blob \| history
test/CodeGen/NVPTX/fcos-no-fast-math.ll	[new file with mode: 0644]	patch \| blob
test/CodeGen/NVPTX/fsin-no-fast-math.ll	[new file with mode: 0644]	patch \| blob