[CUDA] Conservatively mark inline asm as convergent.

author Justin Lebar <jlebar@google.com>

Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)

committer Justin Lebar <jlebar@google.com>

Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)
author Justin Lebar <jlebar@google.com>
Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)
committer Justin Lebar <jlebar@google.com>
Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)
diff --git a/lib/CodeGen/CGStmt.cpp b/lib/CodeGen/CGStmt.cpp

index 6945ec9ef6d0897b71c50dc2a02c78077325c2a9..ff70bbc866f478cf889f6b638d8a38279008054e 100644 (file)
--- a/lib/CodeGen/CGStmt.cpp
+++ b/lib/CodeGen/CGStmt.cpp
@@ -2054,6 +2054,14 @@ void CodeGenFunction::EmitAsmStmt(const AsmStmt &S) {
                                            llvm::ConstantAsMetadata::get(Loc)));
    }
  
+  if (getLangOpts().CUDA && getLangOpts().CUDAIsDevice) {
+    // Conservatively, mark all inline asm blocks in CUDA as convergent
+    // (meaning, they may call an intrinsically convergent op, such as bar.sync,
+    // and so can't have certain optimizations applied around them).
+    Result->addAttribute(llvm::AttributeSet::FunctionIndex,
+                         llvm::Attribute::Convergent);
+  }
+
    // Extract all of the register value results from the asm.
    std::vector<llvm::Value*> RegResults;
    if (ResultRegTypes.size() == 1) {
diff --git a/test/CodeGenCUDA/convergent.cu b/test/CodeGenCUDA/convergent.cu

index d2e75f7e2fa56e7815ae48560e40f099214fd012..6827c57d29fbe7fdc962b264893a6d4a44b252ec 100644 (file)
--- a/test/CodeGenCUDA/convergent.cu
+++ b/test/CodeGenCUDA/convergent.cu
@@ -25,6 +25,11 @@ __host__ __device__ void baz();
  __host__ __device__ void bar() {
    // DEVICE: call void @_Z3bazv() [[CALL_ATTR:#[0-9]+]]
    baz();
+  // DEVICE: call i32 asm "trap;", "=l"() [[ASM_ATTR:#[0-9]+]]
+  int x;
+  asm ("trap;" : "=l"(x));
+  // DEVICE: call void asm sideeffect "trap;", ""() [[ASM_ATTR:#[0-9]+]]
+  asm volatile ("trap;");
  }
  
  // DEVICE: declare void @_Z3bazv() [[BAZ_ATTR:#[0-9]+]]
@@ -32,6 +37,7 @@ __host__ __device__ void bar() {
  // DEVICE-SAME: convergent
  // DEVICE-SAME: }
  // DEVICE: attributes [[CALL_ATTR]] = { convergent }
+// DEVICE: attributes [[ASM_ATTR]] = { convergent
  
  // HOST: declare void @_Z3bazv() [[BAZ_ATTR:#[0-9]+]]
  // HOST: attributes [[BAZ_ATTR]] = {
author	Justin Lebar <jlebar@google.com>
	Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)
committer	Justin Lebar <jlebar@google.com>
	Tue, 31 May 2016 21:27:13 +0000 (21:27 +0000)
lib/CodeGen/CGStmt.cpp		patch \| blob \| history
test/CodeGenCUDA/convergent.cu		patch \| blob \| history