]> granicus.if.org Git - llvm/commitdiff
[XRay][CodeGen][PowerPC] Fix tail exit codegen for XRay in PPC
authorDean Michael Berris <dberris@google.com>
Fri, 8 Sep 2017 01:47:56 +0000 (01:47 +0000)
committerDean Michael Berris <dberris@google.com>
Fri, 8 Sep 2017 01:47:56 +0000 (01:47 +0000)
Summary:
This fixes code-gen for XRay in PPC. The regression wasn't caught by
codegen tests  which we add in this change.

What happened was the following:

- For tail exits, we used to unconditionally prepend the returns/exits
  with a pseudo-instruction that gets lowered to the instrumentation
  sled (and leave the actual return/exit instruction as-is).
- Changes to the XRay instrumentation pass caused the tail exits to
  suddenly also emit the tail exit pseudo-instruction, since the check
  for whether a return instruction was also a call instruction meant it
  was a tail exit instruction.
- None of the tests caught the regression either due to non-existent
  tests, or the tests being disabled/removed for continuous breakage.

This change re-introduces some of the basic tests and verifies that
we're back to a state that allows the back-end to generate appropriate
XRay instrumented binaries for PPC in the presence of tail exits.

Reviewers: echristo, timshen

Subscribers: nemanjai, kbarton, llvm-commits

Differential Revision: https://reviews.llvm.org/D37570

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@312772 91177308-0d34-0410-b5e6-96231b3b80d8

lib/CodeGen/XRayInstrumentation.cpp
lib/Target/PowerPC/PPCAsmPrinter.cpp
test/CodeGen/PowerPC/xray-attribute-instrumentation.ll [new file with mode: 0644]
test/CodeGen/PowerPC/xray-tail-call-hidden.ll [new file with mode: 0644]
test/CodeGen/PowerPC/xray-tail-call-sled.ll [new file with mode: 0644]

index 0b4c6e551667b4e9149589f917aee4f537d9118a..e6b65825f5b5dc1d197928000b733660747c7d58 100644 (file)
@@ -14,8 +14,8 @@
 //
 //===---------------------------------------------------------------------===//
 
-#include "llvm/ADT/SmallVector.h"
 #include "llvm/ADT/STLExtras.h"
+#include "llvm/ADT/SmallVector.h"
 #include "llvm/ADT/Triple.h"
 #include "llvm/CodeGen/MachineBasicBlock.h"
 #include "llvm/CodeGen/MachineDominators.h"
@@ -109,22 +109,13 @@ void XRayInstrumentation::replaceRetWithPatchableRet(
 
 void XRayInstrumentation::prependRetWithPatchableExit(
     MachineFunction &MF, const TargetInstrInfo *TII) {
-  for (auto &MBB : MF) {
-    for (auto &T : MBB.terminators()) {
-      unsigned Opc = 0;
+  for (auto &MBB : MF)
+    for (auto &T : MBB.terminators())
       if (T.isReturn()) {
-        Opc = TargetOpcode::PATCHABLE_FUNCTION_EXIT;
-      }
-      if (TII->isTailCall(T)) {
-        Opc = TargetOpcode::PATCHABLE_TAIL_CALL;
-      }
-      if (Opc != 0) {
-        // Prepend the return instruction with PATCHABLE_FUNCTION_EXIT or
-        //   PATCHABLE_TAIL_CALL .
-        BuildMI(MBB, T, T.getDebugLoc(), TII->get(Opc));
+        // Prepend the return instruction with PATCHABLE_FUNCTION_EXIT.
+        BuildMI(MBB, T, T.getDebugLoc(),
+                TII->get(TargetOpcode::PATCHABLE_FUNCTION_EXIT));
       }
-    }
-  }
 }
 
 bool XRayInstrumentation::runOnMachineFunction(MachineFunction &MF) {
@@ -143,7 +134,7 @@ bool XRayInstrumentation::runOnMachineFunction(MachineFunction &MF) {
 
     // Count the number of MachineInstr`s in MachineFunction
     int64_t MICount = 0;
-    for (const autoMBB : MF)
+    for (const auto &MBB : MF)
       MICount += MBB.size();
 
     // Check if we have a loop.
index 841b8c51446417fd9d54f5392075c9f81bd0da64..67c849b37bd8e1b10c5f999516e7ec0f3a900e10 100644 (file)
@@ -1131,6 +1131,8 @@ void PPCLinuxAsmPrinter::EmitInstruction(const MachineInstr *MI) {
     break;
   }
   case TargetOpcode::PATCHABLE_TAIL_CALL:
+    // TODO: Define a trampoline `__xray_FunctionTailExit` and differentiate a
+    // normal function exit from a tail exit.
   case TargetOpcode::PATCHABLE_RET:
     // PPC's tail call instruction, e.g. PPC::TCRETURNdi8, doesn't really
     // lower to a PPC::B instruction. The PPC::B instruction is generated
diff --git a/test/CodeGen/PowerPC/xray-attribute-instrumentation.ll b/test/CodeGen/PowerPC/xray-attribute-instrumentation.ll
new file mode 100644 (file)
index 0000000..3592499
--- /dev/null
@@ -0,0 +1,44 @@
+; RUN: llc -filetype=asm -o - -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s
+; RUN: llc -filetype=asm -o - -mtriple=powerpc64le-unknown-linux-gnu \
+; RUN:    -relocation-model=pic < %s | FileCheck %s
+
+define i32 @foo() nounwind noinline uwtable "function-instrument"="xray-always" {
+; CHECK-LABEL: .Ltmp0:
+; CHECK:              b .Ltmp1
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionEntry
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+; CHECK-LABEL: .Ltmp1:
+  ret i32 0
+; CHECK-LABEL: .Ltmp2:
+; CHECK:              blr
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionExit
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+}
+; CHECK-LABEL: xray_instr_map,"awo",@progbits,.text,unique,1
+; CHECK:      .Lxray_sleds_start0:
+; CHECK-NEXT:         .quad   .Ltmp0
+; CHECK-NEXT:         .quad   foo
+; CHECK-NEXT:         .byte   0x00
+; CHECK-NEXT:         .byte   0x01
+; CHECK-NEXT:         .byte   0x00
+; CHECK-NEXT:         .space  13
+; CHECK-NEXT:         .quad   .Ltmp2
+; CHECK-NEXT:         .quad   foo
+; CHECK-NEXT:         .byte   0x01
+; CHECK-NEXT:         .byte   0x01
+; CHECK-NEXT:         .byte   0x00
+; CHECK-NEXT:         .space  13
+; CHECK-NEXT: .Lxray_sleds_end0:
+; CHECK-LABEL: xray_fn_idx,"awo",@progbits,.text,unique,1
+; CHECK:              .p2align        4
+; CHECK-NEXT:         .quad   .Lxray_sleds_start0
+; CHECK-NEXT:         .quad   .Lxray_sleds_end0
+; CHECK-NEXT:         .text
diff --git a/test/CodeGen/PowerPC/xray-tail-call-hidden.ll b/test/CodeGen/PowerPC/xray-tail-call-hidden.ll
new file mode 100644 (file)
index 0000000..3b1cd5f
--- /dev/null
@@ -0,0 +1,26 @@
+; RUN: llc -filetype=asm -o - -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s
+
+declare hidden i32 @callee() nounwind noinline uwtable "function-instrument"="xray-always"
+
+define i32 @caller() nounwind noinline uwtable "function-instrument"="xray-always" {
+; CHECK-LABEL: .Ltmp0:
+; CHECK:              b .Ltmp1
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionEntry
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+; CHECK-LABEL: .Ltmp1:
+  %retval = tail call i32 @callee()
+  ret i32 %retval
+; CHECK-LABEL: .Ltmp2:
+; CHECK:              b callee
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionExit
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+}
+
diff --git a/test/CodeGen/PowerPC/xray-tail-call-sled.ll b/test/CodeGen/PowerPC/xray-tail-call-sled.ll
new file mode 100644 (file)
index 0000000..e8fe9db
--- /dev/null
@@ -0,0 +1,44 @@
+; RUN: llc -filetype=asm -o - -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s
+
+define i32 @callee() nounwind noinline uwtable "function-instrument"="xray-always" {
+; CHECK-LABEL: .Ltmp0:
+; CHECK:              b .Ltmp1
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionEntry
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+; CHECK-LABEL: .Ltmp1:
+  ret i32 0
+; CHECK-LABEL: .Ltmp2:
+; CHECK:              blr
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionExit
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+}
+
+define i32 @caller() nounwind noinline uwtable "function-instrument"="xray-always" {
+; CHECK-LABEL: .Ltmp3:
+; CHECK:              b .Ltmp4
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionEntry
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+; CHECK-LABEL: .Ltmp4:
+  %retval = tail call i32 @callee()
+  ret i32 %retval
+; CHECK-LABEL: .Ltmp5:
+; CHECK:              blr
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         std 0, -8(1)
+; CHECK-NEXT:         mflr 0
+; CHECK-NEXT:         bl __xray_FunctionExit
+; CHECK-NEXT:         nop
+; CHECK-NEXT:         mtlr 0
+}