From 1b09aae82aba335d1ff48b93da8f3cf5c783b72e Mon Sep 17 00:00:00 2001 From: Dean Michael Berris Date: Thu, 13 Oct 2016 23:56:54 +0000 Subject: [PATCH] [compiler-rt][XRay] Support tail call sleds Summary: This change depends on D23986 which adds tail call-specific sleds. For now we treat them first as normal exits, and in the future leave room for implementing this as a different kind of log entry. The reason for deferring the change is so that we can keep the naive logging implementation more accurate without additional complexity for reading the log. The accuracy is gained in effectively interpreting call stacks like: A() B() C() Which when tail-call merged will end up not having any exit entries for A() nor B(), but effectively in turn can be reasoned about as: A() B() C() Although we lose the fact that A() had called B() then had called C() with the naive approach, a later iteration that adds the explicit tail call entries would be a change in the log format and thus necessitate a version change for the header. We can do this later to have a chance at releasing some tools (in D21987) that are able to handle the naive log format, then support higher version numbers of the log format too. Reviewers: echristo, kcc, rSerge, majnemer Subscribers: mehdi_amini, llvm-commits, dberris Differential Revision: https://reviews.llvm.org/D23988 llvm-svn: 284178 --- compiler-rt/include/xray/xray_interface.h | 2 +- compiler-rt/lib/xray/xray_arm.cc | 7 ++++++ compiler-rt/lib/xray/xray_interface.cc | 3 +++ compiler-rt/lib/xray/xray_interface_internal.h | 7 +++--- compiler-rt/lib/xray/xray_x86_64.cc | 33 ++++++++++++++++++++++++++ 5 files changed, 48 insertions(+), 4 deletions(-) diff --git a/compiler-rt/include/xray/xray_interface.h b/compiler-rt/include/xray/xray_interface.h index 22f137d..680fcfd 100644 --- a/compiler-rt/include/xray/xray_interface.h +++ b/compiler-rt/include/xray/xray_interface.h @@ -18,7 +18,7 @@ extern "C" { -enum XRayEntryType { ENTRY = 0, EXIT = 1 }; +enum XRayEntryType { ENTRY = 0, EXIT = 1, TAIL = 2 }; // Provide a function to invoke for when instrumentation points are hit. This is // a user-visible control surface that overrides the default implementation. The diff --git a/compiler-rt/lib/xray/xray_arm.cc b/compiler-rt/lib/xray/xray_arm.cc index d1b953e..4c19803 100644 --- a/compiler-rt/lib/xray/xray_arm.cc +++ b/compiler-rt/lib/xray/xray_arm.cc @@ -127,4 +127,11 @@ bool patchFunctionExit(const bool Enable, const uint32_t FuncId, return patchSled(Enable, FuncId, Sled, __xray_FunctionExit); } +bool patchFunctionTailExit(const bool Enable, const uint32_t FuncId, + const XRaySledEntry &Sled) { + // FIXME: In the future we'd need to distinguish between non-tail exits and + // tail exits for better information preservation. + return patchSled(Enable, FuncId, Sled, __xray_FunctionExit); +} + } // namespace __xray diff --git a/compiler-rt/lib/xray/xray_interface.cc b/compiler-rt/lib/xray/xray_interface.cc index ec393b9..fb49ff3 100644 --- a/compiler-rt/lib/xray/xray_interface.cc +++ b/compiler-rt/lib/xray/xray_interface.cc @@ -174,6 +174,9 @@ XRayPatchingStatus ControlPatching(bool Enable) { case XRayEntryType::EXIT: Success = patchFunctionExit(Enable, FuncId, Sled); break; + case XRayEntryType::TAIL: + Success = patchFunctionTailExit(Enable, FuncId, Sled); + break; default: Report("Unsupported sled kind: %d", int(Sled.Kind)); continue; diff --git a/compiler-rt/lib/xray/xray_interface_internal.h b/compiler-rt/lib/xray/xray_interface_internal.h index fe58f8a..24a5acc 100644 --- a/compiler-rt/lib/xray/xray_interface_internal.h +++ b/compiler-rt/lib/xray/xray_interface_internal.h @@ -48,10 +48,11 @@ struct XRaySledMap { size_t Entries; }; -bool patchFunctionEntry(const bool Enable, const uint32_t FuncId, +bool patchFunctionEntry(bool Enable, uint32_t FuncId, const XRaySledEntry &Sled); -bool patchFunctionExit(const bool Enable, const uint32_t FuncId, - const XRaySledEntry &Sled); +bool patchFunctionExit(bool Enable, uint32_t FuncId, const XRaySledEntry &Sled); +bool patchFunctionTailExit(bool Enable, uint32_t FuncId, + const XRaySledEntry &Sled); } // namespace __xray diff --git a/compiler-rt/lib/xray/xray_x86_64.cc b/compiler-rt/lib/xray/xray_x86_64.cc index 0443c5e..c4fead9 100644 --- a/compiler-rt/lib/xray/xray_x86_64.cc +++ b/compiler-rt/lib/xray/xray_x86_64.cc @@ -111,4 +111,37 @@ bool patchFunctionExit(const bool Enable, const uint32_t FuncId, return true; } +bool patchFunctionTailExit(const bool Enable, const uint32_t FuncId, + const XRaySledEntry &Sled) { + // Here we do the dance of replacing the tail call sled with a similar + // sequence as the entry sled, but calls the exit sled instead, so we can + // treat tail call exits as if they were normal exits. + // + // FIXME: In the future we'd need to distinguish between non-tail exits and + // tail exits for better information preservation. + int64_t TrampolineOffset = reinterpret_cast(__xray_FunctionExit) - + (static_cast(Sled.Address) + 11); + if (TrampolineOffset < MinOffset || TrampolineOffset > MaxOffset) { + Report("XRay Exit trampoline (%p) too far from sled (%p); distance = " + "%ld\n", + __xray_FunctionExit, reinterpret_cast(Sled.Address), + TrampolineOffset); + return false; + } + if (Enable) { + *reinterpret_cast(Sled.Address + 2) = FuncId; + *reinterpret_cast(Sled.Address + 6) = CallOpCode; + *reinterpret_cast(Sled.Address + 7) = TrampolineOffset; + std::atomic_store_explicit( + reinterpret_cast *>(Sled.Address), MovR10Seq, + std::memory_order_release); + } else { + std::atomic_store_explicit( + reinterpret_cast *>(Sled.Address), Jmp9Seq, + std::memory_order_release); + // FIXME: Write out the nops still? + } + return true; +} + } // namespace __xray -- 2.7.4