[Pytorch Profiler] Introduce scopes to enableProfiler (#62417)

author Kimish Patel <kimishpatel@fb.com>

Sat, 14 Aug 2021 04:37:57 +0000 (21:37 -0700)

committer Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>

Sat, 14 Aug 2021 04:40:15 +0000 (21:40 -0700)
author Kimish Patel <kimishpatel@fb.com>
Sat, 14 Aug 2021 04:37:57 +0000 (21:37 -0700)
committer Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>
Sat, 14 Aug 2021 04:40:15 +0000 (21:40 -0700)
diff --git a/test/cpp/jit/test_misc.cpp b/test/cpp/jit/test_misc.cpp

index 5ee8816..8ecedd3 100644 (file)
--- a/test/cpp/jit/test_misc.cpp
+++ b/test/cpp/jit/test_misc.cpp
@@ -2505,6 +2505,76 @@ TEST(RecordDebugHandles, Basic) {
    ASSERT_EQ(my_events, 2);
  }
  
+TEST(RecordDebugHandles, ScopedCallbacks) {
+  // Enable the profiler in this thread
+  torch::autograd::profiler::prepareProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU});
+  torch::autograd::profiler::enableProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU});
+
+  {
+    auto a = torch::rand({128, 128});
+    auto b = torch::rand({128, 128});
+    auto c = a + b;
+  }
+  auto profiler_results_ptr = torch::autograd::profiler::disableProfiler();
+  ASSERT_TRUE(profiler_results_ptr->events().size() > 0);
+
+  // Enable the profiler in this thread
+  torch::autograd::profiler::prepareProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU});
+  torch::autograd::profiler::enableProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU},
+      {at::RecordScope::USER_SCOPE});
+  {
+    auto a = torch::rand({128, 128});
+    auto b = torch::rand({128, 128});
+    auto c = a + b;
+  }
+  profiler_results_ptr = torch::autograd::profiler::disableProfiler();
+  ASSERT_TRUE(profiler_results_ptr->events().size() == 0);
+
+  torch::autograd::profiler::prepareProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU});
+  torch::autograd::profiler::enableProfiler(
+      torch::autograd::profiler::ProfilerConfig(
+          torch::autograd::profiler::ProfilerState::KINETO, false, false),
+      {torch::autograd::profiler::ActivityType::CPU},
+      {at::RecordScope::USER_SCOPE});
+  {
+    RECORD_USER_SCOPE_WITH_DEBUG_HANDLE_AND_INPUTS("my_function", 42, {});
+    auto a = torch::rand({128, 128});
+    auto b = torch::rand({128, 128});
+    auto c = a + b;
+  }
+  {
+    RECORD_USER_SCOPE_WITH_INPUTS("not_my_function", {});
+    auto a = torch::rand({128, 128});
+    auto b = torch::rand({128, 128});
+    auto c = a + b;
+  }
+  profiler_results_ptr = torch::autograd::profiler::disableProfiler();
+  const auto& kineto_events = profiler_results_ptr->events();
+  for (const auto& e : kineto_events) {
+    if (e.name() == "my_function") {
+      ASSERT_EQ(e.debugHandle(), 42);
+    } else if (e.name() == "not_my_function") {
+      ASSERT_EQ(e.debugHandle(), -1);
+    }
+  }
+  ASSERT_TRUE(profiler_results_ptr->events().size() == 2);
+}
+
  TEST(IValueKWargsTest, Basic) {
    const auto text = R"(
      def foo(a : int, b : int, c : int = 4):
diff --git a/torch/csrc/autograd/init.cpp b/torch/csrc/autograd/init.cpp

index dc51241..2eacbf1 100644 (file)
--- a/torch/csrc/autograd/init.cpp
+++ b/torch/csrc/autograd/init.cpp
@@ -18,6 +18,7 @@
  #include <c10/core/ScalarType.h>
  
  #include <set>
+#include <unordered_set>
  
  struct DisableTorchDispatch {
    DisableTorchDispatch() : guard_(c10::DispatchKey::Python) {
@@ -223,7 +224,11 @@ PyObject* THPAutograd_initExtension(PyObject* _unused, PyObject *unused) {
  #endif // USE_KINETO
      ;
  
-  m.def("_enable_profiler", enableProfiler);
+  m.def("_enable_profiler",
+        &enableProfiler,
+        py::arg("config"),
+        py::arg("activities"),
+        py::arg("scopes") = std::unordered_set<at::RecordScope>());
    m.def("_disable_profiler", disableProfiler);
    m.def("_prepare_profiler", prepareProfiler);
  
diff --git a/torch/csrc/autograd/profiler_kineto.cpp b/torch/csrc/autograd/profiler_kineto.cpp

index e92461a..526813d 100644 (file)
--- a/torch/csrc/autograd/profiler_kineto.cpp
+++ b/torch/csrc/autograd/profiler_kineto.cpp
@@ -287,7 +287,7 @@ KinetoThreadLocalState* getProfilerTLSState() {
    return static_cast<KinetoThreadLocalState*>(state);
  }
  
-void pushProfilingCallbacks() {
+void pushProfilingCallbacks(const std::unordered_set<at::RecordScope>& scopes) {
    auto state_ptr = getProfilerTLSState();
    TORCH_INTERNAL_ASSERT(state_ptr, "Expected profiler state set");
    auto handle = at::addThreadLocalCallback(at::RecordFunctionCallback(
@@ -388,7 +388,8 @@ void pushProfilingCallbacks() {
          }
        })
      .needsInputs(state_ptr->config().report_input_shapes)
-    .needsIds(true));
+    .needsIds(true)
+    .scopes(scopes));
    state_ptr->setCallbackHandle(handle);
  }
  
@@ -497,7 +498,8 @@ void prepareProfiler(
  
  void enableProfiler(
      const ProfilerConfig& config,
-    const std::set<ActivityType>& activities) {
+    const std::set<ActivityType>& activities,
+    const std::unordered_set<at::RecordScope>& scopes) {
    if (config.state != ProfilerState::NVTX) {
      TORCH_CHECK(
          config.state == ProfilerState::KINETO ||
@@ -514,7 +516,7 @@ void enableProfiler(
    c10::ThreadLocalDebugInfo::_push(c10::DebugInfoKind::PROFILER_STATE, state);
  
    if (activities.count(ActivityType::CPU) || config.state == ProfilerState::NVTX) {
-    pushProfilingCallbacks();
+    pushProfilingCallbacks(scopes);
    }
  
  #ifdef USE_KINETO
diff --git a/torch/csrc/autograd/profiler_kineto.h b/torch/csrc/autograd/profiler_kineto.h

index 8a878a0..310554a 100644 (file)
--- a/torch/csrc/autograd/profiler_kineto.h
+++ b/torch/csrc/autograd/profiler_kineto.h
@@ -331,7 +331,8 @@ struct TORCH_API ProfilerResult {
  
  TORCH_API void enableProfiler(
      const ProfilerConfig& config,
-    const std::set<ActivityType>& activities);
+    const std::set<ActivityType>& activities,
+    const std::unordered_set<at::RecordScope>& scopes = {});
  
  TORCH_API std::unique_ptr<ProfilerResult> disableProfiler();
author	Kimish Patel <kimishpatel@fb.com>
	Sat, 14 Aug 2021 04:37:57 +0000 (21:37 -0700)
committer	Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>
	Sat, 14 Aug 2021 04:40:15 +0000 (21:40 -0700)
test/cpp/jit/test_misc.cpp		patch \| blob \| history
torch/csrc/autograd/init.cpp		patch \| blob \| history
torch/csrc/autograd/profiler_kineto.cpp		patch \| blob \| history
torch/csrc/autograd/profiler_kineto.h		patch \| blob \| history