perf/x86: Track pmu in per-CPU cpu_hw_events

author Kan Liang <kan.liang@linux.intel.com>

Mon, 12 Apr 2021 14:30:43 +0000 (07:30 -0700)

committer Peter Zijlstra <peterz@infradead.org>

Mon, 19 Apr 2021 18:03:24 +0000 (20:03 +0200)
author Kan Liang <kan.liang@linux.intel.com>
Mon, 12 Apr 2021 14:30:43 +0000 (07:30 -0700)
committer Peter Zijlstra <peterz@infradead.org>
Mon, 19 Apr 2021 18:03:24 +0000 (20:03 +0200)
diff --git a/arch/x86/events/core.c b/arch/x86/events/core.c

index dd9f3c2f7d058d87f8b07785d26553049417a2b0..a49a8bd6267cde659deeacca51f2484e595d8695 100644 (file)
--- a/arch/x86/events/core.c
+++ b/arch/x86/events/core.c
@@ -45,9 +45,11 @@
  #include "perf_event.h"
  
  struct x86_pmu x86_pmu __read_mostly;
+static struct pmu pmu;
  
  DEFINE_PER_CPU(struct cpu_hw_events, cpu_hw_events) = {
         .enabled = 1,
+       .pmu = &pmu,
  };
  
  DEFINE_STATIC_KEY_FALSE(rdpmc_never_available_key);
@@ -724,16 +726,23 @@ void x86_pmu_enable_all(int added)
         }
  }
  
-static struct pmu pmu;
-
  static inline int is_x86_event(struct perf_event *event)
  {
         return event->pmu == &pmu;
  }
  
-struct pmu *x86_get_pmu(void)
+struct pmu *x86_get_pmu(unsigned int cpu)
  {
-       return &pmu;
+       struct cpu_hw_events *cpuc = &per_cpu(cpu_hw_events, cpu);
+
+       /*
+        * All CPUs of the hybrid type have been offline.
+        * The x86_get_pmu() should not be invoked.
+        */
+       if (WARN_ON_ONCE(!cpuc->pmu))
+               return &pmu;
+
+       return cpuc->pmu;
  }
  /*
   * Event scheduler state:
diff --git a/arch/x86/events/intel/core.c b/arch/x86/events/intel/core.c

index 7bbb5bb98d8cd327efdccaf7308209b7cb35de62..f116c63c723ce71a7ef5b4bdf9ac6487fd398cd9 100644 (file)
--- a/arch/x86/events/intel/core.c
+++ b/arch/x86/events/intel/core.c
@@ -4876,7 +4876,7 @@ static void update_tfa_sched(void *ignored)
          * and if so force schedule out for all event types all contexts
          */
         if (test_bit(3, cpuc->active_mask))
-               perf_pmu_resched(x86_get_pmu());
+               perf_pmu_resched(x86_get_pmu(smp_processor_id()));
  }
  
  static ssize_t show_sysctl_tfa(struct device *cdev,
diff --git a/arch/x86/events/intel/ds.c b/arch/x86/events/intel/ds.c

index 7ebae18264033c73293d0293504fd3439303c83e..1bfea8c7c679ab291b7a5b3fbdbcb05c7285abce 100644 (file)
--- a/arch/x86/events/intel/ds.c
+++ b/arch/x86/events/intel/ds.c
@@ -2192,7 +2192,7 @@ void __init intel_ds_init(void)
                                         PERF_SAMPLE_TIME;
                                 x86_pmu.flags |= PMU_FL_PEBS_ALL;
                                 pebs_qual = "-baseline";
-                               x86_get_pmu()->capabilities |= PERF_PMU_CAP_EXTENDED_REGS;
+                               x86_get_pmu(smp_processor_id())->capabilities |= PERF_PMU_CAP_EXTENDED_REGS;
                         } else {
                                 /* Only basic record supported */
                                 x86_pmu.large_pebs_flags &=
@@ -2207,7 +2207,7 @@ void __init intel_ds_init(void)
  
                         if (x86_pmu.intel_cap.pebs_output_pt_available) {
                                 pr_cont("PEBS-via-PT, ");
-                               x86_get_pmu()->capabilities |= PERF_PMU_CAP_AUX_OUTPUT;
+                               x86_get_pmu(smp_processor_id())->capabilities |= PERF_PMU_CAP_AUX_OUTPUT;
                         }
  
                         break;
diff --git a/arch/x86/events/intel/lbr.c b/arch/x86/events/intel/lbr.c

index 21890dacfcfee5f7406e5ac5b72980188ccb3997..bb4486c4155a9685e28435b828e8140c58aabf2e 100644 (file)
--- a/arch/x86/events/intel/lbr.c
+++ b/arch/x86/events/intel/lbr.c
@@ -705,7 +705,7 @@ void intel_pmu_lbr_add(struct perf_event *event)
  
  void release_lbr_buffers(void)
  {
-       struct kmem_cache *kmem_cache = x86_get_pmu()->task_ctx_cache;
+       struct kmem_cache *kmem_cache;
         struct cpu_hw_events *cpuc;
         int cpu;
  
@@ -714,6 +714,7 @@ void release_lbr_buffers(void)
  
         for_each_possible_cpu(cpu) {
                 cpuc = per_cpu_ptr(&cpu_hw_events, cpu);
+               kmem_cache = x86_get_pmu(cpu)->task_ctx_cache;
                 if (kmem_cache && cpuc->lbr_xsave) {
                         kmem_cache_free(kmem_cache, cpuc->lbr_xsave);
                         cpuc->lbr_xsave = NULL;
@@ -1609,7 +1610,7 @@ void intel_pmu_lbr_init_hsw(void)
         x86_pmu.lbr_sel_mask = LBR_SEL_MASK;
         x86_pmu.lbr_sel_map  = hsw_lbr_sel_map;
  
-       x86_get_pmu()->task_ctx_cache = create_lbr_kmem_cache(size, 0);
+       x86_get_pmu(smp_processor_id())->task_ctx_cache = create_lbr_kmem_cache(size, 0);
  
         if (lbr_from_signext_quirk_needed())
                 static_branch_enable(&lbr_from_quirk_key);
@@ -1629,7 +1630,7 @@ __init void intel_pmu_lbr_init_skl(void)
         x86_pmu.lbr_sel_mask = LBR_SEL_MASK;
         x86_pmu.lbr_sel_map  = hsw_lbr_sel_map;
  
-       x86_get_pmu()->task_ctx_cache = create_lbr_kmem_cache(size, 0);
+       x86_get_pmu(smp_processor_id())->task_ctx_cache = create_lbr_kmem_cache(size, 0);
  
         /*
          * SW branch filter usage:
@@ -1726,7 +1727,7 @@ static bool is_arch_lbr_xsave_available(void)
  
  void __init intel_pmu_arch_lbr_init(void)
  {
-       struct pmu *pmu = x86_get_pmu();
+       struct pmu *pmu = x86_get_pmu(smp_processor_id());
         union cpuid28_eax eax;
         union cpuid28_ebx ebx;
         union cpuid28_ecx ecx;
diff --git a/arch/x86/events/perf_event.h b/arch/x86/events/perf_event.h

index 54a340e42a22214b4f4db9af7fb2f167ca929131..da947d3d14a527ba1a49a2f89026df1a8f733986 100644 (file)
--- a/arch/x86/events/perf_event.h
+++ b/arch/x86/events/perf_event.h
@@ -326,6 +326,8 @@ struct cpu_hw_events {
         int                             n_pair; /* Large increment events */
  
         void                            *kfree_on_online[X86_PERF_KFREE_MAX];
+
+       struct pmu                      *pmu;
  };
  
  #define __EVENT_CONSTRAINT_RANGE(c, e, n, m, w, o, f) {        \
@@ -904,7 +906,7 @@ static struct perf_pmu_events_ht_attr event_attr_##v = {            \
         .event_str_ht   = ht,                                           \
  }
  
-struct pmu *x86_get_pmu(void);
+struct pmu *x86_get_pmu(unsigned int cpu);
  extern struct x86_pmu x86_pmu __read_mostly;
  
  static __always_inline struct x86_perf_task_context_opt *task_context_opt(void *ctx)
author	Kan Liang <kan.liang@linux.intel.com>
	Mon, 12 Apr 2021 14:30:43 +0000 (07:30 -0700)
committer	Peter Zijlstra <peterz@infradead.org>
	Mon, 19 Apr 2021 18:03:24 +0000 (20:03 +0200)
arch/x86/events/core.c		patch \| blob \| history
arch/x86/events/intel/core.c		patch \| blob \| history
arch/x86/events/intel/ds.c		patch \| blob \| history
arch/x86/events/intel/lbr.c		patch \| blob \| history
arch/x86/events/perf_event.h		patch \| blob \| history