sched: add throttled time stat for throttled children

author Josh Don <joshdon@google.com>

Tue, 20 Jun 2023 18:32:47 +0000 (11:32 -0700)

committer Peter Zijlstra <peterz@infradead.org>

Thu, 13 Jul 2023 13:21:49 +0000 (15:21 +0200)
author Josh Don <joshdon@google.com>
Tue, 20 Jun 2023 18:32:47 +0000 (11:32 -0700)
committer Peter Zijlstra <peterz@infradead.org>
Thu, 13 Jul 2023 13:21:49 +0000 (15:21 +0200)
diff --git a/include/linux/cgroup-defs.h b/include/linux/cgroup-defs.h

index 8a0d546..ae20dbb 100644 (file)
--- a/include/linux/cgroup-defs.h
+++ b/include/linux/cgroup-defs.h
@@ -661,6 +661,8 @@ struct cgroup_subsys {
         void (*css_rstat_flush)(struct cgroup_subsys_state *css, int cpu);
         int (*css_extra_stat_show)(struct seq_file *seq,
                                    struct cgroup_subsys_state *css);
+       int (*css_local_stat_show)(struct seq_file *seq,
+                                  struct cgroup_subsys_state *css);
  
         int (*can_attach)(struct cgroup_taskset *tset);
         void (*cancel_attach)(struct cgroup_taskset *tset);
diff --git a/kernel/cgroup/cgroup.c b/kernel/cgroup/cgroup.c

index bfe3cd8..4e3ee13 100644 (file)
--- a/kernel/cgroup/cgroup.c
+++ b/kernel/cgroup/cgroup.c
@@ -3685,6 +3685,36 @@ static int cpu_stat_show(struct seq_file *seq, void *v)
         return ret;
  }
  
+static int __maybe_unused cgroup_local_stat_show(struct seq_file *seq,
+                                                struct cgroup *cgrp, int ssid)
+{
+       struct cgroup_subsys *ss = cgroup_subsys[ssid];
+       struct cgroup_subsys_state *css;
+       int ret;
+
+       if (!ss->css_local_stat_show)
+               return 0;
+
+       css = cgroup_tryget_css(cgrp, ss);
+       if (!css)
+               return 0;
+
+       ret = ss->css_local_stat_show(seq, css);
+       css_put(css);
+       return ret;
+}
+
+static int cpu_local_stat_show(struct seq_file *seq, void *v)
+{
+       struct cgroup __maybe_unused *cgrp = seq_css(seq)->cgroup;
+       int ret = 0;
+
+#ifdef CONFIG_CGROUP_SCHED
+       ret = cgroup_local_stat_show(seq, cgrp, cpu_cgrp_id);
+#endif
+       return ret;
+}
+
  #ifdef CONFIG_PSI
  static int cgroup_io_pressure_show(struct seq_file *seq, void *v)
  {
@@ -5235,6 +5265,10 @@ static struct cftype cgroup_base_files[] = {
                 .name = "cpu.stat",
                 .seq_show = cpu_stat_show,
         },
+       {
+               .name = "cpu.stat.local",
+               .seq_show = cpu_local_stat_show,
+       },
         { }     /* terminate */
  };
  
diff --git a/kernel/sched/core.c b/kernel/sched/core.c

index c52c2eb..2291f9d 100644 (file)
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -11139,6 +11139,27 @@ static int cpu_cfs_stat_show(struct seq_file *sf, void *v)
  
         return 0;
  }
+
+static u64 throttled_time_self(struct task_group *tg)
+{
+       int i;
+       u64 total = 0;
+
+       for_each_possible_cpu(i) {
+               total += READ_ONCE(tg->cfs_rq[i]->throttled_clock_self_time);
+       }
+
+       return total;
+}
+
+static int cpu_cfs_local_stat_show(struct seq_file *sf, void *v)
+{
+       struct task_group *tg = css_tg(seq_css(sf));
+
+       seq_printf(sf, "throttled_time %llu\n", throttled_time_self(tg));
+
+       return 0;
+}
  #endif /* CONFIG_CFS_BANDWIDTH */
  #endif /* CONFIG_FAIR_GROUP_SCHED */
  
@@ -11215,6 +11236,10 @@ static struct cftype cpu_legacy_files[] = {
                 .name = "stat",
                 .seq_show = cpu_cfs_stat_show,
         },
+       {
+               .name = "stat.local",
+               .seq_show = cpu_cfs_local_stat_show,
+       },
  #endif
  #ifdef CONFIG_RT_GROUP_SCHED
         {
@@ -11271,6 +11296,24 @@ static int cpu_extra_stat_show(struct seq_file *sf,
         return 0;
  }
  
+static int cpu_local_stat_show(struct seq_file *sf,
+                              struct cgroup_subsys_state *css)
+{
+#ifdef CONFIG_CFS_BANDWIDTH
+       {
+               struct task_group *tg = css_tg(css);
+               u64 throttled_self_usec;
+
+               throttled_self_usec = throttled_time_self(tg);
+               do_div(throttled_self_usec, NSEC_PER_USEC);
+
+               seq_printf(sf, "throttled_usec %llu\n",
+                          throttled_self_usec);
+       }
+#endif
+       return 0;
+}
+
  #ifdef CONFIG_FAIR_GROUP_SCHED
  static u64 cpu_weight_read_u64(struct cgroup_subsys_state *css,
                                struct cftype *cft)
@@ -11449,6 +11492,7 @@ struct cgroup_subsys cpu_cgrp_subsys = {
         .css_released   = cpu_cgroup_css_released,
         .css_free       = cpu_cgroup_css_free,
         .css_extra_stat_show = cpu_extra_stat_show,
+       .css_local_stat_show = cpu_local_stat_show,
  #ifdef CONFIG_RT_GROUP_SCHED
         .can_attach     = cpu_cgroup_can_attach,
  #endif
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 51ccae7..159b202 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -4878,8 +4878,12 @@ enqueue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
                         list_add_leaf_cfs_rq(cfs_rq);
                 } else {
  #ifdef CONFIG_CFS_BANDWIDTH
+                       struct rq *rq = rq_of(cfs_rq);
+
                         if (cfs_rq_throttled(cfs_rq) && !cfs_rq->throttled_clock)
-                               cfs_rq->throttled_clock = rq_clock(rq_of(cfs_rq));
+                               cfs_rq->throttled_clock = rq_clock(rq);
+                       if (!cfs_rq->throttled_clock_self)
+                               cfs_rq->throttled_clock_self = rq_clock(rq);
  #endif
                 }
         }
@@ -5384,6 +5388,17 @@ static int tg_unthrottle_up(struct task_group *tg, void *data)
                 /* Add cfs_rq with load or one or more already running entities to the list */
                 if (!cfs_rq_is_decayed(cfs_rq))
                         list_add_leaf_cfs_rq(cfs_rq);
+
+               if (cfs_rq->throttled_clock_self) {
+                       u64 delta = rq_clock(rq) - cfs_rq->throttled_clock_self;
+
+                       cfs_rq->throttled_clock_self = 0;
+
+                       if (SCHED_WARN_ON((s64)delta < 0))
+                               delta = 0;
+
+                       cfs_rq->throttled_clock_self_time += delta;
+               }
         }
  
         return 0;
@@ -5398,6 +5413,10 @@ static int tg_throttle_down(struct task_group *tg, void *data)
         if (!cfs_rq->throttle_count) {
                 cfs_rq->throttled_clock_pelt = rq_clock_pelt(rq);
                 list_del_leaf_cfs_rq(cfs_rq);
+
+               SCHED_WARN_ON(cfs_rq->throttled_clock_self);
+               if (cfs_rq->nr_running)
+                       cfs_rq->throttled_clock_self = rq_clock(rq);
         }
         cfs_rq->throttle_count++;
  
diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h

index e93e006..1dcea9b 100644 (file)
--- a/kernel/sched/sched.h
+++ b/kernel/sched/sched.h
@@ -636,6 +636,8 @@ struct cfs_rq {
         u64                     throttled_clock;
         u64                     throttled_clock_pelt;
         u64                     throttled_clock_pelt_time;
+       u64                     throttled_clock_self;
+       u64                     throttled_clock_self_time;
         int                     throttled;
         int                     throttle_count;
         struct list_head        throttled_list;
author	Josh Don <joshdon@google.com>
	Tue, 20 Jun 2023 18:32:47 +0000 (11:32 -0700)
committer	Peter Zijlstra <peterz@infradead.org>
	Thu, 13 Jul 2023 13:21:49 +0000 (15:21 +0200)
include/linux/cgroup-defs.h		patch \| blob \| history
kernel/cgroup/cgroup.c		patch \| blob \| history
kernel/sched/core.c		patch \| blob \| history
kernel/sched/fair.c		patch \| blob \| history
kernel/sched/sched.h		patch \| blob \| history