sched/fair: Move idle_balance()

author Peter Zijlstra <peterz@infradead.org>

Tue, 20 Feb 2018 10:45:47 +0000 (11:45 +0100)

committer Ingo Molnar <mingo@kernel.org>

Fri, 9 Mar 2018 06:59:25 +0000 (07:59 +0100)
author Peter Zijlstra <peterz@infradead.org>
Tue, 20 Feb 2018 10:45:47 +0000 (11:45 +0100)
committer Ingo Molnar <mingo@kernel.org>
Fri, 9 Mar 2018 06:59:25 +0000 (07:59 +0100)
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index d6767f5..058badc 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -8917,120 +8917,6 @@ update_next_balance(struct sched_domain *sd, unsigned long *next_balance)
  }
  
  /*
- * idle_balance is called by schedule() if this_cpu is about to become
- * idle. Attempts to pull tasks from other CPUs.
- */
-static int idle_balance(struct rq *this_rq, struct rq_flags *rf)
-{
-       unsigned long next_balance = jiffies + HZ;
-       int this_cpu = this_rq->cpu;
-       struct sched_domain *sd;
-       int pulled_task = 0;
-       u64 curr_cost = 0;
-
-       /*
-        * We must set idle_stamp _before_ calling idle_balance(), such that we
-        * measure the duration of idle_balance() as idle time.
-        */
-       this_rq->idle_stamp = rq_clock(this_rq);
-
-       /*
-        * Do not pull tasks towards !active CPUs...
-        */
-       if (!cpu_active(this_cpu))
-               return 0;
-
-       /*
-        * This is OK, because current is on_cpu, which avoids it being picked
-        * for load-balance and preemption/IRQs are still disabled avoiding
-        * further scheduler activity on it and we're being very careful to
-        * re-start the picking loop.
-        */
-       rq_unpin_lock(this_rq, rf);
-
-       if (this_rq->avg_idle < sysctl_sched_migration_cost ||
-           !this_rq->rd->overload) {
-               rcu_read_lock();
-               sd = rcu_dereference_check_sched_domain(this_rq->sd);
-               if (sd)
-                       update_next_balance(sd, &next_balance);
-               rcu_read_unlock();
-
-               goto out;
-       }
-
-       raw_spin_unlock(&this_rq->lock);
-
-       update_blocked_averages(this_cpu);
-       rcu_read_lock();
-       for_each_domain(this_cpu, sd) {
-               int continue_balancing = 1;
-               u64 t0, domain_cost;
-
-               if (!(sd->flags & SD_LOAD_BALANCE))
-                       continue;
-
-               if (this_rq->avg_idle < curr_cost + sd->max_newidle_lb_cost) {
-                       update_next_balance(sd, &next_balance);
-                       break;
-               }
-
-               if (sd->flags & SD_BALANCE_NEWIDLE) {
-                       t0 = sched_clock_cpu(this_cpu);
-
-                       pulled_task = load_balance(this_cpu, this_rq,
-                                                  sd, CPU_NEWLY_IDLE,
-                                                  &continue_balancing);
-
-                       domain_cost = sched_clock_cpu(this_cpu) - t0;
-                       if (domain_cost > sd->max_newidle_lb_cost)
-                               sd->max_newidle_lb_cost = domain_cost;
-
-                       curr_cost += domain_cost;
-               }
-
-               update_next_balance(sd, &next_balance);
-
-               /*
-                * Stop searching for tasks to pull if there are
-                * now runnable tasks on this rq.
-                */
-               if (pulled_task || this_rq->nr_running > 0)
-                       break;
-       }
-       rcu_read_unlock();
-
-       raw_spin_lock(&this_rq->lock);
-
-       if (curr_cost > this_rq->max_idle_balance_cost)
-               this_rq->max_idle_balance_cost = curr_cost;
-
-       /*
-        * While browsing the domains, we released the rq lock, a task could
-        * have been enqueued in the meantime. Since we're not going idle,
-        * pretend we pulled a task.
-        */
-       if (this_rq->cfs.h_nr_running && !pulled_task)
-               pulled_task = 1;
-
-out:
-       /* Move the next balance forward */
-       if (time_after(this_rq->next_balance, next_balance))
-               this_rq->next_balance = next_balance;
-
-       /* Is there a task of a high priority class? */
-       if (this_rq->nr_running != this_rq->cfs.h_nr_running)
-               pulled_task = -1;
-
-       if (pulled_task)
-               this_rq->idle_stamp = 0;
-
-       rq_repin_lock(this_rq, rf);
-
-       return pulled_task;
-}
-
-/*
   * active_load_balance_cpu_stop is run by the CPU stopper. It pushes
   * running tasks off the busiest CPU onto idle CPUs. It requires at
   * least 1 task to be running on each physical CPU where possible, and
@@ -9604,6 +9490,120 @@ static bool nohz_idle_balance(struct rq *this_rq, enum cpu_idle_type idle)
  #endif /* CONFIG_NO_HZ_COMMON */
  
  /*
+ * idle_balance is called by schedule() if this_cpu is about to become
+ * idle. Attempts to pull tasks from other CPUs.
+ */
+static int idle_balance(struct rq *this_rq, struct rq_flags *rf)
+{
+       unsigned long next_balance = jiffies + HZ;
+       int this_cpu = this_rq->cpu;
+       struct sched_domain *sd;
+       int pulled_task = 0;
+       u64 curr_cost = 0;
+
+       /*
+        * We must set idle_stamp _before_ calling idle_balance(), such that we
+        * measure the duration of idle_balance() as idle time.
+        */
+       this_rq->idle_stamp = rq_clock(this_rq);
+
+       /*
+        * Do not pull tasks towards !active CPUs...
+        */
+       if (!cpu_active(this_cpu))
+               return 0;
+
+       /*
+        * This is OK, because current is on_cpu, which avoids it being picked
+        * for load-balance and preemption/IRQs are still disabled avoiding
+        * further scheduler activity on it and we're being very careful to
+        * re-start the picking loop.
+        */
+       rq_unpin_lock(this_rq, rf);
+
+       if (this_rq->avg_idle < sysctl_sched_migration_cost ||
+           !this_rq->rd->overload) {
+               rcu_read_lock();
+               sd = rcu_dereference_check_sched_domain(this_rq->sd);
+               if (sd)
+                       update_next_balance(sd, &next_balance);
+               rcu_read_unlock();
+
+               goto out;
+       }
+
+       raw_spin_unlock(&this_rq->lock);
+
+       update_blocked_averages(this_cpu);
+       rcu_read_lock();
+       for_each_domain(this_cpu, sd) {
+               int continue_balancing = 1;
+               u64 t0, domain_cost;
+
+               if (!(sd->flags & SD_LOAD_BALANCE))
+                       continue;
+
+               if (this_rq->avg_idle < curr_cost + sd->max_newidle_lb_cost) {
+                       update_next_balance(sd, &next_balance);
+                       break;
+               }
+
+               if (sd->flags & SD_BALANCE_NEWIDLE) {
+                       t0 = sched_clock_cpu(this_cpu);
+
+                       pulled_task = load_balance(this_cpu, this_rq,
+                                                  sd, CPU_NEWLY_IDLE,
+                                                  &continue_balancing);
+
+                       domain_cost = sched_clock_cpu(this_cpu) - t0;
+                       if (domain_cost > sd->max_newidle_lb_cost)
+                               sd->max_newidle_lb_cost = domain_cost;
+
+                       curr_cost += domain_cost;
+               }
+
+               update_next_balance(sd, &next_balance);
+
+               /*
+                * Stop searching for tasks to pull if there are
+                * now runnable tasks on this rq.
+                */
+               if (pulled_task || this_rq->nr_running > 0)
+                       break;
+       }
+       rcu_read_unlock();
+
+       raw_spin_lock(&this_rq->lock);
+
+       if (curr_cost > this_rq->max_idle_balance_cost)
+               this_rq->max_idle_balance_cost = curr_cost;
+
+       /*
+        * While browsing the domains, we released the rq lock, a task could
+        * have been enqueued in the meantime. Since we're not going idle,
+        * pretend we pulled a task.
+        */
+       if (this_rq->cfs.h_nr_running && !pulled_task)
+               pulled_task = 1;
+
+out:
+       /* Move the next balance forward */
+       if (time_after(this_rq->next_balance, next_balance))
+               this_rq->next_balance = next_balance;
+
+       /* Is there a task of a high priority class? */
+       if (this_rq->nr_running != this_rq->cfs.h_nr_running)
+               pulled_task = -1;
+
+       if (pulled_task)
+               this_rq->idle_stamp = 0;
+
+       rq_repin_lock(this_rq, rf);
+
+       return pulled_task;
+}
+
+/*
   * run_rebalance_domains is triggered when needed from the scheduler tick.
   * Also triggered for nohz idle balancing (with nohz_balancing_kick set).
   */
author	Peter Zijlstra <peterz@infradead.org>
	Tue, 20 Feb 2018 10:45:47 +0000 (11:45 +0100)
committer	Ingo Molnar <mingo@kernel.org>
	Fri, 9 Mar 2018 06:59:25 +0000 (07:59 +0100)