sched/{fair,tune}: track RUNNABLE tasks impact on per CPU boost value

author Patrick Bellasi <patrick.bellasi@arm.com>

Tue, 7 Jul 2015 14:33:20 +0000 (15:33 +0100)

committer Leo Yan <leo.yan@linaro.org>

Tue, 10 May 2016 08:53:24 +0000 (16:53 +0800)
author Patrick Bellasi <patrick.bellasi@arm.com>
Tue, 7 Jul 2015 14:33:20 +0000 (15:33 +0100)
committer Leo Yan <leo.yan@linaro.org>
Tue, 10 May 2016 08:53:24 +0000 (16:53 +0800)
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index eff548fae43ef7d219f3bb5b7a134c685514510f..2dbe1ff0a90b43fd398de97a8e8a608346a5fbcc 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -34,6 +34,7 @@
  #include <trace/events/sched.h>
  
  #include "sched.h"
+#include "tune.h"
  
  /*
   * Targeted preemption latency for CPU-bound tasks:
@@ -4210,6 +4211,8 @@ enqueue_task_fair(struct rq *rq, struct task_struct *p, int flags)
                     cpu_overutilized(rq->cpu))
                         rq->rd->overutilized = true;
  
+               schedtune_enqueue_task(p, cpu_of(rq));
+
                 /*
                  * We want to potentially trigger a freq switch
                  * request only for tasks that are waking up; this is
@@ -4279,6 +4282,7 @@ static void dequeue_task_fair(struct rq *rq, struct task_struct *p, int flags)
  
         if (!se) {
                 sub_nr_running(rq, 1);
+               schedtune_dequeue_task(p, cpu_of(rq));
  
                 /*
                  * We want to potentially trigger a freq switch
@@ -5114,10 +5118,15 @@ schedtune_margin(unsigned long signal, unsigned long boost)
  }
  
  static inline unsigned int
-schedtune_cpu_margin(unsigned long util)
+schedtune_cpu_margin(unsigned long util, int cpu)
  {
-       unsigned int boost = get_sysctl_sched_cfs_boost();
+       unsigned int boost;
  
+#ifdef CONFIG_CGROUP_SCHEDTUNE
+       boost = schedtune_cpu_boost(cpu);
+#else
+       boost = get_sysctl_sched_cfs_boost();
+#endif
         if (boost == 0)
                 return 0;
  
@@ -5127,7 +5136,7 @@ schedtune_cpu_margin(unsigned long util)
  #else /* CONFIG_SCHED_TUNE */
  
  static inline unsigned int
-schedtune_cpu_margin(unsigned long util)
+schedtune_cpu_margin(unsigned long util, int cpu)
  {
         return 0;
  }
@@ -5138,7 +5147,7 @@ static inline unsigned long
  boosted_cpu_util(int cpu)
  {
         unsigned long util = cpu_util(cpu);
-       unsigned long margin = schedtune_cpu_margin(util);
+       unsigned long margin = schedtune_cpu_margin(util, cpu);
  
         return util + margin;
  }
diff --git a/kernel/sched/tune.c b/kernel/sched/tune.c

index f623868937253c9454074708f666e140d09f5733..540b945a01ce4c8cb834c7a14ddafa35bccaefa0 100644 (file)
--- a/kernel/sched/tune.c
+++ b/kernel/sched/tune.c
@@ -2,6 +2,7 @@
  #include <linux/err.h>
  #include <linux/percpu.h>
  #include <linux/printk.h>
+#include <linux/rcupdate.h>
  #include <linux/slab.h>
  
  #include "sched.h"
@@ -158,6 +159,87 @@ schedtune_boostgroup_update(int idx, int boost)
         return 0;
  }
  
+static inline void
+schedtune_tasks_update(struct task_struct *p, int cpu, int idx, int task_count)
+{
+       struct boost_groups *bg;
+       int tasks;
+
+       bg = &per_cpu(cpu_boost_groups, cpu);
+
+       /* Update boosted tasks count while avoiding to make it negative */
+       if (task_count < 0 && bg->group[idx].tasks <= -task_count)
+               bg->group[idx].tasks = 0;
+       else
+               bg->group[idx].tasks += task_count;
+
+       /* Boost group activation or deactivation on that RQ */
+       tasks = bg->group[idx].tasks;
+       if (tasks == 1 || tasks == 0)
+               schedtune_cpu_update(cpu);
+}
+
+/*
+ * NOTE: This function must be called while holding the lock on the CPU RQ
+ */
+void schedtune_enqueue_task(struct task_struct *p, int cpu)
+{
+       struct schedtune *st;
+       int idx;
+
+       /*
+        * When a task is marked PF_EXITING by do_exit() it's going to be
+        * dequeued and enqueued multiple times in the exit path.
+        * Thus we avoid any further update, since we do not want to change
+        * CPU boosting while the task is exiting.
+        */
+       if (p->flags & PF_EXITING)
+               return;
+
+       /* Get task boost group */
+       rcu_read_lock();
+       st = task_schedtune(p);
+       idx = st->idx;
+       rcu_read_unlock();
+
+       schedtune_tasks_update(p, cpu, idx, 1);
+}
+
+/*
+ * NOTE: This function must be called while holding the lock on the CPU RQ
+ */
+void schedtune_dequeue_task(struct task_struct *p, int cpu)
+{
+       struct schedtune *st;
+       int idx;
+
+       /*
+        * When a task is marked PF_EXITING by do_exit() it's going to be
+        * dequeued and enqueued multiple times in the exit path.
+        * Thus we avoid any further update, since we do not want to change
+        * CPU boosting while the task is exiting.
+        * The last dequeue will be done by cgroup exit() callback.
+        */
+       if (p->flags & PF_EXITING)
+               return;
+
+       /* Get task boost group */
+       rcu_read_lock();
+       st = task_schedtune(p);
+       idx = st->idx;
+       rcu_read_unlock();
+
+       schedtune_tasks_update(p, cpu, idx, -1);
+}
+
+int schedtune_cpu_boost(int cpu)
+{
+       struct boost_groups *bg;
+
+       bg = &per_cpu(cpu_boost_groups, cpu);
+       return bg->boost_max;
+}
+
  static u64
  boost_read(struct cgroup_subsys_state *css, struct cftype *cft)
  {
diff --git a/kernel/sched/tune.h b/kernel/sched/tune.h

new file mode 100644 (file)

index 0000000..561b517
--- /dev/null
+++ b/kernel/sched/tune.h
@@ -0,0 +1,23 @@
+
+#ifdef CONFIG_SCHED_TUNE
+
+#ifdef CONFIG_CGROUP_SCHEDTUNE
+
+int schedtune_cpu_boost(int cpu);
+
+void schedtune_enqueue_task(struct task_struct *p, int cpu);
+void schedtune_dequeue_task(struct task_struct *p, int cpu);
+
+#else /* CONFIG_CGROUP_SCHEDTUNE */
+
+#define schedtune_enqueue_task(task, cpu) do { } while (0)
+#define schedtune_dequeue_task(task, cpu) do { } while (0)
+
+#endif /* CONFIG_CGROUP_SCHEDTUNE */
+
+#else /* CONFIG_SCHED_TUNE */
+
+#define schedtune_enqueue_task(task, cpu) do { } while (0)
+#define schedtune_dequeue_task(task, cpu) do { } while (0)
+
+#endif /* CONFIG_SCHED_TUNE */
author	Patrick Bellasi <patrick.bellasi@arm.com>
	Tue, 7 Jul 2015 14:33:20 +0000 (15:33 +0100)
committer	Leo Yan <leo.yan@linaro.org>
	Tue, 10 May 2016 08:53:24 +0000 (16:53 +0800)
kernel/sched/fair.c		patch \| blob \| blame \| history
kernel/sched/tune.c		patch \| blob \| blame \| history
kernel/sched/tune.h	[new file with mode: 0644]	patch \| blob