From: Park Bumgyu <bumgyu.park@samsung.com>
Date: Wed, 21 Mar 2018 06:25:47 +0000 (+0900)
Subject: sched: ems: build skeleton for EMS
X-Git-Url: https://git.stricted.de/?a=commitdiff_plain;h=8c63fb8e9fb4e47c7eac06b922c85d4e63ad8724;p=GitHub%2FLineageOS%2Fandroid_kernel_motorola_exynos9610.git

sched: ems: build skeleton for EMS

Change-Id: I0e79d33aa1e5f64a9621773916d0546c1b0c8d20
Signed-off-by: Park Bumgyu <bumgyu.park@samsung.com>
---

diff --git a/kernel/sched/Makefile b/kernel/sched/Makefile
index 7c7516a21020..f8b8b5152868 100644
--- a/kernel/sched/Makefile
+++ b/kernel/sched/Makefile
@@ -20,7 +20,6 @@ obj-y += core.o loadavg.o clock.o cputime.o
 obj-y += idle_task.o fair.o rt.o deadline.o
 obj-y += wait.o wait_bit.o swait.o completion.o idle.o
 obj-$(CONFIG_SMP) += cpupri.o cpudeadline.o topology.o stop_task.o
-obj-$(CONFIG_SCHED_EHMP) += ehmp.o
 obj-$(CONFIG_GENERIC_ARCH_TOPOLOGY) += energy.o
 obj-$(CONFIG_SCHED_WALT) += walt.o
 obj-$(CONFIG_SCHED_AUTOGROUP) += autogroup.o
@@ -31,4 +30,4 @@ obj-$(CONFIG_CGROUP_CPUACCT) += cpuacct.o
 obj-$(CONFIG_CPU_FREQ) += cpufreq.o
 obj-$(CONFIG_CPU_FREQ_GOV_SCHEDUTIL) += cpufreq_schedutil.o
 obj-$(CONFIG_MEMBARRIER) += membarrier.o
-obj-$(CONFIG_FREQVAR_TUNE) += freqvar_tune.o
+obj-$(CONFIG_SCHED_EHMP) += ems/
diff --git a/kernel/sched/ehmp.c b/kernel/sched/ehmp.c
deleted file mode 100644
index baa223815b69..000000000000
--- a/kernel/sched/ehmp.c
+++ /dev/null
@@ -1,2064 +0,0 @@
-/*
- * Exynos scheduler for Heterogeneous Multi-Processing (HMP)
- *
- * Copyright (C) 2017 Samsung Electronics Co., Ltd
- * Park Bumgyu <bumgyu.park@samsung.com>
- */
-
-#include <linux/sched.h>
-#include <linux/cpuidle.h>
-#include <linux/pm_qos.h>
-#include <linux/ehmp.h>
-#include <linux/sched_energy.h>
-
-#define CREATE_TRACE_POINTS
-#include <trace/events/ehmp.h>
-
-#include "sched.h"
-#include "tune.h"
-
-/**********************************************************************
- * extern functions                                                   *
- **********************************************************************/
-extern struct sched_entity *__pick_next_entity(struct sched_entity *se);
-extern unsigned long boosted_task_util(struct task_struct *task);
-extern unsigned long capacity_curr_of(int cpu);
-extern int find_best_target(struct task_struct *p, int *backup_cpu,
-				   bool boosted, bool prefer_idle);
-extern u64 decay_load(u64 val, u64 n);
-extern int start_cpu(bool boosted);
-
-unsigned long task_util(struct task_struct *p)
-{
-	if (rt_task(p))
-		return p->rt.avg.util_avg;
-	else
-		return p->se.avg.util_avg;
-}
-
-static inline struct task_struct *task_of(struct sched_entity *se)
-{
-	return container_of(se, struct task_struct, se);
-}
-
-static inline struct sched_entity *se_of(struct sched_avg *sa)
-{
-	return container_of(sa, struct sched_entity, avg);
-}
-
-static inline int task_fits(struct task_struct *p, long capacity)
-{
-	return capacity * 1024 > boosted_task_util(p) * 1248;
-}
-
-#define entity_is_cfs_rq(se)	(se->my_q)
-#define entity_is_task(se)	(!se->my_q)
-#define LOAD_AVG_MAX		47742
-
-static unsigned long maxcap_val = 1024;
-static int maxcap_cpu = 7;
-
-void ehmp_update_max_cpu_capacity(int cpu, unsigned long val)
-{
-	maxcap_cpu = cpu;
-	maxcap_val = val;
-}
-
-static inline struct device_node *get_ehmp_node(void)
-{
-	return of_find_node_by_path("/cpus/ehmp");
-}
-
-static inline struct cpumask *sched_group_cpus(struct sched_group *sg)
-{
-	return to_cpumask(sg->cpumask);
-}
-
-#define tsk_cpus_allowed(tsk)	(&(tsk)->cpus_allowed)
-
-/**********************************************************************
- * Energy diff		                                              *
- **********************************************************************/
-#define EAS_CPU_PRV	0
-#define EAS_CPU_NXT	1
-#define EAS_CPU_BKP	2
-
-int exynos_estimate_idle_state(int cpu_idx, struct cpumask *mask,
-				int state, int cpus)
-{
-	unsigned int deepest_state_residency = 0;
-	unsigned int next_timer_us = 0;
-	int grp_nr_running = 0;
-	int deepest_state = 0;
-	int i;
-	int estimate_state = 0;
-
-	if (cpu_idx == EAS_CPU_PRV)
-		grp_nr_running++;
-
-	for_each_cpu(i, mask) {
-		grp_nr_running += cpu_rq(i)->nr_running;
-
-		next_timer_us = ktime_to_us(tick_nohz_get_sleep_length_cpu(i));
-		deepest_state_residency = cpuidle_get_target_residency(i, state);
-
-		if (next_timer_us > deepest_state_residency)
-			deepest_state++;
-	}
-
-	if (!grp_nr_running && deepest_state == cpus)
-		estimate_state = state + 1;
-
-	return estimate_state;
-}
-
-/**********************************************************************
- * task initialization                                                *
- **********************************************************************/
-enum {
-	TYPE_BASE_CFS_RQ_UTIL = 0,
-	TYPE_BASE_INHERIT_PARENT_UTIL,
-	TYPE_MAX_NUM,
-};
-
-static unsigned long init_util_type = TYPE_BASE_CFS_RQ_UTIL;
-static unsigned long init_util_ratio = 25;			/* 25% */
-
-static ssize_t show_initial_util_type(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-        return snprintf(buf, 10, "%ld\n", init_util_type);
-}
-
-static ssize_t store_initial_util_type(struct kobject *kobj,
-                struct kobj_attribute *attr, const char *buf,
-                size_t count)
-{
-        long input;
-
-        if (!sscanf(buf, "%ld", &input))
-                return -EINVAL;
-
-        input = input < 0 ? 0 : input;
-        input = input >= TYPE_MAX_NUM ? TYPE_MAX_NUM - 1 : input;
-
-        init_util_type = input;
-
-        return count;
-}
-
-static ssize_t show_initial_util_ratio(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-        return snprintf(buf, 10, "%ld\n", init_util_ratio);
-}
-
-static ssize_t store_initial_util_ratio(struct kobject *kobj,
-                struct kobj_attribute *attr, const char *buf,
-                size_t count)
-{
-        long input;
-
-        if (!sscanf(buf, "%ld", &input))
-                return -EINVAL;
-
-        init_util_ratio = !!input;
-
-        return count;
-}
-
-static struct kobj_attribute initial_util_type =
-__ATTR(initial_util_type, 0644, show_initial_util_type, store_initial_util_type);
-
-static struct kobj_attribute initial_util_ratio =
-__ATTR(initial_util_ratio, 0644, show_initial_util_ratio, store_initial_util_ratio);
-
-void base_cfs_rq_util(struct sched_entity *se)
-{
-	struct cfs_rq *cfs_rq = se->cfs_rq;
-	struct sched_avg *sa = &se->avg;
-	int cpu = cpu_of(cfs_rq->rq);
-	unsigned long cap_org = capacity_orig_of(cpu);
-	long cap = (long)(cap_org - cfs_rq->avg.util_avg) / 2;
-
-	if (cap > 0) {
-		if (cfs_rq->avg.util_avg != 0) {
-			sa->util_avg  = cfs_rq->avg.util_avg * se->load.weight;
-			sa->util_avg /= (cfs_rq->avg.load_avg + 1);
-
-			if (sa->util_avg > cap)
-				sa->util_avg = cap;
-		} else {
-			sa->util_avg = cap_org * init_util_ratio / 100;
-		}
-		/*
-		 * If we wish to restore tuning via setting initial util,
-		 * this is where we should do it.
-		 */
-		sa->util_sum = sa->util_avg * LOAD_AVG_MAX;
-	}
-}
-
-void base_inherit_parent_util(struct sched_entity *se)
-{
-	struct sched_avg *sa = &se->avg;
-	struct task_struct *p = current;
-
-	sa->util_avg = p->se.avg.util_avg;
-	sa->util_sum = p->se.avg.util_sum;
-}
-
-void exynos_init_entity_util_avg(struct sched_entity *se)
-{
-	int type = init_util_type;
-
-	switch(type) {
-	case TYPE_BASE_CFS_RQ_UTIL:
-		base_cfs_rq_util(se);
-		break;
-	case TYPE_BASE_INHERIT_PARENT_UTIL:
-		base_inherit_parent_util(se);
-		break;
-	default:
-		pr_info("%s: Not support initial util type %ld\n",
-				__func__, init_util_type);
-	}
-}
-
-/**********************************************************************
- * load balance                                                       *
- **********************************************************************/
-#define lb_sd_parent(sd) \
-	(sd->parent && sd->parent->groups != sd->parent->groups->next)
-
-struct sched_group *
-exynos_fit_idlest_group(struct sched_domain *sd, struct task_struct *p)
-{
-	struct sched_group *group = sd->groups;
-	struct sched_group *fit_group = NULL;
-	unsigned long fit_capacity = ULONG_MAX;
-
-	do {
-		int i;
-
-		/* Skip over this group if it has no CPUs allowed */
-		if (!cpumask_intersects(sched_group_span(group),
-					&p->cpus_allowed))
-			continue;
-
-		for_each_cpu(i, sched_group_span(group)) {
-			if (capacity_of(i) < fit_capacity && task_fits(p, capacity_of(i))) {
-				fit_capacity = capacity_of(i);
-				fit_group = group;
-			}
-		}
-	} while (group = group->next, group != sd->groups);
-
-	return fit_group;
-}
-
-static inline int
-check_cpu_capacity(struct rq *rq, struct sched_domain *sd)
-{
-	return ((rq->cpu_capacity * sd->imbalance_pct) <
-				(rq->cpu_capacity_orig * 100));
-}
-
-unsigned long global_boost(void);
-int exynos_need_active_balance(enum cpu_idle_type idle, struct sched_domain *sd,
-					int src_cpu, int dst_cpu)
-{
-	unsigned int src_imb_pct = lb_sd_parent(sd) ? sd->imbalance_pct : 1;
-	unsigned int dst_imb_pct = lb_sd_parent(sd) ? 100 : 1;
-	unsigned long src_cap = capacity_of(src_cpu);
-	unsigned long dst_cap = capacity_of(dst_cpu);
-	int level = sd->level;
-
-	/* dst_cpu is idle */
-	if ((idle != CPU_NOT_IDLE) &&
-	    (cpu_rq(src_cpu)->cfs.h_nr_running == 1)) {
-		if ((check_cpu_capacity(cpu_rq(src_cpu), sd)) &&
-		    (src_cap * sd->imbalance_pct < dst_cap * 100)) {
-			return 1;
-		}
-
-		/* This domain is top and dst_cpu is bigger than src_cpu*/
-		if (!lb_sd_parent(sd) && src_cap < dst_cap)
-			if (lbt_overutilized(src_cpu, level) || global_boost())
-				return 1;
-	}
-
-	if ((src_cap * src_imb_pct < dst_cap * dst_imb_pct) &&
-			cpu_rq(src_cpu)->cfs.h_nr_running == 1 &&
-			lbt_overutilized(src_cpu, level) &&
-			!lbt_overutilized(dst_cpu, level)) {
-		return 1;
-	}
-
-	return unlikely(sd->nr_balance_failed > sd->cache_nice_tries + 2);
-}
-
-/****************************************************************/
-/*			Load Balance Trigger			*/
-/****************************************************************/
-#define DISABLE_OU		-1
-#define DEFAULT_OU_RATIO	80
-
-struct lbt_overutil {
-	bool			top;
-	struct cpumask		cpus;
-	unsigned long		capacity;
-	int			ratio;
-};
-DEFINE_PER_CPU(struct lbt_overutil *, lbt_overutil);
-
-static inline int get_topology_depth(void)
-{
-	struct sched_domain *sd;
-
-	for_each_domain(0, sd) {
-		if (sd->parent == NULL)
-			return sd->level;
-	}
-
-	return -1;
-}
-
-static inline int get_last_level(struct lbt_overutil *ou)
-{
-	int level;
-
-	for (level = 0; &ou[level] != NULL; level++) {
-		if (ou[level].top == true)
-			return level;
-	}
-
-	return -1;
-}
-
-/****************************************************************/
-/*			External APIs				*/
-/****************************************************************/
-bool lbt_overutilized(int cpu, int level)
-{
-	struct lbt_overutil *ou = per_cpu(lbt_overutil, cpu);
-	bool overutilized;
-
-	if (!ou)
-		return false;
-
-	overutilized = (cpu_util(cpu) > ou[level].capacity) ? true : false;
-
-	if (overutilized)
-		trace_ehmp_lbt_overutilized(cpu, level, cpu_util(cpu),
-				ou[level].capacity, overutilized);
-
-	return overutilized;
-}
-
-void update_lbt_overutil(int cpu, unsigned long capacity)
-{
-	struct lbt_overutil *ou = per_cpu(lbt_overutil, cpu);
-	int level, last = get_last_level(ou);
-
-	for (level = 0; level <= last; level++) {
-		if (ou[level].ratio == DISABLE_OU)
-			continue;
-
-		ou[level].capacity = (capacity * ou[level].ratio) / 100;
-	}
-}
-
-/****************************************************************/
-/*				SYSFS				*/
-/****************************************************************/
-static ssize_t show_overutil_ratio(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	struct lbt_overutil *ou = per_cpu(lbt_overutil, 0);
-	int level, last = get_last_level(ou);
-	int cpu, ret = 0;
-
-	for (level = 0; level <= last; level++) {
-		ret += sprintf(buf + ret, "[level%d]\n", level);
-
-		for_each_possible_cpu(cpu) {
-			ou = per_cpu(lbt_overutil, cpu);
-
-			if (ou[level].ratio == DISABLE_OU)
-				continue;
-
-			ret += sprintf(buf + ret, "cpu%d ratio:%3d capacity:%4lu\n",
-					cpu, ou[level].ratio, ou[level].capacity);
-		}
-	}
-
-	return ret;
-}
-
-static ssize_t store_overutil_ratio(struct kobject *kobj,
-		struct kobj_attribute *attr, const char *buf,
-		size_t count)
-{
-	struct lbt_overutil *ou;
-	unsigned long capacity;
-	int cpu, level, ratio;
-	int last;
-
-	if (sscanf(buf, "%d %d %d", &cpu, &level, &ratio) != 3)
-		return -EINVAL;
-
-	/* Check cpu is possible */
-	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
-		return -EINVAL;
-	ou = per_cpu(lbt_overutil, cpu);
-
-	/* Check level range */
-	last = get_last_level(ou);
-	if (last < 0 || level < 0 || level > last)
-		return -EINVAL;
-
-	/* If ratio is outrage, disable overutil */
-	if (ratio < 0 || ratio > 100)
-		ratio = DEFAULT_OU_RATIO;
-
-	for_each_cpu(cpu, &ou[level].cpus) {
-		ou = per_cpu(lbt_overutil, cpu);
-		if (ou[level].ratio == DISABLE_OU)
-			continue;
-
-		ou[level].ratio = ratio;
-		capacity = capacity_orig_of(cpu);
-		update_lbt_overutil(cpu, capacity);
-	}
-
-	return count;
-}
-
-static struct kobj_attribute overutil_ratio_attr =
-__ATTR(overutil_ratio, 0644, show_overutil_ratio, store_overutil_ratio);
-
-/****************************************************************/
-/*			Initialization				*/
-/****************************************************************/
-static void free_lbt_overutil(void)
-{
-	int cpu;
-
-	for_each_possible_cpu(cpu) {
-		if (per_cpu(lbt_overutil, cpu))
-			kfree(per_cpu(lbt_overutil, cpu));
-	}
-}
-
-static int alloc_lbt_overutil(void)
-{
-	int cpu, depth = get_topology_depth();
-
-	for_each_possible_cpu(cpu) {
-		struct lbt_overutil *ou = kzalloc(sizeof(struct lbt_overutil) *
-				(depth + 1), GFP_KERNEL);
-		if (!ou)
-			goto fail_alloc;
-
-		per_cpu(lbt_overutil, cpu) = ou;
-	}
-	return 0;
-
-fail_alloc:
-	free_lbt_overutil();
-	return -ENOMEM;
-}
-
-static int set_lbt_overutil(int level, const char *mask, int ratio)
-{
-	struct lbt_overutil *ou;
-	struct cpumask cpus;
-	bool top, overlap = false;
-	int cpu;
-
-	cpulist_parse(mask, &cpus);
-	cpumask_and(&cpus, &cpus, cpu_possible_mask);
-	if (!cpumask_weight(&cpus))
-		return -ENODEV;
-
-	/* If sibling cpus is same with possible cpus, it is top level */
-	top = cpumask_equal(&cpus, cpu_possible_mask);
-
-	/* If this level is overlapped with prev level, disable this level */
-	if (level > 0) {
-		ou = per_cpu(lbt_overutil, cpumask_first(&cpus));
-		overlap = cpumask_equal(&cpus, &ou[level-1].cpus);
-	}
-
-	for_each_cpu(cpu, &cpus) {
-		ou = per_cpu(lbt_overutil, cpu);
-		cpumask_copy(&ou[level].cpus, &cpus);
-		ou[level].ratio = overlap ? DISABLE_OU : ratio;
-		ou[level].top = top;
-	}
-
-	return 0;
-}
-
-static int parse_lbt_overutil(struct device_node *dn)
-{
-	struct device_node *lbt, *ou;
-	int level, depth = get_topology_depth();
-	int ret = 0;
-
-	lbt = of_get_child_by_name(dn, "lbt");
-	if (!lbt)
-		return -ENODEV;
-
-	for (level = 0; level <= depth; level++) {
-		char name[20];
-		const char *mask[NR_CPUS];
-		int ratio[NR_CPUS];
-		int i, proplen;
-
-		snprintf(name, sizeof(name), "overutil-level%d", level);
-		ou = of_get_child_by_name(lbt, name);
-		if (!ou) {
-			ret = -ENODEV;
-			goto out;
-		}
-
-		proplen = of_property_count_strings(ou, "cpus");
-		if ((proplen < 0) || (proplen != of_property_count_u32_elems(ou, "ratio"))) {
-			of_node_put(ou);
-			ret = -ENODEV;
-			goto out;
-		}
-
-		of_property_read_string_array(ou, "cpus", mask, proplen);
-		of_property_read_u32_array(ou, "ratio", ratio, proplen);
-		of_node_put(ou);
-
-		for (i = 0; i < proplen; i++) {
-			ret = set_lbt_overutil(level, mask[i], ratio[i]);
-			if (ret)
-				goto out;
-		}
-	}
-
-out:
-	of_node_put(lbt);
-	return ret;
-}
-
-static int __init init_lbt(void)
-{
-	struct device_node *dn;
-	int ret;
-
-	dn = of_find_node_by_path("/cpus/ehmp");
-	if (!dn)
-		return 0;
-
-	ret = alloc_lbt_overutil();
-	if (ret) {
-		pr_err("Failed to allocate lbt_overutil\n");
-		goto out;
-	}
-
-	ret = parse_lbt_overutil(dn);
-	if (ret) {
-		pr_err("Failed to parse lbt_overutil\n");
-		free_lbt_overutil();
-		goto out;
-	}
-
-out:
-	of_node_put(dn);
-	return ret;
-}
-pure_initcall(init_lbt);
-/**********************************************************************
- * Global boost                                                       *
- **********************************************************************/
-static unsigned long gb_value = 0;
-static unsigned long gb_max_value = 0;
-static struct gb_qos_request gb_req_user =
-{
-	.name = "ehmp_gb_req_user",
-};
-
-static struct plist_head gb_list = PLIST_HEAD_INIT(gb_list);
-
-static DEFINE_SPINLOCK(gb_lock);
-
-static int gb_qos_max_value(void)
-{
-	return plist_last(&gb_list)->prio;
-}
-
-static int gb_qos_req_value(struct gb_qos_request *req)
-{
-	return req->node.prio;
-}
-
-void gb_qos_update_request(struct gb_qos_request *req, u32 new_value)
-{
-	unsigned long flags;
-
-	if (req->node.prio == new_value)
-		return;
-
-	spin_lock_irqsave(&gb_lock, flags);
-
-	if (req->active)
-		plist_del(&req->node, &gb_list);
-	else
-		req->active = 1;
-
-	plist_node_init(&req->node, new_value);
-	plist_add(&req->node, &gb_list);
-
-	gb_value = gb_max_value * gb_qos_max_value() / 100;
-	trace_ehmp_global_boost(req->name, new_value);
-
-	spin_unlock_irqrestore(&gb_lock, flags);
-}
-
-static ssize_t show_global_boost(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	struct gb_qos_request *req;
-	int ret = 0;
-
-	plist_for_each_entry(req, &gb_list, node)
-		ret += snprintf(buf + ret, 30, "%s : %d\n",
-				req->name, gb_qos_req_value(req));
-
-	return ret;
-}
-
-static ssize_t store_global_boost(struct kobject *kobj,
-		struct kobj_attribute *attr, const char *buf,
-		size_t count)
-{
-	unsigned int input;
-
-	if (!sscanf(buf, "%d", &input))
-		return -EINVAL;
-
-	gb_qos_update_request(&gb_req_user, input);
-
-	return count;
-}
-
-static struct kobj_attribute global_boost_attr =
-__ATTR(global_boost, 0644, show_global_boost, store_global_boost);
-
-#define BOOT_BOOST_DURATION 40000000	/* microseconds */
-unsigned long global_boost(void)
-{
-	u64 now = ktime_to_us(ktime_get());
-
-	if (now < BOOT_BOOST_DURATION)
-		return gb_max_value;
-
-	return gb_value;
-}
-
-int find_second_max_cap(void)
-{
-	struct sched_domain *sd = rcu_dereference(per_cpu(sd_ea, 0));
-	struct sched_group *sg;
-	int max_cap = 0, second_max_cap = 0;
-
-	if (!sd)
-		return 0;
-
-	sg = sd->groups;
-	do {
-		int i;
-
-		for_each_cpu(i, sched_group_cpus(sg)) {
-			if (max_cap < cpu_rq(i)->cpu_capacity_orig) {
-				second_max_cap = max_cap;
-				max_cap = cpu_rq(i)->cpu_capacity_orig;
-			}
-		}
-	} while (sg = sg->next, sg != sd->groups);
-
-	return second_max_cap;
-}
-
-static int __init init_global_boost(void)
-{
-	gb_max_value = find_second_max_cap() + 1;
-
-	return 0;
-}
-pure_initcall(init_global_boost);
-
-/**********************************************************************
- * Boost cpu selection (global boost, schedtune.prefer_perf)          *
- **********************************************************************/
-#define cpu_selected(cpu)	(cpu >= 0)
-
-int kernel_prefer_perf(int grp_idx);
-static ssize_t show_prefer_perf(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	int i, ret = 0;
-
-	for (i = 0; i < STUNE_GROUP_COUNT; i++)
-		ret += snprintf(buf + ret, 10, "%d ", kernel_prefer_perf(i));
-
-	ret += snprintf(buf + ret, 10, "\n");
-
-	return ret;
-}
-
-static struct kobj_attribute prefer_perf_attr =
-__ATTR(kernel_prefer_perf, 0444, show_prefer_perf, NULL);
-
-enum {
-	BT_PREFER_PERF = 0,
-	BT_GROUP_BALANCE,
-	BT_GLOBAL_BOOST,
-};
-
-struct boost_trigger {
-	int trigger;
-	int boost_val;
-};
-
-static int check_boost_trigger(struct task_struct *p, struct boost_trigger *bt)
-{
-	int gb;
-
-#ifdef CONFIG_SCHED_TUNE
-	if (schedtune_prefer_perf(p) > 0) {
-		bt->trigger = BT_PREFER_PERF;
-		bt->boost_val = schedtune_perf_threshold();
-		return 1;
-	}
-
-	if (schedtune_need_group_balance(p) > 0) {
-		bt->trigger = BT_GROUP_BALANCE;
-		bt->boost_val = schedtune_perf_threshold();
-		return 1;
-	}
-#endif
-
-	gb = global_boost();
-	if (gb) {
-		bt->trigger = BT_GLOBAL_BOOST;
-		bt->boost_val = gb;
-		return 1;
-	}
-
-	/* not boost state */
-	return 0;
-}
-
-static int boost_select_cpu(struct task_struct *p, struct cpumask *target_cpus)
-{
-	int i, cpu = 0;
-
-	if (cpumask_empty(target_cpus))
-		return -1;
-
-	if (cpumask_test_cpu(task_cpu(p), target_cpus))
-		return task_cpu(p);
-
-	/* Return last cpu in target_cpus */
-	for_each_cpu(i, target_cpus)
-		cpu = i;
-
-	return cpu;
-}
-
-static void mark_shallowest_cpu(int cpu, unsigned int *min_exit_latency,
-						struct cpumask *shallowest_cpus)
-{
-	struct rq *rq = cpu_rq(cpu);
-	struct cpuidle_state *idle = idle_get_state(rq);
-
-	/* Before enabling cpuidle, all idle cpus are marked */
-	if (!idle) {
-		cpumask_set_cpu(cpu, shallowest_cpus);
-		return;
-	}
-
-	/* Deeper idle cpu is ignored */
-	if (idle->exit_latency > *min_exit_latency)
-		return;
-
-	/* if shallower idle cpu is found, previsouly founded cpu is ignored */
-	if (idle->exit_latency < *min_exit_latency) {
-		cpumask_clear(shallowest_cpus);
-		*min_exit_latency = idle->exit_latency;
-	}
-
-	cpumask_set_cpu(cpu, shallowest_cpus);
-}
-static int check_migration_task(struct task_struct *p)
-{
-	return !p->se.avg.last_update_time;
-}
-
-unsigned long cpu_util_wake(int cpu, struct task_struct *p)
-{
-	unsigned long util, capacity;
-
-	/* Task has no contribution or is new */
-	if (cpu != task_cpu(p) || check_migration_task(p))
-		return cpu_util(cpu);
-
-	capacity = capacity_orig_of(cpu);
-	util = max_t(long, cpu_util(cpu) - task_util(p), 0);
-
-	return (util >= capacity) ? capacity : util;
-}
-
-static int find_group_boost_target(struct task_struct *p)
-{
-	struct sched_domain *sd;
-	int shallowest_cpu = -1;
-	int lowest_cpu = -1;
-	unsigned int min_exit_latency = UINT_MAX;
-	unsigned long lowest_util = ULONG_MAX;
-	int target_cpu = -1;
-	int cpu;
-	char state[30] = "fail";
-
-	sd = rcu_dereference(per_cpu(sd_ea, maxcap_cpu));
-	if (!sd)
-		return target_cpu;
-
-	if (cpumask_test_cpu(task_cpu(p), sched_group_cpus(sd->groups))) {
-		if (idle_cpu(task_cpu(p))) {
-			target_cpu = task_cpu(p);
-			strcpy(state, "current idle");
-			goto find_target;
-		}
-	}
-
-	for_each_cpu_and(cpu, tsk_cpus_allowed(p), sched_group_cpus(sd->groups)) {
-		unsigned long util = cpu_util_wake(cpu, p);
-
-		if (idle_cpu(cpu)) {
-			struct cpuidle_state *idle;
-
-			idle = idle_get_state(cpu_rq(cpu));
-			if (!idle) {
-				target_cpu = cpu;
-				strcpy(state, "idle wakeup");
-				goto find_target;
-			}
-
-			if (idle->exit_latency < min_exit_latency) {
-				min_exit_latency = idle->exit_latency;
-				shallowest_cpu = cpu;
-				continue;
-			}
-		}
-
-		if (cpu_selected(shallowest_cpu))
-			continue;
-
-		if (util < lowest_util) {
-			lowest_cpu = cpu;
-			lowest_util = util;
-		}
-	}
-
-	if (cpu_selected(shallowest_cpu)) {
-		target_cpu = shallowest_cpu;
-		strcpy(state, "shallowest idle");
-		goto find_target;
-	}
-
-	if (cpu_selected(lowest_cpu)) {
-		target_cpu = lowest_cpu;
-		strcpy(state, "lowest util");
-	}
-
-find_target:
-	trace_ehmp_select_group_boost(p, target_cpu, state);
-
-	return target_cpu;
-}
-
-static int
-find_boost_target(struct sched_domain *sd, struct task_struct *p,
-			unsigned long min_util, struct boost_trigger *bt)
-{
-	struct sched_group *sg;
-	int boost = bt->boost_val;
-	unsigned long max_capacity;
-	struct cpumask boost_candidates;
-	struct cpumask backup_boost_candidates;
-	unsigned int min_exit_latency = UINT_MAX;
-	unsigned int backup_min_exit_latency = UINT_MAX;
-	int target_cpu;
-	bool go_up = false;
-	unsigned long lowest_util = ULONG_MAX;
-	int lowest_cpu = -1;
-	char state[30] = "fail";
-
-	if (bt->trigger == BT_GROUP_BALANCE)
-		return find_group_boost_target(p);
-
-	cpumask_setall(&boost_candidates);
-	cpumask_clear(&backup_boost_candidates);
-
-	max_capacity = maxcap_val;
-
-	sg = sd->groups;
-
-	do {
-		int i;
-
-		for_each_cpu_and(i, tsk_cpus_allowed(p), sched_group_cpus(sg)) {
-			unsigned long new_util, wake_util;
-
-			if (!cpu_online(i))
-				continue;
-
-			wake_util = cpu_util_wake(i, p);
-			new_util = wake_util + task_util(p);
-			new_util = max(min_util, new_util);
-
-			if (min(new_util + boost, max_capacity) > capacity_orig_of(i)) {
-				if (!cpu_rq(i)->nr_running)
-					mark_shallowest_cpu(i, &backup_min_exit_latency,
-							&backup_boost_candidates);
-				else if (cpumask_test_cpu(task_cpu(p), sched_group_cpus(sg)))
-					go_up = true;
-
-				continue;
-			}
-
-			if (cpumask_weight(&boost_candidates) >= nr_cpu_ids)
-				cpumask_clear(&boost_candidates);
-
-			if (!cpu_rq(i)->nr_running) {
-				mark_shallowest_cpu(i, &min_exit_latency, &boost_candidates);
-				continue;
-			}
-
-			if (wake_util < lowest_util) {
-				lowest_util = wake_util;
-				lowest_cpu = i;
-			}
-		}
-
-		if (cpumask_weight(&boost_candidates) >= nr_cpu_ids)
-			continue;
-
-		target_cpu = boost_select_cpu(p, &boost_candidates);
-		if (cpu_selected(target_cpu)) {
-			strcpy(state, "big idle");
-			goto out;
-		}
-
-		target_cpu = boost_select_cpu(p, &backup_boost_candidates);
-		if (cpu_selected(target_cpu)) {
-			strcpy(state, "little idle");
-			goto out;
-		}
-	} while (sg = sg->next, sg != sd->groups);
-
-	if (go_up) {
-		strcpy(state, "lowest big cpu");
-		target_cpu = lowest_cpu;
-		goto out;
-	}
-
-	strcpy(state, "current cpu");
-	target_cpu = task_cpu(p);
-
-out:
-	trace_ehmp_select_boost_cpu(p, target_cpu, bt->trigger, state);
-	return target_cpu;
-}
-
-/**********************************************************************
- * schedtune.prefer_idle                                              *
- **********************************************************************/
-static void mark_lowest_cpu(int cpu, unsigned long new_util,
-			int *lowest_cpu, unsigned long *lowest_util)
-{
-	if (new_util >= *lowest_util)
-		return;
-
-	*lowest_util = new_util;
-	*lowest_cpu = cpu;
-}
-
-static int find_prefer_idle_target(struct sched_domain *sd,
-			struct task_struct *p, unsigned long min_util)
-{
-	struct sched_group *sg;
-	int target_cpu = -1;
-	int lowest_cpu = -1;
-	int lowest_idle_cpu = -1;
-	int overcap_cpu = -1;
-	unsigned long lowest_util = ULONG_MAX;
-	unsigned long lowest_idle_util = ULONG_MAX;
-	unsigned long overcap_util = ULONG_MAX;
-	struct cpumask idle_candidates;
-	struct cpumask overcap_idle_candidates;
-
-	cpumask_clear(&idle_candidates);
-	cpumask_clear(&overcap_idle_candidates);
-
-	sg = sd->groups;
-
-	do {
-		int i;
-
-		for_each_cpu_and(i, tsk_cpus_allowed(p), sched_group_cpus(sg)) {
-			unsigned long new_util, wake_util;
-
-			if (!cpu_online(i))
-				continue;
-
-			wake_util = cpu_util_wake(i, p);
-			new_util = wake_util + task_util(p);
-			new_util = max(min_util, new_util);
-
-			trace_ehmp_prefer_idle(p, task_cpu(p), i, task_util(p),
-							new_util, idle_cpu(i));
-
-			if (new_util > capacity_orig_of(i)) {
-				if (idle_cpu(i)) {
-					cpumask_set_cpu(i, &overcap_idle_candidates);
-					mark_lowest_cpu(i, new_util,
-						&overcap_cpu, &overcap_util);
-				}
-
-				continue;
-			}
-
-			if (idle_cpu(i)) {
-				if (task_cpu(p) == i) {
-					target_cpu = i;
-					break;
-				}
-
-				cpumask_set_cpu(i, &idle_candidates);
-				mark_lowest_cpu(i, new_util,
-					&lowest_idle_cpu, &lowest_idle_util);
-
-				continue;
-			}
-
-			mark_lowest_cpu(i, new_util, &lowest_cpu, &lowest_util);
-		}
-
-		if (cpu_selected(target_cpu))
-			break;
-
-		if (cpumask_weight(&idle_candidates)) {
-			target_cpu = lowest_idle_cpu;
-			break;
-		}
-
-		if (cpu_selected(lowest_cpu)) {
-			target_cpu = lowest_cpu;
-			break;
-		}
-
-	} while (sg = sg->next, sg != sd->groups);
-
-	if (cpu_selected(target_cpu))
-		goto out;
-
-	if (cpumask_weight(&overcap_idle_candidates)) {
-		if (cpumask_test_cpu(task_cpu(p), &overcap_idle_candidates))
-			target_cpu = task_cpu(p);
-		else
-			target_cpu = overcap_cpu;
-
-		goto out;
-	}
-
-out:
-	trace_ehmp_prefer_idle_cpu_select(p, target_cpu);
-
-	return target_cpu;
-}
-
-/****************************************************************/
-/*			On-time migration			*/
-/****************************************************************/
-#define TASK_TRACK_COUNT	5
-
-#define ontime_task_cpu(p)		(ontime_of(p)->cpu)
-#define ontime_flag(p)			(ontime_of(p)->flags)
-#define ontime_migration_time(p)	(ontime_of(p)->avg.ontime_migration_time)
-#define ontime_load_avg(p)		(ontime_of(p)->avg.load_avg)
-
-#define cap_scale(v, s)		((v)*(s) >> SCHED_CAPACITY_SHIFT)
-#define mincap_of(__cpu)	(sge_array[__cpu][SD_LEVEL0]->cap_states[0].cap)
-
-/* Structure of ontime migration condition */
-struct ontime_cond {
-	unsigned long		up_threshold;
-	unsigned long		down_threshold;
-	unsigned int		min_residency_us;
-
-	struct cpumask		src_cpus;
-	struct cpumask		dst_cpus;
-
-	struct ontime_cond	*next;
-};
-static struct ontime_cond *ontime_cond;
-
-/* Structure of ontime migration environment */
-struct ontime_env {
-	struct rq		*dst_rq;
-	int			dst_cpu;
-	struct rq		*src_rq;
-	int			src_cpu;
-	struct task_struct	*target_task;
-	int			boost_migration;
-};
-DEFINE_PER_CPU(struct ontime_env, ontime_env);
-
-static unsigned long get_up_threshold(int cpu)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->src_cpus))
-			return cond->up_threshold;
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static int set_up_threshold(int cpu, unsigned long val)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->src_cpus)) {
-			cond->up_threshold = val;
-			return 0;
-		}
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static unsigned long get_down_threshold(int cpu)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->dst_cpus))
-			return cond->down_threshold;
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static int set_down_threshold(int cpu, unsigned long val)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->dst_cpus)) {
-			cond->down_threshold = val;
-			return 0;
-		}
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static unsigned int get_min_residency(int cpu)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->dst_cpus))
-			return cond->min_residency_us;
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static int set_min_residency(int cpu, int val)
-{
-	struct ontime_cond *cond = ontime_cond;
-
-	while (cond) {
-		if (cpumask_test_cpu(cpu, &cond->dst_cpus)) {
-			cond->min_residency_us = val;
-			return 0;
-		}
-
-		cond = cond->next;
-	}
-
-	return -EINVAL;
-}
-
-static inline void include_ontime_task(struct task_struct *p, int dst_cpu)
-{
-	ontime_flag(p) = ONTIME;
-	ontime_task_cpu(p) = dst_cpu;
-
-	/* Manage time based on clock task of boot cpu(cpu0) */
-	ontime_migration_time(p) = cpu_rq(0)->clock_task;
-}
-
-static inline void exclude_ontime_task(struct task_struct *p)
-{
-	ontime_task_cpu(p) = 0;
-	ontime_migration_time(p) = 0;
-	ontime_flag(p) = NOT_ONTIME;
-}
-
-static int
-ontime_select_target_cpu(struct cpumask *dst_cpus, const struct cpumask *mask)
-{
-	int cpu;
-	int dest_cpu = -1;
-	unsigned int min_exit_latency = UINT_MAX;
-	struct cpuidle_state *idle;
-
-	rcu_read_lock();
-	for_each_cpu_and(cpu, dst_cpus, mask) {
-		if (!idle_cpu(cpu))
-			continue;
-
-		if (cpu_rq(cpu)->ontime_migrating)
-			continue;
-
-		idle = idle_get_state(cpu_rq(cpu));
-		if (!idle) {
-			rcu_read_unlock();
-			return cpu;
-		}
-
-		if (idle && idle->exit_latency < min_exit_latency) {
-			min_exit_latency = idle->exit_latency;
-			dest_cpu = cpu;
-		}
-	}
-
-	rcu_read_unlock();
-	return dest_cpu;
-}
-
-extern struct sched_entity *__pick_next_entity(struct sched_entity *se);
-static struct task_struct *
-ontime_pick_heavy_task(struct sched_entity *se, struct cpumask *dst_cpus,
-						int *boost_migration)
-{
-	struct task_struct *heaviest_task = NULL;
-	struct task_struct *p;
-	unsigned int max_util_avg = 0;
-	int task_count = 0;
-	int boosted = !!global_boost();
-
-	/*
-	 * Since current task does not exist in entity list of cfs_rq,
-	 * check first that current task is heavy.
-	 */
-	p = task_of(se);
-	if (boosted || ontime_load_avg(p) >= get_up_threshold(task_cpu(p))) {
-		heaviest_task = task_of(se);
-		max_util_avg = ontime_load_avg(task_of(se));
-		if (boosted)
-			*boost_migration = 1;
-	}
-
-	se = __pick_first_entity(se->cfs_rq);
-	while (se && task_count < TASK_TRACK_COUNT) {
-		/* Skip non-task entity */
-		if (entity_is_cfs_rq(se))
-			goto next_entity;
-
-		p = task_of(se);
-		if (schedtune_prefer_perf(p)) {
-			heaviest_task = p;
-			*boost_migration = 1;
-			break;
-		}
-
-		if (!boosted && ontime_load_avg(p) <
-				get_up_threshold(task_cpu(p)))
-			goto next_entity;
-
-		if (ontime_load_avg(p) > max_util_avg &&
-		    cpumask_intersects(dst_cpus, tsk_cpus_allowed(p))) {
-			heaviest_task = p;
-			max_util_avg = ontime_load_avg(p);
-			*boost_migration = boosted;
-		}
-
-next_entity:
-		se = __pick_next_entity(se);
-		task_count++;
-	}
-
-	return heaviest_task;
-}
-
-static int can_migrate(struct task_struct *p, struct ontime_env *env)
-{
-	if (!cpumask_test_cpu(env->dst_cpu, tsk_cpus_allowed(p)))
-		return 0;
-
-	if (task_running(env->src_rq, p))
-		return 0;
-
-	return 1;
-}
-
-static void move_task(struct task_struct *p, struct ontime_env *env)
-{
-	p->on_rq = TASK_ON_RQ_MIGRATING;
-	deactivate_task(env->src_rq, p, 0);
-	set_task_cpu(p, env->dst_cpu);
-
-	activate_task(env->dst_rq, p, 0);
-	p->on_rq = TASK_ON_RQ_QUEUED;
-	check_preempt_curr(env->dst_rq, p, 0);
-}
-
-static int move_specific_task(struct task_struct *target, struct ontime_env *env)
-{
-	struct task_struct *p, *n;
-
-	list_for_each_entry_safe(p, n, &env->src_rq->cfs_tasks, se.group_node) {
-		if (!can_migrate(p, env))
-			continue;
-
-		if (p != target)
-			continue;
-
-		move_task(p, env);
-		return 1;
-	}
-
-	return 0;
-}
-
-static int ontime_migration_cpu_stop(void *data)
-{
-	struct ontime_env *env = data;
-	struct rq *src_rq, *dst_rq;
-	int src_cpu, dst_cpu;
-	struct task_struct *p;
-	struct sched_domain *sd;
-	int boost_migration;
-
-	/* Initialize environment data */
-	src_rq = env->src_rq;
-	dst_rq = env->dst_rq = cpu_rq(env->dst_cpu);
-	src_cpu = env->src_cpu = env->src_rq->cpu;
-	dst_cpu = env->dst_cpu;
-	p = env->target_task;
-	boost_migration = env->boost_migration;
-
-	raw_spin_lock_irq(&src_rq->lock);
-
-	if (!(ontime_flag(p) & ONTIME_MIGRATING))
-		goto out_unlock;
-
-	if (p->exit_state)
-		goto out_unlock;
-
-	if (unlikely(src_cpu != smp_processor_id()))
-		goto out_unlock;
-
-	if (src_rq->nr_running <= 1)
-		goto out_unlock;
-
-	if (src_rq != task_rq(p))
-		goto out_unlock;
-
-	BUG_ON(src_rq == dst_rq);
-
-	double_lock_balance(src_rq, dst_rq);
-
-	rcu_read_lock();
-	for_each_domain(dst_cpu, sd)
-		if (cpumask_test_cpu(src_cpu, sched_domain_span(sd)))
-			break;
-
-	if (likely(sd) && move_specific_task(p, env)) {
-		if (boost_migration) {
-			/* boost task is not classified as ontime task */
-			exclude_ontime_task(p);
-		} else {
-			include_ontime_task(p, dst_cpu);
-		}
-
-		rcu_read_unlock();
-		double_unlock_balance(src_rq, dst_rq);
-
-		trace_ehmp_ontime_migration(p, ontime_of(p)->avg.load_avg,
-					src_cpu, dst_cpu, boost_migration);
-		goto success_unlock;
-	}
-
-	rcu_read_unlock();
-	double_unlock_balance(src_rq, dst_rq);
-
-out_unlock:
-	exclude_ontime_task(p);
-
-success_unlock:
-	src_rq->active_balance = 0;
-	dst_rq->ontime_migrating = 0;
-
-	raw_spin_unlock_irq(&src_rq->lock);
-	put_task_struct(p);
-
-	return 0;
-}
-
-static int ontime_task_wakeup(struct task_struct *p)
-{
-	struct ontime_cond *cond;
-	struct cpumask target_mask;
-	u64 delta;
-	int target_cpu = -1;
-
-	/* When wakeup task is on ontime migrating, do not ontime wakeup */
-	if (ontime_flag(p) == ONTIME_MIGRATING)
-		return -1;
-
-	/*
-	 * When wakeup task satisfies ontime condition to up migration,
-	 * check there is a possible target cpu.
-	 */
-	if (ontime_load_avg(p) >= get_up_threshold(task_cpu(p))) {
-		cpumask_clear(&target_mask);
-
-		for (cond = ontime_cond; cond != NULL; cond = cond->next)
-			if (cpumask_test_cpu(task_cpu(p), &cond->src_cpus)) {
-				cpumask_copy(&target_mask, &cond->dst_cpus);
-				break;
-			}
-
-		target_cpu = ontime_select_target_cpu(&target_mask, tsk_cpus_allowed(p));
-
-		if (cpu_selected(target_cpu)) {
-			trace_ehmp_ontime_task_wakeup(p, task_cpu(p),
-					target_cpu, "up ontime");
-			goto ontime_up;
-		}
-	}
-
-	/*
-	 * If wakeup task is not ontime and doesn't satisfy ontime condition,
-	 * it cannot be ontime task.
-	 */
-	if (ontime_flag(p) == NOT_ONTIME)
-		goto ontime_out;
-
-	if (ontime_flag(p) == ONTIME) {
-		/*
-		 * If wakeup task is ontime but doesn't keep ontime condition,
-		 * exclude this task from ontime.
-		 */
-		delta = cpu_rq(0)->clock_task - ontime_migration_time(p);
-		delta = delta >> 10;
-
-		if (delta > get_min_residency(ontime_task_cpu(p)) &&
-				ontime_load_avg(p) < get_down_threshold(ontime_task_cpu(p))) {
-			trace_ehmp_ontime_task_wakeup(p, task_cpu(p), -1,
-					"release ontime");
-			goto ontime_out;
-		}
-
-		/*
-		 * If there is a possible cpu to stay ontime, task will wake up at this cpu.
-		 */
-		cpumask_copy(&target_mask, cpu_coregroup_mask(ontime_task_cpu(p)));
-		target_cpu = ontime_select_target_cpu(&target_mask, tsk_cpus_allowed(p));
-
-		if (cpu_selected(target_cpu)) {
-			trace_ehmp_ontime_task_wakeup(p, task_cpu(p),
-					target_cpu, "stay ontime");
-			goto ontime_stay;
-		}
-
-		trace_ehmp_ontime_task_wakeup(p, task_cpu(p), -1, "banished");
-		goto ontime_out;
-	}
-
-	if (!cpu_selected(target_cpu))
-		goto ontime_out;
-
-ontime_up:
-	include_ontime_task(p, target_cpu);
-
-ontime_stay:
-	return target_cpu;
-
-ontime_out:
-	exclude_ontime_task(p);
-	return -1;
-}
-
-static void ontime_update_next_balance(int cpu, struct ontime_avg *oa)
-{
-	if (cpumask_test_cpu(cpu, cpu_coregroup_mask(maxcap_cpu)))
-		return;
-
-	if (oa->load_avg < get_up_threshold(cpu))
-		return;
-
-	/*
-	 * Update the next_balance of this cpu because tick is most likely
-	 * to occur first in currently running cpu.
-	 */
-	cpu_rq(smp_processor_id())->next_balance = jiffies;
-}
-
-extern u64 decay_load(u64 val, u64 n);
-static u32 __accumulate_pelt_segments(u64 periods, u32 d1, u32 d3)
-{
-	u32 c1, c2, c3 = d3;
-
-	c1 = decay_load((u64)d1, periods);
-	c2 = LOAD_AVG_MAX - decay_load(LOAD_AVG_MAX, periods) - 1024;
-
-	return c1 + c2 + c3;
-}
-
-/****************************************************************/
-/*			External APIs				*/
-/****************************************************************/
-void ontime_trace_task_info(struct task_struct *p)
-{
-	trace_ehmp_ontime_load_avg_task(p, &ontime_of(p)->avg, ontime_flag(p));
-}
-
-DEFINE_PER_CPU(struct cpu_stop_work, ontime_migration_work);
-static DEFINE_SPINLOCK(om_lock);
-
-void ontime_migration(void)
-{
-	struct ontime_cond *cond;
-	int cpu;
-
-	if (!spin_trylock(&om_lock))
-		return;
-
-	for (cond = ontime_cond; cond != NULL; cond = cond->next) {
-		for_each_cpu_and(cpu, &cond->src_cpus, cpu_active_mask) {
-			unsigned long flags;
-			struct rq *rq;
-			struct sched_entity *se;
-			struct task_struct *p;
-			int dst_cpu;
-			struct ontime_env *env = &per_cpu(ontime_env, cpu);
-			int boost_migration = 0;
-
-			rq = cpu_rq(cpu);
-			raw_spin_lock_irqsave(&rq->lock, flags);
-
-			/*
-			 * Ontime migration is not performed when active balance
-			 * is in progress.
-			 */
-			if (rq->active_balance) {
-				raw_spin_unlock_irqrestore(&rq->lock, flags);
-				continue;
-			}
-
-			/*
-			 * No need to migration if source cpu does not have cfs
-			 * tasks.
-			 */
-			if (!rq->cfs.curr) {
-				raw_spin_unlock_irqrestore(&rq->lock, flags);
-				continue;
-			}
-
-			se = rq->cfs.curr;
-
-			/* Find task entity if entity is cfs_rq. */
-			if (entity_is_cfs_rq(se)) {
-				struct cfs_rq *cfs_rq;
-
-				cfs_rq = se->my_q;
-				while (cfs_rq) {
-					se = cfs_rq->curr;
-					cfs_rq = se->my_q;
-				}
-			}
-
-			/*
-			 * Select cpu to migrate the task to. Return negative number
-			 * if there is no idle cpu in sg.
-			 */
-			dst_cpu = ontime_select_target_cpu(&cond->dst_cpus, cpu_active_mask);
-			if (dst_cpu < 0) {
-				raw_spin_unlock_irqrestore(&rq->lock, flags);
-				continue;
-			}
-
-			/*
-			 * Pick task to be migrated. Return NULL if there is no
-			 * heavy task in rq.
-			 */
-			p = ontime_pick_heavy_task(se, &cond->dst_cpus,
-							&boost_migration);
-			if (!p) {
-				raw_spin_unlock_irqrestore(&rq->lock, flags);
-				continue;
-			}
-
-			ontime_flag(p) = ONTIME_MIGRATING;
-			get_task_struct(p);
-
-			/* Set environment data */
-			env->dst_cpu = dst_cpu;
-			env->src_rq = rq;
-			env->target_task = p;
-			env->boost_migration = boost_migration;
-
-			/* Prevent active balance to use stopper for migration */
-			rq->active_balance = 1;
-
-			cpu_rq(dst_cpu)->ontime_migrating = 1;
-
-			raw_spin_unlock_irqrestore(&rq->lock, flags);
-
-			/* Migrate task through stopper */
-			stop_one_cpu_nowait(cpu,
-				ontime_migration_cpu_stop, env,
-				&per_cpu(ontime_migration_work, cpu));
-		}
-	}
-
-	spin_unlock(&om_lock);
-}
-
-int ontime_can_migration(struct task_struct *p, int dst_cpu)
-{
-	u64 delta;
-
-	if (ontime_flag(p) & NOT_ONTIME) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "not ontime");
-		return true;
-	}
-
-	if (ontime_flag(p) & ONTIME_MIGRATING) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "migrating");
-		return false;
-	}
-
-	if (cpumask_test_cpu(dst_cpu, cpu_coregroup_mask(ontime_task_cpu(p)))) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "same coregroup");
-		return true;
-	}
-
-	if (capacity_orig_of(dst_cpu) > capacity_orig_of(ontime_task_cpu(p))) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "bigger cpu");
-		return true;
-	}
-
-	/*
-	 * At this point, task is "ontime task" and running on big
-	 * and load balancer is trying to migrate task to LITTLE.
-	 */
-	delta = cpu_rq(0)->clock_task - ontime_migration_time(p);
-	delta = delta >> 10;
-	if (delta <= get_min_residency(ontime_task_cpu(p))) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "min residency");
-		return false;
-	}
-
-	if (cpu_rq(task_cpu(p))->nr_running > 1) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "big is busy");
-		goto release;
-	}
-
-	if (ontime_load_avg(p) >= get_down_threshold(ontime_task_cpu(p))) {
-		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "heavy task");
-		return false;
-	}
-
-	trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "ontime_release");
-release:
-	exclude_ontime_task(p);
-
-	return true;
-}
-
-/*
- * ontime_update_load_avg : load tracking for ontime-migration
- *
- * @sa : sched_avg to be updated
- * @delta : elapsed time since last update
- * @period_contrib : amount already accumulated against our next period
- * @scale_freq : scale vector of cpu frequency
- * @scale_cpu : scale vector of cpu capacity
- */
-void ontime_update_load_avg(u64 delta, int cpu, unsigned long weight, struct sched_avg *sa)
-{
-	struct ontime_avg *oa = &se_of(sa)->ontime.avg;
-	unsigned long scale_freq, scale_cpu;
-	u32 contrib = (u32)delta; /* p == 0 -> delta < 1024 */
-	u64 periods;
-
-	scale_freq = arch_scale_freq_capacity(NULL, cpu);
-	scale_cpu = arch_scale_cpu_capacity(NULL, cpu);
-
-	delta += oa->period_contrib;
-	periods = delta / 1024; /* A period is 1024us (~1ms) */
-
-	if (periods) {
-		oa->load_sum = decay_load(oa->load_sum, periods);
-
-		delta %= 1024;
-		contrib = __accumulate_pelt_segments(periods,
-				1024 - oa->period_contrib, delta);
-	}
-	oa->period_contrib = delta;
-
-	if (weight) {
-		contrib = cap_scale(contrib, scale_freq);
-		oa->load_sum += contrib * scale_cpu;
-	}
-
-	if (!periods)
-		return;
-
-	oa->load_avg = div_u64(oa->load_sum, LOAD_AVG_MAX - 1024 + oa->period_contrib);
-	ontime_update_next_balance(cpu, oa);
-}
-
-void ontime_new_entity_load(struct task_struct *parent, struct sched_entity *se)
-{
-	struct ontime_entity *ontime;
-
-	if (entity_is_cfs_rq(se))
-		return;
-
-	ontime = &se->ontime;
-
-	ontime->avg.load_sum = ontime_of(parent)->avg.load_sum;
-	ontime->avg.load_avg = ontime_of(parent)->avg.load_avg;
-	ontime->avg.ontime_migration_time = 0;
-	ontime->avg.period_contrib = 1023;
-	ontime->flags = NOT_ONTIME;
-
-	trace_ehmp_ontime_new_entity_load(task_of(se), &ontime->avg);
-}
-
-/****************************************************************/
-/*				SYSFS				*/
-/****************************************************************/
-static ssize_t show_up_threshold(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	struct ontime_cond *cond = ontime_cond;
-	int ret = 0;
-
-	while (cond) {
-		ret += sprintf(buf + ret, "cpu%*pbl: %ld\n",
-				cpumask_pr_args(&cond->src_cpus),
-				cond->up_threshold);
-
-		cond = cond->next;
-	}
-
-	return ret;
-}
-
-static ssize_t store_up_threshold(struct kobject *kobj,
-		struct kobj_attribute *attr, const char *buf,
-		size_t count)
-{
-	unsigned long val;
-	int cpu;
-
-	if (sscanf(buf, "%d %lu", &cpu, &val) != 2)
-		return -EINVAL;
-
-	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
-		return -EINVAL;
-
-	val = val > 1024 ? 1024 : val;
-
-	if (set_up_threshold(cpu, val))
-		return -EINVAL;
-
-	return count;
-}
-
-static struct kobj_attribute up_threshold_attr =
-__ATTR(up_threshold, 0644, show_up_threshold, store_up_threshold);
-
-static ssize_t show_down_threshold(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	struct ontime_cond *cond = ontime_cond;
-	int ret = 0;
-
-	while (cond) {
-		ret += sprintf(buf + ret, "cpu%*pbl: %ld\n",
-				cpumask_pr_args(&cond->dst_cpus),
-				cond->down_threshold);
-
-		cond = cond->next;
-	}
-
-	return ret;
-}
-
-static ssize_t store_down_threshold(struct kobject *kobj,
-		struct kobj_attribute *attr, const char *buf,
-		size_t count)
-{
-	unsigned long val;
-	int cpu;
-
-	if (sscanf(buf, "%d %lu", &cpu, &val) != 2)
-		return -EINVAL;
-
-	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
-		return -EINVAL;
-
-	val = val > 1024 ? 1024 : val;
-
-	if (set_down_threshold(cpu, val))
-		return -EINVAL;
-
-	return count;
-}
-
-static struct kobj_attribute down_threshold_attr =
-__ATTR(down_threshold, 0644, show_down_threshold, store_down_threshold);
-
-static ssize_t show_min_residency(struct kobject *kobj,
-		struct kobj_attribute *attr, char *buf)
-{
-	struct ontime_cond *cond = ontime_cond;
-	int ret = 0;
-
-	while (cond) {
-		ret += sprintf(buf + ret, "cpu%*pbl: %d\n",
-				cpumask_pr_args(&cond->dst_cpus),
-				cond->min_residency_us);
-
-		cond = cond->next;
-	}
-
-	return ret;
-}
-
-static ssize_t store_min_residency(struct kobject *kobj,
-		struct kobj_attribute *attr, const char *buf,
-		size_t count)
-{
-	int val;
-	int cpu;
-
-	if (sscanf(buf, "%d %d", &cpu, &val) != 2)
-		return -EINVAL;
-
-	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
-		return -EINVAL;
-
-	val = val < 0 ? 0 : val;
-
-	if (set_min_residency(cpu, val))
-		return -EINVAL;
-
-	return count;
-}
-
-static struct kobj_attribute min_residency_attr =
-__ATTR(min_residency, 0644, show_min_residency, store_min_residency);
-
-/****************************************************************/
-/*			initialization				*/
-/****************************************************************/
-static void
-parse_ontime(struct device_node *dn, struct ontime_cond *cond, int step)
-{
-	struct device_node *ontime, *on_step;
-	char name[10];
-	int prop;
-
-	/*
-	 * Initilize default values:
-	 *   up_threshold	= 40% of Source CPU's maximum capacity
-	 *   down_threshold	= 50% of Destination CPU's minimum capacity
-	 *   min_residency	= 8ms
-	 */
-	cond->up_threshold =
-		capacity_orig_of(cpumask_first(&cond->src_cpus)) * 40 / 100;
-	cond->down_threshold =
-		mincap_of(cpumask_first(&cond->dst_cpus)) * 50 / 100;
-	cond->min_residency_us = 8192;
-
-	ontime = of_get_child_by_name(dn, "ontime");
-	if (!ontime)
-		return;
-
-	snprintf(name, sizeof(name), "step%d", step);
-	on_step = of_get_child_by_name(ontime, name);
-	if (!on_step)
-		return;
-
-	of_property_read_u32(on_step, "up-threshold", &prop);
-	cond->up_threshold = prop;
-
-	of_property_read_u32(on_step, "down-threshold", &prop);
-	cond->down_threshold = prop;
-
-	of_property_read_u32(on_step, "min-residency-us", &prop);
-	cond->min_residency_us = prop;
-}
-
-static int __init init_ontime(void)
-{
-	struct cpumask prev_cpus;
-	struct ontime_cond *cond, *last;
-	struct device_node *dn;
-	int cpu, step = 0;
-
-	dn = of_find_node_by_path("/cpus/ehmp");
-	if (!dn)
-		return 0;
-
-	cpumask_clear(&prev_cpus);
-
-	for_each_possible_cpu(cpu) {
-		if (cpu != cpumask_first(cpu_coregroup_mask(cpu)))
-			continue;
-
-		if (cpumask_empty(&prev_cpus)) {
-			cpumask_copy(&prev_cpus, cpu_coregroup_mask(cpu));
-			continue;
-		}
-
-		cond = kzalloc(sizeof(struct ontime_cond), GFP_KERNEL);
-
-		cpumask_copy(&cond->dst_cpus, cpu_coregroup_mask(cpu));
-		cpumask_copy(&cond->src_cpus, &prev_cpus);
-
-		parse_ontime(dn, cond, step++);
-
-		cpumask_copy(&prev_cpus, cpu_coregroup_mask(cpu));
-
-		/* Add linked list of ontime_cond at last */
-		cond->next = NULL;
-		if (ontime_cond)
-			last->next = cond;
-		else
-			ontime_cond = cond;
-		last = cond;
-	}
-
-	of_node_put(dn);
-	return 0;
-}
-pure_initcall(init_ontime);
-
-/**********************************************************************
- * cpu selection                                                      *
- **********************************************************************/
-#define EAS_CPU_PRV	0
-#define EAS_CPU_NXT	1
-#define EAS_CPU_BKP	2
-
-int exynos_select_cpu(struct task_struct *p, int *backup_cpu,
-				bool boosted, bool prefer_idle)
-{
-	struct sched_domain *sd;
-	int target_cpu = -1;
-	int cpu;
-	unsigned long min_util;
-	struct boost_trigger trigger = {
-		.trigger = 0,
-		.boost_val = 0
-	};
-
-	target_cpu = ontime_task_wakeup(p);
-	if (cpu_selected(target_cpu))
-		goto exit;
-
-	/* Find target cpu from lowest capacity domain */
-	cpu = start_cpu(boosted);
-	if (cpu < 0)
-		goto exit;
-
-	/* Find SD for the start CPU */
-	sd = rcu_dereference(per_cpu(sd_ea, cpu));
-	if (!sd)
-		goto exit;
-
-	min_util = boosted_task_util(p);
-
-	if (check_boost_trigger(p, &trigger)) {
-		target_cpu = find_boost_target(sd, p, min_util, &trigger);
-		if (cpu_selected(target_cpu))
-			goto exit;
-	}
-
-	if (prefer_idle) {
-		target_cpu = find_prefer_idle_target(sd, p, min_util);
-		if (cpu_selected(target_cpu))
-			goto exit;
-	}
-
-	target_cpu = find_best_target(p, backup_cpu, 0, 0);
-
-exit:
-
-	return target_cpu;
-}
-
-/**********************************************************************
- * Sysfs                                                              *
- **********************************************************************/
-static struct attribute *ehmp_attrs[] = {
-	&global_boost_attr.attr,
-	&min_residency_attr.attr,
-	&up_threshold_attr.attr,
-	&down_threshold_attr.attr,
-	&overutil_ratio_attr.attr,
-	&prefer_perf_attr.attr,
-	&initial_util_type.attr,
-	&initial_util_ratio.attr,
-	NULL,
-};
-
-static const struct attribute_group ehmp_group = {
-	.attrs = ehmp_attrs,
-};
-
-static struct kobject *ehmp_kobj;
-
-static int __init init_sysfs(void)
-{
-	int ret;
-
-	ehmp_kobj = kobject_create_and_add("ehmp", kernel_kobj);
-	ret = sysfs_create_group(ehmp_kobj, &ehmp_group);
-
-	return 0;
-}
-late_initcall(init_sysfs);
diff --git a/kernel/sched/ems/Makefile b/kernel/sched/ems/Makefile
new file mode 100644
index 000000000000..f2b1f7be7905
--- /dev/null
+++ b/kernel/sched/ems/Makefile
@@ -0,0 +1,2 @@
+obj-$(CONFIG_SCHED_EHMP) += ehmp.o
+obj-$(CONFIG_FREQVAR_TUNE) += freqvar_tune.o
diff --git a/kernel/sched/ems/ehmp.c b/kernel/sched/ems/ehmp.c
new file mode 100644
index 000000000000..01f64b0628a6
--- /dev/null
+++ b/kernel/sched/ems/ehmp.c
@@ -0,0 +1,2064 @@
+/*
+ * Exynos scheduler for Heterogeneous Multi-Processing (HMP)
+ *
+ * Copyright (C) 2017 Samsung Electronics Co., Ltd
+ * Park Bumgyu <bumgyu.park@samsung.com>
+ */
+
+#include <linux/sched.h>
+#include <linux/cpuidle.h>
+#include <linux/pm_qos.h>
+#include <linux/ehmp.h>
+#include <linux/sched_energy.h>
+
+#define CREATE_TRACE_POINTS
+#include <trace/events/ehmp.h>
+
+#include "../sched.h"
+#include "../tune.h"
+
+/**********************************************************************
+ * extern functions                                                   *
+ **********************************************************************/
+extern struct sched_entity *__pick_next_entity(struct sched_entity *se);
+extern unsigned long boosted_task_util(struct task_struct *task);
+extern unsigned long capacity_curr_of(int cpu);
+extern int find_best_target(struct task_struct *p, int *backup_cpu,
+				   bool boosted, bool prefer_idle);
+extern u64 decay_load(u64 val, u64 n);
+extern int start_cpu(bool boosted);
+
+unsigned long task_util(struct task_struct *p)
+{
+	if (rt_task(p))
+		return p->rt.avg.util_avg;
+	else
+		return p->se.avg.util_avg;
+}
+
+static inline struct task_struct *task_of(struct sched_entity *se)
+{
+	return container_of(se, struct task_struct, se);
+}
+
+static inline struct sched_entity *se_of(struct sched_avg *sa)
+{
+	return container_of(sa, struct sched_entity, avg);
+}
+
+static inline int task_fits(struct task_struct *p, long capacity)
+{
+	return capacity * 1024 > boosted_task_util(p) * 1248;
+}
+
+#define entity_is_cfs_rq(se)	(se->my_q)
+#define entity_is_task(se)	(!se->my_q)
+#define LOAD_AVG_MAX		47742
+
+static unsigned long maxcap_val = 1024;
+static int maxcap_cpu = 7;
+
+void ehmp_update_max_cpu_capacity(int cpu, unsigned long val)
+{
+	maxcap_cpu = cpu;
+	maxcap_val = val;
+}
+
+static inline struct device_node *get_ehmp_node(void)
+{
+	return of_find_node_by_path("/cpus/ehmp");
+}
+
+static inline struct cpumask *sched_group_cpus(struct sched_group *sg)
+{
+	return to_cpumask(sg->cpumask);
+}
+
+#define tsk_cpus_allowed(tsk)	(&(tsk)->cpus_allowed)
+
+/**********************************************************************
+ * Energy diff		                                              *
+ **********************************************************************/
+#define EAS_CPU_PRV	0
+#define EAS_CPU_NXT	1
+#define EAS_CPU_BKP	2
+
+int exynos_estimate_idle_state(int cpu_idx, struct cpumask *mask,
+				int state, int cpus)
+{
+	unsigned int deepest_state_residency = 0;
+	unsigned int next_timer_us = 0;
+	int grp_nr_running = 0;
+	int deepest_state = 0;
+	int i;
+	int estimate_state = 0;
+
+	if (cpu_idx == EAS_CPU_PRV)
+		grp_nr_running++;
+
+	for_each_cpu(i, mask) {
+		grp_nr_running += cpu_rq(i)->nr_running;
+
+		next_timer_us = ktime_to_us(tick_nohz_get_sleep_length_cpu(i));
+		deepest_state_residency = cpuidle_get_target_residency(i, state);
+
+		if (next_timer_us > deepest_state_residency)
+			deepest_state++;
+	}
+
+	if (!grp_nr_running && deepest_state == cpus)
+		estimate_state = state + 1;
+
+	return estimate_state;
+}
+
+/**********************************************************************
+ * task initialization                                                *
+ **********************************************************************/
+enum {
+	TYPE_BASE_CFS_RQ_UTIL = 0,
+	TYPE_BASE_INHERIT_PARENT_UTIL,
+	TYPE_MAX_NUM,
+};
+
+static unsigned long init_util_type = TYPE_BASE_CFS_RQ_UTIL;
+static unsigned long init_util_ratio = 25;			/* 25% */
+
+static ssize_t show_initial_util_type(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+        return snprintf(buf, 10, "%ld\n", init_util_type);
+}
+
+static ssize_t store_initial_util_type(struct kobject *kobj,
+                struct kobj_attribute *attr, const char *buf,
+                size_t count)
+{
+        long input;
+
+        if (!sscanf(buf, "%ld", &input))
+                return -EINVAL;
+
+        input = input < 0 ? 0 : input;
+        input = input >= TYPE_MAX_NUM ? TYPE_MAX_NUM - 1 : input;
+
+        init_util_type = input;
+
+        return count;
+}
+
+static ssize_t show_initial_util_ratio(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+        return snprintf(buf, 10, "%ld\n", init_util_ratio);
+}
+
+static ssize_t store_initial_util_ratio(struct kobject *kobj,
+                struct kobj_attribute *attr, const char *buf,
+                size_t count)
+{
+        long input;
+
+        if (!sscanf(buf, "%ld", &input))
+                return -EINVAL;
+
+        init_util_ratio = !!input;
+
+        return count;
+}
+
+static struct kobj_attribute initial_util_type =
+__ATTR(initial_util_type, 0644, show_initial_util_type, store_initial_util_type);
+
+static struct kobj_attribute initial_util_ratio =
+__ATTR(initial_util_ratio, 0644, show_initial_util_ratio, store_initial_util_ratio);
+
+void base_cfs_rq_util(struct sched_entity *se)
+{
+	struct cfs_rq *cfs_rq = se->cfs_rq;
+	struct sched_avg *sa = &se->avg;
+	int cpu = cpu_of(cfs_rq->rq);
+	unsigned long cap_org = capacity_orig_of(cpu);
+	long cap = (long)(cap_org - cfs_rq->avg.util_avg) / 2;
+
+	if (cap > 0) {
+		if (cfs_rq->avg.util_avg != 0) {
+			sa->util_avg  = cfs_rq->avg.util_avg * se->load.weight;
+			sa->util_avg /= (cfs_rq->avg.load_avg + 1);
+
+			if (sa->util_avg > cap)
+				sa->util_avg = cap;
+		} else {
+			sa->util_avg = cap_org * init_util_ratio / 100;
+		}
+		/*
+		 * If we wish to restore tuning via setting initial util,
+		 * this is where we should do it.
+		 */
+		sa->util_sum = sa->util_avg * LOAD_AVG_MAX;
+	}
+}
+
+void base_inherit_parent_util(struct sched_entity *se)
+{
+	struct sched_avg *sa = &se->avg;
+	struct task_struct *p = current;
+
+	sa->util_avg = p->se.avg.util_avg;
+	sa->util_sum = p->se.avg.util_sum;
+}
+
+void exynos_init_entity_util_avg(struct sched_entity *se)
+{
+	int type = init_util_type;
+
+	switch(type) {
+	case TYPE_BASE_CFS_RQ_UTIL:
+		base_cfs_rq_util(se);
+		break;
+	case TYPE_BASE_INHERIT_PARENT_UTIL:
+		base_inherit_parent_util(se);
+		break;
+	default:
+		pr_info("%s: Not support initial util type %ld\n",
+				__func__, init_util_type);
+	}
+}
+
+/**********************************************************************
+ * load balance                                                       *
+ **********************************************************************/
+#define lb_sd_parent(sd) \
+	(sd->parent && sd->parent->groups != sd->parent->groups->next)
+
+struct sched_group *
+exynos_fit_idlest_group(struct sched_domain *sd, struct task_struct *p)
+{
+	struct sched_group *group = sd->groups;
+	struct sched_group *fit_group = NULL;
+	unsigned long fit_capacity = ULONG_MAX;
+
+	do {
+		int i;
+
+		/* Skip over this group if it has no CPUs allowed */
+		if (!cpumask_intersects(sched_group_span(group),
+					&p->cpus_allowed))
+			continue;
+
+		for_each_cpu(i, sched_group_span(group)) {
+			if (capacity_of(i) < fit_capacity && task_fits(p, capacity_of(i))) {
+				fit_capacity = capacity_of(i);
+				fit_group = group;
+			}
+		}
+	} while (group = group->next, group != sd->groups);
+
+	return fit_group;
+}
+
+static inline int
+check_cpu_capacity(struct rq *rq, struct sched_domain *sd)
+{
+	return ((rq->cpu_capacity * sd->imbalance_pct) <
+				(rq->cpu_capacity_orig * 100));
+}
+
+unsigned long global_boost(void);
+int exynos_need_active_balance(enum cpu_idle_type idle, struct sched_domain *sd,
+					int src_cpu, int dst_cpu)
+{
+	unsigned int src_imb_pct = lb_sd_parent(sd) ? sd->imbalance_pct : 1;
+	unsigned int dst_imb_pct = lb_sd_parent(sd) ? 100 : 1;
+	unsigned long src_cap = capacity_of(src_cpu);
+	unsigned long dst_cap = capacity_of(dst_cpu);
+	int level = sd->level;
+
+	/* dst_cpu is idle */
+	if ((idle != CPU_NOT_IDLE) &&
+	    (cpu_rq(src_cpu)->cfs.h_nr_running == 1)) {
+		if ((check_cpu_capacity(cpu_rq(src_cpu), sd)) &&
+		    (src_cap * sd->imbalance_pct < dst_cap * 100)) {
+			return 1;
+		}
+
+		/* This domain is top and dst_cpu is bigger than src_cpu*/
+		if (!lb_sd_parent(sd) && src_cap < dst_cap)
+			if (lbt_overutilized(src_cpu, level) || global_boost())
+				return 1;
+	}
+
+	if ((src_cap * src_imb_pct < dst_cap * dst_imb_pct) &&
+			cpu_rq(src_cpu)->cfs.h_nr_running == 1 &&
+			lbt_overutilized(src_cpu, level) &&
+			!lbt_overutilized(dst_cpu, level)) {
+		return 1;
+	}
+
+	return unlikely(sd->nr_balance_failed > sd->cache_nice_tries + 2);
+}
+
+/****************************************************************/
+/*			Load Balance Trigger			*/
+/****************************************************************/
+#define DISABLE_OU		-1
+#define DEFAULT_OU_RATIO	80
+
+struct lbt_overutil {
+	bool			top;
+	struct cpumask		cpus;
+	unsigned long		capacity;
+	int			ratio;
+};
+DEFINE_PER_CPU(struct lbt_overutil *, lbt_overutil);
+
+static inline int get_topology_depth(void)
+{
+	struct sched_domain *sd;
+
+	for_each_domain(0, sd) {
+		if (sd->parent == NULL)
+			return sd->level;
+	}
+
+	return -1;
+}
+
+static inline int get_last_level(struct lbt_overutil *ou)
+{
+	int level;
+
+	for (level = 0; &ou[level] != NULL; level++) {
+		if (ou[level].top == true)
+			return level;
+	}
+
+	return -1;
+}
+
+/****************************************************************/
+/*			External APIs				*/
+/****************************************************************/
+bool lbt_overutilized(int cpu, int level)
+{
+	struct lbt_overutil *ou = per_cpu(lbt_overutil, cpu);
+	bool overutilized;
+
+	if (!ou)
+		return false;
+
+	overutilized = (cpu_util(cpu) > ou[level].capacity) ? true : false;
+
+	if (overutilized)
+		trace_ehmp_lbt_overutilized(cpu, level, cpu_util(cpu),
+				ou[level].capacity, overutilized);
+
+	return overutilized;
+}
+
+void update_lbt_overutil(int cpu, unsigned long capacity)
+{
+	struct lbt_overutil *ou = per_cpu(lbt_overutil, cpu);
+	int level, last = get_last_level(ou);
+
+	for (level = 0; level <= last; level++) {
+		if (ou[level].ratio == DISABLE_OU)
+			continue;
+
+		ou[level].capacity = (capacity * ou[level].ratio) / 100;
+	}
+}
+
+/****************************************************************/
+/*				SYSFS				*/
+/****************************************************************/
+static ssize_t show_overutil_ratio(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	struct lbt_overutil *ou = per_cpu(lbt_overutil, 0);
+	int level, last = get_last_level(ou);
+	int cpu, ret = 0;
+
+	for (level = 0; level <= last; level++) {
+		ret += sprintf(buf + ret, "[level%d]\n", level);
+
+		for_each_possible_cpu(cpu) {
+			ou = per_cpu(lbt_overutil, cpu);
+
+			if (ou[level].ratio == DISABLE_OU)
+				continue;
+
+			ret += sprintf(buf + ret, "cpu%d ratio:%3d capacity:%4lu\n",
+					cpu, ou[level].ratio, ou[level].capacity);
+		}
+	}
+
+	return ret;
+}
+
+static ssize_t store_overutil_ratio(struct kobject *kobj,
+		struct kobj_attribute *attr, const char *buf,
+		size_t count)
+{
+	struct lbt_overutil *ou;
+	unsigned long capacity;
+	int cpu, level, ratio;
+	int last;
+
+	if (sscanf(buf, "%d %d %d", &cpu, &level, &ratio) != 3)
+		return -EINVAL;
+
+	/* Check cpu is possible */
+	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
+		return -EINVAL;
+	ou = per_cpu(lbt_overutil, cpu);
+
+	/* Check level range */
+	last = get_last_level(ou);
+	if (last < 0 || level < 0 || level > last)
+		return -EINVAL;
+
+	/* If ratio is outrage, disable overutil */
+	if (ratio < 0 || ratio > 100)
+		ratio = DEFAULT_OU_RATIO;
+
+	for_each_cpu(cpu, &ou[level].cpus) {
+		ou = per_cpu(lbt_overutil, cpu);
+		if (ou[level].ratio == DISABLE_OU)
+			continue;
+
+		ou[level].ratio = ratio;
+		capacity = capacity_orig_of(cpu);
+		update_lbt_overutil(cpu, capacity);
+	}
+
+	return count;
+}
+
+static struct kobj_attribute overutil_ratio_attr =
+__ATTR(overutil_ratio, 0644, show_overutil_ratio, store_overutil_ratio);
+
+/****************************************************************/
+/*			Initialization				*/
+/****************************************************************/
+static void free_lbt_overutil(void)
+{
+	int cpu;
+
+	for_each_possible_cpu(cpu) {
+		if (per_cpu(lbt_overutil, cpu))
+			kfree(per_cpu(lbt_overutil, cpu));
+	}
+}
+
+static int alloc_lbt_overutil(void)
+{
+	int cpu, depth = get_topology_depth();
+
+	for_each_possible_cpu(cpu) {
+		struct lbt_overutil *ou = kzalloc(sizeof(struct lbt_overutil) *
+				(depth + 1), GFP_KERNEL);
+		if (!ou)
+			goto fail_alloc;
+
+		per_cpu(lbt_overutil, cpu) = ou;
+	}
+	return 0;
+
+fail_alloc:
+	free_lbt_overutil();
+	return -ENOMEM;
+}
+
+static int set_lbt_overutil(int level, const char *mask, int ratio)
+{
+	struct lbt_overutil *ou;
+	struct cpumask cpus;
+	bool top, overlap = false;
+	int cpu;
+
+	cpulist_parse(mask, &cpus);
+	cpumask_and(&cpus, &cpus, cpu_possible_mask);
+	if (!cpumask_weight(&cpus))
+		return -ENODEV;
+
+	/* If sibling cpus is same with possible cpus, it is top level */
+	top = cpumask_equal(&cpus, cpu_possible_mask);
+
+	/* If this level is overlapped with prev level, disable this level */
+	if (level > 0) {
+		ou = per_cpu(lbt_overutil, cpumask_first(&cpus));
+		overlap = cpumask_equal(&cpus, &ou[level-1].cpus);
+	}
+
+	for_each_cpu(cpu, &cpus) {
+		ou = per_cpu(lbt_overutil, cpu);
+		cpumask_copy(&ou[level].cpus, &cpus);
+		ou[level].ratio = overlap ? DISABLE_OU : ratio;
+		ou[level].top = top;
+	}
+
+	return 0;
+}
+
+static int parse_lbt_overutil(struct device_node *dn)
+{
+	struct device_node *lbt, *ou;
+	int level, depth = get_topology_depth();
+	int ret = 0;
+
+	lbt = of_get_child_by_name(dn, "lbt");
+	if (!lbt)
+		return -ENODEV;
+
+	for (level = 0; level <= depth; level++) {
+		char name[20];
+		const char *mask[NR_CPUS];
+		int ratio[NR_CPUS];
+		int i, proplen;
+
+		snprintf(name, sizeof(name), "overutil-level%d", level);
+		ou = of_get_child_by_name(lbt, name);
+		if (!ou) {
+			ret = -ENODEV;
+			goto out;
+		}
+
+		proplen = of_property_count_strings(ou, "cpus");
+		if ((proplen < 0) || (proplen != of_property_count_u32_elems(ou, "ratio"))) {
+			of_node_put(ou);
+			ret = -ENODEV;
+			goto out;
+		}
+
+		of_property_read_string_array(ou, "cpus", mask, proplen);
+		of_property_read_u32_array(ou, "ratio", ratio, proplen);
+		of_node_put(ou);
+
+		for (i = 0; i < proplen; i++) {
+			ret = set_lbt_overutil(level, mask[i], ratio[i]);
+			if (ret)
+				goto out;
+		}
+	}
+
+out:
+	of_node_put(lbt);
+	return ret;
+}
+
+static int __init init_lbt(void)
+{
+	struct device_node *dn;
+	int ret;
+
+	dn = of_find_node_by_path("/cpus/ehmp");
+	if (!dn)
+		return 0;
+
+	ret = alloc_lbt_overutil();
+	if (ret) {
+		pr_err("Failed to allocate lbt_overutil\n");
+		goto out;
+	}
+
+	ret = parse_lbt_overutil(dn);
+	if (ret) {
+		pr_err("Failed to parse lbt_overutil\n");
+		free_lbt_overutil();
+		goto out;
+	}
+
+out:
+	of_node_put(dn);
+	return ret;
+}
+pure_initcall(init_lbt);
+/**********************************************************************
+ * Global boost                                                       *
+ **********************************************************************/
+static unsigned long gb_value = 0;
+static unsigned long gb_max_value = 0;
+static struct gb_qos_request gb_req_user =
+{
+	.name = "ehmp_gb_req_user",
+};
+
+static struct plist_head gb_list = PLIST_HEAD_INIT(gb_list);
+
+static DEFINE_SPINLOCK(gb_lock);
+
+static int gb_qos_max_value(void)
+{
+	return plist_last(&gb_list)->prio;
+}
+
+static int gb_qos_req_value(struct gb_qos_request *req)
+{
+	return req->node.prio;
+}
+
+void gb_qos_update_request(struct gb_qos_request *req, u32 new_value)
+{
+	unsigned long flags;
+
+	if (req->node.prio == new_value)
+		return;
+
+	spin_lock_irqsave(&gb_lock, flags);
+
+	if (req->active)
+		plist_del(&req->node, &gb_list);
+	else
+		req->active = 1;
+
+	plist_node_init(&req->node, new_value);
+	plist_add(&req->node, &gb_list);
+
+	gb_value = gb_max_value * gb_qos_max_value() / 100;
+	trace_ehmp_global_boost(req->name, new_value);
+
+	spin_unlock_irqrestore(&gb_lock, flags);
+}
+
+static ssize_t show_global_boost(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	struct gb_qos_request *req;
+	int ret = 0;
+
+	plist_for_each_entry(req, &gb_list, node)
+		ret += snprintf(buf + ret, 30, "%s : %d\n",
+				req->name, gb_qos_req_value(req));
+
+	return ret;
+}
+
+static ssize_t store_global_boost(struct kobject *kobj,
+		struct kobj_attribute *attr, const char *buf,
+		size_t count)
+{
+	unsigned int input;
+
+	if (!sscanf(buf, "%d", &input))
+		return -EINVAL;
+
+	gb_qos_update_request(&gb_req_user, input);
+
+	return count;
+}
+
+static struct kobj_attribute global_boost_attr =
+__ATTR(global_boost, 0644, show_global_boost, store_global_boost);
+
+#define BOOT_BOOST_DURATION 40000000	/* microseconds */
+unsigned long global_boost(void)
+{
+	u64 now = ktime_to_us(ktime_get());
+
+	if (now < BOOT_BOOST_DURATION)
+		return gb_max_value;
+
+	return gb_value;
+}
+
+int find_second_max_cap(void)
+{
+	struct sched_domain *sd = rcu_dereference(per_cpu(sd_ea, 0));
+	struct sched_group *sg;
+	int max_cap = 0, second_max_cap = 0;
+
+	if (!sd)
+		return 0;
+
+	sg = sd->groups;
+	do {
+		int i;
+
+		for_each_cpu(i, sched_group_cpus(sg)) {
+			if (max_cap < cpu_rq(i)->cpu_capacity_orig) {
+				second_max_cap = max_cap;
+				max_cap = cpu_rq(i)->cpu_capacity_orig;
+			}
+		}
+	} while (sg = sg->next, sg != sd->groups);
+
+	return second_max_cap;
+}
+
+static int __init init_global_boost(void)
+{
+	gb_max_value = find_second_max_cap() + 1;
+
+	return 0;
+}
+pure_initcall(init_global_boost);
+
+/**********************************************************************
+ * Boost cpu selection (global boost, schedtune.prefer_perf)          *
+ **********************************************************************/
+#define cpu_selected(cpu)	(cpu >= 0)
+
+int kernel_prefer_perf(int grp_idx);
+static ssize_t show_prefer_perf(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	int i, ret = 0;
+
+	for (i = 0; i < STUNE_GROUP_COUNT; i++)
+		ret += snprintf(buf + ret, 10, "%d ", kernel_prefer_perf(i));
+
+	ret += snprintf(buf + ret, 10, "\n");
+
+	return ret;
+}
+
+static struct kobj_attribute prefer_perf_attr =
+__ATTR(kernel_prefer_perf, 0444, show_prefer_perf, NULL);
+
+enum {
+	BT_PREFER_PERF = 0,
+	BT_GROUP_BALANCE,
+	BT_GLOBAL_BOOST,
+};
+
+struct boost_trigger {
+	int trigger;
+	int boost_val;
+};
+
+static int check_boost_trigger(struct task_struct *p, struct boost_trigger *bt)
+{
+	int gb;
+
+#ifdef CONFIG_SCHED_TUNE
+	if (schedtune_prefer_perf(p) > 0) {
+		bt->trigger = BT_PREFER_PERF;
+		bt->boost_val = schedtune_perf_threshold();
+		return 1;
+	}
+
+	if (schedtune_need_group_balance(p) > 0) {
+		bt->trigger = BT_GROUP_BALANCE;
+		bt->boost_val = schedtune_perf_threshold();
+		return 1;
+	}
+#endif
+
+	gb = global_boost();
+	if (gb) {
+		bt->trigger = BT_GLOBAL_BOOST;
+		bt->boost_val = gb;
+		return 1;
+	}
+
+	/* not boost state */
+	return 0;
+}
+
+static int boost_select_cpu(struct task_struct *p, struct cpumask *target_cpus)
+{
+	int i, cpu = 0;
+
+	if (cpumask_empty(target_cpus))
+		return -1;
+
+	if (cpumask_test_cpu(task_cpu(p), target_cpus))
+		return task_cpu(p);
+
+	/* Return last cpu in target_cpus */
+	for_each_cpu(i, target_cpus)
+		cpu = i;
+
+	return cpu;
+}
+
+static void mark_shallowest_cpu(int cpu, unsigned int *min_exit_latency,
+						struct cpumask *shallowest_cpus)
+{
+	struct rq *rq = cpu_rq(cpu);
+	struct cpuidle_state *idle = idle_get_state(rq);
+
+	/* Before enabling cpuidle, all idle cpus are marked */
+	if (!idle) {
+		cpumask_set_cpu(cpu, shallowest_cpus);
+		return;
+	}
+
+	/* Deeper idle cpu is ignored */
+	if (idle->exit_latency > *min_exit_latency)
+		return;
+
+	/* if shallower idle cpu is found, previsouly founded cpu is ignored */
+	if (idle->exit_latency < *min_exit_latency) {
+		cpumask_clear(shallowest_cpus);
+		*min_exit_latency = idle->exit_latency;
+	}
+
+	cpumask_set_cpu(cpu, shallowest_cpus);
+}
+static int check_migration_task(struct task_struct *p)
+{
+	return !p->se.avg.last_update_time;
+}
+
+unsigned long cpu_util_wake(int cpu, struct task_struct *p)
+{
+	unsigned long util, capacity;
+
+	/* Task has no contribution or is new */
+	if (cpu != task_cpu(p) || check_migration_task(p))
+		return cpu_util(cpu);
+
+	capacity = capacity_orig_of(cpu);
+	util = max_t(long, cpu_util(cpu) - task_util(p), 0);
+
+	return (util >= capacity) ? capacity : util;
+}
+
+static int find_group_boost_target(struct task_struct *p)
+{
+	struct sched_domain *sd;
+	int shallowest_cpu = -1;
+	int lowest_cpu = -1;
+	unsigned int min_exit_latency = UINT_MAX;
+	unsigned long lowest_util = ULONG_MAX;
+	int target_cpu = -1;
+	int cpu;
+	char state[30] = "fail";
+
+	sd = rcu_dereference(per_cpu(sd_ea, maxcap_cpu));
+	if (!sd)
+		return target_cpu;
+
+	if (cpumask_test_cpu(task_cpu(p), sched_group_cpus(sd->groups))) {
+		if (idle_cpu(task_cpu(p))) {
+			target_cpu = task_cpu(p);
+			strcpy(state, "current idle");
+			goto find_target;
+		}
+	}
+
+	for_each_cpu_and(cpu, tsk_cpus_allowed(p), sched_group_cpus(sd->groups)) {
+		unsigned long util = cpu_util_wake(cpu, p);
+
+		if (idle_cpu(cpu)) {
+			struct cpuidle_state *idle;
+
+			idle = idle_get_state(cpu_rq(cpu));
+			if (!idle) {
+				target_cpu = cpu;
+				strcpy(state, "idle wakeup");
+				goto find_target;
+			}
+
+			if (idle->exit_latency < min_exit_latency) {
+				min_exit_latency = idle->exit_latency;
+				shallowest_cpu = cpu;
+				continue;
+			}
+		}
+
+		if (cpu_selected(shallowest_cpu))
+			continue;
+
+		if (util < lowest_util) {
+			lowest_cpu = cpu;
+			lowest_util = util;
+		}
+	}
+
+	if (cpu_selected(shallowest_cpu)) {
+		target_cpu = shallowest_cpu;
+		strcpy(state, "shallowest idle");
+		goto find_target;
+	}
+
+	if (cpu_selected(lowest_cpu)) {
+		target_cpu = lowest_cpu;
+		strcpy(state, "lowest util");
+	}
+
+find_target:
+	trace_ehmp_select_group_boost(p, target_cpu, state);
+
+	return target_cpu;
+}
+
+static int
+find_boost_target(struct sched_domain *sd, struct task_struct *p,
+			unsigned long min_util, struct boost_trigger *bt)
+{
+	struct sched_group *sg;
+	int boost = bt->boost_val;
+	unsigned long max_capacity;
+	struct cpumask boost_candidates;
+	struct cpumask backup_boost_candidates;
+	unsigned int min_exit_latency = UINT_MAX;
+	unsigned int backup_min_exit_latency = UINT_MAX;
+	int target_cpu;
+	bool go_up = false;
+	unsigned long lowest_util = ULONG_MAX;
+	int lowest_cpu = -1;
+	char state[30] = "fail";
+
+	if (bt->trigger == BT_GROUP_BALANCE)
+		return find_group_boost_target(p);
+
+	cpumask_setall(&boost_candidates);
+	cpumask_clear(&backup_boost_candidates);
+
+	max_capacity = maxcap_val;
+
+	sg = sd->groups;
+
+	do {
+		int i;
+
+		for_each_cpu_and(i, tsk_cpus_allowed(p), sched_group_cpus(sg)) {
+			unsigned long new_util, wake_util;
+
+			if (!cpu_online(i))
+				continue;
+
+			wake_util = cpu_util_wake(i, p);
+			new_util = wake_util + task_util(p);
+			new_util = max(min_util, new_util);
+
+			if (min(new_util + boost, max_capacity) > capacity_orig_of(i)) {
+				if (!cpu_rq(i)->nr_running)
+					mark_shallowest_cpu(i, &backup_min_exit_latency,
+							&backup_boost_candidates);
+				else if (cpumask_test_cpu(task_cpu(p), sched_group_cpus(sg)))
+					go_up = true;
+
+				continue;
+			}
+
+			if (cpumask_weight(&boost_candidates) >= nr_cpu_ids)
+				cpumask_clear(&boost_candidates);
+
+			if (!cpu_rq(i)->nr_running) {
+				mark_shallowest_cpu(i, &min_exit_latency, &boost_candidates);
+				continue;
+			}
+
+			if (wake_util < lowest_util) {
+				lowest_util = wake_util;
+				lowest_cpu = i;
+			}
+		}
+
+		if (cpumask_weight(&boost_candidates) >= nr_cpu_ids)
+			continue;
+
+		target_cpu = boost_select_cpu(p, &boost_candidates);
+		if (cpu_selected(target_cpu)) {
+			strcpy(state, "big idle");
+			goto out;
+		}
+
+		target_cpu = boost_select_cpu(p, &backup_boost_candidates);
+		if (cpu_selected(target_cpu)) {
+			strcpy(state, "little idle");
+			goto out;
+		}
+	} while (sg = sg->next, sg != sd->groups);
+
+	if (go_up) {
+		strcpy(state, "lowest big cpu");
+		target_cpu = lowest_cpu;
+		goto out;
+	}
+
+	strcpy(state, "current cpu");
+	target_cpu = task_cpu(p);
+
+out:
+	trace_ehmp_select_boost_cpu(p, target_cpu, bt->trigger, state);
+	return target_cpu;
+}
+
+/**********************************************************************
+ * schedtune.prefer_idle                                              *
+ **********************************************************************/
+static void mark_lowest_cpu(int cpu, unsigned long new_util,
+			int *lowest_cpu, unsigned long *lowest_util)
+{
+	if (new_util >= *lowest_util)
+		return;
+
+	*lowest_util = new_util;
+	*lowest_cpu = cpu;
+}
+
+static int find_prefer_idle_target(struct sched_domain *sd,
+			struct task_struct *p, unsigned long min_util)
+{
+	struct sched_group *sg;
+	int target_cpu = -1;
+	int lowest_cpu = -1;
+	int lowest_idle_cpu = -1;
+	int overcap_cpu = -1;
+	unsigned long lowest_util = ULONG_MAX;
+	unsigned long lowest_idle_util = ULONG_MAX;
+	unsigned long overcap_util = ULONG_MAX;
+	struct cpumask idle_candidates;
+	struct cpumask overcap_idle_candidates;
+
+	cpumask_clear(&idle_candidates);
+	cpumask_clear(&overcap_idle_candidates);
+
+	sg = sd->groups;
+
+	do {
+		int i;
+
+		for_each_cpu_and(i, tsk_cpus_allowed(p), sched_group_cpus(sg)) {
+			unsigned long new_util, wake_util;
+
+			if (!cpu_online(i))
+				continue;
+
+			wake_util = cpu_util_wake(i, p);
+			new_util = wake_util + task_util(p);
+			new_util = max(min_util, new_util);
+
+			trace_ehmp_prefer_idle(p, task_cpu(p), i, task_util(p),
+							new_util, idle_cpu(i));
+
+			if (new_util > capacity_orig_of(i)) {
+				if (idle_cpu(i)) {
+					cpumask_set_cpu(i, &overcap_idle_candidates);
+					mark_lowest_cpu(i, new_util,
+						&overcap_cpu, &overcap_util);
+				}
+
+				continue;
+			}
+
+			if (idle_cpu(i)) {
+				if (task_cpu(p) == i) {
+					target_cpu = i;
+					break;
+				}
+
+				cpumask_set_cpu(i, &idle_candidates);
+				mark_lowest_cpu(i, new_util,
+					&lowest_idle_cpu, &lowest_idle_util);
+
+				continue;
+			}
+
+			mark_lowest_cpu(i, new_util, &lowest_cpu, &lowest_util);
+		}
+
+		if (cpu_selected(target_cpu))
+			break;
+
+		if (cpumask_weight(&idle_candidates)) {
+			target_cpu = lowest_idle_cpu;
+			break;
+		}
+
+		if (cpu_selected(lowest_cpu)) {
+			target_cpu = lowest_cpu;
+			break;
+		}
+
+	} while (sg = sg->next, sg != sd->groups);
+
+	if (cpu_selected(target_cpu))
+		goto out;
+
+	if (cpumask_weight(&overcap_idle_candidates)) {
+		if (cpumask_test_cpu(task_cpu(p), &overcap_idle_candidates))
+			target_cpu = task_cpu(p);
+		else
+			target_cpu = overcap_cpu;
+
+		goto out;
+	}
+
+out:
+	trace_ehmp_prefer_idle_cpu_select(p, target_cpu);
+
+	return target_cpu;
+}
+
+/****************************************************************/
+/*			On-time migration			*/
+/****************************************************************/
+#define TASK_TRACK_COUNT	5
+
+#define ontime_task_cpu(p)		(ontime_of(p)->cpu)
+#define ontime_flag(p)			(ontime_of(p)->flags)
+#define ontime_migration_time(p)	(ontime_of(p)->avg.ontime_migration_time)
+#define ontime_load_avg(p)		(ontime_of(p)->avg.load_avg)
+
+#define cap_scale(v, s)		((v)*(s) >> SCHED_CAPACITY_SHIFT)
+#define mincap_of(__cpu)	(sge_array[__cpu][SD_LEVEL0]->cap_states[0].cap)
+
+/* Structure of ontime migration condition */
+struct ontime_cond {
+	unsigned long		up_threshold;
+	unsigned long		down_threshold;
+	unsigned int		min_residency_us;
+
+	struct cpumask		src_cpus;
+	struct cpumask		dst_cpus;
+
+	struct ontime_cond	*next;
+};
+static struct ontime_cond *ontime_cond;
+
+/* Structure of ontime migration environment */
+struct ontime_env {
+	struct rq		*dst_rq;
+	int			dst_cpu;
+	struct rq		*src_rq;
+	int			src_cpu;
+	struct task_struct	*target_task;
+	int			boost_migration;
+};
+DEFINE_PER_CPU(struct ontime_env, ontime_env);
+
+static unsigned long get_up_threshold(int cpu)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->src_cpus))
+			return cond->up_threshold;
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static int set_up_threshold(int cpu, unsigned long val)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->src_cpus)) {
+			cond->up_threshold = val;
+			return 0;
+		}
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static unsigned long get_down_threshold(int cpu)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->dst_cpus))
+			return cond->down_threshold;
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static int set_down_threshold(int cpu, unsigned long val)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->dst_cpus)) {
+			cond->down_threshold = val;
+			return 0;
+		}
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static unsigned int get_min_residency(int cpu)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->dst_cpus))
+			return cond->min_residency_us;
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static int set_min_residency(int cpu, int val)
+{
+	struct ontime_cond *cond = ontime_cond;
+
+	while (cond) {
+		if (cpumask_test_cpu(cpu, &cond->dst_cpus)) {
+			cond->min_residency_us = val;
+			return 0;
+		}
+
+		cond = cond->next;
+	}
+
+	return -EINVAL;
+}
+
+static inline void include_ontime_task(struct task_struct *p, int dst_cpu)
+{
+	ontime_flag(p) = ONTIME;
+	ontime_task_cpu(p) = dst_cpu;
+
+	/* Manage time based on clock task of boot cpu(cpu0) */
+	ontime_migration_time(p) = cpu_rq(0)->clock_task;
+}
+
+static inline void exclude_ontime_task(struct task_struct *p)
+{
+	ontime_task_cpu(p) = 0;
+	ontime_migration_time(p) = 0;
+	ontime_flag(p) = NOT_ONTIME;
+}
+
+static int
+ontime_select_target_cpu(struct cpumask *dst_cpus, const struct cpumask *mask)
+{
+	int cpu;
+	int dest_cpu = -1;
+	unsigned int min_exit_latency = UINT_MAX;
+	struct cpuidle_state *idle;
+
+	rcu_read_lock();
+	for_each_cpu_and(cpu, dst_cpus, mask) {
+		if (!idle_cpu(cpu))
+			continue;
+
+		if (cpu_rq(cpu)->ontime_migrating)
+			continue;
+
+		idle = idle_get_state(cpu_rq(cpu));
+		if (!idle) {
+			rcu_read_unlock();
+			return cpu;
+		}
+
+		if (idle && idle->exit_latency < min_exit_latency) {
+			min_exit_latency = idle->exit_latency;
+			dest_cpu = cpu;
+		}
+	}
+
+	rcu_read_unlock();
+	return dest_cpu;
+}
+
+extern struct sched_entity *__pick_next_entity(struct sched_entity *se);
+static struct task_struct *
+ontime_pick_heavy_task(struct sched_entity *se, struct cpumask *dst_cpus,
+						int *boost_migration)
+{
+	struct task_struct *heaviest_task = NULL;
+	struct task_struct *p;
+	unsigned int max_util_avg = 0;
+	int task_count = 0;
+	int boosted = !!global_boost();
+
+	/*
+	 * Since current task does not exist in entity list of cfs_rq,
+	 * check first that current task is heavy.
+	 */
+	p = task_of(se);
+	if (boosted || ontime_load_avg(p) >= get_up_threshold(task_cpu(p))) {
+		heaviest_task = task_of(se);
+		max_util_avg = ontime_load_avg(task_of(se));
+		if (boosted)
+			*boost_migration = 1;
+	}
+
+	se = __pick_first_entity(se->cfs_rq);
+	while (se && task_count < TASK_TRACK_COUNT) {
+		/* Skip non-task entity */
+		if (entity_is_cfs_rq(se))
+			goto next_entity;
+
+		p = task_of(se);
+		if (schedtune_prefer_perf(p)) {
+			heaviest_task = p;
+			*boost_migration = 1;
+			break;
+		}
+
+		if (!boosted && ontime_load_avg(p) <
+				get_up_threshold(task_cpu(p)))
+			goto next_entity;
+
+		if (ontime_load_avg(p) > max_util_avg &&
+		    cpumask_intersects(dst_cpus, tsk_cpus_allowed(p))) {
+			heaviest_task = p;
+			max_util_avg = ontime_load_avg(p);
+			*boost_migration = boosted;
+		}
+
+next_entity:
+		se = __pick_next_entity(se);
+		task_count++;
+	}
+
+	return heaviest_task;
+}
+
+static int can_migrate(struct task_struct *p, struct ontime_env *env)
+{
+	if (!cpumask_test_cpu(env->dst_cpu, tsk_cpus_allowed(p)))
+		return 0;
+
+	if (task_running(env->src_rq, p))
+		return 0;
+
+	return 1;
+}
+
+static void move_task(struct task_struct *p, struct ontime_env *env)
+{
+	p->on_rq = TASK_ON_RQ_MIGRATING;
+	deactivate_task(env->src_rq, p, 0);
+	set_task_cpu(p, env->dst_cpu);
+
+	activate_task(env->dst_rq, p, 0);
+	p->on_rq = TASK_ON_RQ_QUEUED;
+	check_preempt_curr(env->dst_rq, p, 0);
+}
+
+static int move_specific_task(struct task_struct *target, struct ontime_env *env)
+{
+	struct task_struct *p, *n;
+
+	list_for_each_entry_safe(p, n, &env->src_rq->cfs_tasks, se.group_node) {
+		if (!can_migrate(p, env))
+			continue;
+
+		if (p != target)
+			continue;
+
+		move_task(p, env);
+		return 1;
+	}
+
+	return 0;
+}
+
+static int ontime_migration_cpu_stop(void *data)
+{
+	struct ontime_env *env = data;
+	struct rq *src_rq, *dst_rq;
+	int src_cpu, dst_cpu;
+	struct task_struct *p;
+	struct sched_domain *sd;
+	int boost_migration;
+
+	/* Initialize environment data */
+	src_rq = env->src_rq;
+	dst_rq = env->dst_rq = cpu_rq(env->dst_cpu);
+	src_cpu = env->src_cpu = env->src_rq->cpu;
+	dst_cpu = env->dst_cpu;
+	p = env->target_task;
+	boost_migration = env->boost_migration;
+
+	raw_spin_lock_irq(&src_rq->lock);
+
+	if (!(ontime_flag(p) & ONTIME_MIGRATING))
+		goto out_unlock;
+
+	if (p->exit_state)
+		goto out_unlock;
+
+	if (unlikely(src_cpu != smp_processor_id()))
+		goto out_unlock;
+
+	if (src_rq->nr_running <= 1)
+		goto out_unlock;
+
+	if (src_rq != task_rq(p))
+		goto out_unlock;
+
+	BUG_ON(src_rq == dst_rq);
+
+	double_lock_balance(src_rq, dst_rq);
+
+	rcu_read_lock();
+	for_each_domain(dst_cpu, sd)
+		if (cpumask_test_cpu(src_cpu, sched_domain_span(sd)))
+			break;
+
+	if (likely(sd) && move_specific_task(p, env)) {
+		if (boost_migration) {
+			/* boost task is not classified as ontime task */
+			exclude_ontime_task(p);
+		} else {
+			include_ontime_task(p, dst_cpu);
+		}
+
+		rcu_read_unlock();
+		double_unlock_balance(src_rq, dst_rq);
+
+		trace_ehmp_ontime_migration(p, ontime_of(p)->avg.load_avg,
+					src_cpu, dst_cpu, boost_migration);
+		goto success_unlock;
+	}
+
+	rcu_read_unlock();
+	double_unlock_balance(src_rq, dst_rq);
+
+out_unlock:
+	exclude_ontime_task(p);
+
+success_unlock:
+	src_rq->active_balance = 0;
+	dst_rq->ontime_migrating = 0;
+
+	raw_spin_unlock_irq(&src_rq->lock);
+	put_task_struct(p);
+
+	return 0;
+}
+
+static int ontime_task_wakeup(struct task_struct *p)
+{
+	struct ontime_cond *cond;
+	struct cpumask target_mask;
+	u64 delta;
+	int target_cpu = -1;
+
+	/* When wakeup task is on ontime migrating, do not ontime wakeup */
+	if (ontime_flag(p) == ONTIME_MIGRATING)
+		return -1;
+
+	/*
+	 * When wakeup task satisfies ontime condition to up migration,
+	 * check there is a possible target cpu.
+	 */
+	if (ontime_load_avg(p) >= get_up_threshold(task_cpu(p))) {
+		cpumask_clear(&target_mask);
+
+		for (cond = ontime_cond; cond != NULL; cond = cond->next)
+			if (cpumask_test_cpu(task_cpu(p), &cond->src_cpus)) {
+				cpumask_copy(&target_mask, &cond->dst_cpus);
+				break;
+			}
+
+		target_cpu = ontime_select_target_cpu(&target_mask, tsk_cpus_allowed(p));
+
+		if (cpu_selected(target_cpu)) {
+			trace_ehmp_ontime_task_wakeup(p, task_cpu(p),
+					target_cpu, "up ontime");
+			goto ontime_up;
+		}
+	}
+
+	/*
+	 * If wakeup task is not ontime and doesn't satisfy ontime condition,
+	 * it cannot be ontime task.
+	 */
+	if (ontime_flag(p) == NOT_ONTIME)
+		goto ontime_out;
+
+	if (ontime_flag(p) == ONTIME) {
+		/*
+		 * If wakeup task is ontime but doesn't keep ontime condition,
+		 * exclude this task from ontime.
+		 */
+		delta = cpu_rq(0)->clock_task - ontime_migration_time(p);
+		delta = delta >> 10;
+
+		if (delta > get_min_residency(ontime_task_cpu(p)) &&
+				ontime_load_avg(p) < get_down_threshold(ontime_task_cpu(p))) {
+			trace_ehmp_ontime_task_wakeup(p, task_cpu(p), -1,
+					"release ontime");
+			goto ontime_out;
+		}
+
+		/*
+		 * If there is a possible cpu to stay ontime, task will wake up at this cpu.
+		 */
+		cpumask_copy(&target_mask, cpu_coregroup_mask(ontime_task_cpu(p)));
+		target_cpu = ontime_select_target_cpu(&target_mask, tsk_cpus_allowed(p));
+
+		if (cpu_selected(target_cpu)) {
+			trace_ehmp_ontime_task_wakeup(p, task_cpu(p),
+					target_cpu, "stay ontime");
+			goto ontime_stay;
+		}
+
+		trace_ehmp_ontime_task_wakeup(p, task_cpu(p), -1, "banished");
+		goto ontime_out;
+	}
+
+	if (!cpu_selected(target_cpu))
+		goto ontime_out;
+
+ontime_up:
+	include_ontime_task(p, target_cpu);
+
+ontime_stay:
+	return target_cpu;
+
+ontime_out:
+	exclude_ontime_task(p);
+	return -1;
+}
+
+static void ontime_update_next_balance(int cpu, struct ontime_avg *oa)
+{
+	if (cpumask_test_cpu(cpu, cpu_coregroup_mask(maxcap_cpu)))
+		return;
+
+	if (oa->load_avg < get_up_threshold(cpu))
+		return;
+
+	/*
+	 * Update the next_balance of this cpu because tick is most likely
+	 * to occur first in currently running cpu.
+	 */
+	cpu_rq(smp_processor_id())->next_balance = jiffies;
+}
+
+extern u64 decay_load(u64 val, u64 n);
+static u32 __accumulate_pelt_segments(u64 periods, u32 d1, u32 d3)
+{
+	u32 c1, c2, c3 = d3;
+
+	c1 = decay_load((u64)d1, periods);
+	c2 = LOAD_AVG_MAX - decay_load(LOAD_AVG_MAX, periods) - 1024;
+
+	return c1 + c2 + c3;
+}
+
+/****************************************************************/
+/*			External APIs				*/
+/****************************************************************/
+void ontime_trace_task_info(struct task_struct *p)
+{
+	trace_ehmp_ontime_load_avg_task(p, &ontime_of(p)->avg, ontime_flag(p));
+}
+
+DEFINE_PER_CPU(struct cpu_stop_work, ontime_migration_work);
+static DEFINE_SPINLOCK(om_lock);
+
+void ontime_migration(void)
+{
+	struct ontime_cond *cond;
+	int cpu;
+
+	if (!spin_trylock(&om_lock))
+		return;
+
+	for (cond = ontime_cond; cond != NULL; cond = cond->next) {
+		for_each_cpu_and(cpu, &cond->src_cpus, cpu_active_mask) {
+			unsigned long flags;
+			struct rq *rq;
+			struct sched_entity *se;
+			struct task_struct *p;
+			int dst_cpu;
+			struct ontime_env *env = &per_cpu(ontime_env, cpu);
+			int boost_migration = 0;
+
+			rq = cpu_rq(cpu);
+			raw_spin_lock_irqsave(&rq->lock, flags);
+
+			/*
+			 * Ontime migration is not performed when active balance
+			 * is in progress.
+			 */
+			if (rq->active_balance) {
+				raw_spin_unlock_irqrestore(&rq->lock, flags);
+				continue;
+			}
+
+			/*
+			 * No need to migration if source cpu does not have cfs
+			 * tasks.
+			 */
+			if (!rq->cfs.curr) {
+				raw_spin_unlock_irqrestore(&rq->lock, flags);
+				continue;
+			}
+
+			se = rq->cfs.curr;
+
+			/* Find task entity if entity is cfs_rq. */
+			if (entity_is_cfs_rq(se)) {
+				struct cfs_rq *cfs_rq;
+
+				cfs_rq = se->my_q;
+				while (cfs_rq) {
+					se = cfs_rq->curr;
+					cfs_rq = se->my_q;
+				}
+			}
+
+			/*
+			 * Select cpu to migrate the task to. Return negative number
+			 * if there is no idle cpu in sg.
+			 */
+			dst_cpu = ontime_select_target_cpu(&cond->dst_cpus, cpu_active_mask);
+			if (dst_cpu < 0) {
+				raw_spin_unlock_irqrestore(&rq->lock, flags);
+				continue;
+			}
+
+			/*
+			 * Pick task to be migrated. Return NULL if there is no
+			 * heavy task in rq.
+			 */
+			p = ontime_pick_heavy_task(se, &cond->dst_cpus,
+							&boost_migration);
+			if (!p) {
+				raw_spin_unlock_irqrestore(&rq->lock, flags);
+				continue;
+			}
+
+			ontime_flag(p) = ONTIME_MIGRATING;
+			get_task_struct(p);
+
+			/* Set environment data */
+			env->dst_cpu = dst_cpu;
+			env->src_rq = rq;
+			env->target_task = p;
+			env->boost_migration = boost_migration;
+
+			/* Prevent active balance to use stopper for migration */
+			rq->active_balance = 1;
+
+			cpu_rq(dst_cpu)->ontime_migrating = 1;
+
+			raw_spin_unlock_irqrestore(&rq->lock, flags);
+
+			/* Migrate task through stopper */
+			stop_one_cpu_nowait(cpu,
+				ontime_migration_cpu_stop, env,
+				&per_cpu(ontime_migration_work, cpu));
+		}
+	}
+
+	spin_unlock(&om_lock);
+}
+
+int ontime_can_migration(struct task_struct *p, int dst_cpu)
+{
+	u64 delta;
+
+	if (ontime_flag(p) & NOT_ONTIME) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "not ontime");
+		return true;
+	}
+
+	if (ontime_flag(p) & ONTIME_MIGRATING) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "migrating");
+		return false;
+	}
+
+	if (cpumask_test_cpu(dst_cpu, cpu_coregroup_mask(ontime_task_cpu(p)))) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "same coregroup");
+		return true;
+	}
+
+	if (capacity_orig_of(dst_cpu) > capacity_orig_of(ontime_task_cpu(p))) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "bigger cpu");
+		return true;
+	}
+
+	/*
+	 * At this point, task is "ontime task" and running on big
+	 * and load balancer is trying to migrate task to LITTLE.
+	 */
+	delta = cpu_rq(0)->clock_task - ontime_migration_time(p);
+	delta = delta >> 10;
+	if (delta <= get_min_residency(ontime_task_cpu(p))) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "min residency");
+		return false;
+	}
+
+	if (cpu_rq(task_cpu(p))->nr_running > 1) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "big is busy");
+		goto release;
+	}
+
+	if (ontime_load_avg(p) >= get_down_threshold(ontime_task_cpu(p))) {
+		trace_ehmp_ontime_check_migrate(p, dst_cpu, false, "heavy task");
+		return false;
+	}
+
+	trace_ehmp_ontime_check_migrate(p, dst_cpu, true, "ontime_release");
+release:
+	exclude_ontime_task(p);
+
+	return true;
+}
+
+/*
+ * ontime_update_load_avg : load tracking for ontime-migration
+ *
+ * @sa : sched_avg to be updated
+ * @delta : elapsed time since last update
+ * @period_contrib : amount already accumulated against our next period
+ * @scale_freq : scale vector of cpu frequency
+ * @scale_cpu : scale vector of cpu capacity
+ */
+void ontime_update_load_avg(u64 delta, int cpu, unsigned long weight, struct sched_avg *sa)
+{
+	struct ontime_avg *oa = &se_of(sa)->ontime.avg;
+	unsigned long scale_freq, scale_cpu;
+	u32 contrib = (u32)delta; /* p == 0 -> delta < 1024 */
+	u64 periods;
+
+	scale_freq = arch_scale_freq_capacity(NULL, cpu);
+	scale_cpu = arch_scale_cpu_capacity(NULL, cpu);
+
+	delta += oa->period_contrib;
+	periods = delta / 1024; /* A period is 1024us (~1ms) */
+
+	if (periods) {
+		oa->load_sum = decay_load(oa->load_sum, periods);
+
+		delta %= 1024;
+		contrib = __accumulate_pelt_segments(periods,
+				1024 - oa->period_contrib, delta);
+	}
+	oa->period_contrib = delta;
+
+	if (weight) {
+		contrib = cap_scale(contrib, scale_freq);
+		oa->load_sum += contrib * scale_cpu;
+	}
+
+	if (!periods)
+		return;
+
+	oa->load_avg = div_u64(oa->load_sum, LOAD_AVG_MAX - 1024 + oa->period_contrib);
+	ontime_update_next_balance(cpu, oa);
+}
+
+void ontime_new_entity_load(struct task_struct *parent, struct sched_entity *se)
+{
+	struct ontime_entity *ontime;
+
+	if (entity_is_cfs_rq(se))
+		return;
+
+	ontime = &se->ontime;
+
+	ontime->avg.load_sum = ontime_of(parent)->avg.load_sum;
+	ontime->avg.load_avg = ontime_of(parent)->avg.load_avg;
+	ontime->avg.ontime_migration_time = 0;
+	ontime->avg.period_contrib = 1023;
+	ontime->flags = NOT_ONTIME;
+
+	trace_ehmp_ontime_new_entity_load(task_of(se), &ontime->avg);
+}
+
+/****************************************************************/
+/*				SYSFS				*/
+/****************************************************************/
+static ssize_t show_up_threshold(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	struct ontime_cond *cond = ontime_cond;
+	int ret = 0;
+
+	while (cond) {
+		ret += sprintf(buf + ret, "cpu%*pbl: %ld\n",
+				cpumask_pr_args(&cond->src_cpus),
+				cond->up_threshold);
+
+		cond = cond->next;
+	}
+
+	return ret;
+}
+
+static ssize_t store_up_threshold(struct kobject *kobj,
+		struct kobj_attribute *attr, const char *buf,
+		size_t count)
+{
+	unsigned long val;
+	int cpu;
+
+	if (sscanf(buf, "%d %lu", &cpu, &val) != 2)
+		return -EINVAL;
+
+	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
+		return -EINVAL;
+
+	val = val > 1024 ? 1024 : val;
+
+	if (set_up_threshold(cpu, val))
+		return -EINVAL;
+
+	return count;
+}
+
+static struct kobj_attribute up_threshold_attr =
+__ATTR(up_threshold, 0644, show_up_threshold, store_up_threshold);
+
+static ssize_t show_down_threshold(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	struct ontime_cond *cond = ontime_cond;
+	int ret = 0;
+
+	while (cond) {
+		ret += sprintf(buf + ret, "cpu%*pbl: %ld\n",
+				cpumask_pr_args(&cond->dst_cpus),
+				cond->down_threshold);
+
+		cond = cond->next;
+	}
+
+	return ret;
+}
+
+static ssize_t store_down_threshold(struct kobject *kobj,
+		struct kobj_attribute *attr, const char *buf,
+		size_t count)
+{
+	unsigned long val;
+	int cpu;
+
+	if (sscanf(buf, "%d %lu", &cpu, &val) != 2)
+		return -EINVAL;
+
+	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
+		return -EINVAL;
+
+	val = val > 1024 ? 1024 : val;
+
+	if (set_down_threshold(cpu, val))
+		return -EINVAL;
+
+	return count;
+}
+
+static struct kobj_attribute down_threshold_attr =
+__ATTR(down_threshold, 0644, show_down_threshold, store_down_threshold);
+
+static ssize_t show_min_residency(struct kobject *kobj,
+		struct kobj_attribute *attr, char *buf)
+{
+	struct ontime_cond *cond = ontime_cond;
+	int ret = 0;
+
+	while (cond) {
+		ret += sprintf(buf + ret, "cpu%*pbl: %d\n",
+				cpumask_pr_args(&cond->dst_cpus),
+				cond->min_residency_us);
+
+		cond = cond->next;
+	}
+
+	return ret;
+}
+
+static ssize_t store_min_residency(struct kobject *kobj,
+		struct kobj_attribute *attr, const char *buf,
+		size_t count)
+{
+	int val;
+	int cpu;
+
+	if (sscanf(buf, "%d %d", &cpu, &val) != 2)
+		return -EINVAL;
+
+	if (!cpumask_test_cpu(cpu, cpu_possible_mask))
+		return -EINVAL;
+
+	val = val < 0 ? 0 : val;
+
+	if (set_min_residency(cpu, val))
+		return -EINVAL;
+
+	return count;
+}
+
+static struct kobj_attribute min_residency_attr =
+__ATTR(min_residency, 0644, show_min_residency, store_min_residency);
+
+/****************************************************************/
+/*			initialization				*/
+/****************************************************************/
+static void
+parse_ontime(struct device_node *dn, struct ontime_cond *cond, int step)
+{
+	struct device_node *ontime, *on_step;
+	char name[10];
+	int prop;
+
+	/*
+	 * Initilize default values:
+	 *   up_threshold	= 40% of Source CPU's maximum capacity
+	 *   down_threshold	= 50% of Destination CPU's minimum capacity
+	 *   min_residency	= 8ms
+	 */
+	cond->up_threshold =
+		capacity_orig_of(cpumask_first(&cond->src_cpus)) * 40 / 100;
+	cond->down_threshold =
+		mincap_of(cpumask_first(&cond->dst_cpus)) * 50 / 100;
+	cond->min_residency_us = 8192;
+
+	ontime = of_get_child_by_name(dn, "ontime");
+	if (!ontime)
+		return;
+
+	snprintf(name, sizeof(name), "step%d", step);
+	on_step = of_get_child_by_name(ontime, name);
+	if (!on_step)
+		return;
+
+	of_property_read_u32(on_step, "up-threshold", &prop);
+	cond->up_threshold = prop;
+
+	of_property_read_u32(on_step, "down-threshold", &prop);
+	cond->down_threshold = prop;
+
+	of_property_read_u32(on_step, "min-residency-us", &prop);
+	cond->min_residency_us = prop;
+}
+
+static int __init init_ontime(void)
+{
+	struct cpumask prev_cpus;
+	struct ontime_cond *cond, *last;
+	struct device_node *dn;
+	int cpu, step = 0;
+
+	dn = of_find_node_by_path("/cpus/ehmp");
+	if (!dn)
+		return 0;
+
+	cpumask_clear(&prev_cpus);
+
+	for_each_possible_cpu(cpu) {
+		if (cpu != cpumask_first(cpu_coregroup_mask(cpu)))
+			continue;
+
+		if (cpumask_empty(&prev_cpus)) {
+			cpumask_copy(&prev_cpus, cpu_coregroup_mask(cpu));
+			continue;
+		}
+
+		cond = kzalloc(sizeof(struct ontime_cond), GFP_KERNEL);
+
+		cpumask_copy(&cond->dst_cpus, cpu_coregroup_mask(cpu));
+		cpumask_copy(&cond->src_cpus, &prev_cpus);
+
+		parse_ontime(dn, cond, step++);
+
+		cpumask_copy(&prev_cpus, cpu_coregroup_mask(cpu));
+
+		/* Add linked list of ontime_cond at last */
+		cond->next = NULL;
+		if (ontime_cond)
+			last->next = cond;
+		else
+			ontime_cond = cond;
+		last = cond;
+	}
+
+	of_node_put(dn);
+	return 0;
+}
+pure_initcall(init_ontime);
+
+/**********************************************************************
+ * cpu selection                                                      *
+ **********************************************************************/
+#define EAS_CPU_PRV	0
+#define EAS_CPU_NXT	1
+#define EAS_CPU_BKP	2
+
+int exynos_select_cpu(struct task_struct *p, int *backup_cpu,
+				bool boosted, bool prefer_idle)
+{
+	struct sched_domain *sd;
+	int target_cpu = -1;
+	int cpu;
+	unsigned long min_util;
+	struct boost_trigger trigger = {
+		.trigger = 0,
+		.boost_val = 0
+	};
+
+	target_cpu = ontime_task_wakeup(p);
+	if (cpu_selected(target_cpu))
+		goto exit;
+
+	/* Find target cpu from lowest capacity domain */
+	cpu = start_cpu(boosted);
+	if (cpu < 0)
+		goto exit;
+
+	/* Find SD for the start CPU */
+	sd = rcu_dereference(per_cpu(sd_ea, cpu));
+	if (!sd)
+		goto exit;
+
+	min_util = boosted_task_util(p);
+
+	if (check_boost_trigger(p, &trigger)) {
+		target_cpu = find_boost_target(sd, p, min_util, &trigger);
+		if (cpu_selected(target_cpu))
+			goto exit;
+	}
+
+	if (prefer_idle) {
+		target_cpu = find_prefer_idle_target(sd, p, min_util);
+		if (cpu_selected(target_cpu))
+			goto exit;
+	}
+
+	target_cpu = find_best_target(p, backup_cpu, 0, 0);
+
+exit:
+
+	return target_cpu;
+}
+
+/**********************************************************************
+ * Sysfs                                                              *
+ **********************************************************************/
+static struct attribute *ehmp_attrs[] = {
+	&global_boost_attr.attr,
+	&min_residency_attr.attr,
+	&up_threshold_attr.attr,
+	&down_threshold_attr.attr,
+	&overutil_ratio_attr.attr,
+	&prefer_perf_attr.attr,
+	&initial_util_type.attr,
+	&initial_util_ratio.attr,
+	NULL,
+};
+
+static const struct attribute_group ehmp_group = {
+	.attrs = ehmp_attrs,
+};
+
+static struct kobject *ehmp_kobj;
+
+static int __init init_sysfs(void)
+{
+	int ret;
+
+	ehmp_kobj = kobject_create_and_add("ehmp", kernel_kobj);
+	ret = sysfs_create_group(ehmp_kobj, &ehmp_group);
+
+	return 0;
+}
+late_initcall(init_sysfs);
diff --git a/kernel/sched/ems/freqvar_tune.c b/kernel/sched/ems/freqvar_tune.c
new file mode 100644
index 000000000000..fb11fbf76d2f
--- /dev/null
+++ b/kernel/sched/ems/freqvar_tune.c
@@ -0,0 +1,639 @@
+/*
+ * Frequency variant cpufreq driver
+ *
+ * Copyright (C) 2017 Samsung Electronics Co., Ltd
+ * Park Bumgyu <bumgyu.park@samsung.com>
+ */
+
+#include <linux/cpufreq.h>
+#include <linux/slab.h>
+#include <linux/of.h>
+
+#include "../sched.h"
+
+/**********************************************************************
+ * common APIs                                                        *
+ **********************************************************************/
+struct freqvar_table {
+	int frequency;
+	int value;
+};
+
+static int freqvar_get_value(int freq, struct freqvar_table *table)
+{
+	struct freqvar_table *pos = table;
+	int value = -EINVAL;
+
+	for (; pos->frequency != CPUFREQ_TABLE_END; pos++)
+		if (freq == pos->frequency) {
+			value = pos->value;
+			break;
+		}
+
+	return value;
+}
+
+static int freqvar_get_table_size(struct cpufreq_policy *policy)
+{
+	struct cpufreq_frequency_table *cpufreq_table, *pos;
+	int size = 0;
+
+	cpufreq_table = policy->freq_table;
+	if (unlikely(!cpufreq_table)) {
+		pr_debug("%s: Unable to find frequency table\n", __func__);
+		return -ENOENT;
+	}
+
+	cpufreq_for_each_valid_entry(pos, cpufreq_table)
+		size++;
+
+	return size;
+}
+
+static int freqvar_fill_frequency_table(struct cpufreq_policy *policy,
+					struct freqvar_table *table)
+{
+	struct cpufreq_frequency_table *cpufreq_table, *pos;
+	int index;
+
+	cpufreq_table = policy->freq_table;
+	if (unlikely(!cpufreq_table)) {
+		pr_debug("%s: Unable to find frequency table\n", __func__);
+		return -ENOENT;
+	}
+
+	index = 0;
+	cpufreq_for_each_valid_entry(pos, cpufreq_table) {
+		table[index].frequency = pos->frequency;
+		index++;
+	}
+	table[index].frequency = CPUFREQ_TABLE_END;
+
+	return 0;
+}
+
+static int freqvar_update_table(unsigned int *src, int src_size,
+					struct freqvar_table *dst)
+{
+	struct freqvar_table *pos, *last_pos = dst;
+	unsigned int value = 0, freq = 0;
+	int i;
+
+	for (i = src_size - 1; i >= 0; i--) {
+		value = src[i];
+		freq  = (i <= 0) ? 0 : src[i - 1];
+
+		for (pos = last_pos; pos->frequency != CPUFREQ_TABLE_END; pos++)
+			if (pos->frequency >= freq) {
+				pos->value = value;
+			} else {
+				last_pos = pos;
+				break;
+			}
+	}
+
+	return 0;
+}
+
+static int freqvar_parse_value_dt(struct device_node *dn, const char *table_name,
+						struct freqvar_table *table)
+{
+	int size, ret = 0;
+	unsigned int *temp;
+
+	/* get the table from device tree source */
+	size = of_property_count_u32_elems(dn, table_name);
+	if (size <= 0)
+		return size;
+
+	temp = kzalloc(sizeof(unsigned int) * size, GFP_KERNEL);
+	if (!temp)
+		return -ENOMEM;
+
+	ret = of_property_read_u32_array(dn, table_name, temp, size);
+	if (ret)
+		goto fail_parsing;
+
+	freqvar_update_table(temp, size, table);
+
+fail_parsing:
+	kfree(temp);
+	return ret;
+}
+
+static void freqvar_free(void *data)
+{
+	if (data)
+		kfree(data);
+}
+
+static unsigned int *get_tokenized_data(const char *buf, int *num_tokens)
+{
+	const char *cp;
+	int i;
+	int ntokens = 1;
+	unsigned int *tokenized_data;
+	int err = -EINVAL;
+
+	cp = buf;
+	while ((cp = strpbrk(cp + 1, " :")))
+		ntokens++;
+
+	if (!(ntokens & 0x1))
+		goto err;
+
+	tokenized_data = kmalloc(ntokens * sizeof(unsigned int), GFP_KERNEL);
+	if (!tokenized_data) {
+		err = -ENOMEM;
+		goto err;
+	}
+
+	cp = buf;
+	i = 0;
+	while (i < ntokens) {
+		if (sscanf(cp, "%u", &tokenized_data[i++]) != 1)
+			goto err_kfree;
+
+		cp = strpbrk(cp, " :");
+		if (!cp)
+			break;
+		cp++;
+	}
+
+	if (i != ntokens)
+		goto err_kfree;
+
+	*num_tokens = ntokens;
+	return tokenized_data;
+
+err_kfree:
+	kfree(tokenized_data);
+err:
+	return ERR_PTR(err);
+}
+
+#define attr_freqvar(type, name, table)						\
+static ssize_t freqvar_##name##_show(struct gov_attr_set *attr_set, char *buf)	\
+{										\
+	struct cpufreq_policy *policy = sugov_get_attr_policy(attr_set);	\
+	struct freqvar_##type *data = per_cpu(freqvar_##type, policy->cpu);	\
+	struct freqvar_table *pos = data->table;				\
+	int ret = 0;								\
+										\
+	for (; pos->frequency != CPUFREQ_TABLE_END; pos++)			\
+		ret += sprintf(buf + ret, "%8d ratio:%3d \n",			\
+					pos->frequency, pos->value);		\
+										\
+	return ret;								\
+}										\
+										\
+static ssize_t freqvar_##name##_store(struct gov_attr_set *attr_set,		\
+				      const char *buf, size_t count)		\
+{										\
+	struct cpufreq_policy *policy = sugov_get_attr_policy(attr_set);	\
+	struct freqvar_##type *data = per_cpu(freqvar_##type, policy->cpu);	\
+	struct freqvar_table *old_table = data->table;				\
+	int *new_table = NULL;							\
+	int ntokens;								\
+										\
+	new_table = get_tokenized_data(buf, &ntokens);				\
+	if (IS_ERR(new_table))							\
+		return PTR_RET(new_table);					\
+										\
+	freqvar_update_table(new_table, ntokens, old_table);			\
+	kfree(new_table);							\
+										\
+	return count;								\
+}										\
+
+int sugov_sysfs_add_attr(struct cpufreq_policy *policy, const struct attribute *attr);
+struct cpufreq_policy *sugov_get_attr_policy(struct gov_attr_set *attr_set);
+
+/**********************************************************************
+ * freqvar boost                                                 *
+ **********************************************************************/
+struct freqvar_boost {
+	struct freqvar_table *table;
+	unsigned int ratio;
+};
+DEFINE_PER_CPU(struct freqvar_boost *, freqvar_boost);
+
+attr_freqvar(boost, boost, table);
+static struct governor_attr freqvar_boost_attr = __ATTR_RW(freqvar_boost);
+
+unsigned long freqvar_boost_vector(int cpu, unsigned long util, struct cfs_rq *cfs_rq)
+{
+	struct freqvar_boost *boost = per_cpu(freqvar_boost, cpu);
+	unsigned long cap = arch_scale_cpu_capacity(NULL, cpu);
+	unsigned long vector;
+	int margin;
+
+	if (!boost)
+		return cap;
+
+	/*
+	 * boost task load(util_sum/avg) and load of cfs_rq is not included.
+	 * boost ratio is changed with frequency scale.
+	 * 1024 is default boost_vector. it is no effect.
+	 * if boost_vector is 2048, it means adding twice bigger load than orinal load
+	 */
+	if (cfs_rq && cfs_rq->nr_running)
+		margin = cap - (util / cfs_rq->nr_running);
+	else
+		margin = cap - util;
+
+	if (margin <= 0)
+		return cap;
+
+	vector = cap + (margin * boost->ratio / 100);
+
+	return vector;
+}
+
+static void freqvar_boost_update(int cpu, int new_freq)
+{
+	struct freqvar_boost *boost;
+
+	boost = per_cpu(freqvar_boost, cpu);
+	if (!boost)
+		return;
+
+	boost->ratio = freqvar_get_value(new_freq, boost->table);
+}
+
+static void freqvar_boost_free(struct freqvar_boost *boost)
+{
+	if (boost)
+		freqvar_free(boost->table);
+
+	freqvar_free(boost);
+}
+
+static struct
+freqvar_boost *freqvar_boost_alloc(struct cpufreq_policy *policy)
+{
+	struct freqvar_boost *boost;
+	int size;
+
+	boost = kzalloc(sizeof(*boost), GFP_KERNEL);
+	if (!boost)
+		return NULL;
+
+	size = freqvar_get_table_size(policy);
+	if (size <= 0)
+		goto fail_alloc;
+
+	boost->table = kzalloc(sizeof(struct freqvar_table) * (size + 1), GFP_KERNEL);
+	if (!boost->table)
+		goto fail_alloc;
+
+	return boost;
+
+fail_alloc:
+	freqvar_boost_free(boost);
+	return NULL;
+}
+
+static int freqvar_boost_init(struct device_node *dn, const struct cpumask *mask)
+{
+	struct freqvar_boost *boost;
+	struct cpufreq_policy *policy;
+	int cpu, ret = 0;
+
+	policy = cpufreq_cpu_get(cpumask_first(mask));
+	if (!policy)
+		return -ENODEV;
+
+	boost = freqvar_boost_alloc(policy);
+	if (!boost) {
+		ret = -ENOMEM;
+		goto fail_init;
+	}
+
+	ret = freqvar_fill_frequency_table(policy, boost->table);
+	if (ret)
+		goto fail_init;
+
+	ret = freqvar_parse_value_dt(dn, "boost_table", boost->table);
+	if (ret)
+		goto fail_init;
+
+	for_each_cpu(cpu, mask)
+		per_cpu(freqvar_boost, cpu) = boost;
+
+	freqvar_boost_update(policy->cpu, policy->cur);
+
+	ret = sugov_sysfs_add_attr(policy, &freqvar_boost_attr.attr);
+	if (ret)
+		goto fail_init;
+
+	return 0;
+
+fail_init:
+	cpufreq_cpu_put(policy);
+	freqvar_boost_free(boost);
+
+	return ret;
+}
+
+/**********************************************************************
+ * freqvar rate limit                                                 *
+ **********************************************************************/
+struct freqvar_rate_limit {
+	struct freqvar_table *up_table;
+	struct freqvar_table *down_table;
+};
+DEFINE_PER_CPU(struct freqvar_rate_limit *, freqvar_rate_limit);
+
+attr_freqvar(rate_limit, up_rate_limit, up_table);
+attr_freqvar(rate_limit, down_rate_limit, down_table);
+static struct governor_attr freqvar_up_rate_limit = __ATTR_RW(freqvar_up_rate_limit);
+static struct governor_attr freqvar_down_rate_limit = __ATTR_RW(freqvar_down_rate_limit);
+
+void sugov_update_rate_limit_us(struct cpufreq_policy *policy,
+			int up_rate_limit_ms, int down_rate_limit_ms);
+static void freqvar_rate_limit_update(int cpu, int new_freq)
+{
+	struct freqvar_rate_limit *rate_limit;
+	int up_rate_limit, down_rate_limit;
+	struct cpufreq_policy *policy;
+
+	rate_limit = per_cpu(freqvar_rate_limit, cpu);
+	if (!rate_limit)
+		return;
+
+	up_rate_limit = freqvar_get_value(new_freq, rate_limit->up_table);
+	down_rate_limit = freqvar_get_value(new_freq, rate_limit->down_table);
+
+	policy = cpufreq_cpu_get(cpu);
+	if (!policy)
+		return;
+
+	sugov_update_rate_limit_us(policy, up_rate_limit, down_rate_limit);
+
+	cpufreq_cpu_put(policy);
+}
+
+static void freqvar_rate_limit_free(struct freqvar_rate_limit *rate_limit)
+{
+	if (rate_limit) {
+		freqvar_free(rate_limit->up_table);
+		freqvar_free(rate_limit->down_table);
+	}
+
+	freqvar_free(rate_limit);
+}
+
+static struct
+freqvar_rate_limit *freqvar_rate_limit_alloc(struct cpufreq_policy *policy)
+{
+	struct freqvar_rate_limit *rate_limit;
+	int size;
+
+	rate_limit = kzalloc(sizeof(*rate_limit), GFP_KERNEL);
+	if (!rate_limit)
+		return NULL;
+
+	size = freqvar_get_table_size(policy);
+	if (size <= 0)
+		goto fail_alloc;
+
+	rate_limit->up_table = kzalloc(sizeof(struct freqvar_table)
+					* (size + 1), GFP_KERNEL);
+	if (!rate_limit->up_table)
+		goto fail_alloc;
+
+	rate_limit->down_table = kzalloc(sizeof(struct freqvar_table)
+					* (size + 1), GFP_KERNEL);
+	if (!rate_limit->down_table)
+		goto fail_alloc;
+
+	return rate_limit;
+
+fail_alloc:
+	freqvar_rate_limit_free(rate_limit);
+	return NULL;
+}
+
+static int freqvar_rate_limit_init(struct device_node *dn, const struct cpumask *mask)
+{
+	struct freqvar_rate_limit *rate_limit;
+	struct cpufreq_policy *policy;
+	int cpu, ret = 0;
+
+	policy = cpufreq_cpu_get(cpumask_first(mask));
+	if (!policy)
+		return -ENODEV;
+
+	rate_limit = freqvar_rate_limit_alloc(policy);
+	if (!rate_limit) {
+		ret = -ENOMEM;
+		goto fail_init;
+	}
+
+	ret = freqvar_fill_frequency_table(policy, rate_limit->up_table);
+	if (ret)
+		goto fail_init;
+
+	ret = freqvar_fill_frequency_table(policy, rate_limit->down_table);
+	if (ret)
+		goto fail_init;
+
+	ret = freqvar_parse_value_dt(dn, "up_rate_limit_table", rate_limit->up_table);
+	if (ret)
+		goto fail_init;
+
+	ret = freqvar_parse_value_dt(dn, "down_rate_limit_table", rate_limit->down_table);
+	if (ret)
+		goto fail_init;
+
+	ret = sugov_sysfs_add_attr(policy, &freqvar_up_rate_limit.attr);
+	if (ret)
+		goto fail_init;
+
+	ret = sugov_sysfs_add_attr(policy, &freqvar_down_rate_limit.attr);
+	if (ret)
+		goto fail_init;
+
+	for_each_cpu(cpu, mask)
+		per_cpu(freqvar_rate_limit, cpu) = rate_limit;
+
+	freqvar_rate_limit_update(policy->cpu, policy->cur);
+
+	return 0;
+
+fail_init:
+	freqvar_rate_limit_free(rate_limit);
+	cpufreq_cpu_put(policy);
+
+	return ret;
+}
+
+/**********************************************************************
+ * freqvar up-scale ratio                                             *
+ **********************************************************************/
+struct freqvar_upscale_ratio {
+	struct freqvar_table *table;
+	int ratio;
+};
+DEFINE_PER_CPU(struct freqvar_upscale_ratio *, freqvar_upscale_ratio);
+
+attr_freqvar(upscale_ratio, upscale_ratio, table);
+static struct governor_attr freqvar_upscale_ratio_attr = __ATTR_RW(freqvar_upscale_ratio);
+
+unsigned int freqvar_tipping_point(int cpu, unsigned int freq)
+{
+	struct freqvar_upscale_ratio *upscale = per_cpu(freqvar_upscale_ratio, cpu);
+
+	if (!upscale)
+		return freq + (freq >> 2);
+
+	return freq * 100 / upscale->ratio;
+}
+
+static void freqvar_upscale_ratio_update(int cpu, int new_freq)
+{
+	struct freqvar_upscale_ratio *upscale;
+
+	upscale = per_cpu(freqvar_upscale_ratio, cpu);
+	if (!upscale)
+		return;
+
+	upscale->ratio = freqvar_get_value(new_freq, upscale->table);
+}
+
+static void freqvar_upscale_ratio_free(struct freqvar_upscale_ratio *upscale)
+{
+	if (upscale)
+		freqvar_free(upscale->table);
+
+	freqvar_free(upscale);
+}
+
+static struct
+freqvar_upscale_ratio *freqvar_upscale_ratio_alloc(struct cpufreq_policy *policy)
+{
+	struct freqvar_upscale_ratio *upscale;
+	int size;
+
+	upscale = kzalloc(sizeof(*upscale), GFP_KERNEL);
+	if (!upscale)
+		return NULL;
+
+	size = freqvar_get_table_size(policy);
+	if (size <= 0)
+		goto fail_alloc;
+
+	upscale->table = kzalloc(sizeof(struct freqvar_table) * (size + 1), GFP_KERNEL);
+	if (!upscale->table)
+		goto fail_alloc;
+
+	return upscale;
+
+fail_alloc:
+	freqvar_upscale_ratio_free(upscale);
+	return NULL;
+}
+
+static int freqvar_upscale_ratio_init(struct device_node *dn, const struct cpumask *mask)
+{
+	struct freqvar_upscale_ratio *upscale;
+	struct cpufreq_policy *policy;
+	int cpu, ret = 0;
+
+	policy = cpufreq_cpu_get(cpumask_first(mask));
+	if (!policy)
+		return -ENODEV;
+
+	upscale = freqvar_upscale_ratio_alloc(policy);
+	if (!upscale) {
+		ret = -ENOMEM;
+		goto fail_init;
+	}
+
+	ret = freqvar_fill_frequency_table(policy, upscale->table);
+	if (ret)
+		goto fail_init;
+
+	ret = freqvar_parse_value_dt(dn, "upscale_ratio_table", upscale->table);
+	if (ret)
+		goto fail_init;
+
+	for_each_cpu(cpu, mask)
+		per_cpu(freqvar_upscale_ratio, cpu) = upscale;
+
+	freqvar_upscale_ratio_update(policy->cpu, policy->cur);
+
+	ret = sugov_sysfs_add_attr(policy, &freqvar_upscale_ratio_attr.attr);
+	if (ret)
+		goto fail_init;
+
+	return 0;
+
+fail_init:
+	cpufreq_cpu_put(policy);
+	freqvar_upscale_ratio_free(upscale);
+
+	return ret;
+}
+
+/**********************************************************************
+ * cpufreq notifier callback                                          *
+ **********************************************************************/
+static int freqvar_cpufreq_callback(struct notifier_block *nb,
+					unsigned long val, void *data)
+{
+	struct cpufreq_freqs *freq = data;
+
+	if (freq->flags & CPUFREQ_CONST_LOOPS)
+		return NOTIFY_OK;
+
+	if (val != CPUFREQ_POSTCHANGE)
+		return NOTIFY_OK;
+
+	freqvar_boost_update(freq->cpu, freq->new);
+	freqvar_rate_limit_update(freq->cpu, freq->new);
+	freqvar_upscale_ratio_update(freq->cpu, freq->new);
+
+	return 0;
+}
+
+static struct notifier_block freqvar_cpufreq_notifier = {
+	.notifier_call  = freqvar_cpufreq_callback,
+};
+
+/**********************************************************************
+ * initialization                                                     *
+ **********************************************************************/
+static int __init freqvar_tune_init(void)
+{
+	struct device_node *dn = NULL;
+	struct cpumask shared_mask;
+	const char *buf;
+
+	while ((dn = of_find_node_by_type(dn, "freqvar-tune"))) {
+		/*
+		 * shared-cpus includes cpus scaling at the sametime.
+		 * it is called "sibling cpus" in the CPUFreq and
+		 * masked on the realated_cpus of the policy
+		 */
+		if (of_property_read_string(dn, "shared-cpus", &buf))
+			continue;
+
+		cpumask_clear(&shared_mask);
+		cpulist_parse(buf, &shared_mask);
+		cpumask_and(&shared_mask, &shared_mask, cpu_possible_mask);
+		if (cpumask_weight(&shared_mask) == 0)
+			continue;
+
+		freqvar_boost_init(dn, &shared_mask);
+		freqvar_rate_limit_init(dn, &shared_mask);
+		freqvar_upscale_ratio_init(dn, &shared_mask);
+	}
+
+	cpufreq_register_notifier(&freqvar_cpufreq_notifier,
+					CPUFREQ_TRANSITION_NOTIFIER);
+
+	return 0;
+}
+late_initcall(freqvar_tune_init);
diff --git a/kernel/sched/freqvar_tune.c b/kernel/sched/freqvar_tune.c
deleted file mode 100644
index d869549b7a67..000000000000
--- a/kernel/sched/freqvar_tune.c
+++ /dev/null
@@ -1,639 +0,0 @@
-/*
- * Frequency variant cpufreq driver
- *
- * Copyright (C) 2017 Samsung Electronics Co., Ltd
- * Park Bumgyu <bumgyu.park@samsung.com>
- */
-
-#include <linux/cpufreq.h>
-#include <linux/slab.h>
-#include <linux/of.h>
-
-#include "sched.h"
-
-/**********************************************************************
- * common APIs                                                        *
- **********************************************************************/
-struct freqvar_table {
-	int frequency;
-	int value;
-};
-
-static int freqvar_get_value(int freq, struct freqvar_table *table)
-{
-	struct freqvar_table *pos = table;
-	int value = -EINVAL;
-
-	for (; pos->frequency != CPUFREQ_TABLE_END; pos++)
-		if (freq == pos->frequency) {
-			value = pos->value;
-			break;
-		}
-
-	return value;
-}
-
-static int freqvar_get_table_size(struct cpufreq_policy *policy)
-{
-	struct cpufreq_frequency_table *cpufreq_table, *pos;
-	int size = 0;
-
-	cpufreq_table = policy->freq_table;
-	if (unlikely(!cpufreq_table)) {
-		pr_debug("%s: Unable to find frequency table\n", __func__);
-		return -ENOENT;
-	}
-
-	cpufreq_for_each_valid_entry(pos, cpufreq_table)
-		size++;
-
-	return size;
-}
-
-static int freqvar_fill_frequency_table(struct cpufreq_policy *policy,
-					struct freqvar_table *table)
-{
-	struct cpufreq_frequency_table *cpufreq_table, *pos;
-	int index;
-
-	cpufreq_table = policy->freq_table;
-	if (unlikely(!cpufreq_table)) {
-		pr_debug("%s: Unable to find frequency table\n", __func__);
-		return -ENOENT;
-	}
-
-	index = 0;
-	cpufreq_for_each_valid_entry(pos, cpufreq_table) {
-		table[index].frequency = pos->frequency;
-		index++;
-	}
-	table[index].frequency = CPUFREQ_TABLE_END;
-
-	return 0;
-}
-
-static int freqvar_update_table(unsigned int *src, int src_size,
-					struct freqvar_table *dst)
-{
-	struct freqvar_table *pos, *last_pos = dst;
-	unsigned int value = 0, freq = 0;
-	int i;
-
-	for (i = src_size - 1; i >= 0; i--) {
-		value = src[i];
-		freq  = (i <= 0) ? 0 : src[i - 1];
-
-		for (pos = last_pos; pos->frequency != CPUFREQ_TABLE_END; pos++)
-			if (pos->frequency >= freq) {
-				pos->value = value;
-			} else {
-				last_pos = pos;
-				break;
-			}
-	}
-
-	return 0;
-}
-
-static int freqvar_parse_value_dt(struct device_node *dn, const char *table_name,
-						struct freqvar_table *table)
-{
-	int size, ret = 0;
-	unsigned int *temp;
-
-	/* get the table from device tree source */
-	size = of_property_count_u32_elems(dn, table_name);
-	if (size <= 0)
-		return size;
-
-	temp = kzalloc(sizeof(unsigned int) * size, GFP_KERNEL);
-	if (!temp)
-		return -ENOMEM;
-
-	ret = of_property_read_u32_array(dn, table_name, temp, size);
-	if (ret)
-		goto fail_parsing;
-
-	freqvar_update_table(temp, size, table);
-
-fail_parsing:
-	kfree(temp);
-	return ret;
-}
-
-static void freqvar_free(void *data)
-{
-	if (data)
-		kfree(data);
-}
-
-static unsigned int *get_tokenized_data(const char *buf, int *num_tokens)
-{
-	const char *cp;
-	int i;
-	int ntokens = 1;
-	unsigned int *tokenized_data;
-	int err = -EINVAL;
-
-	cp = buf;
-	while ((cp = strpbrk(cp + 1, " :")))
-		ntokens++;
-
-	if (!(ntokens & 0x1))
-		goto err;
-
-	tokenized_data = kmalloc(ntokens * sizeof(unsigned int), GFP_KERNEL);
-	if (!tokenized_data) {
-		err = -ENOMEM;
-		goto err;
-	}
-
-	cp = buf;
-	i = 0;
-	while (i < ntokens) {
-		if (sscanf(cp, "%u", &tokenized_data[i++]) != 1)
-			goto err_kfree;
-
-		cp = strpbrk(cp, " :");
-		if (!cp)
-			break;
-		cp++;
-	}
-
-	if (i != ntokens)
-		goto err_kfree;
-
-	*num_tokens = ntokens;
-	return tokenized_data;
-
-err_kfree:
-	kfree(tokenized_data);
-err:
-	return ERR_PTR(err);
-}
-
-#define attr_freqvar(type, name, table)						\
-static ssize_t freqvar_##name##_show(struct gov_attr_set *attr_set, char *buf)	\
-{										\
-	struct cpufreq_policy *policy = sugov_get_attr_policy(attr_set);	\
-	struct freqvar_##type *data = per_cpu(freqvar_##type, policy->cpu);	\
-	struct freqvar_table *pos = data->table;				\
-	int ret = 0;								\
-										\
-	for (; pos->frequency != CPUFREQ_TABLE_END; pos++)			\
-		ret += sprintf(buf + ret, "%8d ratio:%3d \n",			\
-					pos->frequency, pos->value);		\
-										\
-	return ret;								\
-}										\
-										\
-static ssize_t freqvar_##name##_store(struct gov_attr_set *attr_set,		\
-				      const char *buf, size_t count)		\
-{										\
-	struct cpufreq_policy *policy = sugov_get_attr_policy(attr_set);	\
-	struct freqvar_##type *data = per_cpu(freqvar_##type, policy->cpu);	\
-	struct freqvar_table *old_table = data->table;				\
-	int *new_table = NULL;							\
-	int ntokens;								\
-										\
-	new_table = get_tokenized_data(buf, &ntokens);				\
-	if (IS_ERR(new_table))							\
-		return PTR_RET(new_table);					\
-										\
-	freqvar_update_table(new_table, ntokens, old_table);			\
-	kfree(new_table);							\
-										\
-	return count;								\
-}										\
-
-int sugov_sysfs_add_attr(struct cpufreq_policy *policy, const struct attribute *attr);
-struct cpufreq_policy *sugov_get_attr_policy(struct gov_attr_set *attr_set);
-
-/**********************************************************************
- * freqvar boost                                                 *
- **********************************************************************/
-struct freqvar_boost {
-	struct freqvar_table *table;
-	unsigned int ratio;
-};
-DEFINE_PER_CPU(struct freqvar_boost *, freqvar_boost);
-
-attr_freqvar(boost, boost, table);
-static struct governor_attr freqvar_boost_attr = __ATTR_RW(freqvar_boost);
-
-unsigned long freqvar_boost_vector(int cpu, unsigned long util, struct cfs_rq *cfs_rq)
-{
-	struct freqvar_boost *boost = per_cpu(freqvar_boost, cpu);
-	unsigned long cap = arch_scale_cpu_capacity(NULL, cpu);
-	unsigned long vector;
-	int margin;
-
-	if (!boost)
-		return cap;
-
-	/*
-	 * boost task load(util_sum/avg) and load of cfs_rq is not included.
-	 * boost ratio is changed with frequency scale.
-	 * 1024 is default boost_vector. it is no effect.
-	 * if boost_vector is 2048, it means adding twice bigger load than orinal load
-	 */
-	if (cfs_rq && cfs_rq->nr_running)
-		margin = cap - (util / cfs_rq->nr_running);
-	else
-		margin = cap - util;
-
-	if (margin <= 0)
-		return cap;
-
-	vector = cap + (margin * boost->ratio / 100);
-
-	return vector;
-}
-
-static void freqvar_boost_update(int cpu, int new_freq)
-{
-	struct freqvar_boost *boost;
-
-	boost = per_cpu(freqvar_boost, cpu);
-	if (!boost)
-		return;
-
-	boost->ratio = freqvar_get_value(new_freq, boost->table);
-}
-
-static void freqvar_boost_free(struct freqvar_boost *boost)
-{
-	if (boost)
-		freqvar_free(boost->table);
-
-	freqvar_free(boost);
-}
-
-static struct
-freqvar_boost *freqvar_boost_alloc(struct cpufreq_policy *policy)
-{
-	struct freqvar_boost *boost;
-	int size;
-
-	boost = kzalloc(sizeof(*boost), GFP_KERNEL);
-	if (!boost)
-		return NULL;
-
-	size = freqvar_get_table_size(policy);
-	if (size <= 0)
-		goto fail_alloc;
-
-	boost->table = kzalloc(sizeof(struct freqvar_table) * (size + 1), GFP_KERNEL);
-	if (!boost->table)
-		goto fail_alloc;
-
-	return boost;
-
-fail_alloc:
-	freqvar_boost_free(boost);
-	return NULL;
-}
-
-static int freqvar_boost_init(struct device_node *dn, const struct cpumask *mask)
-{
-	struct freqvar_boost *boost;
-	struct cpufreq_policy *policy;
-	int cpu, ret = 0;
-
-	policy = cpufreq_cpu_get(cpumask_first(mask));
-	if (!policy)
-		return -ENODEV;
-
-	boost = freqvar_boost_alloc(policy);
-	if (!boost) {
-		ret = -ENOMEM;
-		goto fail_init;
-	}
-
-	ret = freqvar_fill_frequency_table(policy, boost->table);
-	if (ret)
-		goto fail_init;
-
-	ret = freqvar_parse_value_dt(dn, "boost_table", boost->table);
-	if (ret)
-		goto fail_init;
-
-	for_each_cpu(cpu, mask)
-		per_cpu(freqvar_boost, cpu) = boost;
-
-	freqvar_boost_update(policy->cpu, policy->cur);
-
-	ret = sugov_sysfs_add_attr(policy, &freqvar_boost_attr.attr);
-	if (ret)
-		goto fail_init;
-
-	return 0;
-
-fail_init:
-	cpufreq_cpu_put(policy);
-	freqvar_boost_free(boost);
-
-	return ret;
-}
-
-/**********************************************************************
- * freqvar rate limit                                                 *
- **********************************************************************/
-struct freqvar_rate_limit {
-	struct freqvar_table *up_table;
-	struct freqvar_table *down_table;
-};
-DEFINE_PER_CPU(struct freqvar_rate_limit *, freqvar_rate_limit);
-
-attr_freqvar(rate_limit, up_rate_limit, up_table);
-attr_freqvar(rate_limit, down_rate_limit, down_table);
-static struct governor_attr freqvar_up_rate_limit = __ATTR_RW(freqvar_up_rate_limit);
-static struct governor_attr freqvar_down_rate_limit = __ATTR_RW(freqvar_down_rate_limit);
-
-void sugov_update_rate_limit_us(struct cpufreq_policy *policy,
-			int up_rate_limit_ms, int down_rate_limit_ms);
-static void freqvar_rate_limit_update(int cpu, int new_freq)
-{
-	struct freqvar_rate_limit *rate_limit;
-	int up_rate_limit, down_rate_limit;
-	struct cpufreq_policy *policy;
-
-	rate_limit = per_cpu(freqvar_rate_limit, cpu);
-	if (!rate_limit)
-		return;
-
-	up_rate_limit = freqvar_get_value(new_freq, rate_limit->up_table);
-	down_rate_limit = freqvar_get_value(new_freq, rate_limit->down_table);
-
-	policy = cpufreq_cpu_get(cpu);
-	if (!policy)
-		return;
-
-	sugov_update_rate_limit_us(policy, up_rate_limit, down_rate_limit);
-
-	cpufreq_cpu_put(policy);
-}
-
-static void freqvar_rate_limit_free(struct freqvar_rate_limit *rate_limit)
-{
-	if (rate_limit) {
-		freqvar_free(rate_limit->up_table);
-		freqvar_free(rate_limit->down_table);
-	}
-
-	freqvar_free(rate_limit);
-}
-
-static struct
-freqvar_rate_limit *freqvar_rate_limit_alloc(struct cpufreq_policy *policy)
-{
-	struct freqvar_rate_limit *rate_limit;
-	int size;
-
-	rate_limit = kzalloc(sizeof(*rate_limit), GFP_KERNEL);
-	if (!rate_limit)
-		return NULL;
-
-	size = freqvar_get_table_size(policy);
-	if (size <= 0)
-		goto fail_alloc;
-
-	rate_limit->up_table = kzalloc(sizeof(struct freqvar_table)
-					* (size + 1), GFP_KERNEL);
-	if (!rate_limit->up_table)
-		goto fail_alloc;
-
-	rate_limit->down_table = kzalloc(sizeof(struct freqvar_table)
-					* (size + 1), GFP_KERNEL);
-	if (!rate_limit->down_table)
-		goto fail_alloc;
-
-	return rate_limit;
-
-fail_alloc:
-	freqvar_rate_limit_free(rate_limit);
-	return NULL;
-}
-
-static int freqvar_rate_limit_init(struct device_node *dn, const struct cpumask *mask)
-{
-	struct freqvar_rate_limit *rate_limit;
-	struct cpufreq_policy *policy;
-	int cpu, ret = 0;
-
-	policy = cpufreq_cpu_get(cpumask_first(mask));
-	if (!policy)
-		return -ENODEV;
-
-	rate_limit = freqvar_rate_limit_alloc(policy);
-	if (!rate_limit) {
-		ret = -ENOMEM;
-		goto fail_init;
-	}
-
-	ret = freqvar_fill_frequency_table(policy, rate_limit->up_table);
-	if (ret)
-		goto fail_init;
-
-	ret = freqvar_fill_frequency_table(policy, rate_limit->down_table);
-	if (ret)
-		goto fail_init;
-
-	ret = freqvar_parse_value_dt(dn, "up_rate_limit_table", rate_limit->up_table);
-	if (ret)
-		goto fail_init;
-
-	ret = freqvar_parse_value_dt(dn, "down_rate_limit_table", rate_limit->down_table);
-	if (ret)
-		goto fail_init;
-
-	ret = sugov_sysfs_add_attr(policy, &freqvar_up_rate_limit.attr);
-	if (ret)
-		goto fail_init;
-
-	ret = sugov_sysfs_add_attr(policy, &freqvar_down_rate_limit.attr);
-	if (ret)
-		goto fail_init;
-
-	for_each_cpu(cpu, mask)
-		per_cpu(freqvar_rate_limit, cpu) = rate_limit;
-
-	freqvar_rate_limit_update(policy->cpu, policy->cur);
-
-	return 0;
-
-fail_init:
-	freqvar_rate_limit_free(rate_limit);
-	cpufreq_cpu_put(policy);
-
-	return ret;
-}
-
-/**********************************************************************
- * freqvar up-scale ratio                                             *
- **********************************************************************/
-struct freqvar_upscale_ratio {
-	struct freqvar_table *table;
-	int ratio;
-};
-DEFINE_PER_CPU(struct freqvar_upscale_ratio *, freqvar_upscale_ratio);
-
-attr_freqvar(upscale_ratio, upscale_ratio, table);
-static struct governor_attr freqvar_upscale_ratio_attr = __ATTR_RW(freqvar_upscale_ratio);
-
-unsigned int freqvar_tipping_point(int cpu, unsigned int freq)
-{
-	struct freqvar_upscale_ratio *upscale = per_cpu(freqvar_upscale_ratio, cpu);
-
-	if (!upscale)
-		return freq + (freq >> 2);
-
-	return freq * 100 / upscale->ratio;
-}
-
-static void freqvar_upscale_ratio_update(int cpu, int new_freq)
-{
-	struct freqvar_upscale_ratio *upscale;
-
-	upscale = per_cpu(freqvar_upscale_ratio, cpu);
-	if (!upscale)
-		return;
-
-	upscale->ratio = freqvar_get_value(new_freq, upscale->table);
-}
-
-static void freqvar_upscale_ratio_free(struct freqvar_upscale_ratio *upscale)
-{
-	if (upscale)
-		freqvar_free(upscale->table);
-
-	freqvar_free(upscale);
-}
-
-static struct
-freqvar_upscale_ratio *freqvar_upscale_ratio_alloc(struct cpufreq_policy *policy)
-{
-	struct freqvar_upscale_ratio *upscale;
-	int size;
-
-	upscale = kzalloc(sizeof(*upscale), GFP_KERNEL);
-	if (!upscale)
-		return NULL;
-
-	size = freqvar_get_table_size(policy);
-	if (size <= 0)
-		goto fail_alloc;
-
-	upscale->table = kzalloc(sizeof(struct freqvar_table) * (size + 1), GFP_KERNEL);
-	if (!upscale->table)
-		goto fail_alloc;
-
-	return upscale;
-
-fail_alloc:
-	freqvar_upscale_ratio_free(upscale);
-	return NULL;
-}
-
-static int freqvar_upscale_ratio_init(struct device_node *dn, const struct cpumask *mask)
-{
-	struct freqvar_upscale_ratio *upscale;
-	struct cpufreq_policy *policy;
-	int cpu, ret = 0;
-
-	policy = cpufreq_cpu_get(cpumask_first(mask));
-	if (!policy)
-		return -ENODEV;
-
-	upscale = freqvar_upscale_ratio_alloc(policy);
-	if (!upscale) {
-		ret = -ENOMEM;
-		goto fail_init;
-	}
-
-	ret = freqvar_fill_frequency_table(policy, upscale->table);
-	if (ret)
-		goto fail_init;
-
-	ret = freqvar_parse_value_dt(dn, "upscale_ratio_table", upscale->table);
-	if (ret)
-		goto fail_init;
-
-	for_each_cpu(cpu, mask)
-		per_cpu(freqvar_upscale_ratio, cpu) = upscale;
-
-	freqvar_upscale_ratio_update(policy->cpu, policy->cur);
-
-	ret = sugov_sysfs_add_attr(policy, &freqvar_upscale_ratio_attr.attr);
-	if (ret)
-		goto fail_init;
-
-	return 0;
-
-fail_init:
-	cpufreq_cpu_put(policy);
-	freqvar_upscale_ratio_free(upscale);
-
-	return ret;
-}
-
-/**********************************************************************
- * cpufreq notifier callback                                          *
- **********************************************************************/
-static int freqvar_cpufreq_callback(struct notifier_block *nb,
-					unsigned long val, void *data)
-{
-	struct cpufreq_freqs *freq = data;
-
-	if (freq->flags & CPUFREQ_CONST_LOOPS)
-		return NOTIFY_OK;
-
-	if (val != CPUFREQ_POSTCHANGE)
-		return NOTIFY_OK;
-
-	freqvar_boost_update(freq->cpu, freq->new);
-	freqvar_rate_limit_update(freq->cpu, freq->new);
-	freqvar_upscale_ratio_update(freq->cpu, freq->new);
-
-	return 0;
-}
-
-static struct notifier_block freqvar_cpufreq_notifier = {
-	.notifier_call  = freqvar_cpufreq_callback,
-};
-
-/**********************************************************************
- * initialization                                                     *
- **********************************************************************/
-static int __init freqvar_tune_init(void)
-{
-	struct device_node *dn = NULL;
-	struct cpumask shared_mask;
-	const char *buf;
-
-	while ((dn = of_find_node_by_type(dn, "freqvar-tune"))) {
-		/*
-		 * shared-cpus includes cpus scaling at the sametime.
-		 * it is called "sibling cpus" in the CPUFreq and
-		 * masked on the realated_cpus of the policy
-		 */
-		if (of_property_read_string(dn, "shared-cpus", &buf))
-			continue;
-
-		cpumask_clear(&shared_mask);
-		cpulist_parse(buf, &shared_mask);
-		cpumask_and(&shared_mask, &shared_mask, cpu_possible_mask);
-		if (cpumask_weight(&shared_mask) == 0)
-			continue;
-
-		freqvar_boost_init(dn, &shared_mask);
-		freqvar_rate_limit_init(dn, &shared_mask);
-		freqvar_upscale_ratio_init(dn, &shared_mask);
-	}
-
-	cpufreq_register_notifier(&freqvar_cpufreq_notifier,
-					CPUFREQ_TRANSITION_NOTIFIER);
-
-	return 0;
-}
-late_initcall(freqvar_tune_init);