Commit ec7dc8ac authored by Dhaval Giani's avatar Dhaval Giani Committed by Ingo Molnar

sched: allow the group scheduler to have multiple levels

This patch makes the group scheduler multi hierarchy aware.

[a.p.zijlstra@chello.nl: rt-parts and assorted fixes]
Signed-off-by: default avatarDhaval Giani <dhaval@linux.vnet.ibm.com>
Signed-off-by: default avatarPeter Zijlstra <a.p.zijlstra@chello.nl>
Signed-off-by: default avatarIngo Molnar <mingo@elte.hu>
parent 354d60c2
...@@ -2052,7 +2052,7 @@ extern void normalize_rt_tasks(void); ...@@ -2052,7 +2052,7 @@ extern void normalize_rt_tasks(void);
extern struct task_group init_task_group; extern struct task_group init_task_group;
extern struct task_group *sched_create_group(void); extern struct task_group *sched_create_group(struct task_group *parent);
extern void sched_destroy_group(struct task_group *tg); extern void sched_destroy_group(struct task_group *tg);
extern void sched_move_task(struct task_struct *tsk); extern void sched_move_task(struct task_struct *tsk);
#ifdef CONFIG_FAIR_GROUP_SCHED #ifdef CONFIG_FAIR_GROUP_SCHED
......
...@@ -7438,10 +7438,11 @@ static void init_rt_rq(struct rt_rq *rt_rq, struct rq *rq) ...@@ -7438,10 +7438,11 @@ static void init_rt_rq(struct rt_rq *rt_rq, struct rq *rq)
} }
#ifdef CONFIG_FAIR_GROUP_SCHED #ifdef CONFIG_FAIR_GROUP_SCHED
static void init_tg_cfs_entry(struct rq *rq, struct task_group *tg, static void init_tg_cfs_entry(struct task_group *tg, struct cfs_rq *cfs_rq,
struct cfs_rq *cfs_rq, struct sched_entity *se, struct sched_entity *se, int cpu, int add,
int cpu, int add) struct sched_entity *parent)
{ {
struct rq *rq = cpu_rq(cpu);
tg->cfs_rq[cpu] = cfs_rq; tg->cfs_rq[cpu] = cfs_rq;
init_cfs_rq(cfs_rq, rq); init_cfs_rq(cfs_rq, rq);
cfs_rq->tg = tg; cfs_rq->tg = tg;
...@@ -7453,19 +7454,25 @@ static void init_tg_cfs_entry(struct rq *rq, struct task_group *tg, ...@@ -7453,19 +7454,25 @@ static void init_tg_cfs_entry(struct rq *rq, struct task_group *tg,
if (!se) if (!se)
return; return;
if (!parent)
se->cfs_rq = &rq->cfs; se->cfs_rq = &rq->cfs;
else
se->cfs_rq = parent->my_q;
se->my_q = cfs_rq; se->my_q = cfs_rq;
se->load.weight = tg->shares; se->load.weight = tg->shares;
se->load.inv_weight = div64_64(1ULL<<32, se->load.weight); se->load.inv_weight = div64_64(1ULL<<32, se->load.weight);
se->parent = NULL; se->parent = parent;
} }
#endif #endif
#ifdef CONFIG_RT_GROUP_SCHED #ifdef CONFIG_RT_GROUP_SCHED
static void init_tg_rt_entry(struct rq *rq, struct task_group *tg, static void init_tg_rt_entry(struct task_group *tg, struct rt_rq *rt_rq,
struct rt_rq *rt_rq, struct sched_rt_entity *rt_se, struct sched_rt_entity *rt_se, int cpu, int add,
int cpu, int add) struct sched_rt_entity *parent)
{ {
struct rq *rq = cpu_rq(cpu);
tg->rt_rq[cpu] = rt_rq; tg->rt_rq[cpu] = rt_rq;
init_rt_rq(rt_rq, rq); init_rt_rq(rt_rq, rq);
rt_rq->tg = tg; rt_rq->tg = tg;
...@@ -7478,9 +7485,14 @@ static void init_tg_rt_entry(struct rq *rq, struct task_group *tg, ...@@ -7478,9 +7485,14 @@ static void init_tg_rt_entry(struct rq *rq, struct task_group *tg,
if (!rt_se) if (!rt_se)
return; return;
if (!parent)
rt_se->rt_rq = &rq->rt;
else
rt_se->rt_rq = parent->my_q;
rt_se->rt_rq = &rq->rt; rt_se->rt_rq = &rq->rt;
rt_se->my_q = rt_rq; rt_se->my_q = rt_rq;
rt_se->parent = NULL; rt_se->parent = parent;
INIT_LIST_HEAD(&rt_se->run_list); INIT_LIST_HEAD(&rt_se->run_list);
} }
#endif #endif
...@@ -7568,7 +7580,7 @@ void __init sched_init(void) ...@@ -7568,7 +7580,7 @@ void __init sched_init(void)
* We achieve this by letting init_task_group's tasks sit * We achieve this by letting init_task_group's tasks sit
* directly in rq->cfs (i.e init_task_group->se[] = NULL). * directly in rq->cfs (i.e init_task_group->se[] = NULL).
*/ */
init_tg_cfs_entry(rq, &init_task_group, &rq->cfs, NULL, i, 1); init_tg_cfs_entry(&init_task_group, &rq->cfs, NULL, i, 1, NULL);
#elif defined CONFIG_USER_SCHED #elif defined CONFIG_USER_SCHED
/* /*
* In case of task-groups formed thr' the user id of tasks, * In case of task-groups formed thr' the user id of tasks,
...@@ -7581,9 +7593,9 @@ void __init sched_init(void) ...@@ -7581,9 +7593,9 @@ void __init sched_init(void)
* (init_cfs_rq) and having one entity represent this group of * (init_cfs_rq) and having one entity represent this group of
* tasks in rq->cfs (i.e init_task_group->se[] != NULL). * tasks in rq->cfs (i.e init_task_group->se[] != NULL).
*/ */
init_tg_cfs_entry(rq, &init_task_group, init_tg_cfs_entry(&init_task_group,
&per_cpu(init_cfs_rq, i), &per_cpu(init_cfs_rq, i),
&per_cpu(init_sched_entity, i), i, 1); &per_cpu(init_sched_entity, i), i, 1, NULL);
#endif #endif
#endif /* CONFIG_FAIR_GROUP_SCHED */ #endif /* CONFIG_FAIR_GROUP_SCHED */
...@@ -7592,11 +7604,11 @@ void __init sched_init(void) ...@@ -7592,11 +7604,11 @@ void __init sched_init(void)
#ifdef CONFIG_RT_GROUP_SCHED #ifdef CONFIG_RT_GROUP_SCHED
INIT_LIST_HEAD(&rq->leaf_rt_rq_list); INIT_LIST_HEAD(&rq->leaf_rt_rq_list);
#ifdef CONFIG_CGROUP_SCHED #ifdef CONFIG_CGROUP_SCHED
init_tg_rt_entry(rq, &init_task_group, &rq->rt, NULL, i, 1); init_tg_rt_entry(&init_task_group, &rq->rt, NULL, i, 1, NULL);
#elif defined CONFIG_USER_SCHED #elif defined CONFIG_USER_SCHED
init_tg_rt_entry(rq, &init_task_group, init_tg_rt_entry(&init_task_group,
&per_cpu(init_rt_rq, i), &per_cpu(init_rt_rq, i),
&per_cpu(init_sched_rt_entity, i), i, 1); &per_cpu(init_sched_rt_entity, i), i, 1, NULL);
#endif #endif
#endif #endif
...@@ -7798,10 +7810,11 @@ static void free_fair_sched_group(struct task_group *tg) ...@@ -7798,10 +7810,11 @@ static void free_fair_sched_group(struct task_group *tg)
kfree(tg->se); kfree(tg->se);
} }
static int alloc_fair_sched_group(struct task_group *tg) static
int alloc_fair_sched_group(struct task_group *tg, struct task_group *parent)
{ {
struct cfs_rq *cfs_rq; struct cfs_rq *cfs_rq;
struct sched_entity *se; struct sched_entity *se, *parent_se;
struct rq *rq; struct rq *rq;
int i; int i;
...@@ -7827,7 +7840,8 @@ static int alloc_fair_sched_group(struct task_group *tg) ...@@ -7827,7 +7840,8 @@ static int alloc_fair_sched_group(struct task_group *tg)
if (!se) if (!se)
goto err; goto err;
init_tg_cfs_entry(rq, tg, cfs_rq, se, i, 0); parent_se = parent ? parent->se[i] : NULL;
init_tg_cfs_entry(tg, cfs_rq, se, i, 0, parent_se);
} }
return 1; return 1;
...@@ -7851,7 +7865,8 @@ static inline void free_fair_sched_group(struct task_group *tg) ...@@ -7851,7 +7865,8 @@ static inline void free_fair_sched_group(struct task_group *tg)
{ {
} }
static inline int alloc_fair_sched_group(struct task_group *tg) static inline
int alloc_fair_sched_group(struct task_group *tg, struct task_group *parent)
{ {
return 1; return 1;
} }
...@@ -7883,10 +7898,11 @@ static void free_rt_sched_group(struct task_group *tg) ...@@ -7883,10 +7898,11 @@ static void free_rt_sched_group(struct task_group *tg)
kfree(tg->rt_se); kfree(tg->rt_se);
} }
static int alloc_rt_sched_group(struct task_group *tg) static
int alloc_rt_sched_group(struct task_group *tg, struct task_group *parent)
{ {
struct rt_rq *rt_rq; struct rt_rq *rt_rq;
struct sched_rt_entity *rt_se; struct sched_rt_entity *rt_se, *parent_se;
struct rq *rq; struct rq *rq;
int i; int i;
...@@ -7913,7 +7929,8 @@ static int alloc_rt_sched_group(struct task_group *tg) ...@@ -7913,7 +7929,8 @@ static int alloc_rt_sched_group(struct task_group *tg)
if (!rt_se) if (!rt_se)
goto err; goto err;
init_tg_rt_entry(rq, tg, rt_rq, rt_se, i, 0); parent_se = parent ? parent->rt_se[i] : NULL;
init_tg_rt_entry(tg, rt_rq, rt_se, i, 0, parent_se);
} }
return 1; return 1;
...@@ -7937,7 +7954,8 @@ static inline void free_rt_sched_group(struct task_group *tg) ...@@ -7937,7 +7954,8 @@ static inline void free_rt_sched_group(struct task_group *tg)
{ {
} }
static inline int alloc_rt_sched_group(struct task_group *tg) static inline
int alloc_rt_sched_group(struct task_group *tg, struct task_group *parent)
{ {
return 1; return 1;
} }
...@@ -7960,7 +7978,7 @@ static void free_sched_group(struct task_group *tg) ...@@ -7960,7 +7978,7 @@ static void free_sched_group(struct task_group *tg)
} }
/* allocate runqueue etc for a new task group */ /* allocate runqueue etc for a new task group */
struct task_group *sched_create_group(void) struct task_group *sched_create_group(struct task_group *parent)
{ {
struct task_group *tg; struct task_group *tg;
unsigned long flags; unsigned long flags;
...@@ -7970,10 +7988,10 @@ struct task_group *sched_create_group(void) ...@@ -7970,10 +7988,10 @@ struct task_group *sched_create_group(void)
if (!tg) if (!tg)
return ERR_PTR(-ENOMEM); return ERR_PTR(-ENOMEM);
if (!alloc_fair_sched_group(tg)) if (!alloc_fair_sched_group(tg, parent))
goto err; goto err;
if (!alloc_rt_sched_group(tg)) if (!alloc_rt_sched_group(tg, parent))
goto err; goto err;
spin_lock_irqsave(&task_group_lock, flags); spin_lock_irqsave(&task_group_lock, flags);
...@@ -8084,6 +8102,12 @@ int sched_group_set_shares(struct task_group *tg, unsigned long shares) ...@@ -8084,6 +8102,12 @@ int sched_group_set_shares(struct task_group *tg, unsigned long shares)
int i; int i;
unsigned long flags; unsigned long flags;
/*
* We can't change the weight of the root cgroup.
*/
if (!tg->se[0])
return -EINVAL;
/* /*
* A weight of 0 or 1 can cause arithmetics problems. * A weight of 0 or 1 can cause arithmetics problems.
* (The default weight is 1024 - so there's no practical * (The default weight is 1024 - so there's no practical
...@@ -8327,7 +8351,7 @@ static inline struct task_group *cgroup_tg(struct cgroup *cgrp) ...@@ -8327,7 +8351,7 @@ static inline struct task_group *cgroup_tg(struct cgroup *cgrp)
static struct cgroup_subsys_state * static struct cgroup_subsys_state *
cpu_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cgrp) cpu_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cgrp)
{ {
struct task_group *tg; struct task_group *tg, *parent;
if (!cgrp->parent) { if (!cgrp->parent) {
/* This is early initialization for the top cgroup */ /* This is early initialization for the top cgroup */
...@@ -8335,11 +8359,8 @@ cpu_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cgrp) ...@@ -8335,11 +8359,8 @@ cpu_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cgrp)
return &init_task_group.css; return &init_task_group.css;
} }
/* we support only 1-level deep hierarchical scheduler atm */ parent = cgroup_tg(cgrp->parent);
if (cgrp->parent->parent) tg = sched_create_group(parent);
return ERR_PTR(-EINVAL);
tg = sched_create_group();
if (IS_ERR(tg)) if (IS_ERR(tg))
return ERR_PTR(-ENOMEM); return ERR_PTR(-ENOMEM);
......
...@@ -101,7 +101,7 @@ static int sched_create_user(struct user_struct *up) ...@@ -101,7 +101,7 @@ static int sched_create_user(struct user_struct *up)
{ {
int rc = 0; int rc = 0;
up->tg = sched_create_group(); up->tg = sched_create_group(NULL);
if (IS_ERR(up->tg)) if (IS_ERR(up->tg))
rc = -ENOMEM; rc = -ENOMEM;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment