Skip to content

Commit c8a8539

Browse files
joelagnelPeter Zijlstra
authored andcommitted
sched/core: Fix picking of tasks for core scheduling with DL server
* Use simple CFS pick_task for DL pick_task DL server's pick_task calls CFS's pick_next_task_fair(), this is wrong because core scheduling's pick_task only calls CFS's pick_task() for evaluation / checking of the CFS task (comparing across CPUs), not for actually affirmatively picking the next task. This causes RB tree corruption issues in CFS that were found by syzbot. * Make pick_task_fair clear DL server A DL task pick might set ->dl_server, but it is possible the task will never run (say the other HT has a stop task). If the CFS task is picked in the future directly (say without DL server), ->dl_server will be set. So clear it in pick_task_fair(). This fixes the KASAN issue reported by syzbot in set_next_entity(). (DL refactoring suggestions by Vineeth Pillai). Reported-by: Suleiman Souhlal <[email protected]> Signed-off-by: "Joel Fernandes (Google)" <[email protected]> Signed-off-by: Daniel Bristot de Oliveira <[email protected]> Signed-off-by: Peter Zijlstra (Intel) <[email protected]> Reviewed-by: Vineeth Pillai <[email protected]> Tested-by: Juri Lelli <[email protected]> Link: https://lore.kernel.org/r/b10489ab1f03d23e08e6097acea47442e7d6466f.1716811044.git.bristot@kernel.org
1 parent 4b26cfd commit c8a8539

File tree

4 files changed

+47
-9
lines changed

4 files changed

+47
-9
lines changed

include/linux/sched.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -686,7 +686,8 @@ struct sched_dl_entity {
686686
*/
687687
struct rq *rq;
688688
dl_server_has_tasks_f server_has_tasks;
689-
dl_server_pick_f server_pick;
689+
dl_server_pick_f server_pick_next;
690+
dl_server_pick_f server_pick_task;
690691

691692
#ifdef CONFIG_RT_MUTEXES
692693
/*

kernel/sched/deadline.c

Lines changed: 22 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1664,11 +1664,13 @@ void dl_server_stop(struct sched_dl_entity *dl_se)
16641664

16651665
void dl_server_init(struct sched_dl_entity *dl_se, struct rq *rq,
16661666
dl_server_has_tasks_f has_tasks,
1667-
dl_server_pick_f pick)
1667+
dl_server_pick_f pick_next,
1668+
dl_server_pick_f pick_task)
16681669
{
16691670
dl_se->rq = rq;
16701671
dl_se->server_has_tasks = has_tasks;
1671-
dl_se->server_pick = pick;
1672+
dl_se->server_pick_next = pick_next;
1673+
dl_se->server_pick_task = pick_task;
16721674
}
16731675

16741676
void __dl_server_attach_root(struct sched_dl_entity *dl_se, struct rq *rq)
@@ -2399,7 +2401,12 @@ static struct sched_dl_entity *pick_next_dl_entity(struct dl_rq *dl_rq)
23992401
return __node_2_dle(left);
24002402
}
24012403

2402-
static struct task_struct *pick_task_dl(struct rq *rq)
2404+
/*
2405+
* __pick_next_task_dl - Helper to pick the next -deadline task to run.
2406+
* @rq: The runqueue to pick the next task from.
2407+
* @peek: If true, just peek at the next task. Only relevant for dlserver.
2408+
*/
2409+
static struct task_struct *__pick_next_task_dl(struct rq *rq, bool peek)
24032410
{
24042411
struct sched_dl_entity *dl_se;
24052412
struct dl_rq *dl_rq = &rq->dl;
@@ -2413,7 +2420,10 @@ static struct task_struct *pick_task_dl(struct rq *rq)
24132420
WARN_ON_ONCE(!dl_se);
24142421

24152422
if (dl_server(dl_se)) {
2416-
p = dl_se->server_pick(dl_se);
2423+
if (IS_ENABLED(CONFIG_SMP) && peek)
2424+
p = dl_se->server_pick_task(dl_se);
2425+
else
2426+
p = dl_se->server_pick_next(dl_se);
24172427
if (!p) {
24182428
WARN_ON_ONCE(1);
24192429
dl_se->dl_yielded = 1;
@@ -2428,11 +2438,18 @@ static struct task_struct *pick_task_dl(struct rq *rq)
24282438
return p;
24292439
}
24302440

2441+
#ifdef CONFIG_SMP
2442+
static struct task_struct *pick_task_dl(struct rq *rq)
2443+
{
2444+
return __pick_next_task_dl(rq, true);
2445+
}
2446+
#endif
2447+
24312448
static struct task_struct *pick_next_task_dl(struct rq *rq)
24322449
{
24332450
struct task_struct *p;
24342451

2435-
p = pick_task_dl(rq);
2452+
p = __pick_next_task_dl(rq, false);
24362453
if (!p)
24372454
return p;
24382455

kernel/sched/fair.c

Lines changed: 21 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8479,6 +8479,14 @@ static struct task_struct *pick_task_fair(struct rq *rq)
84798479
cfs_rq = group_cfs_rq(se);
84808480
} while (cfs_rq);
84818481

8482+
/*
8483+
* This can be called from directly from CFS's ->pick_task() or indirectly
8484+
* from DL's ->pick_task when fair server is enabled. In the indirect case,
8485+
* DL will set ->dl_server just after this function is called, so its Ok to
8486+
* clear. In the direct case, we are picking directly so we must clear it.
8487+
*/
8488+
task_of(se)->dl_server = NULL;
8489+
84828490
return task_of(se);
84838491
}
84848492
#endif
@@ -8638,7 +8646,16 @@ static bool fair_server_has_tasks(struct sched_dl_entity *dl_se)
86388646
return !!dl_se->rq->cfs.nr_running;
86398647
}
86408648

8641-
static struct task_struct *fair_server_pick(struct sched_dl_entity *dl_se)
8649+
static struct task_struct *fair_server_pick_task(struct sched_dl_entity *dl_se)
8650+
{
8651+
#ifdef CONFIG_SMP
8652+
return pick_task_fair(dl_se->rq);
8653+
#else
8654+
return NULL;
8655+
#endif
8656+
}
8657+
8658+
static struct task_struct *fair_server_pick_next(struct sched_dl_entity *dl_se)
86428659
{
86438660
return pick_next_task_fair(dl_se->rq, NULL, NULL);
86448661
}
@@ -8649,7 +8666,9 @@ void fair_server_init(struct rq *rq)
86498666

86508667
init_dl_entity(dl_se);
86518668

8652-
dl_server_init(dl_se, rq, fair_server_has_tasks, fair_server_pick);
8669+
dl_server_init(dl_se, rq, fair_server_has_tasks, fair_server_pick_next,
8670+
fair_server_pick_task);
8671+
86538672
}
86548673

86558674
/*

kernel/sched/sched.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -361,7 +361,8 @@ extern void dl_server_start(struct sched_dl_entity *dl_se);
361361
extern void dl_server_stop(struct sched_dl_entity *dl_se);
362362
extern void dl_server_init(struct sched_dl_entity *dl_se, struct rq *rq,
363363
dl_server_has_tasks_f has_tasks,
364-
dl_server_pick_f pick);
364+
dl_server_pick_f pick_next,
365+
dl_server_pick_f pick_task);
365366

366367
extern void dl_server_update_idle_time(struct rq *rq,
367368
struct task_struct *p);

0 commit comments

Comments
 (0)