Skip to content

Commit e636ffb

Browse files
author
Peter Zijlstra
committed
sched/deadline: Fix dl_server time accounting
The dl_server time accounting code is a little odd. The normal scheduler pattern is to update curr before doing something, such that the old state is fully accounted before changing state. Notably, the dl_server_timer() needs to propagate the current time accounting since the current task could be ran by dl_server and thus this can affect dl_se->runtime. Similarly for dl_server_start(). And since the (deferred) dl_server wants idle time accounted, rework sched_idle_class time accounting to be more like all the others. Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org> Link: https://patch.msgid.link/20251020141130.GJ3245006@noisy.programming.kicks-ass.net
1 parent e40cea3 commit e636ffb

4 files changed

Lines changed: 33 additions & 35 deletions

File tree

kernel/sched/deadline.c

Lines changed: 15 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -1166,8 +1166,12 @@ static enum hrtimer_restart dl_server_timer(struct hrtimer *timer, struct sched_
11661166
sched_clock_tick();
11671167
update_rq_clock(rq);
11681168

1169-
if (!dl_se->dl_runtime)
1170-
return HRTIMER_NORESTART;
1169+
/*
1170+
* Make sure current has propagated its pending runtime into
1171+
* any relevant server through calling dl_server_update() and
1172+
* friends.
1173+
*/
1174+
rq->donor->sched_class->update_curr(rq);
11711175

11721176
if (dl_se->dl_defer_armed) {
11731177
/*
@@ -1543,35 +1547,16 @@ static void update_curr_dl_se(struct rq *rq, struct sched_dl_entity *dl_se, s64
15431547
* as time available for the fair server, avoiding a penalty for the
15441548
* rt scheduler that did not consumed that time.
15451549
*/
1546-
void dl_server_update_idle_time(struct rq *rq, struct task_struct *p)
1550+
void dl_server_update_idle(struct sched_dl_entity *dl_se, s64 delta_exec)
15471551
{
1548-
s64 delta_exec;
1549-
1550-
if (!rq->fair_server.dl_defer)
1551-
return;
1552-
1553-
/* no need to discount more */
1554-
if (rq->fair_server.runtime < 0)
1555-
return;
1556-
1557-
delta_exec = rq_clock_task(rq) - p->se.exec_start;
1558-
if (delta_exec < 0)
1559-
return;
1560-
1561-
rq->fair_server.runtime -= delta_exec;
1562-
1563-
if (rq->fair_server.runtime < 0) {
1564-
rq->fair_server.dl_defer_running = 0;
1565-
rq->fair_server.runtime = 0;
1566-
}
1567-
1568-
p->se.exec_start = rq_clock_task(rq);
1552+
if (dl_se->dl_server_active && dl_se->dl_runtime && dl_se->dl_defer)
1553+
update_curr_dl_se(dl_se->rq, dl_se, delta_exec);
15691554
}
15701555

15711556
void dl_server_update(struct sched_dl_entity *dl_se, s64 delta_exec)
15721557
{
15731558
/* 0 runtime = fair server disabled */
1574-
if (dl_se->dl_runtime)
1559+
if (dl_se->dl_server_active && dl_se->dl_runtime)
15751560
update_curr_dl_se(dl_se->rq, dl_se, delta_exec);
15761561
}
15771562

@@ -1582,6 +1567,11 @@ void dl_server_start(struct sched_dl_entity *dl_se)
15821567
if (!dl_server(dl_se) || dl_se->dl_server_active)
15831568
return;
15841569

1570+
/*
1571+
* Update the current task to 'now'.
1572+
*/
1573+
rq->donor->sched_class->update_curr(rq);
1574+
15851575
if (WARN_ON_ONCE(!cpu_online(cpu_of(rq))))
15861576
return;
15871577

kernel/sched/fair.c

Lines changed: 2 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1212,8 +1212,7 @@ static void update_curr(struct cfs_rq *cfs_rq)
12121212
* against fair_server such that it can account for this time
12131213
* and possibly avoid running this period.
12141214
*/
1215-
if (dl_server_active(&rq->fair_server))
1216-
dl_server_update(&rq->fair_server, delta_exec);
1215+
dl_server_update(&rq->fair_server, delta_exec);
12171216
}
12181217

12191218
account_cfs_rq_runtime(cfs_rq, delta_exec);
@@ -6961,12 +6960,8 @@ enqueue_task_fair(struct rq *rq, struct task_struct *p, int flags)
69616960
h_nr_idle = 1;
69626961
}
69636962

6964-
if (!rq_h_nr_queued && rq->cfs.h_nr_queued) {
6965-
/* Account for idle runtime */
6966-
if (!rq->nr_running)
6967-
dl_server_update_idle_time(rq, rq->curr);
6963+
if (!rq_h_nr_queued && rq->cfs.h_nr_queued)
69686964
dl_server_start(&rq->fair_server);
6969-
}
69706965

69716966
/* At this point se is NULL and we are at root level*/
69726967
add_nr_running(rq, 1);

kernel/sched/idle.c

Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -452,9 +452,11 @@ static void wakeup_preempt_idle(struct rq *rq, struct task_struct *p, int flags)
452452
resched_curr(rq);
453453
}
454454

455+
static void update_curr_idle(struct rq *rq);
456+
455457
static void put_prev_task_idle(struct rq *rq, struct task_struct *prev, struct task_struct *next)
456458
{
457-
dl_server_update_idle_time(rq, prev);
459+
update_curr_idle(rq);
458460
scx_update_idle(rq, false, true);
459461
}
460462

@@ -496,6 +498,7 @@ dequeue_task_idle(struct rq *rq, struct task_struct *p, int flags)
496498
*/
497499
static void task_tick_idle(struct rq *rq, struct task_struct *curr, int queued)
498500
{
501+
update_curr_idle(rq);
499502
}
500503

501504
static void switching_to_idle(struct rq *rq, struct task_struct *p)
@@ -514,6 +517,17 @@ prio_changed_idle(struct rq *rq, struct task_struct *p, u64 oldprio)
514517

515518
static void update_curr_idle(struct rq *rq)
516519
{
520+
struct sched_entity *se = &rq->idle->se;
521+
u64 now = rq_clock_task(rq);
522+
s64 delta_exec;
523+
524+
delta_exec = now - se->exec_start;
525+
if (unlikely(delta_exec <= 0))
526+
return;
527+
528+
se->exec_start = now;
529+
530+
dl_server_update_idle(&rq->fair_server, delta_exec);
517531
}
518532

519533
/*

kernel/sched/sched.h

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -404,15 +404,14 @@ extern s64 dl_scaled_delta_exec(struct rq *rq, struct sched_dl_entity *dl_se, s6
404404
* naturally thottled to once per period, avoiding high context switch
405405
* workloads from spamming the hrtimer program/cancel paths.
406406
*/
407+
extern void dl_server_update_idle(struct sched_dl_entity *dl_se, s64 delta_exec);
407408
extern void dl_server_update(struct sched_dl_entity *dl_se, s64 delta_exec);
408409
extern void dl_server_start(struct sched_dl_entity *dl_se);
409410
extern void dl_server_stop(struct sched_dl_entity *dl_se);
410411
extern void dl_server_init(struct sched_dl_entity *dl_se, struct rq *rq,
411412
dl_server_pick_f pick_task);
412413
extern void sched_init_dl_servers(void);
413414

414-
extern void dl_server_update_idle_time(struct rq *rq,
415-
struct task_struct *p);
416415
extern void fair_server_init(struct rq *rq);
417416
extern void __dl_server_attach_root(struct sched_dl_entity *dl_se, struct rq *rq);
418417
extern int dl_server_apply_params(struct sched_dl_entity *dl_se,

0 commit comments

Comments
 (0)