cfs_bandwidth_used is a static_key to control cfs bandwidth
feature. When adding a cfs_bandwidth group, we need increase
the key, and decrease it when removing. But currently when we
remove a cfs bandwidth group, we don't decrease the key and
this switch will always be on even if there is no cfs bandwidth
group in the system.
Fix the problem as two steps:
1.Rename cfs_bandwidth_usage_{dec, inc}() to
cfs_bandwidth_usage_{dec,inc}_cpuslocked() and its caller need to
hold the hotplug lock.
2.Add cfs_bandwidth_usage_dec() and its caller don't need
to hold the hotplug lock. And when removing a cfs bandwidth group,
we decrease cfs_bandwidth_used by calling cfs_bandwidth_usage_dec().
Fixes: 56f570e512ee ("sched: use jump labels to reduce overhead when bandwidth control is inactive")
Signed-off-by: Zhang Qiao <[email protected]>
Reviewed-by: Daniel Jordan <[email protected]>
---
Changes since v3:
- Rebase it on the latest code
- Add Reviewed-by tag from Daniel
- link to patch v3: https://lkml.org/lkml/2021/7/15/2101
Changes since v2:
- Remove cfs_bandwidth_usage_inc()
- Make cfs_bandwidth_usage_dec() static
Changes since v1:
- Add suffix _cpuslocked to cfs_bandwidth_usage_{dec,inc}.
- Use static_key_slow_{dec,inc}_cpuslocked() in origin
cfs_bandwidth_usage_{dec,inc}().
---
kernel/sched/core.c | 4 ++--
kernel/sched/fair.c | 18 ++++++++++++++----
kernel/sched/sched.h | 4 ++--
3 files changed, 18 insertions(+), 8 deletions(-)
diff --git a/kernel/sched/core.c b/kernel/sched/core.c
index c4462c454ab9..0e8c789e84a9 100644
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -10221,7 +10221,7 @@ static int tg_set_cfs_bandwidth(struct task_group *tg, u64 period, u64 quota,
* before making related changes, and on->off must occur afterwards
*/
if (runtime_enabled && !runtime_was_enabled)
- cfs_bandwidth_usage_inc();
+ cfs_bandwidth_usage_inc_cpuslocked();
raw_spin_lock_irq(&cfs_b->lock);
cfs_b->period = ns_to_ktime(period);
cfs_b->quota = quota;
@@ -10249,7 +10249,7 @@ static int tg_set_cfs_bandwidth(struct task_group *tg, u64 period, u64 quota,
rq_unlock_irq(rq, &rf);
}
if (runtime_was_enabled && !runtime_enabled)
- cfs_bandwidth_usage_dec();
+ cfs_bandwidth_usage_dec_cpuslocked();
out_unlock:
mutex_unlock(&cfs_constraints_mutex);
cpus_read_unlock();
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c
index ff69f245b939..28f2e7600b53 100644
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -4645,23 +4645,30 @@ static inline bool cfs_bandwidth_used(void)
return static_key_false(&__cfs_bandwidth_used);
}
-void cfs_bandwidth_usage_inc(void)
+void cfs_bandwidth_usage_inc_cpuslocked(void)
{
static_key_slow_inc_cpuslocked(&__cfs_bandwidth_used);
}
-void cfs_bandwidth_usage_dec(void)
+void cfs_bandwidth_usage_dec_cpuslocked(void)
{
static_key_slow_dec_cpuslocked(&__cfs_bandwidth_used);
}
+
+static void cfs_bandwidth_usage_dec(void)
+{
+ static_key_slow_dec(&__cfs_bandwidth_used);
+}
#else /* CONFIG_JUMP_LABEL */
static bool cfs_bandwidth_used(void)
{
return true;
}
-void cfs_bandwidth_usage_inc(void) {}
-void cfs_bandwidth_usage_dec(void) {}
+void cfs_bandwidth_usage_inc_cpuslocked(void) {}
+void cfs_bandwidth_usage_dec_cpuslocked(void) {}
+
+static void cfs_bandwidth_usage_dec(void) {}
#endif /* CONFIG_JUMP_LABEL */
/*
@@ -5389,6 +5396,9 @@ static void destroy_cfs_bandwidth(struct cfs_bandwidth *cfs_b)
if (!cfs_b->throttled_cfs_rq.next)
return;
+ if (cfs_b->quota != RUNTIME_INF)
+ cfs_bandwidth_usage_dec();
+
hrtimer_cancel(&cfs_b->period_timer);
hrtimer_cancel(&cfs_b->slack_timer);
}
diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h
index 3d3e5793e117..05fed8f5e15c 100644
--- a/kernel/sched/sched.h
+++ b/kernel/sched/sched.h
@@ -2702,8 +2702,8 @@ extern void init_cfs_rq(struct cfs_rq *cfs_rq);
extern void init_rt_rq(struct rt_rq *rt_rq);
extern void init_dl_rq(struct dl_rq *dl_rq);
-extern void cfs_bandwidth_usage_inc(void);
-extern void cfs_bandwidth_usage_dec(void);
+extern void cfs_bandwidth_usage_inc_cpuslocked(void);
+extern void cfs_bandwidth_usage_dec_cpuslocked(void);
#ifdef CONFIG_NO_HZ_COMMON
#define NOHZ_BALANCE_KICK_BIT 0
--
2.18.0