kernel/sched/sched.h

b2441318SGreg Kroah-Hartman/* SPDX-License-Identifier: GPL-2.0 */
97fb7a0aSIngo Molnar/*
97fb7a0aSIngo Molnar * Scheduler internal types and methods:
97fb7a0aSIngo Molnar */
95458477SIngo Molnar#ifndef _KERNEL_SCHED_SCHED_H
95458477SIngo Molnar#define _KERNEL_SCHED_SCHED_H
325ea10cSIngo Molnar
801c1419SIngo Molnar#include <linux/sched/affinity.h>
dfc3401aSIngo Molnar#include <linux/sched/autogroup.h>
55687da1SIngo Molnar#include <linux/sched/cpufreq.h>
325ea10cSIngo Molnar#include <linux/sched/deadline.h>
4ff8f2caSIngo Molnar#include <linux/sched.h>
325ea10cSIngo Molnar#include <linux/sched/loadavg.h>
325ea10cSIngo Molnar#include <linux/sched/mm.h>
801c1419SIngo Molnar#include <linux/sched/rseq_api.h>
325ea10cSIngo Molnar#include <linux/sched/signal.h>
321a874aSThomas Gleixner#include <linux/sched/smt.h>
325ea10cSIngo Molnar#include <linux/sched/stat.h>
325ea10cSIngo Molnar#include <linux/sched/sysctl.h>
4ff8f2caSIngo Molnar#include <linux/sched/task_flags.h>
29930025SIngo Molnar#include <linux/sched/task.h>
325ea10cSIngo Molnar#include <linux/sched/topology.h>
ef8bd77fSIngo Molnar
4ff8f2caSIngo Molnar#include <linux/atomic.h>
4ff8f2caSIngo Molnar#include <linux/bitmap.h>
4ff8f2caSIngo Molnar#include <linux/bug.h>
4ff8f2caSIngo Molnar#include <linux/capability.h>
4ff8f2caSIngo Molnar#include <linux/cgroup_api.h>
4ff8f2caSIngo Molnar#include <linux/cgroup.h>
325ea10cSIngo Molnar#include <linux/cpufreq.h>
4ff8f2caSIngo Molnar#include <linux/cpumask_api.h>
325ea10cSIngo Molnar#include <linux/ctype.h>
4ff8f2caSIngo Molnar#include <linux/file.h>
4ff8f2caSIngo Molnar#include <linux/fs_api.h>
4ff8f2caSIngo Molnar#include <linux/hrtimer_api.h>
4ff8f2caSIngo Molnar#include <linux/interrupt.h>
4ff8f2caSIngo Molnar#include <linux/irq_work.h>
4ff8f2caSIngo Molnar#include <linux/jiffies.h>
4ff8f2caSIngo Molnar#include <linux/kref_api.h>
325ea10cSIngo Molnar#include <linux/kthread.h>
4ff8f2caSIngo Molnar#include <linux/ktime_api.h>
4ff8f2caSIngo Molnar#include <linux/lockdep_api.h>
4ff8f2caSIngo Molnar#include <linux/lockdep.h>
4ff8f2caSIngo Molnar#include <linux/minmax.h>
4ff8f2caSIngo Molnar#include <linux/mm.h>
4ff8f2caSIngo Molnar#include <linux/module.h>
4ff8f2caSIngo Molnar#include <linux/mutex_api.h>
4ff8f2caSIngo Molnar#include <linux/plist.h>
4ff8f2caSIngo Molnar#include <linux/poll.h>
325ea10cSIngo Molnar#include <linux/proc_fs.h>
325ea10cSIngo Molnar#include <linux/profile.h>
eb414681SJohannes Weiner#include <linux/psi.h>
4ff8f2caSIngo Molnar#include <linux/rcupdate.h>
4ff8f2caSIngo Molnar#include <linux/seq_file.h>
4ff8f2caSIngo Molnar#include <linux/seqlock.h>
4ff8f2caSIngo Molnar#include <linux/softirq.h>
4ff8f2caSIngo Molnar#include <linux/spinlock_api.h>
4ff8f2caSIngo Molnar#include <linux/static_key.h>
391e43daSPeter Zijlstra#include <linux/stop_machine.h>
4ff8f2caSIngo Molnar#include <linux/syscalls_api.h>
325ea10cSIngo Molnar#include <linux/syscalls.h>
4ff8f2caSIngo Molnar#include <linux/tick.h>
4ff8f2caSIngo Molnar#include <linux/topology.h>
4ff8f2caSIngo Molnar#include <linux/types.h>
4ff8f2caSIngo Molnar#include <linux/u64_stats_sync_api.h>
4ff8f2caSIngo Molnar#include <linux/uaccess.h>
4ff8f2caSIngo Molnar#include <linux/wait_api.h>
4ff8f2caSIngo Molnar#include <linux/wait_bit.h>
4ff8f2caSIngo Molnar#include <linux/workqueue_api.h>
325ea10cSIngo Molnar
4ff8f2caSIngo Molnar#include <trace/events/power.h>
b9e9c6caSIngo Molnar#include <trace/events/sched.h>
b9e9c6caSIngo Molnar
4ff8f2caSIngo Molnar#include "../workqueue_internal.h"
4ff8f2caSIngo Molnar
b9e9c6caSIngo Molnar#ifdef CONFIG_CGROUP_SCHED
b9e9c6caSIngo Molnar#include <linux/cgroup.h>
b9e9c6caSIngo Molnar#include <linux/psi.h>
b9e9c6caSIngo Molnar#endif
b9e9c6caSIngo Molnar
b9e9c6caSIngo Molnar#ifdef CONFIG_SCHED_DEBUG
b9e9c6caSIngo Molnar# include <linux/static_key.h>
b9e9c6caSIngo Molnar#endif
391e43daSPeter Zijlstra
7fce777cSIngo Molnar#ifdef CONFIG_PARAVIRT
7fce777cSIngo Molnar# include <asm/paravirt.h>
4ff8f2caSIngo Molnar# include <asm/paravirt_api_clock.h>
7fce777cSIngo Molnar#endif
7fce777cSIngo Molnar
391e43daSPeter Zijlstra#include "cpupri.h"
6bfd6d72SJuri Lelli#include "cpudeadline.h"
391e43daSPeter Zijlstra
9148a3a1SPeter Zijlstra#ifdef CONFIG_SCHED_DEBUG
9148a3a1SPeter Zijlstra# define SCHED_WARN_ON(x)      WARN_ONCE(x, #x)
9148a3a1SPeter Zijlstra#else
6d3aed3dSIngo Molnar# define SCHED_WARN_ON(x)      ({ (void)(x), 0; })
9148a3a1SPeter Zijlstra#endif
9148a3a1SPeter Zijlstra
45ceebf7SPaul Gortmakerstruct rq;
442bf3aaSDaniel Lezcanostruct cpuidle_state;
45ceebf7SPaul Gortmaker
da0c1e65SKirill Tkhai/* task_struct::on_rq states: */
da0c1e65SKirill Tkhai#define TASK_ON_RQ_QUEUED	1
cca26e80SKirill Tkhai#define TASK_ON_RQ_MIGRATING	2
da0c1e65SKirill Tkhai
391e43daSPeter Zijlstraextern __read_mostly int scheduler_running;
391e43daSPeter Zijlstra
45ceebf7SPaul Gortmakerextern unsigned long calc_load_update;
45ceebf7SPaul Gortmakerextern atomic_long_t calc_load_tasks;
45ceebf7SPaul Gortmaker
3289bdb4SPeter Zijlstraextern void calc_global_load_tick(struct rq *this_rq);
d60585c5SThomas Gleixnerextern long calc_load_fold_active(struct rq *this_rq, long adjust);
3289bdb4SPeter Zijlstra
9d246053SPhil Auldextern void call_trace_sched_update_nr_running(struct rq *rq, int count);
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Helpers for converting nanosecond timing to jiffy resolution
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra#define NS_TO_JIFFIES(TIME)	((unsigned long)(TIME) / (NSEC_PER_SEC / HZ))
391e43daSPeter Zijlstra
cc1f4b1fSLi Zefan/*
cc1f4b1fSLi Zefan * Increase resolution of nice-level calculations for 64-bit architectures.
cc1f4b1fSLi Zefan * The extra resolution improves shares distribution and load balancing of
cc1f4b1fSLi Zefan * low-weight task groups (eg. nice +19 on an autogroup), deeper taskgroup
cc1f4b1fSLi Zefan * hierarchies, especially on larger systems. This is not a user-visible change
cc1f4b1fSLi Zefan * and does not change the user-interface for setting shares/weights.
cc1f4b1fSLi Zefan *
cc1f4b1fSLi Zefan * We increase resolution only if we have enough bits to allow this increased
97fb7a0aSIngo Molnar * resolution (i.e. 64-bit). The costs for increasing resolution when 32-bit
97fb7a0aSIngo Molnar * are pretty high and the returns do not justify the increased costs.
2159197dSPeter Zijlstra *
97fb7a0aSIngo Molnar * Really only required when CONFIG_FAIR_GROUP_SCHED=y is also set, but to
97fb7a0aSIngo Molnar * increase coverage and consistency always enable it on 64-bit platforms.
cc1f4b1fSLi Zefan */
2159197dSPeter Zijlstra#ifdef CONFIG_64BIT
172895e6SYuyang Du# define NICE_0_LOAD_SHIFT	(SCHED_FIXEDPOINT_SHIFT + SCHED_FIXEDPOINT_SHIFT)
6ecdd749SYuyang Du# define scale_load(w)		((w) << SCHED_FIXEDPOINT_SHIFT)
26cf5222SMichael Wang# define scale_load_down(w) \
26cf5222SMichael Wang({ \
26cf5222SMichael Wang	unsigned long __w = (w); \
26cf5222SMichael Wang	if (__w) \
26cf5222SMichael Wang		__w = max(2UL, __w >> SCHED_FIXEDPOINT_SHIFT); \
26cf5222SMichael Wang	__w; \
26cf5222SMichael Wang})
cc1f4b1fSLi Zefan#else
172895e6SYuyang Du# define NICE_0_LOAD_SHIFT	(SCHED_FIXEDPOINT_SHIFT)
cc1f4b1fSLi Zefan# define scale_load(w)		(w)
cc1f4b1fSLi Zefan# define scale_load_down(w)	(w)
cc1f4b1fSLi Zefan#endif
cc1f4b1fSLi Zefan
6ecdd749SYuyang Du/*
172895e6SYuyang Du * Task weight (visible to users) and its load (invisible to users) have
172895e6SYuyang Du * independent resolution, but they should be well calibrated. We use
172895e6SYuyang Du * scale_load() and scale_load_down(w) to convert between them. The
172895e6SYuyang Du * following must be true:
172895e6SYuyang Du *
9d061ba6SDietmar Eggemann *  scale_load(sched_prio_to_weight[NICE_TO_PRIO(0)-MAX_RT_PRIO]) == NICE_0_LOAD
172895e6SYuyang Du *
6ecdd749SYuyang Du */
172895e6SYuyang Du#define NICE_0_LOAD		(1L << NICE_0_LOAD_SHIFT)
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
332ac17eSDario Faggioli * Single value that decides SCHED_DEADLINE internal math precision.
332ac17eSDario Faggioli * 10 -> just above 1us
332ac17eSDario Faggioli * 9  -> just above 0.5us
332ac17eSDario Faggioli */
97fb7a0aSIngo Molnar#define DL_SCALE		10
332ac17eSDario Faggioli
332ac17eSDario Faggioli/*
97fb7a0aSIngo Molnar * Single value that denotes runtime == period, ie unlimited time.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra#define RUNTIME_INF		((u64)~0ULL)
391e43daSPeter Zijlstra
20f9cd2aSHenrik Austadstatic inline int idle_policy(int policy)
20f9cd2aSHenrik Austad{
20f9cd2aSHenrik Austad	return policy == SCHED_IDLE;
20f9cd2aSHenrik Austad}
d50dde5aSDario Faggiolistatic inline int fair_policy(int policy)
d50dde5aSDario Faggioli{
d50dde5aSDario Faggioli	return policy == SCHED_NORMAL || policy == SCHED_BATCH;
d50dde5aSDario Faggioli}
d50dde5aSDario Faggioli
391e43daSPeter Zijlstrastatic inline int rt_policy(int policy)
391e43daSPeter Zijlstra{
d50dde5aSDario Faggioli	return policy == SCHED_FIFO || policy == SCHED_RR;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
aab03e05SDario Faggiolistatic inline int dl_policy(int policy)
aab03e05SDario Faggioli{
aab03e05SDario Faggioli	return policy == SCHED_DEADLINE;
aab03e05SDario Faggioli}
20f9cd2aSHenrik Austadstatic inline bool valid_policy(int policy)
20f9cd2aSHenrik Austad{
20f9cd2aSHenrik Austad	return idle_policy(policy) || fair_policy(policy) ||
20f9cd2aSHenrik Austad		rt_policy(policy) || dl_policy(policy);
20f9cd2aSHenrik Austad}
aab03e05SDario Faggioli
1da1843fSViresh Kumarstatic inline int task_has_idle_policy(struct task_struct *p)
1da1843fSViresh Kumar{
1da1843fSViresh Kumar	return idle_policy(p->policy);
1da1843fSViresh Kumar}
1da1843fSViresh Kumar
391e43daSPeter Zijlstrastatic inline int task_has_rt_policy(struct task_struct *p)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return rt_policy(p->policy);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
aab03e05SDario Faggiolistatic inline int task_has_dl_policy(struct task_struct *p)
aab03e05SDario Faggioli{
aab03e05SDario Faggioli	return dl_policy(p->policy);
aab03e05SDario Faggioli}
aab03e05SDario Faggioli
07881166SJuri Lelli#define cap_scale(v, s) ((v)*(s) >> SCHED_CAPACITY_SHIFT)
07881166SJuri Lelli
d76343c6SValentin Schneiderstatic inline void update_avg(u64 *avg, u64 sample)
d76343c6SValentin Schneider{
d76343c6SValentin Schneider	s64 diff = sample - *avg;
d76343c6SValentin Schneider	*avg += diff / 8;
d76343c6SValentin Schneider}
d76343c6SValentin Schneider
2d3d891dSDario Faggioli/*
39a2a6ebSValentin Schneider * Shifting a value by an exponent greater *or equal* to the size of said value
39a2a6ebSValentin Schneider * is UB; cap at size-1.
39a2a6ebSValentin Schneider */
39a2a6ebSValentin Schneider#define shr_bound(val, shift)							\
39a2a6ebSValentin Schneider	(val >> min_t(typeof(shift), shift, BITS_PER_TYPE(typeof(val)) - 1))
39a2a6ebSValentin Schneider
39a2a6ebSValentin Schneider/*
794a56ebSJuri Lelli * !! For sched_setattr_nocheck() (kernel) only !!
794a56ebSJuri Lelli *
794a56ebSJuri Lelli * This is actually gross. :(
794a56ebSJuri Lelli *
794a56ebSJuri Lelli * It is used to make schedutil kworker(s) higher priority than SCHED_DEADLINE
794a56ebSJuri Lelli * tasks, but still be able to sleep. We need this on platforms that cannot
794a56ebSJuri Lelli * atomically change clock frequency. Remove once fast switching will be
794a56ebSJuri Lelli * available on such platforms.
794a56ebSJuri Lelli *
794a56ebSJuri Lelli * SUGOV stands for SchedUtil GOVernor.
794a56ebSJuri Lelli */
794a56ebSJuri Lelli#define SCHED_FLAG_SUGOV	0x10000000
794a56ebSJuri Lelli
f9509153SQuentin Perret#define SCHED_DL_FLAGS (SCHED_FLAG_RECLAIM | SCHED_FLAG_DL_OVERRUN | SCHED_FLAG_SUGOV)
f9509153SQuentin Perret
794a56ebSJuri Lellistatic inline bool dl_entity_is_special(struct sched_dl_entity *dl_se)
794a56ebSJuri Lelli{
794a56ebSJuri Lelli#ifdef CONFIG_CPU_FREQ_GOV_SCHEDUTIL
794a56ebSJuri Lelli	return unlikely(dl_se->flags & SCHED_FLAG_SUGOV);
794a56ebSJuri Lelli#else
794a56ebSJuri Lelli	return false;
794a56ebSJuri Lelli#endif
794a56ebSJuri Lelli}
794a56ebSJuri Lelli
794a56ebSJuri Lelli/*
2d3d891dSDario Faggioli * Tells if entity @a should preempt entity @b.
2d3d891dSDario Faggioli */
332ac17eSDario Faggiolistatic inline bool
332ac17eSDario Faggiolidl_entity_preempt(struct sched_dl_entity *a, struct sched_dl_entity *b)
2d3d891dSDario Faggioli{
794a56ebSJuri Lelli	return dl_entity_is_special(a) ||
794a56ebSJuri Lelli	       dl_time_before(a->deadline, b->deadline);
2d3d891dSDario Faggioli}
2d3d891dSDario Faggioli
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * This is the priority-queue data structure of the RT scheduling class:
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastruct rt_prio_array {
391e43daSPeter Zijlstra	DECLARE_BITMAP(bitmap, MAX_RT_PRIO+1); /* include 1 bit for delimiter */
391e43daSPeter Zijlstra	struct list_head queue[MAX_RT_PRIO];
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastruct rt_bandwidth {
391e43daSPeter Zijlstra	/* nests inside the rq lock: */
391e43daSPeter Zijlstra	raw_spinlock_t		rt_runtime_lock;
391e43daSPeter Zijlstra	ktime_t			rt_period;
391e43daSPeter Zijlstra	u64			rt_runtime;
391e43daSPeter Zijlstra	struct hrtimer		rt_period_timer;
4cfafd30SPeter Zijlstra	unsigned int		rt_period_active;
391e43daSPeter Zijlstra};
a5e7be3bSJuri Lelli
a5e7be3bSJuri Lellivoid __dl_clear_params(struct task_struct *p);
a5e7be3bSJuri Lelli
332ac17eSDario Faggiolistruct dl_bandwidth {
332ac17eSDario Faggioli	raw_spinlock_t		dl_runtime_lock;
332ac17eSDario Faggioli	u64			dl_runtime;
332ac17eSDario Faggioli	u64			dl_period;
332ac17eSDario Faggioli};
332ac17eSDario Faggioli
332ac17eSDario Faggiolistatic inline int dl_bandwidth_enabled(void)
332ac17eSDario Faggioli{
1724813dSPeter Zijlstra	return sysctl_sched_rt_runtime >= 0;
332ac17eSDario Faggioli}
332ac17eSDario Faggioli
a57415f5SPeng Liu/*
a57415f5SPeng Liu * To keep the bandwidth of -deadline tasks under control
a57415f5SPeng Liu * we need some place where:
a57415f5SPeng Liu *  - store the maximum -deadline bandwidth of each cpu;
a57415f5SPeng Liu *  - cache the fraction of bandwidth that is currently allocated in
a57415f5SPeng Liu *    each root domain;
a57415f5SPeng Liu *
a57415f5SPeng Liu * This is all done in the data structure below. It is similar to the
a57415f5SPeng Liu * one used for RT-throttling (rt_bandwidth), with the main difference
a57415f5SPeng Liu * that, since here we are only interested in admission control, we
a57415f5SPeng Liu * do not decrease any runtime while the group "executes", neither we
a57415f5SPeng Liu * need a timer to replenish it.
a57415f5SPeng Liu *
a57415f5SPeng Liu * With respect to SMP, bandwidth is given on a per root domain basis,
a57415f5SPeng Liu * meaning that:
a57415f5SPeng Liu *  - bw (< 100%) is the deadline bandwidth of each CPU;
a57415f5SPeng Liu *  - total_bw is the currently allocated bandwidth in each root domain;
a57415f5SPeng Liu */
332ac17eSDario Faggiolistruct dl_bw {
332ac17eSDario Faggioli	raw_spinlock_t		lock;
97fb7a0aSIngo Molnar	u64			bw;
97fb7a0aSIngo Molnar	u64			total_bw;
332ac17eSDario Faggioli};
332ac17eSDario Faggioli
b4118988SLuca Abeni/*
b4118988SLuca Abeni * Verify the fitness of task @p to run on @cpu taking into account the
b4118988SLuca Abeni * CPU original capacity and the runtime/deadline ratio of the task.
b4118988SLuca Abeni *
b4118988SLuca Abeni * The function will return true if the CPU original capacity of the
b4118988SLuca Abeni * @cpu scaled by SCHED_CAPACITY_SCALE >= runtime/deadline ratio of the
b4118988SLuca Abeni * task and false otherwise.
b4118988SLuca Abeni */
b4118988SLuca Abenistatic inline bool dl_task_fits_capacity(struct task_struct *p, int cpu)
b4118988SLuca Abeni{
b4118988SLuca Abeni	unsigned long cap = arch_scale_cpu_capacity(cpu);
b4118988SLuca Abeni
b4118988SLuca Abeni	return cap_scale(p->dl.dl_deadline, cap) >= p->dl.dl_runtime;
b4118988SLuca Abeni}
b4118988SLuca Abeni
f2cb1360SIngo Molnarextern void init_dl_bw(struct dl_bw *dl_b);
06a76fe0SNicolas Pitreextern int  sched_dl_global_validate(void);
06a76fe0SNicolas Pitreextern void sched_dl_do_global(void);
97fb7a0aSIngo Molnarextern int  sched_dl_overflow(struct task_struct *p, int policy, const struct sched_attr *attr);
06a76fe0SNicolas Pitreextern void __setparam_dl(struct task_struct *p, const struct sched_attr *attr);
06a76fe0SNicolas Pitreextern void __getparam_dl(struct task_struct *p, struct sched_attr *attr);
06a76fe0SNicolas Pitreextern bool __checkparam_dl(const struct sched_attr *attr);
06a76fe0SNicolas Pitreextern bool dl_param_changed(struct task_struct *p, const struct sched_attr *attr);
97fb7a0aSIngo Molnarextern int  dl_cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial);
772b6539SDietmar Eggemannextern int  dl_cpu_busy(int cpu, struct task_struct *p);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_CGROUP_SCHED
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastruct cfs_rq;
391e43daSPeter Zijlstrastruct rt_rq;
391e43daSPeter Zijlstra
35cf4e50SMike Galbraithextern struct list_head task_groups;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastruct cfs_bandwidth {
391e43daSPeter Zijlstra#ifdef CONFIG_CFS_BANDWIDTH
391e43daSPeter Zijlstra	raw_spinlock_t		lock;
391e43daSPeter Zijlstra	ktime_t			period;
97fb7a0aSIngo Molnar	u64			quota;
97fb7a0aSIngo Molnar	u64			runtime;
f4183717SHuaixin Chang	u64			burst;
bcb1704aSHuaixin Chang	u64			runtime_snap;
9c58c79aSZhihui Zhang	s64			hierarchical_quota;
391e43daSPeter Zijlstra
66567fcbSbsegall@google.com	u8			idle;
66567fcbSbsegall@google.com	u8			period_active;
66567fcbSbsegall@google.com	u8			slack_started;
97fb7a0aSIngo Molnar	struct hrtimer		period_timer;
97fb7a0aSIngo Molnar	struct hrtimer		slack_timer;
391e43daSPeter Zijlstra	struct list_head	throttled_cfs_rq;
391e43daSPeter Zijlstra
97fb7a0aSIngo Molnar	/* Statistics: */
97fb7a0aSIngo Molnar	int			nr_periods;
97fb7a0aSIngo Molnar	int			nr_throttled;
bcb1704aSHuaixin Chang	int			nr_burst;
391e43daSPeter Zijlstra	u64			throttled_time;
bcb1704aSHuaixin Chang	u64			burst_time;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
97fb7a0aSIngo Molnar/* Task group related information */
391e43daSPeter Zijlstrastruct task_group {
391e43daSPeter Zijlstra	struct cgroup_subsys_state css;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
97fb7a0aSIngo Molnar	/* schedulable entities of this group on each CPU */
391e43daSPeter Zijlstra	struct sched_entity	**se;
97fb7a0aSIngo Molnar	/* runqueue "owned" by this group on each CPU */
391e43daSPeter Zijlstra	struct cfs_rq		**cfs_rq;
391e43daSPeter Zijlstra	unsigned long		shares;
391e43daSPeter Zijlstra
30400039SJosh Don	/* A positive value indicates that this is a SCHED_IDLE group. */
30400039SJosh Don	int			idle;
30400039SJosh Don
fa6bddebSAlex Shi#ifdef	CONFIG_SMP
b0367629SWaiman Long	/*
b0367629SWaiman Long	 * load_avg can be heavily contended at clock tick time, so put
b0367629SWaiman Long	 * it in its own cacheline separated from the fields above which
b0367629SWaiman Long	 * will also be accessed at each tick.
b0367629SWaiman Long	 */
b0367629SWaiman Long	atomic_long_t		load_avg ____cacheline_aligned;
391e43daSPeter Zijlstra#endif
fa6bddebSAlex Shi#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_RT_GROUP_SCHED
391e43daSPeter Zijlstra	struct sched_rt_entity	**rt_se;
391e43daSPeter Zijlstra	struct rt_rq		**rt_rq;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	struct rt_bandwidth	rt_bandwidth;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	struct rcu_head		rcu;
391e43daSPeter Zijlstra	struct list_head	list;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	struct task_group	*parent;
391e43daSPeter Zijlstra	struct list_head	siblings;
391e43daSPeter Zijlstra	struct list_head	children;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_SCHED_AUTOGROUP
391e43daSPeter Zijlstra	struct autogroup	*autogroup;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	struct cfs_bandwidth	cfs_bandwidth;
2480c093SPatrick Bellasi
2480c093SPatrick Bellasi#ifdef CONFIG_UCLAMP_TASK_GROUP
2480c093SPatrick Bellasi	/* The two decimal precision [%] value requested from user-space */
2480c093SPatrick Bellasi	unsigned int		uclamp_pct[UCLAMP_CNT];
2480c093SPatrick Bellasi	/* Clamp values requested for a task group */
2480c093SPatrick Bellasi	struct uclamp_se	uclamp_req[UCLAMP_CNT];
0b60ba2dSPatrick Bellasi	/* Effective clamp values used for a task group */
0b60ba2dSPatrick Bellasi	struct uclamp_se	uclamp[UCLAMP_CNT];
2480c093SPatrick Bellasi#endif
2480c093SPatrick Bellasi
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
391e43daSPeter Zijlstra#define ROOT_TASK_GROUP_LOAD	NICE_0_LOAD
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * A weight of 0 or 1 can cause arithmetics problems.
391e43daSPeter Zijlstra * A weight of a cfs_rq is the sum of weights of which entities
391e43daSPeter Zijlstra * are queued on this cfs_rq, so a weight of a entity should not be
391e43daSPeter Zijlstra * too large, so as the shares value of a task group.
391e43daSPeter Zijlstra * (The default weight is 1024 - so there's no practical
391e43daSPeter Zijlstra *  limitation from this.)
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra#define MIN_SHARES		(1UL <<  1)
391e43daSPeter Zijlstra#define MAX_SHARES		(1UL << 18)
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstratypedef int (*tg_visitor)(struct task_group *, void *);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern int walk_tg_tree_from(struct task_group *from,
391e43daSPeter Zijlstra			     tg_visitor down, tg_visitor up, void *data);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Iterate the full tree, calling @down when first entering a node and @up when
391e43daSPeter Zijlstra * leaving it for the final time.
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * Caller must hold rcu_lock or sufficient equivalent.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline int walk_tg_tree(tg_visitor down, tg_visitor up, void *data)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return walk_tg_tree_from(&root_task_group, down, up, data);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern int tg_nop(struct task_group *tg, void *data);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern void free_fair_sched_group(struct task_group *tg);
391e43daSPeter Zijlstraextern int alloc_fair_sched_group(struct task_group *tg, struct task_group *parent);
8663e24dSPeter Zijlstraextern void online_fair_sched_group(struct task_group *tg);
6fe1f348SPeter Zijlstraextern void unregister_fair_sched_group(struct task_group *tg);
391e43daSPeter Zijlstraextern void init_tg_cfs_entry(struct task_group *tg, struct cfs_rq *cfs_rq,
391e43daSPeter Zijlstra			struct sched_entity *se, int cpu,
391e43daSPeter Zijlstra			struct sched_entity *parent);
391e43daSPeter Zijlstraextern void init_cfs_bandwidth(struct cfs_bandwidth *cfs_b);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern void __refill_cfs_bandwidth_runtime(struct cfs_bandwidth *cfs_b);
77a4d1a1SPeter Zijlstraextern void start_cfs_bandwidth(struct cfs_bandwidth *cfs_b);
391e43daSPeter Zijlstraextern void unthrottle_cfs_rq(struct cfs_rq *cfs_rq);
391e43daSPeter Zijlstra
b027789eSMathias Krauseextern void unregister_rt_sched_group(struct task_group *tg);
391e43daSPeter Zijlstraextern void free_rt_sched_group(struct task_group *tg);
391e43daSPeter Zijlstraextern int alloc_rt_sched_group(struct task_group *tg, struct task_group *parent);
391e43daSPeter Zijlstraextern void init_tg_rt_entry(struct task_group *tg, struct rt_rq *rt_rq,
391e43daSPeter Zijlstra		struct sched_rt_entity *rt_se, int cpu,
391e43daSPeter Zijlstra		struct sched_rt_entity *parent);
8887cd99SNicolas Pitreextern int sched_group_set_rt_runtime(struct task_group *tg, long rt_runtime_us);
8887cd99SNicolas Pitreextern int sched_group_set_rt_period(struct task_group *tg, u64 rt_period_us);
8887cd99SNicolas Pitreextern long sched_group_rt_runtime(struct task_group *tg);
8887cd99SNicolas Pitreextern long sched_group_rt_period(struct task_group *tg);
8887cd99SNicolas Pitreextern int sched_rt_can_attach(struct task_group *tg, struct task_struct *tsk);
391e43daSPeter Zijlstra
25cc7da7SLi Zefanextern struct task_group *sched_create_group(struct task_group *parent);
25cc7da7SLi Zefanextern void sched_online_group(struct task_group *tg,
25cc7da7SLi Zefan			       struct task_group *parent);
25cc7da7SLi Zefanextern void sched_destroy_group(struct task_group *tg);
b027789eSMathias Krauseextern void sched_release_group(struct task_group *tg);
25cc7da7SLi Zefan
25cc7da7SLi Zefanextern void sched_move_task(struct task_struct *tsk);
25cc7da7SLi Zefan
25cc7da7SLi Zefan#ifdef CONFIG_FAIR_GROUP_SCHED
25cc7da7SLi Zefanextern int sched_group_set_shares(struct task_group *tg, unsigned long shares);
ad936d86SByungchul Park
30400039SJosh Donextern int sched_group_set_idle(struct task_group *tg, long idle);
30400039SJosh Don
ad936d86SByungchul Park#ifdef CONFIG_SMP
ad936d86SByungchul Parkextern void set_task_rq_fair(struct sched_entity *se,
ad936d86SByungchul Park			     struct cfs_rq *prev, struct cfs_rq *next);
ad936d86SByungchul Park#else /* !CONFIG_SMP */
ad936d86SByungchul Parkstatic inline void set_task_rq_fair(struct sched_entity *se,
ad936d86SByungchul Park			     struct cfs_rq *prev, struct cfs_rq *next) { }
ad936d86SByungchul Park#endif /* CONFIG_SMP */
ad936d86SByungchul Park#endif /* CONFIG_FAIR_GROUP_SCHED */
25cc7da7SLi Zefan
391e43daSPeter Zijlstra#else /* CONFIG_CGROUP_SCHED */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastruct cfs_bandwidth { };
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#endif	/* CONFIG_CGROUP_SCHED */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/* CFS-related fields in a runqueue */
391e43daSPeter Zijlstrastruct cfs_rq {
391e43daSPeter Zijlstra	struct load_weight	load;
97fb7a0aSIngo Molnar	unsigned int		nr_running;
43e9f7f2SViresh Kumar	unsigned int		h_nr_running;      /* SCHED_{NORMAL,BATCH,IDLE} */
a480addeSJosh Don	unsigned int		idle_nr_running;   /* SCHED_IDLE */
43e9f7f2SViresh Kumar	unsigned int		idle_h_nr_running; /* SCHED_IDLE */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	u64			exec_clock;
391e43daSPeter Zijlstra	u64			min_vruntime;
c6047c2eSJoel Fernandes (Google)#ifdef CONFIG_SCHED_CORE
c6047c2eSJoel Fernandes (Google)	unsigned int		forceidle_seq;
c6047c2eSJoel Fernandes (Google)	u64			min_vruntime_fi;
c6047c2eSJoel Fernandes (Google)#endif
c6047c2eSJoel Fernandes (Google)
391e43daSPeter Zijlstra#ifndef CONFIG_64BIT
391e43daSPeter Zijlstra	u64			min_vruntime_copy;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
bfb06889SDavidlohr Bueso	struct rb_root_cached	tasks_timeline;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/*
391e43daSPeter Zijlstra	 * 'curr' points to currently running entity on this cfs_rq.
391e43daSPeter Zijlstra	 * It is set to NULL otherwise (i.e when none are currently running).
391e43daSPeter Zijlstra	 */
97fb7a0aSIngo Molnar	struct sched_entity	*curr;
97fb7a0aSIngo Molnar	struct sched_entity	*next;
97fb7a0aSIngo Molnar	struct sched_entity	*last;
97fb7a0aSIngo Molnar	struct sched_entity	*skip;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef	CONFIG_SCHED_DEBUG
391e43daSPeter Zijlstra	unsigned int		nr_spread_over;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
2dac754eSPaul Turner#ifdef CONFIG_SMP
2dac754eSPaul Turner	/*
9d89c257SYuyang Du	 * CFS load tracking
2dac754eSPaul Turner	 */
9d89c257SYuyang Du	struct sched_avg	avg;
2a2f5d4eSPeter Zijlstra#ifndef CONFIG_64BIT
2a2f5d4eSPeter Zijlstra	u64			load_last_update_time_copy;
2a2f5d4eSPeter Zijlstra#endif
2a2f5d4eSPeter Zijlstra	struct {
2a2f5d4eSPeter Zijlstra		raw_spinlock_t	lock ____cacheline_aligned;
2a2f5d4eSPeter Zijlstra		int		nr;
2a2f5d4eSPeter Zijlstra		unsigned long	load_avg;
2a2f5d4eSPeter Zijlstra		unsigned long	util_avg;
9f683953SVincent Guittot		unsigned long	runnable_avg;
2a2f5d4eSPeter Zijlstra	} removed;
141965c7SAlex Shi
c566e8e9SPaul Turner#ifdef CONFIG_FAIR_GROUP_SCHED
0e2d2aaaSPeter Zijlstra	unsigned long		tg_load_avg_contrib;
0e2d2aaaSPeter Zijlstra	long			propagate;
0e2d2aaaSPeter Zijlstra	long			prop_runnable_sum;
0e2d2aaaSPeter Zijlstra
82958366SPaul Turner	/*
82958366SPaul Turner	 *   h_load = weight * f(tg)
82958366SPaul Turner	 *
82958366SPaul Turner	 * Where f(tg) is the recursive weight fraction assigned to
82958366SPaul Turner	 * this group.
82958366SPaul Turner	 */
82958366SPaul Turner	unsigned long		h_load;
68520796SVladimir Davydov	u64			last_h_load_update;
68520796SVladimir Davydov	struct sched_entity	*h_load_next;
68520796SVladimir Davydov#endif /* CONFIG_FAIR_GROUP_SCHED */
82958366SPaul Turner#endif /* CONFIG_SMP */
82958366SPaul Turner
391e43daSPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
97fb7a0aSIngo Molnar	struct rq		*rq;	/* CPU runqueue to which this cfs_rq is attached */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/*
391e43daSPeter Zijlstra	 * leaf cfs_rqs are those that hold tasks (lowest schedulable entity in
391e43daSPeter Zijlstra	 * a hierarchy). Non-leaf lrqs hold other higher schedulable entities
391e43daSPeter Zijlstra	 * (like users, containers etc.)
391e43daSPeter Zijlstra	 *
97fb7a0aSIngo Molnar	 * leaf_cfs_rq_list ties together list of leaf cfs_rq's in a CPU.
97fb7a0aSIngo Molnar	 * This list is used during load balance.
391e43daSPeter Zijlstra	 */
391e43daSPeter Zijlstra	int			on_list;
391e43daSPeter Zijlstra	struct list_head	leaf_cfs_rq_list;
391e43daSPeter Zijlstra	struct task_group	*tg;	/* group that "owns" this runqueue */
391e43daSPeter Zijlstra
30400039SJosh Don	/* Locally cached copy of our task_group's idle value */
30400039SJosh Don	int			idle;
30400039SJosh Don
391e43daSPeter Zijlstra#ifdef CONFIG_CFS_BANDWIDTH
391e43daSPeter Zijlstra	int			runtime_enabled;
391e43daSPeter Zijlstra	s64			runtime_remaining;
391e43daSPeter Zijlstra
97fb7a0aSIngo Molnar	u64			throttled_clock;
64eaf507SChengming Zhou	u64			throttled_clock_pelt;
64eaf507SChengming Zhou	u64			throttled_clock_pelt_time;
97fb7a0aSIngo Molnar	int			throttled;
97fb7a0aSIngo Molnar	int			throttle_count;
391e43daSPeter Zijlstra	struct list_head	throttled_list;
391e43daSPeter Zijlstra#endif /* CONFIG_CFS_BANDWIDTH */
391e43daSPeter Zijlstra#endif /* CONFIG_FAIR_GROUP_SCHED */
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline int rt_bandwidth_enabled(void)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return sysctl_sched_rt_runtime >= 0;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
b6366f04SSteven Rostedt/* RT IPI pull logic requires IRQ_WORK */
4bdced5cSSteven Rostedt (Red Hat)#if defined(CONFIG_IRQ_WORK) && defined(CONFIG_SMP)
b6366f04SSteven Rostedt# define HAVE_RT_PUSH_IPI
b6366f04SSteven Rostedt#endif
b6366f04SSteven Rostedt
391e43daSPeter Zijlstra/* Real-Time classes' related field in a runqueue: */
391e43daSPeter Zijlstrastruct rt_rq {
391e43daSPeter Zijlstra	struct rt_prio_array	active;
c82513e5SPeter Zijlstra	unsigned int		rt_nr_running;
01d36d0aSFrederic Weisbecker	unsigned int		rr_nr_running;
391e43daSPeter Zijlstra#if defined CONFIG_SMP || defined CONFIG_RT_GROUP_SCHED
391e43daSPeter Zijlstra	struct {
391e43daSPeter Zijlstra		int		curr; /* highest queued rt task prio */
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra		int		next; /* next highest */
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra	} highest_prio;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
e6fe3f42SAlexey Dobriyan	unsigned int		rt_nr_migratory;
e6fe3f42SAlexey Dobriyan	unsigned int		rt_nr_total;
391e43daSPeter Zijlstra	int			overloaded;
391e43daSPeter Zijlstra	struct plist_head	pushable_tasks;
371bf427SVincent Guittot
b6366f04SSteven Rostedt#endif /* CONFIG_SMP */
f4ebcbc0SKirill Tkhai	int			rt_queued;
f4ebcbc0SKirill Tkhai
391e43daSPeter Zijlstra	int			rt_throttled;
391e43daSPeter Zijlstra	u64			rt_time;
391e43daSPeter Zijlstra	u64			rt_runtime;
391e43daSPeter Zijlstra	/* Nests inside the rq lock: */
391e43daSPeter Zijlstra	raw_spinlock_t		rt_runtime_lock;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_RT_GROUP_SCHED
e6fe3f42SAlexey Dobriyan	unsigned int		rt_nr_boosted;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	struct rq		*rq;
391e43daSPeter Zijlstra	struct task_group	*tg;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
296b2ffeSVincent Guittotstatic inline bool rt_rq_is_runnable(struct rt_rq *rt_rq)
296b2ffeSVincent Guittot{
296b2ffeSVincent Guittot	return rt_rq->rt_queued && rt_rq->rt_nr_running;
296b2ffeSVincent Guittot}
296b2ffeSVincent Guittot
aab03e05SDario Faggioli/* Deadline class' related fields in a runqueue */
aab03e05SDario Faggiolistruct dl_rq {
aab03e05SDario Faggioli	/* runqueue is an rbtree, ordered by deadline */
2161573eSDavidlohr Bueso	struct rb_root_cached	root;
aab03e05SDario Faggioli
e6fe3f42SAlexey Dobriyan	unsigned int		dl_nr_running;
1baca4ceSJuri Lelli
1baca4ceSJuri Lelli#ifdef CONFIG_SMP
1baca4ceSJuri Lelli	/*
1baca4ceSJuri Lelli	 * Deadline values of the currently executing and the
1baca4ceSJuri Lelli	 * earliest ready task on this rq. Caching these facilitates
dfcb245eSIngo Molnar	 * the decision whether or not a ready but not running task
1baca4ceSJuri Lelli	 * should migrate somewhere else.
1baca4ceSJuri Lelli	 */
1baca4ceSJuri Lelli	struct {
1baca4ceSJuri Lelli		u64		curr;
1baca4ceSJuri Lelli		u64		next;
1baca4ceSJuri Lelli	} earliest_dl;
1baca4ceSJuri Lelli
e6fe3f42SAlexey Dobriyan	unsigned int		dl_nr_migratory;
1baca4ceSJuri Lelli	int			overloaded;
1baca4ceSJuri Lelli
1baca4ceSJuri Lelli	/*
1baca4ceSJuri Lelli	 * Tasks on this rq that can be pushed away. They are kept in
1baca4ceSJuri Lelli	 * an rb-tree, ordered by tasks' deadlines, with caching
1baca4ceSJuri Lelli	 * of the leftmost (earliest deadline) element.
1baca4ceSJuri Lelli	 */
2161573eSDavidlohr Bueso	struct rb_root_cached	pushable_dl_tasks_root;
332ac17eSDario Faggioli#else
332ac17eSDario Faggioli	struct dl_bw		dl_bw;
1baca4ceSJuri Lelli#endif
e36d8677SLuca Abeni	/*
e36d8677SLuca Abeni	 * "Active utilization" for this runqueue: increased when a
e36d8677SLuca Abeni	 * task wakes up (becomes TASK_RUNNING) and decreased when a
e36d8677SLuca Abeni	 * task blocks
e36d8677SLuca Abeni	 */
e36d8677SLuca Abeni	u64			running_bw;
4da3abceSLuca Abeni
4da3abceSLuca Abeni	/*
8fd27231SLuca Abeni	 * Utilization of the tasks "assigned" to this runqueue (including
8fd27231SLuca Abeni	 * the tasks that are in runqueue and the tasks that executed on this
8fd27231SLuca Abeni	 * CPU and blocked). Increased when a task moves to this runqueue, and
8fd27231SLuca Abeni	 * decreased when the task moves away (migrates, changes scheduling
8fd27231SLuca Abeni	 * policy, or terminates).
8fd27231SLuca Abeni	 * This is needed to compute the "inactive utilization" for the
8fd27231SLuca Abeni	 * runqueue (inactive utilization = this_bw - running_bw).
8fd27231SLuca Abeni	 */
8fd27231SLuca Abeni	u64			this_bw;
daec5798SLuca Abeni	u64			extra_bw;
8fd27231SLuca Abeni
8fd27231SLuca Abeni	/*
4da3abceSLuca Abeni	 * Inverse of the fraction of CPU utilization that can be reclaimed
4da3abceSLuca Abeni	 * by the GRUB algorithm.
4da3abceSLuca Abeni	 */
4da3abceSLuca Abeni	u64			bw_ratio;
aab03e05SDario Faggioli};
aab03e05SDario Faggioli
c0796298SVincent Guittot#ifdef CONFIG_FAIR_GROUP_SCHED
c0796298SVincent Guittot/* An entity is a task if it doesn't "own" a runqueue */
c0796298SVincent Guittot#define entity_is_task(se)	(!se->my_q)
0dacee1bSVincent Guittot
9f683953SVincent Guittotstatic inline void se_update_runnable(struct sched_entity *se)
9f683953SVincent Guittot{
9f683953SVincent Guittot	if (!entity_is_task(se))
9f683953SVincent Guittot		se->runnable_weight = se->my_q->h_nr_running;
9f683953SVincent Guittot}
9f683953SVincent Guittot
9f683953SVincent Guittotstatic inline long se_runnable(struct sched_entity *se)
9f683953SVincent Guittot{
9f683953SVincent Guittot	if (entity_is_task(se))
9f683953SVincent Guittot		return !!se->on_rq;
9f683953SVincent Guittot	else
9f683953SVincent Guittot		return se->runnable_weight;
9f683953SVincent Guittot}
9f683953SVincent Guittot
c0796298SVincent Guittot#else
c0796298SVincent Guittot#define entity_is_task(se)	1
0dacee1bSVincent Guittot
9f683953SVincent Guittotstatic inline void se_update_runnable(struct sched_entity *se) {}
9f683953SVincent Guittot
9f683953SVincent Guittotstatic inline long se_runnable(struct sched_entity *se)
9f683953SVincent Guittot{
9f683953SVincent Guittot	return !!se->on_rq;
9f683953SVincent Guittot}
c0796298SVincent Guittot#endif
c0796298SVincent Guittot
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
c0796298SVincent Guittot/*
c0796298SVincent Guittot * XXX we want to get rid of these helpers and use the full load resolution.
c0796298SVincent Guittot */
c0796298SVincent Guittotstatic inline long se_weight(struct sched_entity *se)
c0796298SVincent Guittot{
c0796298SVincent Guittot	return scale_load_down(se->load.weight);
c0796298SVincent Guittot}
c0796298SVincent Guittot
391e43daSPeter Zijlstra
afe06efdSTim Chenstatic inline bool sched_asym_prefer(int a, int b)
afe06efdSTim Chen{
afe06efdSTim Chen	return arch_asym_cpu_priority(a) > arch_asym_cpu_priority(b);
afe06efdSTim Chen}
afe06efdSTim Chen
6aa140faSQuentin Perretstruct perf_domain {
6aa140faSQuentin Perret	struct em_perf_domain *em_pd;
6aa140faSQuentin Perret	struct perf_domain *next;
6aa140faSQuentin Perret	struct rcu_head rcu;
6aa140faSQuentin Perret};
6aa140faSQuentin Perret
630246a0SQuentin Perret/* Scheduling group status flags */
630246a0SQuentin Perret#define SG_OVERLOAD		0x1 /* More than one runnable task on a CPU. */
2802bf3cSMorten Rasmussen#define SG_OVERUTILIZED		0x2 /* One or more CPUs are over-utilized. */
630246a0SQuentin Perret
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * We add the notion of a root-domain which will be used to define per-domain
391e43daSPeter Zijlstra * variables. Each exclusive cpuset essentially defines an island domain by
97fb7a0aSIngo Molnar * fully partitioning the member CPUs from any other cpuset. Whenever a new
391e43daSPeter Zijlstra * exclusive cpuset is created, we also create and attach a new root-domain
391e43daSPeter Zijlstra * object.
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastruct root_domain {
391e43daSPeter Zijlstra	atomic_t		refcount;
391e43daSPeter Zijlstra	atomic_t		rto_count;
391e43daSPeter Zijlstra	struct rcu_head		rcu;
391e43daSPeter Zijlstra	cpumask_var_t		span;
391e43daSPeter Zijlstra	cpumask_var_t		online;
391e43daSPeter Zijlstra
757ffdd7SValentin Schneider	/*
757ffdd7SValentin Schneider	 * Indicate pullable load on at least one CPU, e.g:
757ffdd7SValentin Schneider	 * - More than one runnable task
757ffdd7SValentin Schneider	 * - Running task is misfit
757ffdd7SValentin Schneider	 */
575638d1SValentin Schneider	int			overload;
4486edd1STim Chen
2802bf3cSMorten Rasmussen	/* Indicate one or more cpus over-utilized (tipping point) */
2802bf3cSMorten Rasmussen	int			overutilized;
2802bf3cSMorten Rasmussen
391e43daSPeter Zijlstra	/*
1baca4ceSJuri Lelli	 * The bit corresponding to a CPU gets set here if such CPU has more
1baca4ceSJuri Lelli	 * than one runnable -deadline task (as it is below for RT tasks).
1baca4ceSJuri Lelli	 */
1baca4ceSJuri Lelli	cpumask_var_t		dlo_mask;
1baca4ceSJuri Lelli	atomic_t		dlo_count;
332ac17eSDario Faggioli	struct dl_bw		dl_bw;
6bfd6d72SJuri Lelli	struct cpudl		cpudl;
1baca4ceSJuri Lelli
26762423SPeng Liu	/*
26762423SPeng Liu	 * Indicate whether a root_domain's dl_bw has been checked or
26762423SPeng Liu	 * updated. It's monotonously increasing value.
26762423SPeng Liu	 *
26762423SPeng Liu	 * Also, some corner cases, like 'wrap around' is dangerous, but given
26762423SPeng Liu	 * that u64 is 'big enough'. So that shouldn't be a concern.
26762423SPeng Liu	 */
26762423SPeng Liu	u64 visit_gen;
26762423SPeng Liu
4bdced5cSSteven Rostedt (Red Hat)#ifdef HAVE_RT_PUSH_IPI
4bdced5cSSteven Rostedt (Red Hat)	/*
4bdced5cSSteven Rostedt (Red Hat)	 * For IPI pull requests, loop across the rto_mask.
4bdced5cSSteven Rostedt (Red Hat)	 */
4bdced5cSSteven Rostedt (Red Hat)	struct irq_work		rto_push_work;
4bdced5cSSteven Rostedt (Red Hat)	raw_spinlock_t		rto_lock;
4bdced5cSSteven Rostedt (Red Hat)	/* These are only updated and read within rto_lock */
4bdced5cSSteven Rostedt (Red Hat)	int			rto_loop;
4bdced5cSSteven Rostedt (Red Hat)	int			rto_cpu;
4bdced5cSSteven Rostedt (Red Hat)	/* These atomics are updated outside of a lock */
4bdced5cSSteven Rostedt (Red Hat)	atomic_t		rto_loop_next;
4bdced5cSSteven Rostedt (Red Hat)	atomic_t		rto_loop_start;
4bdced5cSSteven Rostedt (Red Hat)#endif
1baca4ceSJuri Lelli	/*
391e43daSPeter Zijlstra	 * The "RT overload" flag: it gets set if a CPU has more than
391e43daSPeter Zijlstra	 * one runnable RT task.
391e43daSPeter Zijlstra	 */
391e43daSPeter Zijlstra	cpumask_var_t		rto_mask;
391e43daSPeter Zijlstra	struct cpupri		cpupri;
cd92bfd3SDietmar Eggemann
cd92bfd3SDietmar Eggemann	unsigned long		max_cpu_capacity;
6aa140faSQuentin Perret
6aa140faSQuentin Perret	/*
6aa140faSQuentin Perret	 * NULL-terminated list of performance domains intersecting with the
6aa140faSQuentin Perret	 * CPUs of the rd. Protected by RCU.
6aa140faSQuentin Perret	 */
7ba7319fSJoel Fernandes (Google)	struct perf_domain __rcu *pd;
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
f2cb1360SIngo Molnarextern void init_defrootdomain(void);
8d5dc512SPeter Zijlstraextern int sched_init_domains(const struct cpumask *cpu_map);
f2cb1360SIngo Molnarextern void rq_attach_root(struct rq *rq, struct root_domain *rd);
364f5665SSteven Rostedt (VMware)extern void sched_get_rd(struct root_domain *rd);
364f5665SSteven Rostedt (VMware)extern void sched_put_rd(struct root_domain *rd);
391e43daSPeter Zijlstra
4bdced5cSSteven Rostedt (Red Hat)#ifdef HAVE_RT_PUSH_IPI
4bdced5cSSteven Rostedt (Red Hat)extern void rto_push_irq_work_func(struct irq_work *work);
4bdced5cSSteven Rostedt (Red Hat)#endif
391e43daSPeter Zijlstra#endif /* CONFIG_SMP */
391e43daSPeter Zijlstra
69842cbaSPatrick Bellasi#ifdef CONFIG_UCLAMP_TASK
69842cbaSPatrick Bellasi/*
69842cbaSPatrick Bellasi * struct uclamp_bucket - Utilization clamp bucket
69842cbaSPatrick Bellasi * @value: utilization clamp value for tasks on this clamp bucket
69842cbaSPatrick Bellasi * @tasks: number of RUNNABLE tasks on this clamp bucket
69842cbaSPatrick Bellasi *
69842cbaSPatrick Bellasi * Keep track of how many tasks are RUNNABLE for a given utilization
69842cbaSPatrick Bellasi * clamp value.
69842cbaSPatrick Bellasi */
69842cbaSPatrick Bellasistruct uclamp_bucket {
69842cbaSPatrick Bellasi	unsigned long value : bits_per(SCHED_CAPACITY_SCALE);
69842cbaSPatrick Bellasi	unsigned long tasks : BITS_PER_LONG - bits_per(SCHED_CAPACITY_SCALE);
69842cbaSPatrick Bellasi};
69842cbaSPatrick Bellasi
69842cbaSPatrick Bellasi/*
69842cbaSPatrick Bellasi * struct uclamp_rq - rq's utilization clamp
69842cbaSPatrick Bellasi * @value: currently active clamp values for a rq
69842cbaSPatrick Bellasi * @bucket: utilization clamp buckets affecting a rq
69842cbaSPatrick Bellasi *
69842cbaSPatrick Bellasi * Keep track of RUNNABLE tasks on a rq to aggregate their clamp values.
69842cbaSPatrick Bellasi * A clamp value is affecting a rq when there is at least one task RUNNABLE
69842cbaSPatrick Bellasi * (or actually running) with that value.
69842cbaSPatrick Bellasi *
69842cbaSPatrick Bellasi * There are up to UCLAMP_CNT possible different clamp values, currently there
69842cbaSPatrick Bellasi * are only two: minimum utilization and maximum utilization.
69842cbaSPatrick Bellasi *
69842cbaSPatrick Bellasi * All utilization clamping values are MAX aggregated, since:
69842cbaSPatrick Bellasi * - for util_min: we want to run the CPU at least at the max of the minimum
69842cbaSPatrick Bellasi *   utilization required by its currently RUNNABLE tasks.
69842cbaSPatrick Bellasi * - for util_max: we want to allow the CPU to run up to the max of the
69842cbaSPatrick Bellasi *   maximum utilization allowed by its currently RUNNABLE tasks.
69842cbaSPatrick Bellasi *
69842cbaSPatrick Bellasi * Since on each system we expect only a limited number of different
69842cbaSPatrick Bellasi * utilization clamp values (UCLAMP_BUCKETS), use a simple array to track
69842cbaSPatrick Bellasi * the metrics required to compute all the per-rq utilization clamp values.
69842cbaSPatrick Bellasi */
69842cbaSPatrick Bellasistruct uclamp_rq {
69842cbaSPatrick Bellasi	unsigned int value;
69842cbaSPatrick Bellasi	struct uclamp_bucket bucket[UCLAMP_BUCKETS];
69842cbaSPatrick Bellasi};
46609ce2SQais Yousef
46609ce2SQais YousefDECLARE_STATIC_KEY_FALSE(sched_uclamp_used);
69842cbaSPatrick Bellasi#endif /* CONFIG_UCLAMP_TASK */
69842cbaSPatrick Bellasi
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * This is the main, per-CPU runqueue data structure.
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * Locking rule: those places that want to lock multiple runqueues
391e43daSPeter Zijlstra * (such as the load balancing or the thread migration code), lock
391e43daSPeter Zijlstra * acquire operations must be ordered by ascending &runqueue.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastruct rq {
391e43daSPeter Zijlstra	/* runqueue lock: */
5cb9eaa3SPeter Zijlstra	raw_spinlock_t		__lock;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/*
391e43daSPeter Zijlstra	 * nr_running and cpu_load should be in the same cacheline because
391e43daSPeter Zijlstra	 * remote CPUs use both these fields when doing load calculation.
391e43daSPeter Zijlstra	 */
c82513e5SPeter Zijlstra	unsigned int		nr_running;
0ec8aa00SPeter Zijlstra#ifdef CONFIG_NUMA_BALANCING
0ec8aa00SPeter Zijlstra	unsigned int		nr_numa_running;
0ec8aa00SPeter Zijlstra	unsigned int		nr_preferred_running;
a4739ecaSSrikar Dronamraju	unsigned int		numa_migrate_on;
0ec8aa00SPeter Zijlstra#endif
3451d024SFrederic Weisbecker#ifdef CONFIG_NO_HZ_COMMON
9fd81dd5SFrederic Weisbecker#ifdef CONFIG_SMP
e022e0d3SPeter Zijlstra	unsigned long		last_blocked_load_update_tick;
f643ea22SVincent Guittot	unsigned int		has_blocked_load;
90b5363aSPeter Zijlstra (Intel)	call_single_data_t	nohz_csd;
9fd81dd5SFrederic Weisbecker#endif /* CONFIG_SMP */
00357f5eSPeter Zijlstra	unsigned int		nohz_tick_stopped;
a22e47a4SPeter Zijlstra	atomic_t		nohz_flags;
9fd81dd5SFrederic Weisbecker#endif /* CONFIG_NO_HZ_COMMON */
dcdedb24SFrederic Weisbecker
126c2092SPeter Zijlstra#ifdef CONFIG_SMP
126c2092SPeter Zijlstra	unsigned int		ttwu_pending;
126c2092SPeter Zijlstra#endif
391e43daSPeter Zijlstra	u64			nr_switches;
391e43daSPeter Zijlstra
69842cbaSPatrick Bellasi#ifdef CONFIG_UCLAMP_TASK
69842cbaSPatrick Bellasi	/* Utilization clamp values based on CPU's RUNNABLE tasks */
69842cbaSPatrick Bellasi	struct uclamp_rq	uclamp[UCLAMP_CNT] ____cacheline_aligned;
e496187dSPatrick Bellasi	unsigned int		uclamp_flags;
e496187dSPatrick Bellasi#define UCLAMP_FLAG_IDLE 0x01
69842cbaSPatrick Bellasi#endif
69842cbaSPatrick Bellasi
391e43daSPeter Zijlstra	struct cfs_rq		cfs;
391e43daSPeter Zijlstra	struct rt_rq		rt;
aab03e05SDario Faggioli	struct dl_rq		dl;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
97fb7a0aSIngo Molnar	/* list of leaf cfs_rq on this CPU: */
391e43daSPeter Zijlstra	struct list_head	leaf_cfs_rq_list;
9c2791f9SVincent Guittot	struct list_head	*tmp_alone_branch;
a35b6466SPeter Zijlstra#endif /* CONFIG_FAIR_GROUP_SCHED */
a35b6466SPeter Zijlstra
391e43daSPeter Zijlstra	/*
391e43daSPeter Zijlstra	 * This is part of a global counter where only the total sum
391e43daSPeter Zijlstra	 * over all CPUs matters. A task can increase this counter on
391e43daSPeter Zijlstra	 * one CPU and if it got migrated afterwards it may decrease
391e43daSPeter Zijlstra	 * it on another CPU. Always updated under the runqueue lock:
391e43daSPeter Zijlstra	 */
e6fe3f42SAlexey Dobriyan	unsigned int		nr_uninterruptible;
391e43daSPeter Zijlstra
4104a562SMadhuparna Bhowmik	struct task_struct __rcu	*curr;
97fb7a0aSIngo Molnar	struct task_struct	*idle;
97fb7a0aSIngo Molnar	struct task_struct	*stop;
391e43daSPeter Zijlstra	unsigned long		next_balance;
391e43daSPeter Zijlstra	struct mm_struct	*prev_mm;
391e43daSPeter Zijlstra
cb42c9a3SMatt Fleming	unsigned int		clock_update_flags;
391e43daSPeter Zijlstra	u64			clock;
23127296SVincent Guittot	/* Ensure that all clocks are in the same cache line */
23127296SVincent Guittot	u64			clock_task ____cacheline_aligned;
23127296SVincent Guittot	u64			clock_pelt;
23127296SVincent Guittot	unsigned long		lost_idle_time;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	atomic_t		nr_iowait;
391e43daSPeter Zijlstra
c006fac5SPaul Turner#ifdef CONFIG_SCHED_DEBUG
c006fac5SPaul Turner	u64 last_seen_need_resched_ns;
c006fac5SPaul Turner	int ticks_without_resched;
c006fac5SPaul Turner#endif
c006fac5SPaul Turner
227a4aadSMathieu Desnoyers#ifdef CONFIG_MEMBARRIER
227a4aadSMathieu Desnoyers	int membarrier_state;
227a4aadSMathieu Desnoyers#endif
227a4aadSMathieu Desnoyers
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra	struct root_domain		*rd;
994aeb7aSJoel Fernandes (Google)	struct sched_domain __rcu	*sd;
391e43daSPeter Zijlstra
ced549faSNicolas Pitre	unsigned long		cpu_capacity;
ca6d75e6SVincent Guittot	unsigned long		cpu_capacity_orig;
391e43daSPeter Zijlstra
e3fca9e7SPeter Zijlstra	struct callback_head	*balance_callback;
e3fca9e7SPeter Zijlstra
19a1f5ecSPeter Zijlstra	unsigned char		nohz_idle_balance;
391e43daSPeter Zijlstra	unsigned char		idle_balance;
97fb7a0aSIngo Molnar
3b1baa64SMorten Rasmussen	unsigned long		misfit_task_load;
3b1baa64SMorten Rasmussen
391e43daSPeter Zijlstra	/* For active balancing */
391e43daSPeter Zijlstra	int			active_balance;
391e43daSPeter Zijlstra	int			push_cpu;
391e43daSPeter Zijlstra	struct cpu_stop_work	active_balance_work;
97fb7a0aSIngo Molnar
97fb7a0aSIngo Molnar	/* CPU of this runqueue: */
391e43daSPeter Zijlstra	int			cpu;
391e43daSPeter Zijlstra	int			online;
391e43daSPeter Zijlstra
367456c7SPeter Zijlstra	struct list_head cfs_tasks;
367456c7SPeter Zijlstra
371bf427SVincent Guittot	struct sched_avg	avg_rt;
3727e0e1SVincent Guittot	struct sched_avg	avg_dl;
11d4afd4SVincent Guittot#ifdef CONFIG_HAVE_SCHED_AVG_IRQ
91c27493SVincent Guittot	struct sched_avg	avg_irq;
91c27493SVincent Guittot#endif
76504793SThara Gopinath#ifdef CONFIG_SCHED_THERMAL_PRESSURE
76504793SThara Gopinath	struct sched_avg	avg_thermal;
76504793SThara Gopinath#endif
391e43daSPeter Zijlstra	u64			idle_stamp;
391e43daSPeter Zijlstra	u64			avg_idle;
9bd721c5SJason Low
94aafc3eSPeter Zijlstra	unsigned long		wake_stamp;
94aafc3eSPeter Zijlstra	u64			wake_avg_idle;
94aafc3eSPeter Zijlstra
9bd721c5SJason Low	/* This is used to determine avg_idle's max value */
9bd721c5SJason Low	u64			max_idle_balance_cost;
f2469a1fSThomas Gleixner
f2469a1fSThomas Gleixner#ifdef CONFIG_HOTPLUG_CPU
f2469a1fSThomas Gleixner	struct rcuwait		hotplug_wait;
f2469a1fSThomas Gleixner#endif
90b5363aSPeter Zijlstra (Intel)#endif /* CONFIG_SMP */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_IRQ_TIME_ACCOUNTING
391e43daSPeter Zijlstra	u64			prev_irq_time;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra#ifdef CONFIG_PARAVIRT
391e43daSPeter Zijlstra	u64			prev_steal_time;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra#ifdef CONFIG_PARAVIRT_TIME_ACCOUNTING
391e43daSPeter Zijlstra	u64			prev_steal_time_rq;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/* calc_load related fields */
391e43daSPeter Zijlstra	unsigned long		calc_load_update;
391e43daSPeter Zijlstra	long			calc_load_active;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_SCHED_HRTICK
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
966a9671SYing Huang	call_single_data_t	hrtick_csd;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra	struct hrtimer		hrtick_timer;
156ec6f4SJuri Lelli	ktime_t 		hrtick_time;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_SCHEDSTATS
391e43daSPeter Zijlstra	/* latency stats */
391e43daSPeter Zijlstra	struct sched_info	rq_sched_info;
391e43daSPeter Zijlstra	unsigned long long	rq_cpu_time;
391e43daSPeter Zijlstra	/* could above be rq->cfs_rq.exec_clock + rq->rt_rq.rt_runtime ? */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/* sys_sched_yield() stats */
391e43daSPeter Zijlstra	unsigned int		yld_count;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/* schedule() stats */
391e43daSPeter Zijlstra	unsigned int		sched_count;
391e43daSPeter Zijlstra	unsigned int		sched_goidle;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	/* try_to_wake_up() stats */
391e43daSPeter Zijlstra	unsigned int		ttwu_count;
391e43daSPeter Zijlstra	unsigned int		ttwu_local;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
442bf3aaSDaniel Lezcano#ifdef CONFIG_CPU_IDLE
442bf3aaSDaniel Lezcano	/* Must be inspected within a rcu lock section */
442bf3aaSDaniel Lezcano	struct cpuidle_state	*idle_state;
442bf3aaSDaniel Lezcano#endif
3015ef4bSThomas Gleixner
74d862b6SThomas Gleixner#ifdef CONFIG_SMP
3015ef4bSThomas Gleixner	unsigned int		nr_pinned;
3015ef4bSThomas Gleixner#endif
a7c81556SPeter Zijlstra	unsigned int		push_busy;
a7c81556SPeter Zijlstra	struct cpu_stop_work	push_work;
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstra#ifdef CONFIG_SCHED_CORE
9edeaea1SPeter Zijlstra	/* per rq */
9edeaea1SPeter Zijlstra	struct rq		*core;
539f6512SPeter Zijlstra	struct task_struct	*core_pick;
9edeaea1SPeter Zijlstra	unsigned int		core_enabled;
539f6512SPeter Zijlstra	unsigned int		core_sched_seq;
8a311c74SPeter Zijlstra	struct rb_root		core_tree;
8a311c74SPeter Zijlstra
3c474b32SPeter Zijlstra	/* shared state -- careful with sched_core_cpu_deactivate() */
8a311c74SPeter Zijlstra	unsigned int		core_task_seq;
539f6512SPeter Zijlstra	unsigned int		core_pick_seq;
539f6512SPeter Zijlstra	unsigned long		core_cookie;
4feee7d1SJosh Don	unsigned int		core_forceidle_count;
c6047c2eSJoel Fernandes (Google)	unsigned int		core_forceidle_seq;
4feee7d1SJosh Don	unsigned int		core_forceidle_occupation;
4feee7d1SJosh Don	u64			core_forceidle_start;
9edeaea1SPeter Zijlstra#endif
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
62478d99SVincent Guittot#ifdef CONFIG_FAIR_GROUP_SCHED
62478d99SVincent Guittot
62478d99SVincent Guittot/* CPU runqueue to which this cfs_rq is attached */
62478d99SVincent Guittotstatic inline struct rq *rq_of(struct cfs_rq *cfs_rq)
62478d99SVincent Guittot{
62478d99SVincent Guittot	return cfs_rq->rq;
62478d99SVincent Guittot}
62478d99SVincent Guittot
62478d99SVincent Guittot#else
62478d99SVincent Guittot
62478d99SVincent Guittotstatic inline struct rq *rq_of(struct cfs_rq *cfs_rq)
62478d99SVincent Guittot{
62478d99SVincent Guittot	return container_of(cfs_rq, struct rq, cfs);
62478d99SVincent Guittot}
62478d99SVincent Guittot#endif
62478d99SVincent Guittot
391e43daSPeter Zijlstrastatic inline int cpu_of(struct rq *rq)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra	return rq->cpu;
391e43daSPeter Zijlstra#else
391e43daSPeter Zijlstra	return 0;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
a7c81556SPeter Zijlstra#define MDF_PUSH	0x01
a7c81556SPeter Zijlstra
a7c81556SPeter Zijlstrastatic inline bool is_migration_disabled(struct task_struct *p)
a7c81556SPeter Zijlstra{
74d862b6SThomas Gleixner#ifdef CONFIG_SMP
a7c81556SPeter Zijlstra	return p->migration_disabled;
a7c81556SPeter Zijlstra#else
a7c81556SPeter Zijlstra	return false;
a7c81556SPeter Zijlstra#endif
a7c81556SPeter Zijlstra}
1b568f0aSPeter Zijlstra
97886d9dSAubrey Listruct sched_group;
9edeaea1SPeter Zijlstra#ifdef CONFIG_SCHED_CORE
97886d9dSAubrey Listatic inline struct cpumask *sched_group_span(struct sched_group *sg);
9edeaea1SPeter Zijlstra
9edeaea1SPeter ZijlstraDECLARE_STATIC_KEY_FALSE(__sched_core_enabled);
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstrastatic inline bool sched_core_enabled(struct rq *rq)
9edeaea1SPeter Zijlstra{
9edeaea1SPeter Zijlstra	return static_branch_unlikely(&__sched_core_enabled) && rq->core_enabled;
9edeaea1SPeter Zijlstra}
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstrastatic inline bool sched_core_disabled(void)
9edeaea1SPeter Zijlstra{
9edeaea1SPeter Zijlstra	return !static_branch_unlikely(&__sched_core_enabled);
9edeaea1SPeter Zijlstra}
9edeaea1SPeter Zijlstra
9ef7e7e3SPeter Zijlstra/*
9ef7e7e3SPeter Zijlstra * Be careful with this function; not for general use. The return value isn't
9ef7e7e3SPeter Zijlstra * stable unless you actually hold a relevant rq->__lock.
9ef7e7e3SPeter Zijlstra */
9edeaea1SPeter Zijlstrastatic inline raw_spinlock_t *rq_lockp(struct rq *rq)
9edeaea1SPeter Zijlstra{
9edeaea1SPeter Zijlstra	if (sched_core_enabled(rq))
9edeaea1SPeter Zijlstra		return &rq->core->__lock;
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstra	return &rq->__lock;
9edeaea1SPeter Zijlstra}
9edeaea1SPeter Zijlstra
9ef7e7e3SPeter Zijlstrastatic inline raw_spinlock_t *__rq_lockp(struct rq *rq)
9ef7e7e3SPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	if (rq->core_enabled)
9ef7e7e3SPeter Zijlstra		return &rq->core->__lock;
9ef7e7e3SPeter Zijlstra
9ef7e7e3SPeter Zijlstra	return &rq->__lock;
9ef7e7e3SPeter Zijlstra}
9ef7e7e3SPeter Zijlstra
c6047c2eSJoel Fernandes (Google)bool cfs_prio_less(struct task_struct *a, struct task_struct *b, bool fi);
c6047c2eSJoel Fernandes (Google)
97886d9dSAubrey Li/*
97886d9dSAubrey Li * Helpers to check if the CPU's core cookie matches with the task's cookie
97886d9dSAubrey Li * when core scheduling is enabled.
97886d9dSAubrey Li * A special case is that the task's cookie always matches with CPU's core
97886d9dSAubrey Li * cookie if the CPU is in an idle core.
97886d9dSAubrey Li */
97886d9dSAubrey Listatic inline bool sched_cpu_cookie_match(struct rq *rq, struct task_struct *p)
97886d9dSAubrey Li{
97886d9dSAubrey Li	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
97886d9dSAubrey Li	if (!sched_core_enabled(rq))
97886d9dSAubrey Li		return true;
97886d9dSAubrey Li
97886d9dSAubrey Li	return rq->core->core_cookie == p->core_cookie;
97886d9dSAubrey Li}
97886d9dSAubrey Li
97886d9dSAubrey Listatic inline bool sched_core_cookie_match(struct rq *rq, struct task_struct *p)
97886d9dSAubrey Li{
97886d9dSAubrey Li	bool idle_core = true;
97886d9dSAubrey Li	int cpu;
97886d9dSAubrey Li
97886d9dSAubrey Li	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
97886d9dSAubrey Li	if (!sched_core_enabled(rq))
97886d9dSAubrey Li		return true;
97886d9dSAubrey Li
97886d9dSAubrey Li	for_each_cpu(cpu, cpu_smt_mask(cpu_of(rq))) {
97886d9dSAubrey Li		if (!available_idle_cpu(cpu)) {
97886d9dSAubrey Li			idle_core = false;
97886d9dSAubrey Li			break;
97886d9dSAubrey Li		}
97886d9dSAubrey Li	}
97886d9dSAubrey Li
97886d9dSAubrey Li	/*
97886d9dSAubrey Li	 * A CPU in an idle core is always the best choice for tasks with
97886d9dSAubrey Li	 * cookies.
97886d9dSAubrey Li	 */
97886d9dSAubrey Li	return idle_core || rq->core->core_cookie == p->core_cookie;
97886d9dSAubrey Li}
97886d9dSAubrey Li
97886d9dSAubrey Listatic inline bool sched_group_cookie_match(struct rq *rq,
97886d9dSAubrey Li					    struct task_struct *p,
97886d9dSAubrey Li					    struct sched_group *group)
97886d9dSAubrey Li{
97886d9dSAubrey Li	int cpu;
97886d9dSAubrey Li
97886d9dSAubrey Li	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
97886d9dSAubrey Li	if (!sched_core_enabled(rq))
97886d9dSAubrey Li		return true;
97886d9dSAubrey Li
97886d9dSAubrey Li	for_each_cpu_and(cpu, sched_group_span(group), p->cpus_ptr) {
97886d9dSAubrey Li		if (sched_core_cookie_match(rq, p))
97886d9dSAubrey Li			return true;
97886d9dSAubrey Li	}
97886d9dSAubrey Li	return false;
97886d9dSAubrey Li}
97886d9dSAubrey Li
d2dfa17bSPeter Zijlstraextern void queue_core_balance(struct rq *rq);
d2dfa17bSPeter Zijlstra
6e33cad0SPeter Zijlstrastatic inline bool sched_core_enqueued(struct task_struct *p)
6e33cad0SPeter Zijlstra{
6e33cad0SPeter Zijlstra	return !RB_EMPTY_NODE(&p->core_node);
6e33cad0SPeter Zijlstra}
6e33cad0SPeter Zijlstra
6e33cad0SPeter Zijlstraextern void sched_core_enqueue(struct rq *rq, struct task_struct *p);
4feee7d1SJosh Donextern void sched_core_dequeue(struct rq *rq, struct task_struct *p, int flags);
6e33cad0SPeter Zijlstra
6e33cad0SPeter Zijlstraextern void sched_core_get(void);
6e33cad0SPeter Zijlstraextern void sched_core_put(void);
6e33cad0SPeter Zijlstra
9edeaea1SPeter Zijlstra#else /* !CONFIG_SCHED_CORE */
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstrastatic inline bool sched_core_enabled(struct rq *rq)
9edeaea1SPeter Zijlstra{
9edeaea1SPeter Zijlstra	return false;
9edeaea1SPeter Zijlstra}
9edeaea1SPeter Zijlstra
d66f1b06SPeter Zijlstrastatic inline bool sched_core_disabled(void)
d66f1b06SPeter Zijlstra{
d66f1b06SPeter Zijlstra	return true;
d66f1b06SPeter Zijlstra}
d66f1b06SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline raw_spinlock_t *rq_lockp(struct rq *rq)
39d371b7SPeter Zijlstra{
5cb9eaa3SPeter Zijlstra	return &rq->__lock;
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
9ef7e7e3SPeter Zijlstrastatic inline raw_spinlock_t *__rq_lockp(struct rq *rq)
9ef7e7e3SPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	return &rq->__lock;
9ef7e7e3SPeter Zijlstra}
9ef7e7e3SPeter Zijlstra
d2dfa17bSPeter Zijlstrastatic inline void queue_core_balance(struct rq *rq)
d2dfa17bSPeter Zijlstra{
d2dfa17bSPeter Zijlstra}
d2dfa17bSPeter Zijlstra
97886d9dSAubrey Listatic inline bool sched_cpu_cookie_match(struct rq *rq, struct task_struct *p)
97886d9dSAubrey Li{
97886d9dSAubrey Li	return true;
97886d9dSAubrey Li}
97886d9dSAubrey Li
97886d9dSAubrey Listatic inline bool sched_core_cookie_match(struct rq *rq, struct task_struct *p)
97886d9dSAubrey Li{
97886d9dSAubrey Li	return true;
97886d9dSAubrey Li}
97886d9dSAubrey Li
97886d9dSAubrey Listatic inline bool sched_group_cookie_match(struct rq *rq,
97886d9dSAubrey Li					    struct task_struct *p,
97886d9dSAubrey Li					    struct sched_group *group)
97886d9dSAubrey Li{
97886d9dSAubrey Li	return true;
97886d9dSAubrey Li}
9edeaea1SPeter Zijlstra#endif /* CONFIG_SCHED_CORE */
9edeaea1SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline void lockdep_assert_rq_held(struct rq *rq)
39d371b7SPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	lockdep_assert_held(__rq_lockp(rq));
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstraextern void raw_spin_rq_lock_nested(struct rq *rq, int subclass);
39d371b7SPeter Zijlstraextern bool raw_spin_rq_trylock(struct rq *rq);
39d371b7SPeter Zijlstraextern void raw_spin_rq_unlock(struct rq *rq);
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline void raw_spin_rq_lock(struct rq *rq)
39d371b7SPeter Zijlstra{
39d371b7SPeter Zijlstra	raw_spin_rq_lock_nested(rq, 0);
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline void raw_spin_rq_lock_irq(struct rq *rq)
39d371b7SPeter Zijlstra{
39d371b7SPeter Zijlstra	local_irq_disable();
39d371b7SPeter Zijlstra	raw_spin_rq_lock(rq);
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline void raw_spin_rq_unlock_irq(struct rq *rq)
39d371b7SPeter Zijlstra{
39d371b7SPeter Zijlstra	raw_spin_rq_unlock(rq);
39d371b7SPeter Zijlstra	local_irq_enable();
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline unsigned long _raw_spin_rq_lock_irqsave(struct rq *rq)
39d371b7SPeter Zijlstra{
39d371b7SPeter Zijlstra	unsigned long flags;
39d371b7SPeter Zijlstra	local_irq_save(flags);
39d371b7SPeter Zijlstra	raw_spin_rq_lock(rq);
39d371b7SPeter Zijlstra	return flags;
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstrastatic inline void raw_spin_rq_unlock_irqrestore(struct rq *rq, unsigned long flags)
39d371b7SPeter Zijlstra{
39d371b7SPeter Zijlstra	raw_spin_rq_unlock(rq);
39d371b7SPeter Zijlstra	local_irq_restore(flags);
39d371b7SPeter Zijlstra}
39d371b7SPeter Zijlstra
39d371b7SPeter Zijlstra#define raw_spin_rq_lock_irqsave(rq, flags)	\
39d371b7SPeter Zijlstrado {						\
39d371b7SPeter Zijlstra	flags = _raw_spin_rq_lock_irqsave(rq);	\
39d371b7SPeter Zijlstra} while (0)
39d371b7SPeter Zijlstra
1b568f0aSPeter Zijlstra#ifdef CONFIG_SCHED_SMT
1b568f0aSPeter Zijlstraextern void __update_idle_core(struct rq *rq);
1b568f0aSPeter Zijlstra
1b568f0aSPeter Zijlstrastatic inline void update_idle_core(struct rq *rq)
1b568f0aSPeter Zijlstra{
1b568f0aSPeter Zijlstra	if (static_branch_unlikely(&sched_smt_present))
1b568f0aSPeter Zijlstra		__update_idle_core(rq);
1b568f0aSPeter Zijlstra}
1b568f0aSPeter Zijlstra
1b568f0aSPeter Zijlstra#else
1b568f0aSPeter Zijlstrastatic inline void update_idle_core(struct rq *rq) { }
1b568f0aSPeter Zijlstra#endif
1b568f0aSPeter Zijlstra
8b06c55bSPranith KumarDECLARE_PER_CPU_SHARED_ALIGNED(struct rq, runqueues);
391e43daSPeter Zijlstra
518cd623SPeter Zijlstra#define cpu_rq(cpu)		(&per_cpu(runqueues, (cpu)))
4a32fea9SChristoph Lameter#define this_rq()		this_cpu_ptr(&runqueues)
518cd623SPeter Zijlstra#define task_rq(p)		cpu_rq(task_cpu(p))
518cd623SPeter Zijlstra#define cpu_curr(cpu)		(cpu_rq(cpu)->curr)
4a32fea9SChristoph Lameter#define raw_rq()		raw_cpu_ptr(&runqueues)
518cd623SPeter Zijlstra
8a311c74SPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
8a311c74SPeter Zijlstrastatic inline struct task_struct *task_of(struct sched_entity *se)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	SCHED_WARN_ON(!entity_is_task(se));
8a311c74SPeter Zijlstra	return container_of(se, struct task_struct, se);
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *task_cfs_rq(struct task_struct *p)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return p->se.cfs_rq;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstra/* runqueue on which this entity is (to be) queued */
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *cfs_rq_of(struct sched_entity *se)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return se->cfs_rq;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstra/* runqueue "owned" by this group */
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *group_cfs_rq(struct sched_entity *grp)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return grp->my_q;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstra#else
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstrastatic inline struct task_struct *task_of(struct sched_entity *se)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return container_of(se, struct task_struct, se);
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *task_cfs_rq(struct task_struct *p)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return &task_rq(p)->cfs;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *cfs_rq_of(struct sched_entity *se)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	struct task_struct *p = task_of(se);
8a311c74SPeter Zijlstra	struct rq *rq = task_rq(p);
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstra	return &rq->cfs;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra
8a311c74SPeter Zijlstra/* runqueue "owned" by this group */
8a311c74SPeter Zijlstrastatic inline struct cfs_rq *group_cfs_rq(struct sched_entity *grp)
8a311c74SPeter Zijlstra{
8a311c74SPeter Zijlstra	return NULL;
8a311c74SPeter Zijlstra}
8a311c74SPeter Zijlstra#endif
8a311c74SPeter Zijlstra
1f351d7fSJohannes Weinerextern void update_rq_clock(struct rq *rq);
1f351d7fSJohannes Weiner
cb42c9a3SMatt Fleming/*
cb42c9a3SMatt Fleming * rq::clock_update_flags bits
cb42c9a3SMatt Fleming *
cb42c9a3SMatt Fleming * %RQCF_REQ_SKIP - will request skipping of clock update on the next
cb42c9a3SMatt Fleming *  call to __schedule(). This is an optimisation to avoid
cb42c9a3SMatt Fleming *  neighbouring rq clock updates.
cb42c9a3SMatt Fleming *
cb42c9a3SMatt Fleming * %RQCF_ACT_SKIP - is set from inside of __schedule() when skipping is
cb42c9a3SMatt Fleming *  in effect and calls to update_rq_clock() are being ignored.
cb42c9a3SMatt Fleming *
cb42c9a3SMatt Fleming * %RQCF_UPDATED - is a debug flag that indicates whether a call has been
cb42c9a3SMatt Fleming *  made to update_rq_clock() since the last time rq::lock was pinned.
cb42c9a3SMatt Fleming *
cb42c9a3SMatt Fleming * If inside of __schedule(), clock_update_flags will have been
cb42c9a3SMatt Fleming * shifted left (a left shift is a cheap operation for the fast path
cb42c9a3SMatt Fleming * to promote %RQCF_REQ_SKIP to %RQCF_ACT_SKIP), so you must use,
cb42c9a3SMatt Fleming *
cb42c9a3SMatt Fleming *	if (rq-clock_update_flags >= RQCF_UPDATED)
cb42c9a3SMatt Fleming *
3b03706fSIngo Molnar * to check if %RQCF_UPDATED is set. It'll never be shifted more than
cb42c9a3SMatt Fleming * one position though, because the next rq_unpin_lock() will shift it
cb42c9a3SMatt Fleming * back.
cb42c9a3SMatt Fleming */
cb42c9a3SMatt Fleming#define RQCF_REQ_SKIP		0x01
cb42c9a3SMatt Fleming#define RQCF_ACT_SKIP		0x02
cb42c9a3SMatt Fleming#define RQCF_UPDATED		0x04
cb42c9a3SMatt Fleming
cb42c9a3SMatt Flemingstatic inline void assert_clock_updated(struct rq *rq)
cb42c9a3SMatt Fleming{
cb42c9a3SMatt Fleming	/*
cb42c9a3SMatt Fleming	 * The only reason for not seeing a clock update since the
cb42c9a3SMatt Fleming	 * last rq_pin_lock() is if we're currently skipping updates.
cb42c9a3SMatt Fleming	 */
cb42c9a3SMatt Fleming	SCHED_WARN_ON(rq->clock_update_flags < RQCF_ACT_SKIP);
cb42c9a3SMatt Fleming}
cb42c9a3SMatt Fleming
78becc27SFrederic Weisbeckerstatic inline u64 rq_clock(struct rq *rq)
78becc27SFrederic Weisbecker{
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
cb42c9a3SMatt Fleming	assert_clock_updated(rq);
cb42c9a3SMatt Fleming
78becc27SFrederic Weisbecker	return rq->clock;
78becc27SFrederic Weisbecker}
78becc27SFrederic Weisbecker
78becc27SFrederic Weisbeckerstatic inline u64 rq_clock_task(struct rq *rq)
78becc27SFrederic Weisbecker{
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
cb42c9a3SMatt Fleming	assert_clock_updated(rq);
cb42c9a3SMatt Fleming
78becc27SFrederic Weisbecker	return rq->clock_task;
78becc27SFrederic Weisbecker}
78becc27SFrederic Weisbecker
05289b90SThara Gopinath/**
05289b90SThara Gopinath * By default the decay is the default pelt decay period.
05289b90SThara Gopinath * The decay shift can change the decay period in
05289b90SThara Gopinath * multiples of 32.
05289b90SThara Gopinath *  Decay shift		Decay period(ms)
05289b90SThara Gopinath *	0			32
05289b90SThara Gopinath *	1			64
05289b90SThara Gopinath *	2			128
05289b90SThara Gopinath *	3			256
05289b90SThara Gopinath *	4			512
05289b90SThara Gopinath */
05289b90SThara Gopinathextern int sched_thermal_decay_shift;
05289b90SThara Gopinath
05289b90SThara Gopinathstatic inline u64 rq_clock_thermal(struct rq *rq)
05289b90SThara Gopinath{
05289b90SThara Gopinath	return rq_clock_task(rq) >> sched_thermal_decay_shift;
05289b90SThara Gopinath}
05289b90SThara Gopinath
adcc8da8SDavidlohr Buesostatic inline void rq_clock_skip_update(struct rq *rq)
9edfbfedSPeter Zijlstra{
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
cb42c9a3SMatt Fleming	rq->clock_update_flags |= RQCF_REQ_SKIP;
adcc8da8SDavidlohr Bueso}
adcc8da8SDavidlohr Bueso
adcc8da8SDavidlohr Bueso/*
595058b6SDavidlohr Bueso * See rt task throttling, which is the only time a skip
3b03706fSIngo Molnar * request is canceled.
adcc8da8SDavidlohr Bueso */
adcc8da8SDavidlohr Buesostatic inline void rq_clock_cancel_skipupdate(struct rq *rq)
adcc8da8SDavidlohr Bueso{
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
cb42c9a3SMatt Fleming	rq->clock_update_flags &= ~RQCF_REQ_SKIP;
9edfbfedSPeter Zijlstra}
9edfbfedSPeter Zijlstra
d8ac8971SMatt Flemingstruct rq_flags {
d8ac8971SMatt Fleming	unsigned long flags;
d8ac8971SMatt Fleming	struct pin_cookie cookie;
cb42c9a3SMatt Fleming#ifdef CONFIG_SCHED_DEBUG
cb42c9a3SMatt Fleming	/*
cb42c9a3SMatt Fleming	 * A copy of (rq::clock_update_flags & RQCF_UPDATED) for the
cb42c9a3SMatt Fleming	 * current pin context is stashed here in case it needs to be
cb42c9a3SMatt Fleming	 * restored in rq_repin_lock().
cb42c9a3SMatt Fleming	 */
cb42c9a3SMatt Fleming	unsigned int clock_update_flags;
cb42c9a3SMatt Fleming#endif
d8ac8971SMatt Fleming};
d8ac8971SMatt Fleming
ae792702SPeter Zijlstraextern struct callback_head balance_push_callback;
ae792702SPeter Zijlstra
58877d34SPeter Zijlstra/*
58877d34SPeter Zijlstra * Lockdep annotation that avoids accidental unlocks; it's like a
58877d34SPeter Zijlstra * sticky/continuous lockdep_assert_held().
58877d34SPeter Zijlstra *
58877d34SPeter Zijlstra * This avoids code that has access to 'struct rq *rq' (basically everything in
58877d34SPeter Zijlstra * the scheduler) from accidentally unlocking the rq if they do not also have a
58877d34SPeter Zijlstra * copy of the (on-stack) 'struct rq_flags rf'.
58877d34SPeter Zijlstra *
58877d34SPeter Zijlstra * Also see Documentation/locking/lockdep-design.rst.
58877d34SPeter Zijlstra */
d8ac8971SMatt Flemingstatic inline void rq_pin_lock(struct rq *rq, struct rq_flags *rf)
d8ac8971SMatt Fleming{
9ef7e7e3SPeter Zijlstra	rf->cookie = lockdep_pin_lock(__rq_lockp(rq));
cb42c9a3SMatt Fleming
cb42c9a3SMatt Fleming#ifdef CONFIG_SCHED_DEBUG
cb42c9a3SMatt Fleming	rq->clock_update_flags &= (RQCF_REQ_SKIP|RQCF_ACT_SKIP);
cb42c9a3SMatt Fleming	rf->clock_update_flags = 0;
565790d2SPeter Zijlstra#ifdef CONFIG_SMP
ae792702SPeter Zijlstra	SCHED_WARN_ON(rq->balance_callback && rq->balance_callback != &balance_push_callback);
ae792702SPeter Zijlstra#endif
565790d2SPeter Zijlstra#endif
d8ac8971SMatt Fleming}
d8ac8971SMatt Fleming
d8ac8971SMatt Flemingstatic inline void rq_unpin_lock(struct rq *rq, struct rq_flags *rf)
d8ac8971SMatt Fleming{
cb42c9a3SMatt Fleming#ifdef CONFIG_SCHED_DEBUG
cb42c9a3SMatt Fleming	if (rq->clock_update_flags > RQCF_ACT_SKIP)
cb42c9a3SMatt Fleming		rf->clock_update_flags = RQCF_UPDATED;
cb42c9a3SMatt Fleming#endif
cb42c9a3SMatt Fleming
9ef7e7e3SPeter Zijlstra	lockdep_unpin_lock(__rq_lockp(rq), rf->cookie);
d8ac8971SMatt Fleming}
d8ac8971SMatt Fleming
d8ac8971SMatt Flemingstatic inline void rq_repin_lock(struct rq *rq, struct rq_flags *rf)
d8ac8971SMatt Fleming{
9ef7e7e3SPeter Zijlstra	lockdep_repin_lock(__rq_lockp(rq), rf->cookie);
cb42c9a3SMatt Fleming
cb42c9a3SMatt Fleming#ifdef CONFIG_SCHED_DEBUG
cb42c9a3SMatt Fleming	/*
cb42c9a3SMatt Fleming	 * Restore the value we stashed in @rf for this pin context.
cb42c9a3SMatt Fleming	 */
cb42c9a3SMatt Fleming	rq->clock_update_flags |= rf->clock_update_flags;
cb42c9a3SMatt Fleming#endif
d8ac8971SMatt Fleming}
d8ac8971SMatt Fleming
1f351d7fSJohannes Weinerstruct rq *__task_rq_lock(struct task_struct *p, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__acquires(rq->lock);
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstruct rq *task_rq_lock(struct task_struct *p, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__acquires(p->pi_lock)
1f351d7fSJohannes Weiner	__acquires(rq->lock);
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void __task_rq_unlock(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__releases(rq->lock)
1f351d7fSJohannes Weiner{
1f351d7fSJohannes Weiner	rq_unpin_lock(rq, rf);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(rq);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinertask_rq_unlock(struct rq *rq, struct task_struct *p, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__releases(rq->lock)
1f351d7fSJohannes Weiner	__releases(p->pi_lock)
1f351d7fSJohannes Weiner{
1f351d7fSJohannes Weiner	rq_unpin_lock(rq, rf);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(rq);
1f351d7fSJohannes Weiner	raw_spin_unlock_irqrestore(&p->pi_lock, rf->flags);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_lock_irqsave(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__acquires(rq->lock)
1f351d7fSJohannes Weiner{
5cb9eaa3SPeter Zijlstra	raw_spin_rq_lock_irqsave(rq, rf->flags);
1f351d7fSJohannes Weiner	rq_pin_lock(rq, rf);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_lock_irq(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__acquires(rq->lock)
1f351d7fSJohannes Weiner{
5cb9eaa3SPeter Zijlstra	raw_spin_rq_lock_irq(rq);
1f351d7fSJohannes Weiner	rq_pin_lock(rq, rf);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_lock(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__acquires(rq->lock)
1f351d7fSJohannes Weiner{
5cb9eaa3SPeter Zijlstra	raw_spin_rq_lock(rq);
1f351d7fSJohannes Weiner	rq_pin_lock(rq, rf);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_unlock_irqrestore(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__releases(rq->lock)
1f351d7fSJohannes Weiner{
1f351d7fSJohannes Weiner	rq_unpin_lock(rq, rf);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock_irqrestore(rq, rf->flags);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_unlock_irq(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__releases(rq->lock)
1f351d7fSJohannes Weiner{
1f351d7fSJohannes Weiner	rq_unpin_lock(rq, rf);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock_irq(rq);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
1f351d7fSJohannes Weinerstatic inline void
1f351d7fSJohannes Weinerrq_unlock(struct rq *rq, struct rq_flags *rf)
1f351d7fSJohannes Weiner	__releases(rq->lock)
1f351d7fSJohannes Weiner{
1f351d7fSJohannes Weiner	rq_unpin_lock(rq, rf);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(rq);
1f351d7fSJohannes Weiner}
1f351d7fSJohannes Weiner
246b3b33SJohannes Weinerstatic inline struct rq *
246b3b33SJohannes Weinerthis_rq_lock_irq(struct rq_flags *rf)
246b3b33SJohannes Weiner	__acquires(rq->lock)
246b3b33SJohannes Weiner{
246b3b33SJohannes Weiner	struct rq *rq;
246b3b33SJohannes Weiner
246b3b33SJohannes Weiner	local_irq_disable();
246b3b33SJohannes Weiner	rq = this_rq();
246b3b33SJohannes Weiner	rq_lock(rq, rf);
246b3b33SJohannes Weiner	return rq;
246b3b33SJohannes Weiner}
246b3b33SJohannes Weiner
9942f79bSRik van Riel#ifdef CONFIG_NUMA
e3fe70b1SRik van Rielenum numa_topology_type {
e3fe70b1SRik van Riel	NUMA_DIRECT,
e3fe70b1SRik van Riel	NUMA_GLUELESS_MESH,
e3fe70b1SRik van Riel	NUMA_BACKPLANE,
e3fe70b1SRik van Riel};
e3fe70b1SRik van Rielextern enum numa_topology_type sched_numa_topology_type;
9942f79bSRik van Rielextern int sched_max_numa_distance;
9942f79bSRik van Rielextern bool find_numa_distance(int distance);
0fb3978bSHuang Yingextern void sched_init_numa(int offline_node);
0fb3978bSHuang Yingextern void sched_update_numa(int cpu, bool online);
f2cb1360SIngo Molnarextern void sched_domains_numa_masks_set(unsigned int cpu);
f2cb1360SIngo Molnarextern void sched_domains_numa_masks_clear(unsigned int cpu);
e0e8d491SWanpeng Liextern int sched_numa_find_closest(const struct cpumask *cpus, int cpu);
f2cb1360SIngo Molnar#else
0fb3978bSHuang Yingstatic inline void sched_init_numa(int offline_node) { }
0fb3978bSHuang Yingstatic inline void sched_update_numa(int cpu, bool online) { }
f2cb1360SIngo Molnarstatic inline void sched_domains_numa_masks_set(unsigned int cpu) { }
f2cb1360SIngo Molnarstatic inline void sched_domains_numa_masks_clear(unsigned int cpu) { }
e0e8d491SWanpeng Listatic inline int sched_numa_find_closest(const struct cpumask *cpus, int cpu)
e0e8d491SWanpeng Li{
e0e8d491SWanpeng Li	return nr_cpu_ids;
e0e8d491SWanpeng Li}
f2cb1360SIngo Molnar#endif
f2cb1360SIngo Molnar
f809ca9aSMel Gorman#ifdef CONFIG_NUMA_BALANCING
44dba3d5SIulia Manda/* The regions in numa_faults array from task_struct */
44dba3d5SIulia Mandaenum numa_faults_stats {
44dba3d5SIulia Manda	NUMA_MEM = 0,
44dba3d5SIulia Manda	NUMA_CPU,
44dba3d5SIulia Manda	NUMA_MEMBUF,
44dba3d5SIulia Manda	NUMA_CPUBUF
44dba3d5SIulia Manda};
0ec8aa00SPeter Zijlstraextern void sched_setnuma(struct task_struct *p, int node);
e6628d5bSMel Gormanextern int migrate_task_to(struct task_struct *p, int cpu);
0ad4e3dfSSrikar Dronamrajuextern int migrate_swap(struct task_struct *p, struct task_struct *t,
0ad4e3dfSSrikar Dronamraju			int cpu, int scpu);
13784475SMel Gormanextern void init_numa_balancing(unsigned long clone_flags, struct task_struct *p);
13784475SMel Gorman#else
13784475SMel Gormanstatic inline void
13784475SMel Gormaninit_numa_balancing(unsigned long clone_flags, struct task_struct *p)
13784475SMel Gorman{
13784475SMel Gorman}
f809ca9aSMel Gorman#endif /* CONFIG_NUMA_BALANCING */
f809ca9aSMel Gorman
518cd623SPeter Zijlstra#ifdef CONFIG_SMP
518cd623SPeter Zijlstra
e3fca9e7SPeter Zijlstrastatic inline void
e3fca9e7SPeter Zijlstraqueue_balance_callback(struct rq *rq,
e3fca9e7SPeter Zijlstra		       struct callback_head *head,
e3fca9e7SPeter Zijlstra		       void (*func)(struct rq *rq))
e3fca9e7SPeter Zijlstra{
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
e3fca9e7SPeter Zijlstra
ae792702SPeter Zijlstra	if (unlikely(head->next || rq->balance_callback == &balance_push_callback))
e3fca9e7SPeter Zijlstra		return;
e3fca9e7SPeter Zijlstra
e3fca9e7SPeter Zijlstra	head->func = (void (*)(struct callback_head *))func;
e3fca9e7SPeter Zijlstra	head->next = rq->balance_callback;
e3fca9e7SPeter Zijlstra	rq->balance_callback = head;
e3fca9e7SPeter Zijlstra}
e3fca9e7SPeter Zijlstra
391e43daSPeter Zijlstra#define rcu_dereference_check_sched_domain(p) \
391e43daSPeter Zijlstra	rcu_dereference_check((p), \
391e43daSPeter Zijlstra			      lockdep_is_held(&sched_domains_mutex))
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * The domain tree (rq->sd) is protected by RCU's quiescent state transition.
337e9b07SPaul E. McKenney * See destroy_sched_domains: call_rcu for details.
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * The domain tree of any CPU may only be accessed from within
391e43daSPeter Zijlstra * preempt-disabled sections.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra#define for_each_domain(cpu, __sd) \
518cd623SPeter Zijlstra	for (__sd = rcu_dereference_check_sched_domain(cpu_rq(cpu)->sd); \
518cd623SPeter Zijlstra			__sd; __sd = __sd->parent)
391e43daSPeter Zijlstra
518cd623SPeter Zijlstra/**
518cd623SPeter Zijlstra * highest_flag_domain - Return highest sched_domain containing flag.
97fb7a0aSIngo Molnar * @cpu:	The CPU whose highest level of sched domain is to
518cd623SPeter Zijlstra *		be returned.
518cd623SPeter Zijlstra * @flag:	The flag to check for the highest sched_domain
97fb7a0aSIngo Molnar *		for the given CPU.
518cd623SPeter Zijlstra *
97fb7a0aSIngo Molnar * Returns the highest sched_domain of a CPU which contains the given flag.
518cd623SPeter Zijlstra */
518cd623SPeter Zijlstrastatic inline struct sched_domain *highest_flag_domain(int cpu, int flag)
518cd623SPeter Zijlstra{
518cd623SPeter Zijlstra	struct sched_domain *sd, *hsd = NULL;
518cd623SPeter Zijlstra
518cd623SPeter Zijlstra	for_each_domain(cpu, sd) {
518cd623SPeter Zijlstra		if (!(sd->flags & flag))
518cd623SPeter Zijlstra			break;
518cd623SPeter Zijlstra		hsd = sd;
518cd623SPeter Zijlstra	}
518cd623SPeter Zijlstra
518cd623SPeter Zijlstra	return hsd;
518cd623SPeter Zijlstra}
518cd623SPeter Zijlstra
fb13c7eeSMel Gormanstatic inline struct sched_domain *lowest_flag_domain(int cpu, int flag)
fb13c7eeSMel Gorman{
fb13c7eeSMel Gorman	struct sched_domain *sd;
fb13c7eeSMel Gorman
fb13c7eeSMel Gorman	for_each_domain(cpu, sd) {
fb13c7eeSMel Gorman		if (sd->flags & flag)
fb13c7eeSMel Gorman			break;
fb13c7eeSMel Gorman	}
fb13c7eeSMel Gorman
fb13c7eeSMel Gorman	return sd;
fb13c7eeSMel Gorman}
fb13c7eeSMel Gorman
994aeb7aSJoel Fernandes (Google)DECLARE_PER_CPU(struct sched_domain __rcu *, sd_llc);
7d9ffa89SPeter ZijlstraDECLARE_PER_CPU(int, sd_llc_size);
518cd623SPeter ZijlstraDECLARE_PER_CPU(int, sd_llc_id);
994aeb7aSJoel Fernandes (Google)DECLARE_PER_CPU(struct sched_domain_shared __rcu *, sd_llc_shared);
994aeb7aSJoel Fernandes (Google)DECLARE_PER_CPU(struct sched_domain __rcu *, sd_numa);
994aeb7aSJoel Fernandes (Google)DECLARE_PER_CPU(struct sched_domain __rcu *, sd_asym_packing);
994aeb7aSJoel Fernandes (Google)DECLARE_PER_CPU(struct sched_domain __rcu *, sd_asym_cpucapacity);
df054e84SMorten Rasmussenextern struct static_key_false sched_asym_cpucapacity;
518cd623SPeter Zijlstra
63b2ca30SNicolas Pitrestruct sched_group_capacity {
5e6521eaSLi Zefan	atomic_t		ref;
5e6521eaSLi Zefan	/*
172895e6SYuyang Du	 * CPU capacity of this group, SCHED_CAPACITY_SCALE being max capacity
63b2ca30SNicolas Pitre	 * for a single CPU.
5e6521eaSLi Zefan	 */
bf475ce0SMorten Rasmussen	unsigned long		capacity;
bf475ce0SMorten Rasmussen	unsigned long		min_capacity;		/* Min per-CPU capacity in group */
e3d6d0cbSMorten Rasmussen	unsigned long		max_capacity;		/* Max per-CPU capacity in group */
5e6521eaSLi Zefan	unsigned long		next_update;
63b2ca30SNicolas Pitre	int			imbalance;		/* XXX unrelated to capacity but shared group state */
5e6521eaSLi Zefan
005f874dSPeter Zijlstra#ifdef CONFIG_SCHED_DEBUG
005f874dSPeter Zijlstra	int			id;
005f874dSPeter Zijlstra#endif
005f874dSPeter Zijlstra
eba9f082Szhuguangqing	unsigned long		cpumask[];		/* Balance mask */
5e6521eaSLi Zefan};
5e6521eaSLi Zefan
5e6521eaSLi Zefanstruct sched_group {
5e6521eaSLi Zefan	struct sched_group	*next;			/* Must be a circular list */
5e6521eaSLi Zefan	atomic_t		ref;
5e6521eaSLi Zefan
5e6521eaSLi Zefan	unsigned int		group_weight;
63b2ca30SNicolas Pitre	struct sched_group_capacity *sgc;
97fb7a0aSIngo Molnar	int			asym_prefer_cpu;	/* CPU of highest priority in group */
16d364baSRicardo Neri	int			flags;
5e6521eaSLi Zefan
5e6521eaSLi Zefan	/*
5e6521eaSLi Zefan	 * The CPUs this group covers.
5e6521eaSLi Zefan	 *
5e6521eaSLi Zefan	 * NOTE: this field is variable length. (Allocated dynamically
5e6521eaSLi Zefan	 * by attaching extra space to the end of the structure,
5e6521eaSLi Zefan	 * depending on how many CPUs the kernel has booted up with)
5e6521eaSLi Zefan	 */
04f5c362SGustavo A. R. Silva	unsigned long		cpumask[];
5e6521eaSLi Zefan};
5e6521eaSLi Zefan
ae4df9d6SPeter Zijlstrastatic inline struct cpumask *sched_group_span(struct sched_group *sg)
5e6521eaSLi Zefan{
5e6521eaSLi Zefan	return to_cpumask(sg->cpumask);
5e6521eaSLi Zefan}
5e6521eaSLi Zefan
5e6521eaSLi Zefan/*
e5c14b1fSPeter Zijlstra * See build_balance_mask().
5e6521eaSLi Zefan */
e5c14b1fSPeter Zijlstrastatic inline struct cpumask *group_balance_mask(struct sched_group *sg)
5e6521eaSLi Zefan{
63b2ca30SNicolas Pitre	return to_cpumask(sg->sgc->cpumask);
5e6521eaSLi Zefan}
5e6521eaSLi Zefan
5e6521eaSLi Zefan/**
97fb7a0aSIngo Molnar * group_first_cpu - Returns the first CPU in the cpumask of a sched_group.
97fb7a0aSIngo Molnar * @group: The group whose first CPU is to be returned.
5e6521eaSLi Zefan */
5e6521eaSLi Zefanstatic inline unsigned int group_first_cpu(struct sched_group *group)
5e6521eaSLi Zefan{
ae4df9d6SPeter Zijlstra	return cpumask_first(sched_group_span(group));
5e6521eaSLi Zefan}
5e6521eaSLi Zefan
c1174876SPeter Zijlstraextern int group_balance_cpu(struct sched_group *sg);
c1174876SPeter Zijlstra
3b87f136SPeter Zijlstra#ifdef CONFIG_SCHED_DEBUG
3b87f136SPeter Zijlstravoid update_sched_domain_debugfs(void);
bbdacdfeSPeter Zijlstravoid dirty_sched_domain_sysctl(int cpu);
3866e845SSteven Rostedt (Red Hat)#else
3b87f136SPeter Zijlstrastatic inline void update_sched_domain_debugfs(void)
3866e845SSteven Rostedt (Red Hat){
3866e845SSteven Rostedt (Red Hat)}
bbdacdfeSPeter Zijlstrastatic inline void dirty_sched_domain_sysctl(int cpu)
bbdacdfeSPeter Zijlstra{
bbdacdfeSPeter Zijlstra}
3866e845SSteven Rostedt (Red Hat)#endif
3866e845SSteven Rostedt (Red Hat)
8a99b683SPeter Zijlstraextern int sched_update_scaling(void);
*d664e399SThomas Gleixner#endif /* CONFIG_SMP */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#include "stats.h"
391e43daSPeter Zijlstra
4feee7d1SJosh Don#if defined(CONFIG_SCHED_CORE) && defined(CONFIG_SCHEDSTATS)
4feee7d1SJosh Don
4feee7d1SJosh Donextern void __sched_core_account_forceidle(struct rq *rq);
4feee7d1SJosh Don
4feee7d1SJosh Donstatic inline void sched_core_account_forceidle(struct rq *rq)
4feee7d1SJosh Don{
4feee7d1SJosh Don	if (schedstat_enabled())
4feee7d1SJosh Don		__sched_core_account_forceidle(rq);
4feee7d1SJosh Don}
4feee7d1SJosh Don
4feee7d1SJosh Donextern void __sched_core_tick(struct rq *rq);
4feee7d1SJosh Don
4feee7d1SJosh Donstatic inline void sched_core_tick(struct rq *rq)
4feee7d1SJosh Don{
4feee7d1SJosh Don	if (sched_core_enabled(rq) && schedstat_enabled())
4feee7d1SJosh Don		__sched_core_tick(rq);
4feee7d1SJosh Don}
4feee7d1SJosh Don
4feee7d1SJosh Don#else
4feee7d1SJosh Don
4feee7d1SJosh Donstatic inline void sched_core_account_forceidle(struct rq *rq) {}
4feee7d1SJosh Don
4feee7d1SJosh Donstatic inline void sched_core_tick(struct rq *rq) {}
4feee7d1SJosh Don
4feee7d1SJosh Don#endif /* CONFIG_SCHED_CORE && CONFIG_SCHEDSTATS */
4feee7d1SJosh Don
391e43daSPeter Zijlstra#ifdef CONFIG_CGROUP_SCHED
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Return the group to which this tasks belongs.
391e43daSPeter Zijlstra *
8af01f56STejun Heo * We cannot use task_css() and friends because the cgroup subsystem
8af01f56STejun Heo * changes that value before the cgroup_subsys::attach() method is called,
8af01f56STejun Heo * therefore we cannot pin it and might observe the wrong value.
8323f26cSPeter Zijlstra *
8323f26cSPeter Zijlstra * The same is true for autogroup's p->signal->autogroup->tg, the autogroup
8323f26cSPeter Zijlstra * core changes this before calling sched_move_task().
8323f26cSPeter Zijlstra *
8323f26cSPeter Zijlstra * Instead we use a 'copy' which is updated from sched_move_task() while
8323f26cSPeter Zijlstra * holding both task_struct::pi_lock and rq::lock.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline struct task_group *task_group(struct task_struct *p)
391e43daSPeter Zijlstra{
8323f26cSPeter Zijlstra	return p->sched_task_group;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/* Change a task's cfs_rq and parent entity if it moves across CPUs/groups */
391e43daSPeter Zijlstrastatic inline void set_task_rq(struct task_struct *p, unsigned int cpu)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra#if defined(CONFIG_FAIR_GROUP_SCHED) || defined(CONFIG_RT_GROUP_SCHED)
391e43daSPeter Zijlstra	struct task_group *tg = task_group(p);
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_FAIR_GROUP_SCHED
ad936d86SByungchul Park	set_task_rq_fair(&p->se, p->se.cfs_rq, tg->cfs_rq[cpu]);
391e43daSPeter Zijlstra	p->se.cfs_rq = tg->cfs_rq[cpu];
391e43daSPeter Zijlstra	p->se.parent = tg->se[cpu];
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_RT_GROUP_SCHED
391e43daSPeter Zijlstra	p->rt.rt_rq  = tg->rt_rq[cpu];
391e43daSPeter Zijlstra	p->rt.parent = tg->rt_se[cpu];
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#else /* CONFIG_CGROUP_SCHED */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline void set_task_rq(struct task_struct *p, unsigned int cpu) { }
391e43daSPeter Zijlstrastatic inline struct task_group *task_group(struct task_struct *p)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return NULL;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#endif /* CONFIG_CGROUP_SCHED */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline void __set_task_cpu(struct task_struct *p, unsigned int cpu)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	set_task_rq(p, cpu);
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra	/*
391e43daSPeter Zijlstra	 * After ->cpu is set up to a new value, task_rq_lock(p, ...) can be
dfcb245eSIngo Molnar	 * successfully executed on another CPU. We must ensure that updates of
391e43daSPeter Zijlstra	 * per-task data have been completed by this moment.
391e43daSPeter Zijlstra	 */
391e43daSPeter Zijlstra	smp_wmb();
c546951dSAndrea Parri	WRITE_ONCE(task_thread_info(p)->cpu, cpu);
ac66f547SPeter Zijlstra	p->wake_cpu = cpu;
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Tunables that become constants when CONFIG_SCHED_DEBUG is off:
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra#ifdef CONFIG_SCHED_DEBUG
391e43daSPeter Zijlstra# define const_debug __read_mostly
391e43daSPeter Zijlstra#else
391e43daSPeter Zijlstra# define const_debug const
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#define SCHED_FEAT(name, enabled)	\
391e43daSPeter Zijlstra	__SCHED_FEAT_##name ,
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraenum {
391e43daSPeter Zijlstra#include "features.h"
f8b6d1ccSPeter Zijlstra	__SCHED_FEAT_NR,
391e43daSPeter Zijlstra};
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#undef SCHED_FEAT
391e43daSPeter Zijlstra
a73f863aSJuri Lelli#ifdef CONFIG_SCHED_DEBUG
765cc3a4SPatrick Bellasi
765cc3a4SPatrick Bellasi/*
765cc3a4SPatrick Bellasi * To support run-time toggling of sched features, all the translation units
765cc3a4SPatrick Bellasi * (but core.c) reference the sysctl_sched_features defined in core.c.
765cc3a4SPatrick Bellasi */
765cc3a4SPatrick Bellasiextern const_debug unsigned int sysctl_sched_features;
765cc3a4SPatrick Bellasi
a73f863aSJuri Lelli#ifdef CONFIG_JUMP_LABEL
f8b6d1ccSPeter Zijlstra#define SCHED_FEAT(name, enabled)					\
c5905afbSIngo Molnarstatic __always_inline bool static_branch_##name(struct static_key *key) \
f8b6d1ccSPeter Zijlstra{									\
6e76ea8aSJason Baron	return static_key_##enabled(key);				\
f8b6d1ccSPeter Zijlstra}
f8b6d1ccSPeter Zijlstra
f8b6d1ccSPeter Zijlstra#include "features.h"
f8b6d1ccSPeter Zijlstra#undef SCHED_FEAT
f8b6d1ccSPeter Zijlstra
c5905afbSIngo Molnarextern struct static_key sched_feat_keys[__SCHED_FEAT_NR];
f8b6d1ccSPeter Zijlstra#define sched_feat(x) (static_branch_##x(&sched_feat_keys[__SCHED_FEAT_##x]))
765cc3a4SPatrick Bellasi
a73f863aSJuri Lelli#else /* !CONFIG_JUMP_LABEL */
a73f863aSJuri Lelli
a73f863aSJuri Lelli#define sched_feat(x) (sysctl_sched_features & (1UL << __SCHED_FEAT_##x))
a73f863aSJuri Lelli
a73f863aSJuri Lelli#endif /* CONFIG_JUMP_LABEL */
a73f863aSJuri Lelli
a73f863aSJuri Lelli#else /* !SCHED_DEBUG */
765cc3a4SPatrick Bellasi
765cc3a4SPatrick Bellasi/*
765cc3a4SPatrick Bellasi * Each translation unit has its own copy of sysctl_sched_features to allow
765cc3a4SPatrick Bellasi * constants propagation at compile time and compiler optimization based on
765cc3a4SPatrick Bellasi * features default.
765cc3a4SPatrick Bellasi */
765cc3a4SPatrick Bellasi#define SCHED_FEAT(name, enabled)	\
765cc3a4SPatrick Bellasi	(1UL << __SCHED_FEAT_##name) * enabled |
765cc3a4SPatrick Bellasistatic const_debug __maybe_unused unsigned int sysctl_sched_features =
765cc3a4SPatrick Bellasi#include "features.h"
765cc3a4SPatrick Bellasi	0;
765cc3a4SPatrick Bellasi#undef SCHED_FEAT
765cc3a4SPatrick Bellasi
7e6f4c5dSPeter Zijlstra#define sched_feat(x) !!(sysctl_sched_features & (1UL << __SCHED_FEAT_##x))
765cc3a4SPatrick Bellasi
a73f863aSJuri Lelli#endif /* SCHED_DEBUG */
391e43daSPeter Zijlstra
2a595721SSrikar Dronamrajuextern struct static_key_false sched_numa_balancing;
cb251765SMel Gormanextern struct static_key_false sched_schedstats;
cbee9f88SPeter Zijlstra
391e43daSPeter Zijlstrastatic inline u64 global_rt_period(void)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return (u64)sysctl_sched_rt_period * NSEC_PER_USEC;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline u64 global_rt_runtime(void)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	if (sysctl_sched_rt_runtime < 0)
391e43daSPeter Zijlstra		return RUNTIME_INF;
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	return (u64)sysctl_sched_rt_runtime * NSEC_PER_USEC;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline int task_current(struct rq *rq, struct task_struct *p)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	return rq->curr == p;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline int task_running(struct rq *rq, struct task_struct *p)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra	return p->on_cpu;
391e43daSPeter Zijlstra#else
391e43daSPeter Zijlstra	return task_current(rq, p);
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
da0c1e65SKirill Tkhaistatic inline int task_on_rq_queued(struct task_struct *p)
da0c1e65SKirill Tkhai{
da0c1e65SKirill Tkhai	return p->on_rq == TASK_ON_RQ_QUEUED;
da0c1e65SKirill Tkhai}
391e43daSPeter Zijlstra
cca26e80SKirill Tkhaistatic inline int task_on_rq_migrating(struct task_struct *p)
cca26e80SKirill Tkhai{
c546951dSAndrea Parri	return READ_ONCE(p->on_rq) == TASK_ON_RQ_MIGRATING;
cca26e80SKirill Tkhai}
cca26e80SKirill Tkhai
17770579SValentin Schneider/* Wake flags. The first three directly map to some SD flag value */
17770579SValentin Schneider#define WF_EXEC     0x02 /* Wakeup after exec; maps to SD_BALANCE_EXEC */
17770579SValentin Schneider#define WF_FORK     0x04 /* Wakeup after fork; maps to SD_BALANCE_FORK */
17770579SValentin Schneider#define WF_TTWU     0x08 /* Wakeup;            maps to SD_BALANCE_WAKE */
17770579SValentin Schneider
17770579SValentin Schneider#define WF_SYNC     0x10 /* Waker goes to sleep after wakeup */
17770579SValentin Schneider#define WF_MIGRATED 0x20 /* Internal use, task got migrated */
17770579SValentin Schneider#define WF_ON_CPU   0x40 /* Wakee is on_cpu */
17770579SValentin Schneider
17770579SValentin Schneider#ifdef CONFIG_SMP
17770579SValentin Schneiderstatic_assert(WF_EXEC == SD_BALANCE_EXEC);
17770579SValentin Schneiderstatic_assert(WF_FORK == SD_BALANCE_FORK);
17770579SValentin Schneiderstatic_assert(WF_TTWU == SD_BALANCE_WAKE);
17770579SValentin Schneider#endif
b13095f0SLi Zefan
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * To aid in avoiding the subversion of "niceness" due to uneven distribution
391e43daSPeter Zijlstra * of tasks with abnormal "nice" values across CPUs the contribution that
391e43daSPeter Zijlstra * each task makes to its run queue's load is weighted according to its
391e43daSPeter Zijlstra * scheduling class and "nice" value. For SCHED_NORMAL tasks this is just a
391e43daSPeter Zijlstra * scaled version of the new time slice allocation that they receive on time
391e43daSPeter Zijlstra * slice expiry etc.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#define WEIGHT_IDLEPRIO		3
391e43daSPeter Zijlstra#define WMULT_IDLEPRIO		1431655765
391e43daSPeter Zijlstra
ed82b8a1SAndi Kleenextern const int		sched_prio_to_weight[40];
ed82b8a1SAndi Kleenextern const u32		sched_prio_to_wmult[40];
391e43daSPeter Zijlstra
ff77e468SPeter Zijlstra/*
ff77e468SPeter Zijlstra * {de,en}queue flags:
ff77e468SPeter Zijlstra *
ff77e468SPeter Zijlstra * DEQUEUE_SLEEP  - task is no longer runnable
ff77e468SPeter Zijlstra * ENQUEUE_WAKEUP - task just became runnable
ff77e468SPeter Zijlstra *
ff77e468SPeter Zijlstra * SAVE/RESTORE - an otherwise spurious dequeue/enqueue, done to ensure tasks
ff77e468SPeter Zijlstra *                are in a known state which allows modification. Such pairs
ff77e468SPeter Zijlstra *                should preserve as much state as possible.
ff77e468SPeter Zijlstra *
ff77e468SPeter Zijlstra * MOVE - paired with SAVE/RESTORE, explicitly does not preserve the location
ff77e468SPeter Zijlstra *        in the runqueue.
ff77e468SPeter Zijlstra *
ff77e468SPeter Zijlstra * ENQUEUE_HEAD      - place at front of runqueue (tail if not specified)
ff77e468SPeter Zijlstra * ENQUEUE_REPLENISH - CBS (replenish runtime and postpone deadline)
59efa0baSPeter Zijlstra * ENQUEUE_MIGRATED  - the task was migrated during wakeup
ff77e468SPeter Zijlstra *
ff77e468SPeter Zijlstra */
ff77e468SPeter Zijlstra
ff77e468SPeter Zijlstra#define DEQUEUE_SLEEP		0x01
97fb7a0aSIngo Molnar#define DEQUEUE_SAVE		0x02 /* Matches ENQUEUE_RESTORE */
97fb7a0aSIngo Molnar#define DEQUEUE_MOVE		0x04 /* Matches ENQUEUE_MOVE */
97fb7a0aSIngo Molnar#define DEQUEUE_NOCLOCK		0x08 /* Matches ENQUEUE_NOCLOCK */
ff77e468SPeter Zijlstra
1de64443SPeter Zijlstra#define ENQUEUE_WAKEUP		0x01
ff77e468SPeter Zijlstra#define ENQUEUE_RESTORE		0x02
ff77e468SPeter Zijlstra#define ENQUEUE_MOVE		0x04
0a67d1eeSPeter Zijlstra#define ENQUEUE_NOCLOCK		0x08
ff77e468SPeter Zijlstra
0a67d1eeSPeter Zijlstra#define ENQUEUE_HEAD		0x10
0a67d1eeSPeter Zijlstra#define ENQUEUE_REPLENISH	0x20
c82ba9faSLi Zefan#ifdef CONFIG_SMP
0a67d1eeSPeter Zijlstra#define ENQUEUE_MIGRATED	0x40
c82ba9faSLi Zefan#else
59efa0baSPeter Zijlstra#define ENQUEUE_MIGRATED	0x00
c82ba9faSLi Zefan#endif
c82ba9faSLi Zefan
37e117c0SPeter Zijlstra#define RETRY_TASK		((void *)-1UL)
37e117c0SPeter Zijlstra
c82ba9faSLi Zefanstruct sched_class {
c82ba9faSLi Zefan
69842cbaSPatrick Bellasi#ifdef CONFIG_UCLAMP_TASK
69842cbaSPatrick Bellasi	int uclamp_enabled;
69842cbaSPatrick Bellasi#endif
69842cbaSPatrick Bellasi
c82ba9faSLi Zefan	void (*enqueue_task) (struct rq *rq, struct task_struct *p, int flags);
c82ba9faSLi Zefan	void (*dequeue_task) (struct rq *rq, struct task_struct *p, int flags);
c82ba9faSLi Zefan	void (*yield_task)   (struct rq *rq);
0900acf2SDietmar Eggemann	bool (*yield_to_task)(struct rq *rq, struct task_struct *p);
c82ba9faSLi Zefan
c82ba9faSLi Zefan	void (*check_preempt_curr)(struct rq *rq, struct task_struct *p, int flags);
c82ba9faSLi Zefan
98c2f700SPeter Zijlstra	struct task_struct *(*pick_next_task)(struct rq *rq);
98c2f700SPeter Zijlstra
6e2df058SPeter Zijlstra	void (*put_prev_task)(struct rq *rq, struct task_struct *p);
a0e813f2SPeter Zijlstra	void (*set_next_task)(struct rq *rq, struct task_struct *p, bool first);
c82ba9faSLi Zefan
c82ba9faSLi Zefan#ifdef CONFIG_SMP
6e2df058SPeter Zijlstra	int (*balance)(struct rq *rq, struct task_struct *prev, struct rq_flags *rf);
3aef1551SValentin Schneider	int  (*select_task_rq)(struct task_struct *p, int task_cpu, int flags);
21f56ffeSPeter Zijlstra
21f56ffeSPeter Zijlstra	struct task_struct * (*pick_task)(struct rq *rq);
21f56ffeSPeter Zijlstra
1327237aSSrikar Dronamraju	void (*migrate_task_rq)(struct task_struct *p, int new_cpu);
c82ba9faSLi Zefan
c82ba9faSLi Zefan	void (*task_woken)(struct rq *this_rq, struct task_struct *task);
c82ba9faSLi Zefan
c82ba9faSLi Zefan	void (*set_cpus_allowed)(struct task_struct *p,
9cfc3e18SPeter Zijlstra				 const struct cpumask *newmask,
9cfc3e18SPeter Zijlstra				 u32 flags);
c82ba9faSLi Zefan
c82ba9faSLi Zefan	void (*rq_online)(struct rq *rq);
c82ba9faSLi Zefan	void (*rq_offline)(struct rq *rq);
a7c81556SPeter Zijlstra
a7c81556SPeter Zijlstra	struct rq *(*find_lock_rq)(struct task_struct *p, struct rq *rq);
c82ba9faSLi Zefan#endif
c82ba9faSLi Zefan
c82ba9faSLi Zefan	void (*task_tick)(struct rq *rq, struct task_struct *p, int queued);
c82ba9faSLi Zefan	void (*task_fork)(struct task_struct *p);
e6c390f2SDario Faggioli	void (*task_dead)(struct task_struct *p);
c82ba9faSLi Zefan
67dfa1b7SKirill Tkhai	/*
67dfa1b7SKirill Tkhai	 * The switched_from() call is allowed to drop rq->lock, therefore we
3b03706fSIngo Molnar	 * cannot assume the switched_from/switched_to pair is serialized by
67dfa1b7SKirill Tkhai	 * rq->lock. They are however serialized by p->pi_lock.
67dfa1b7SKirill Tkhai	 */
c82ba9faSLi Zefan	void (*switched_from)(struct rq *this_rq, struct task_struct *task);
c82ba9faSLi Zefan	void (*switched_to)  (struct rq *this_rq, struct task_struct *task);
c82ba9faSLi Zefan	void (*prio_changed) (struct rq *this_rq, struct task_struct *task,
c82ba9faSLi Zefan			      int oldprio);
c82ba9faSLi Zefan
c82ba9faSLi Zefan	unsigned int (*get_rr_interval)(struct rq *rq,
c82ba9faSLi Zefan					struct task_struct *task);
c82ba9faSLi Zefan
6e998916SStanislaw Gruszka	void (*update_curr)(struct rq *rq);
6e998916SStanislaw Gruszka
ea86cb4bSVincent Guittot#define TASK_SET_GROUP		0
ea86cb4bSVincent Guittot#define TASK_MOVE_GROUP		1
ea86cb4bSVincent Guittot
c82ba9faSLi Zefan#ifdef CONFIG_FAIR_GROUP_SCHED
ea86cb4bSVincent Guittot	void (*task_change_group)(struct task_struct *p, int type);
c82ba9faSLi Zefan#endif
43c31ac0SPeter Zijlstra};
391e43daSPeter Zijlstra
3f1d2a31SPeter Zijlstrastatic inline void put_prev_task(struct rq *rq, struct task_struct *prev)
3f1d2a31SPeter Zijlstra{
10e7071bSPeter Zijlstra	WARN_ON_ONCE(rq->curr != prev);
6e2df058SPeter Zijlstra	prev->sched_class->put_prev_task(rq, prev);
3f1d2a31SPeter Zijlstra}
3f1d2a31SPeter Zijlstra
03b7fad1SPeter Zijlstrastatic inline void set_next_task(struct rq *rq, struct task_struct *next)
b2bf6c31SPeter Zijlstra{
a0e813f2SPeter Zijlstra	next->sched_class->set_next_task(rq, next, false);
b2bf6c31SPeter Zijlstra}
b2bf6c31SPeter Zijlstra
43c31ac0SPeter Zijlstra
43c31ac0SPeter Zijlstra/*
43c31ac0SPeter Zijlstra * Helper to define a sched_class instance; each one is placed in a separate
43c31ac0SPeter Zijlstra * section which is ordered by the linker script:
43c31ac0SPeter Zijlstra *
43c31ac0SPeter Zijlstra *   include/asm-generic/vmlinux.lds.h
43c31ac0SPeter Zijlstra *
43c31ac0SPeter Zijlstra * Also enforce alignment on the instance, not the type, to guarantee layout.
43c31ac0SPeter Zijlstra */
43c31ac0SPeter Zijlstra#define DEFINE_SCHED_CLASS(name) \
43c31ac0SPeter Zijlstraconst struct sched_class name##_sched_class \
43c31ac0SPeter Zijlstra	__aligned(__alignof__(struct sched_class)) \
43c31ac0SPeter Zijlstra	__section("__" #name "_sched_class")
43c31ac0SPeter Zijlstra
c3a340f7SSteven Rostedt (VMware)/* Defined in include/asm-generic/vmlinux.lds.h */
c3a340f7SSteven Rostedt (VMware)extern struct sched_class __begin_sched_classes[];
c3a340f7SSteven Rostedt (VMware)extern struct sched_class __end_sched_classes[];
c3a340f7SSteven Rostedt (VMware)
c3a340f7SSteven Rostedt (VMware)#define sched_class_highest (__end_sched_classes - 1)
c3a340f7SSteven Rostedt (VMware)#define sched_class_lowest  (__begin_sched_classes - 1)
6e2df058SPeter Zijlstra
6e2df058SPeter Zijlstra#define for_class_range(class, _from, _to) \
c3a340f7SSteven Rostedt (VMware)	for (class = (_from); class != (_to); class--)
6e2df058SPeter Zijlstra
391e43daSPeter Zijlstra#define for_each_class(class) \
c3a340f7SSteven Rostedt (VMware)	for_class_range(class, sched_class_highest, sched_class_lowest)
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern const struct sched_class stop_sched_class;
aab03e05SDario Faggioliextern const struct sched_class dl_sched_class;
391e43daSPeter Zijlstraextern const struct sched_class rt_sched_class;
391e43daSPeter Zijlstraextern const struct sched_class fair_sched_class;
391e43daSPeter Zijlstraextern const struct sched_class idle_sched_class;
391e43daSPeter Zijlstra
6e2df058SPeter Zijlstrastatic inline bool sched_stop_runnable(struct rq *rq)
6e2df058SPeter Zijlstra{
6e2df058SPeter Zijlstra	return rq->stop && task_on_rq_queued(rq->stop);
6e2df058SPeter Zijlstra}
6e2df058SPeter Zijlstra
6e2df058SPeter Zijlstrastatic inline bool sched_dl_runnable(struct rq *rq)
6e2df058SPeter Zijlstra{
6e2df058SPeter Zijlstra	return rq->dl.dl_nr_running > 0;
6e2df058SPeter Zijlstra}
6e2df058SPeter Zijlstra
6e2df058SPeter Zijlstrastatic inline bool sched_rt_runnable(struct rq *rq)
6e2df058SPeter Zijlstra{
6e2df058SPeter Zijlstra	return rq->rt.rt_queued > 0;
6e2df058SPeter Zijlstra}
6e2df058SPeter Zijlstra
6e2df058SPeter Zijlstrastatic inline bool sched_fair_runnable(struct rq *rq)
6e2df058SPeter Zijlstra{
6e2df058SPeter Zijlstra	return rq->cfs.nr_running > 0;
6e2df058SPeter Zijlstra}
391e43daSPeter Zijlstra
5d7d6056SPeter Zijlstraextern struct task_struct *pick_next_task_fair(struct rq *rq, struct task_struct *prev, struct rq_flags *rf);
98c2f700SPeter Zijlstraextern struct task_struct *pick_next_task_idle(struct rq *rq);
5d7d6056SPeter Zijlstra
af449901SPeter Zijlstra#define SCA_CHECK		0x01
af449901SPeter Zijlstra#define SCA_MIGRATE_DISABLE	0x02
af449901SPeter Zijlstra#define SCA_MIGRATE_ENABLE	0x04
07ec77a1SWill Deacon#define SCA_USER		0x08
af449901SPeter Zijlstra
391e43daSPeter Zijlstra#ifdef CONFIG_SMP
391e43daSPeter Zijlstra
63b2ca30SNicolas Pitreextern void update_group_capacity(struct sched_domain *sd, int cpu);
b719203bSLi Zefan
7caff66fSDaniel Lezcanoextern void trigger_load_balance(struct rq *rq);
391e43daSPeter Zijlstra
9cfc3e18SPeter Zijlstraextern void set_cpus_allowed_common(struct task_struct *p, const struct cpumask *new_mask, u32 flags);
c5b28038SPeter Zijlstra
a7c81556SPeter Zijlstrastatic inline struct task_struct *get_push_task(struct rq *rq)
a7c81556SPeter Zijlstra{
a7c81556SPeter Zijlstra	struct task_struct *p = rq->curr;
a7c81556SPeter Zijlstra
5cb9eaa3SPeter Zijlstra	lockdep_assert_rq_held(rq);
a7c81556SPeter Zijlstra
a7c81556SPeter Zijlstra	if (rq->push_busy)
a7c81556SPeter Zijlstra		return NULL;
a7c81556SPeter Zijlstra
a7c81556SPeter Zijlstra	if (p->nr_cpus_allowed == 1)
a7c81556SPeter Zijlstra		return NULL;
a7c81556SPeter Zijlstra
e681dcbaSSebastian Andrzej Siewior	if (p->migration_disabled)
e681dcbaSSebastian Andrzej Siewior		return NULL;
e681dcbaSSebastian Andrzej Siewior
a7c81556SPeter Zijlstra	rq->push_busy = true;
a7c81556SPeter Zijlstra	return get_task_struct(p);
a7c81556SPeter Zijlstra}
a7c81556SPeter Zijlstra
a7c81556SPeter Zijlstraextern int push_cpu_stop(void *arg);
dc877341SPeter Zijlstra
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
442bf3aaSDaniel Lezcano#ifdef CONFIG_CPU_IDLE
442bf3aaSDaniel Lezcanostatic inline void idle_set_state(struct rq *rq,
442bf3aaSDaniel Lezcano				  struct cpuidle_state *idle_state)
442bf3aaSDaniel Lezcano{
442bf3aaSDaniel Lezcano	rq->idle_state = idle_state;
442bf3aaSDaniel Lezcano}
442bf3aaSDaniel Lezcano
442bf3aaSDaniel Lezcanostatic inline struct cpuidle_state *idle_get_state(struct rq *rq)
442bf3aaSDaniel Lezcano{
9148a3a1SPeter Zijlstra	SCHED_WARN_ON(!rcu_read_lock_held());
97fb7a0aSIngo Molnar
442bf3aaSDaniel Lezcano	return rq->idle_state;
442bf3aaSDaniel Lezcano}
442bf3aaSDaniel Lezcano#else
442bf3aaSDaniel Lezcanostatic inline void idle_set_state(struct rq *rq,
442bf3aaSDaniel Lezcano				  struct cpuidle_state *idle_state)
442bf3aaSDaniel Lezcano{
442bf3aaSDaniel Lezcano}
442bf3aaSDaniel Lezcano
442bf3aaSDaniel Lezcanostatic inline struct cpuidle_state *idle_get_state(struct rq *rq)
442bf3aaSDaniel Lezcano{
442bf3aaSDaniel Lezcano	return NULL;
442bf3aaSDaniel Lezcano}
442bf3aaSDaniel Lezcano#endif
442bf3aaSDaniel Lezcano
8663effbSSteven Rostedt (VMware)extern void schedule_idle(void);
8663effbSSteven Rostedt (VMware)
391e43daSPeter Zijlstraextern void sysrq_sched_debug_show(void);
391e43daSPeter Zijlstraextern void sched_init_granularity(void);
391e43daSPeter Zijlstraextern void update_max_interval(void);
1baca4ceSJuri Lelli
1baca4ceSJuri Lelliextern void init_sched_dl_class(void);
391e43daSPeter Zijlstraextern void init_sched_rt_class(void);
391e43daSPeter Zijlstraextern void init_sched_fair_class(void);
391e43daSPeter Zijlstra
9059393eSVincent Guittotextern void reweight_task(struct task_struct *p, int prio);
9059393eSVincent Guittot
8875125eSKirill Tkhaiextern void resched_curr(struct rq *rq);
391e43daSPeter Zijlstraextern void resched_cpu(int cpu);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern struct rt_bandwidth def_rt_bandwidth;
391e43daSPeter Zijlstraextern void init_rt_bandwidth(struct rt_bandwidth *rt_b, u64 period, u64 runtime);
*d664e399SThomas Gleixnerextern bool sched_rt_bandwidth_account(struct rt_rq *rt_rq);
391e43daSPeter Zijlstra
332ac17eSDario Faggioliextern void init_dl_bandwidth(struct dl_bandwidth *dl_b, u64 period, u64 runtime);
aab03e05SDario Faggioliextern void init_dl_task_timer(struct sched_dl_entity *dl_se);
209a0cbdSLuca Abeniextern void init_dl_inactive_task_timer(struct sched_dl_entity *dl_se);
aab03e05SDario Faggioli
c52f14d3SLuca Abeni#define BW_SHIFT		20
c52f14d3SLuca Abeni#define BW_UNIT			(1 << BW_SHIFT)
4da3abceSLuca Abeni#define RATIO_SHIFT		8
d505b8afSHuaixin Chang#define MAX_BW_BITS		(64 - BW_SHIFT)
d505b8afSHuaixin Chang#define MAX_BW			((1ULL << MAX_BW_BITS) - 1)
332ac17eSDario Faggioliunsigned long to_ratio(u64 period, u64 runtime);
332ac17eSDario Faggioli
540247fbSYuyang Duextern void init_entity_runnable_average(struct sched_entity *se);
d0fe0b9cSDietmar Eggemannextern void post_init_entity_util_avg(struct task_struct *p);
a75cdaa9SAlex Shi
76d92ac3SFrederic Weisbecker#ifdef CONFIG_NO_HZ_FULL
76d92ac3SFrederic Weisbeckerextern bool sched_can_stop_tick(struct rq *rq);
d84b3131SFrederic Weisbeckerextern int __init sched_tick_offload_init(void);
76d92ac3SFrederic Weisbecker
76d92ac3SFrederic Weisbecker/*
76d92ac3SFrederic Weisbecker * Tick may be needed by tasks in the runqueue depending on their policy and
76d92ac3SFrederic Weisbecker * requirements. If tick is needed, lets send the target an IPI to kick it out of
76d92ac3SFrederic Weisbecker * nohz mode if necessary.
76d92ac3SFrederic Weisbecker */
76d92ac3SFrederic Weisbeckerstatic inline void sched_update_tick_dependency(struct rq *rq)
76d92ac3SFrederic Weisbecker{
21a6ee14SMiaohe Lin	int cpu = cpu_of(rq);
76d92ac3SFrederic Weisbecker
76d92ac3SFrederic Weisbecker	if (!tick_nohz_full_cpu(cpu))
76d92ac3SFrederic Weisbecker		return;
76d92ac3SFrederic Weisbecker
76d92ac3SFrederic Weisbecker	if (sched_can_stop_tick(rq))
76d92ac3SFrederic Weisbecker		tick_nohz_dep_clear_cpu(cpu, TICK_DEP_BIT_SCHED);
76d92ac3SFrederic Weisbecker	else
76d92ac3SFrederic Weisbecker		tick_nohz_dep_set_cpu(cpu, TICK_DEP_BIT_SCHED);
76d92ac3SFrederic Weisbecker}
76d92ac3SFrederic Weisbecker#else
d84b3131SFrederic Weisbeckerstatic inline int sched_tick_offload_init(void) { return 0; }
76d92ac3SFrederic Weisbeckerstatic inline void sched_update_tick_dependency(struct rq *rq) { }
76d92ac3SFrederic Weisbecker#endif
76d92ac3SFrederic Weisbecker
72465447SKirill Tkhaistatic inline void add_nr_running(struct rq *rq, unsigned count)
391e43daSPeter Zijlstra{
72465447SKirill Tkhai	unsigned prev_nr = rq->nr_running;
72465447SKirill Tkhai
72465447SKirill Tkhai	rq->nr_running = prev_nr + count;
9d246053SPhil Auld	if (trace_sched_update_nr_running_tp_enabled()) {
9d246053SPhil Auld		call_trace_sched_update_nr_running(rq, count);
9d246053SPhil Auld	}
9f3660c2SFrederic Weisbecker
4486edd1STim Chen#ifdef CONFIG_SMP
3e184501SViresh Kumar	if (prev_nr < 2 && rq->nr_running >= 2) {
e90c8fe1SValentin Schneider		if (!READ_ONCE(rq->rd->overload))
e90c8fe1SValentin Schneider			WRITE_ONCE(rq->rd->overload, 1);
76d92ac3SFrederic Weisbecker	}
3e184501SViresh Kumar#endif
4486edd1STim Chen
76d92ac3SFrederic Weisbecker	sched_update_tick_dependency(rq);
4486edd1STim Chen}
391e43daSPeter Zijlstra
72465447SKirill Tkhaistatic inline void sub_nr_running(struct rq *rq, unsigned count)
391e43daSPeter Zijlstra{
72465447SKirill Tkhai	rq->nr_running -= count;
9d246053SPhil Auld	if (trace_sched_update_nr_running_tp_enabled()) {
a1bd0685SPhil Auld		call_trace_sched_update_nr_running(rq, -count);
9d246053SPhil Auld	}
9d246053SPhil Auld
76d92ac3SFrederic Weisbecker	/* Check if we still need preemption */
76d92ac3SFrederic Weisbecker	sched_update_tick_dependency(rq);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern void activate_task(struct rq *rq, struct task_struct *p, int flags);
391e43daSPeter Zijlstraextern void deactivate_task(struct rq *rq, struct task_struct *p, int flags);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern void check_preempt_curr(struct rq *rq, struct task_struct *p, int flags);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern const_debug unsigned int sysctl_sched_nr_migrate;
391e43daSPeter Zijlstraextern const_debug unsigned int sysctl_sched_migration_cost;
391e43daSPeter Zijlstra
18765447SHailong Liu#ifdef CONFIG_SCHED_DEBUG
18765447SHailong Liuextern unsigned int sysctl_sched_latency;
18765447SHailong Liuextern unsigned int sysctl_sched_min_granularity;
51ce83edSJosh Donextern unsigned int sysctl_sched_idle_min_granularity;
18765447SHailong Liuextern unsigned int sysctl_sched_wakeup_granularity;
18765447SHailong Liuextern int sysctl_resched_latency_warn_ms;
18765447SHailong Liuextern int sysctl_resched_latency_warn_once;
18765447SHailong Liu
18765447SHailong Liuextern unsigned int sysctl_sched_tunable_scaling;
18765447SHailong Liu
18765447SHailong Liuextern unsigned int sysctl_numa_balancing_scan_delay;
18765447SHailong Liuextern unsigned int sysctl_numa_balancing_scan_period_min;
18765447SHailong Liuextern unsigned int sysctl_numa_balancing_scan_period_max;
18765447SHailong Liuextern unsigned int sysctl_numa_balancing_scan_size;
18765447SHailong Liu#endif
18765447SHailong Liu
391e43daSPeter Zijlstra#ifdef CONFIG_SCHED_HRTICK
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Use hrtick when:
391e43daSPeter Zijlstra *  - enabled by features
391e43daSPeter Zijlstra *  - hrtimer is actually high res
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline int hrtick_enabled(struct rq *rq)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	if (!cpu_active(cpu_of(rq)))
391e43daSPeter Zijlstra		return 0;
391e43daSPeter Zijlstra	return hrtimer_is_hres_active(&rq->hrtick_timer);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
e0ee463cSJuri Lellistatic inline int hrtick_enabled_fair(struct rq *rq)
e0ee463cSJuri Lelli{
e0ee463cSJuri Lelli	if (!sched_feat(HRTICK))
e0ee463cSJuri Lelli		return 0;
e0ee463cSJuri Lelli	return hrtick_enabled(rq);
e0ee463cSJuri Lelli}
e0ee463cSJuri Lelli
e0ee463cSJuri Lellistatic inline int hrtick_enabled_dl(struct rq *rq)
e0ee463cSJuri Lelli{
e0ee463cSJuri Lelli	if (!sched_feat(HRTICK_DL))
e0ee463cSJuri Lelli		return 0;
e0ee463cSJuri Lelli	return hrtick_enabled(rq);
e0ee463cSJuri Lelli}
e0ee463cSJuri Lelli
391e43daSPeter Zijlstravoid hrtick_start(struct rq *rq, u64 delay);
391e43daSPeter Zijlstra
b39e66eaSMike Galbraith#else
b39e66eaSMike Galbraith
e0ee463cSJuri Lellistatic inline int hrtick_enabled_fair(struct rq *rq)
e0ee463cSJuri Lelli{
e0ee463cSJuri Lelli	return 0;
e0ee463cSJuri Lelli}
e0ee463cSJuri Lelli
e0ee463cSJuri Lellistatic inline int hrtick_enabled_dl(struct rq *rq)
e0ee463cSJuri Lelli{
e0ee463cSJuri Lelli	return 0;
e0ee463cSJuri Lelli}
e0ee463cSJuri Lelli
b39e66eaSMike Galbraithstatic inline int hrtick_enabled(struct rq *rq)
b39e66eaSMike Galbraith{
b39e66eaSMike Galbraith	return 0;
b39e66eaSMike Galbraith}
b39e66eaSMike Galbraith
391e43daSPeter Zijlstra#endif /* CONFIG_SCHED_HRTICK */
391e43daSPeter Zijlstra
1567c3e3SGiovanni Gherdovich#ifndef arch_scale_freq_tick
1567c3e3SGiovanni Gherdovichstatic __always_inline
1567c3e3SGiovanni Gherdovichvoid arch_scale_freq_tick(void)
1567c3e3SGiovanni Gherdovich{
1567c3e3SGiovanni Gherdovich}
1567c3e3SGiovanni Gherdovich#endif
1567c3e3SGiovanni Gherdovich
dfbca41fSPeter Zijlstra#ifndef arch_scale_freq_capacity
f4470cdfSValentin Schneider/**
f4470cdfSValentin Schneider * arch_scale_freq_capacity - get the frequency scale factor of a given CPU.
f4470cdfSValentin Schneider * @cpu: the CPU in question.
f4470cdfSValentin Schneider *
f4470cdfSValentin Schneider * Return: the frequency scale factor normalized against SCHED_CAPACITY_SCALE, i.e.
f4470cdfSValentin Schneider *
f4470cdfSValentin Schneider *     f_curr
f4470cdfSValentin Schneider *     ------ * SCHED_CAPACITY_SCALE
f4470cdfSValentin Schneider *     f_max
f4470cdfSValentin Schneider */
dfbca41fSPeter Zijlstrastatic __always_inline
7673c8a4SJuri Lelliunsigned long arch_scale_freq_capacity(int cpu)
dfbca41fSPeter Zijlstra{
dfbca41fSPeter Zijlstra	return SCHED_CAPACITY_SCALE;
dfbca41fSPeter Zijlstra}
dfbca41fSPeter Zijlstra#endif
b5b4860dSVincent Guittot
391e43daSPeter Zijlstra
d66f1b06SPeter Zijlstra#ifdef CONFIG_SMP
d66f1b06SPeter Zijlstra
d66f1b06SPeter Zijlstrastatic inline bool rq_order_less(struct rq *rq1, struct rq *rq2)
d66f1b06SPeter Zijlstra{
9edeaea1SPeter Zijlstra#ifdef CONFIG_SCHED_CORE
9edeaea1SPeter Zijlstra	/*
9edeaea1SPeter Zijlstra	 * In order to not have {0,2},{1,3} turn into into an AB-BA,
9edeaea1SPeter Zijlstra	 * order by core-id first and cpu-id second.
9edeaea1SPeter Zijlstra	 *
9edeaea1SPeter Zijlstra	 * Notably:
9edeaea1SPeter Zijlstra	 *
9edeaea1SPeter Zijlstra	 *	double_rq_lock(0,3); will take core-0, core-1 lock
9edeaea1SPeter Zijlstra	 *	double_rq_lock(1,2); will take core-1, core-0 lock
9edeaea1SPeter Zijlstra	 *
9edeaea1SPeter Zijlstra	 * when only cpu-id is considered.
9edeaea1SPeter Zijlstra	 */
9edeaea1SPeter Zijlstra	if (rq1->core->cpu < rq2->core->cpu)
9edeaea1SPeter Zijlstra		return true;
9edeaea1SPeter Zijlstra	if (rq1->core->cpu > rq2->core->cpu)
9edeaea1SPeter Zijlstra		return false;
9edeaea1SPeter Zijlstra
9edeaea1SPeter Zijlstra	/*
9edeaea1SPeter Zijlstra	 * __sched_core_flip() relies on SMT having cpu-id lock order.
9edeaea1SPeter Zijlstra	 */
9edeaea1SPeter Zijlstra#endif
d66f1b06SPeter Zijlstra	return rq1->cpu < rq2->cpu;
d66f1b06SPeter Zijlstra}
d66f1b06SPeter Zijlstra
d66f1b06SPeter Zijlstraextern void double_rq_lock(struct rq *rq1, struct rq *rq2);
d66f1b06SPeter Zijlstra
d66f1b06SPeter Zijlstra#ifdef CONFIG_PREEMPTION
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * fair double_lock_balance: Safely acquires both rq->locks in a fair
391e43daSPeter Zijlstra * way at the expense of forcing extra atomic operations in all
391e43daSPeter Zijlstra * invocations.  This assures that the double_lock is acquired using the
391e43daSPeter Zijlstra * same underlying policy as the spinlock_t on this architecture, which
391e43daSPeter Zijlstra * reduces latency compared to the unfair variant below.  However, it
391e43daSPeter Zijlstra * also adds more overhead and therefore may reduce throughput.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline int _double_lock_balance(struct rq *this_rq, struct rq *busiest)
391e43daSPeter Zijlstra	__releases(this_rq->lock)
391e43daSPeter Zijlstra	__acquires(busiest->lock)
391e43daSPeter Zijlstra	__acquires(this_rq->lock)
391e43daSPeter Zijlstra{
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(this_rq);
391e43daSPeter Zijlstra	double_rq_lock(this_rq, busiest);
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	return 1;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#else
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * Unfair double_lock_balance: Optimizes throughput at the expense of
391e43daSPeter Zijlstra * latency by eliminating extra atomic operations when the locks are
97fb7a0aSIngo Molnar * already in proper order on entry.  This favors lower CPU-ids and will
97fb7a0aSIngo Molnar * grant the double lock to lower CPUs over higher ids under contention,
391e43daSPeter Zijlstra * regardless of entry order into the function.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline int _double_lock_balance(struct rq *this_rq, struct rq *busiest)
391e43daSPeter Zijlstra	__releases(this_rq->lock)
391e43daSPeter Zijlstra	__acquires(busiest->lock)
391e43daSPeter Zijlstra	__acquires(this_rq->lock)
391e43daSPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	if (__rq_lockp(this_rq) == __rq_lockp(busiest))
5cb9eaa3SPeter Zijlstra		return 0;
391e43daSPeter Zijlstra
5cb9eaa3SPeter Zijlstra	if (likely(raw_spin_rq_trylock(busiest)))
5cb9eaa3SPeter Zijlstra		return 0;
5cb9eaa3SPeter Zijlstra
d66f1b06SPeter Zijlstra	if (rq_order_less(this_rq, busiest)) {
5cb9eaa3SPeter Zijlstra		raw_spin_rq_lock_nested(busiest, SINGLE_DEPTH_NESTING);
5cb9eaa3SPeter Zijlstra		return 0;
391e43daSPeter Zijlstra	}
5cb9eaa3SPeter Zijlstra
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(this_rq);
d66f1b06SPeter Zijlstra	double_rq_lock(this_rq, busiest);
5cb9eaa3SPeter Zijlstra
5cb9eaa3SPeter Zijlstra	return 1;
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
c1a280b6SThomas Gleixner#endif /* CONFIG_PREEMPTION */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * double_lock_balance - lock the busiest runqueue, this_rq is locked already.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline int double_lock_balance(struct rq *this_rq, struct rq *busiest)
391e43daSPeter Zijlstra{
5cb9eaa3SPeter Zijlstra	lockdep_assert_irqs_disabled();
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra	return _double_lock_balance(this_rq, busiest);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstrastatic inline void double_unlock_balance(struct rq *this_rq, struct rq *busiest)
391e43daSPeter Zijlstra	__releases(busiest->lock)
391e43daSPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	if (__rq_lockp(this_rq) != __rq_lockp(busiest))
5cb9eaa3SPeter Zijlstra		raw_spin_rq_unlock(busiest);
9ef7e7e3SPeter Zijlstra	lock_set_subclass(&__rq_lockp(this_rq)->dep_map, 0, _RET_IP_);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
74602315SPeter Zijlstrastatic inline void double_lock(spinlock_t *l1, spinlock_t *l2)
74602315SPeter Zijlstra{
74602315SPeter Zijlstra	if (l1 > l2)
74602315SPeter Zijlstra		swap(l1, l2);
74602315SPeter Zijlstra
74602315SPeter Zijlstra	spin_lock(l1);
74602315SPeter Zijlstra	spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
74602315SPeter Zijlstra}
74602315SPeter Zijlstra
60e69eedSMike Galbraithstatic inline void double_lock_irq(spinlock_t *l1, spinlock_t *l2)
60e69eedSMike Galbraith{
60e69eedSMike Galbraith	if (l1 > l2)
60e69eedSMike Galbraith		swap(l1, l2);
60e69eedSMike Galbraith
60e69eedSMike Galbraith	spin_lock_irq(l1);
60e69eedSMike Galbraith	spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
60e69eedSMike Galbraith}
60e69eedSMike Galbraith
74602315SPeter Zijlstrastatic inline void double_raw_lock(raw_spinlock_t *l1, raw_spinlock_t *l2)
74602315SPeter Zijlstra{
74602315SPeter Zijlstra	if (l1 > l2)
74602315SPeter Zijlstra		swap(l1, l2);
74602315SPeter Zijlstra
74602315SPeter Zijlstra	raw_spin_lock(l1);
74602315SPeter Zijlstra	raw_spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
74602315SPeter Zijlstra}
74602315SPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * double_rq_unlock - safely unlock two runqueues
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * Note this does not restore interrupts like task_rq_unlock,
391e43daSPeter Zijlstra * you need to do so manually after calling.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline void double_rq_unlock(struct rq *rq1, struct rq *rq2)
391e43daSPeter Zijlstra	__releases(rq1->lock)
391e43daSPeter Zijlstra	__releases(rq2->lock)
391e43daSPeter Zijlstra{
9ef7e7e3SPeter Zijlstra	if (__rq_lockp(rq1) != __rq_lockp(rq2))
5cb9eaa3SPeter Zijlstra		raw_spin_rq_unlock(rq2);
391e43daSPeter Zijlstra	else
391e43daSPeter Zijlstra		__release(rq2->lock);
d66f1b06SPeter Zijlstra	raw_spin_rq_unlock(rq1);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
f2cb1360SIngo Molnarextern void set_rq_online (struct rq *rq);
f2cb1360SIngo Molnarextern void set_rq_offline(struct rq *rq);
f2cb1360SIngo Molnarextern bool sched_smp_initialized;
f2cb1360SIngo Molnar
391e43daSPeter Zijlstra#else /* CONFIG_SMP */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * double_rq_lock - safely lock two runqueues
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * Note this does not disable interrupts like task_rq_lock,
391e43daSPeter Zijlstra * you need to do so manually before calling.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline void double_rq_lock(struct rq *rq1, struct rq *rq2)
391e43daSPeter Zijlstra	__acquires(rq1->lock)
391e43daSPeter Zijlstra	__acquires(rq2->lock)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	BUG_ON(!irqs_disabled());
391e43daSPeter Zijlstra	BUG_ON(rq1 != rq2);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_lock(rq1);
391e43daSPeter Zijlstra	__acquire(rq2->lock);	/* Fake it out ;) */
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra/*
391e43daSPeter Zijlstra * double_rq_unlock - safely unlock two runqueues
391e43daSPeter Zijlstra *
391e43daSPeter Zijlstra * Note this does not restore interrupts like task_rq_unlock,
391e43daSPeter Zijlstra * you need to do so manually after calling.
391e43daSPeter Zijlstra */
391e43daSPeter Zijlstrastatic inline void double_rq_unlock(struct rq *rq1, struct rq *rq2)
391e43daSPeter Zijlstra	__releases(rq1->lock)
391e43daSPeter Zijlstra	__releases(rq2->lock)
391e43daSPeter Zijlstra{
391e43daSPeter Zijlstra	BUG_ON(rq1 != rq2);
5cb9eaa3SPeter Zijlstra	raw_spin_rq_unlock(rq1);
391e43daSPeter Zijlstra	__release(rq2->lock);
391e43daSPeter Zijlstra}
391e43daSPeter Zijlstra
391e43daSPeter Zijlstra#endif
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern struct sched_entity *__pick_first_entity(struct cfs_rq *cfs_rq);
391e43daSPeter Zijlstraextern struct sched_entity *__pick_last_entity(struct cfs_rq *cfs_rq);
6b55c965SSrikar Dronamraju
6b55c965SSrikar Dronamraju#ifdef	CONFIG_SCHED_DEBUG
9406415fSPeter Zijlstraextern bool sched_debug_verbose;
9469eb01SPeter Zijlstra
391e43daSPeter Zijlstraextern void print_cfs_stats(struct seq_file *m, int cpu);
391e43daSPeter Zijlstraextern void print_rt_stats(struct seq_file *m, int cpu);
acb32132SWanpeng Liextern void print_dl_stats(struct seq_file *m, int cpu);
f6a34630SMathieu Malaterreextern void print_cfs_rq(struct seq_file *m, int cpu, struct cfs_rq *cfs_rq);
f6a34630SMathieu Malaterreextern void print_rt_rq(struct seq_file *m, int cpu, struct rt_rq *rt_rq);
f6a34630SMathieu Malaterreextern void print_dl_rq(struct seq_file *m, int cpu, struct dl_rq *dl_rq);
c006fac5SPaul Turner
c006fac5SPaul Turnerextern void resched_latency_warn(int cpu, u64 latency);
397f2378SSrikar Dronamraju#ifdef CONFIG_NUMA_BALANCING
397f2378SSrikar Dronamrajuextern void
397f2378SSrikar Dronamrajushow_numa_stats(struct task_struct *p, struct seq_file *m);
397f2378SSrikar Dronamrajuextern void
397f2378SSrikar Dronamrajuprint_numa_stats(struct seq_file *m, int node, unsigned long tsf,
397f2378SSrikar Dronamraju	unsigned long tpf, unsigned long gsf, unsigned long gpf);
397f2378SSrikar Dronamraju#endif /* CONFIG_NUMA_BALANCING */
c006fac5SPaul Turner#else
c006fac5SPaul Turnerstatic inline void resched_latency_warn(int cpu, u64 latency) {}
397f2378SSrikar Dronamraju#endif /* CONFIG_SCHED_DEBUG */
391e43daSPeter Zijlstra
391e43daSPeter Zijlstraextern void init_cfs_rq(struct cfs_rq *cfs_rq);
07c54f7aSAbel Vesaextern void init_rt_rq(struct rt_rq *rt_rq);
07c54f7aSAbel Vesaextern void init_dl_rq(struct dl_rq *dl_rq);
391e43daSPeter Zijlstra
1ee14e6cSBen Segallextern void cfs_bandwidth_usage_inc(void);
1ee14e6cSBen Segallextern void cfs_bandwidth_usage_dec(void);
1c792db7SSuresh Siddha
3451d024SFrederic Weisbecker#ifdef CONFIG_NO_HZ_COMMON
00357f5eSPeter Zijlstra#define NOHZ_BALANCE_KICK_BIT	0
00357f5eSPeter Zijlstra#define NOHZ_STATS_KICK_BIT	1
c6f88654SVincent Guittot#define NOHZ_NEWILB_KICK_BIT	2
efd984c4SValentin Schneider#define NOHZ_NEXT_KICK_BIT	3
a22e47a4SPeter Zijlstra
efd984c4SValentin Schneider/* Run rebalance_domains() */
a22e47a4SPeter Zijlstra#define NOHZ_BALANCE_KICK	BIT(NOHZ_BALANCE_KICK_BIT)
efd984c4SValentin Schneider/* Update blocked load */
b7031a02SPeter Zijlstra#define NOHZ_STATS_KICK		BIT(NOHZ_STATS_KICK_BIT)
efd984c4SValentin Schneider/* Update blocked load when entering idle */
c6f88654SVincent Guittot#define NOHZ_NEWILB_KICK	BIT(NOHZ_NEWILB_KICK_BIT)
efd984c4SValentin Schneider/* Update nohz.next_balance */
efd984c4SValentin Schneider#define NOHZ_NEXT_KICK		BIT(NOHZ_NEXT_KICK_BIT)
b7031a02SPeter Zijlstra
efd984c4SValentin Schneider#define NOHZ_KICK_MASK	(NOHZ_BALANCE_KICK | NOHZ_STATS_KICK | NOHZ_NEXT_KICK)
1c792db7SSuresh Siddha
1c792db7SSuresh Siddha#define nohz_flags(cpu)	(&cpu_rq(cpu)->nohz_flags)
20a5c8ccSThomas Gleixner
00357f5eSPeter Zijlstraextern void nohz_balance_exit_idle(struct rq *rq);
20a5c8ccSThomas Gleixner#else
00357f5eSPeter Zijlstrastatic inline void nohz_balance_exit_idle(struct rq *rq) { }
1c792db7SSuresh Siddha#endif
73fbec60SFrederic Weisbecker
c6f88654SVincent Guittot#if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
c6f88654SVincent Guittotextern void nohz_run_idle_balance(int cpu);
c6f88654SVincent Guittot#else
c6f88654SVincent Guittotstatic inline void nohz_run_idle_balance(int cpu) { }
c6f88654SVincent Guittot#endif
daec5798SLuca Abeni
73fbec60SFrederic Weisbecker#ifdef CONFIG_IRQ_TIME_ACCOUNTING
19d23dbfSFrederic Weisbeckerstruct irqtime {
25e2d8c1SFrederic Weisbecker	u64			total;
a499a5a1SFrederic Weisbecker	u64			tick_delta;
19d23dbfSFrederic Weisbecker	u64			irq_start_time;
19d23dbfSFrederic Weisbecker	struct u64_stats_sync	sync;
19d23dbfSFrederic Weisbecker};
73fbec60SFrederic Weisbecker
19d23dbfSFrederic WeisbeckerDECLARE_PER_CPU(struct irqtime, cpu_irqtime);
73fbec60SFrederic Weisbecker
25e2d8c1SFrederic Weisbecker/*
25e2d8c1SFrederic Weisbecker * Returns the irqtime minus the softirq time computed by ksoftirqd.
3b03706fSIngo Molnar * Otherwise ksoftirqd's sum_exec_runtime is subtracted its own runtime
25e2d8c1SFrederic Weisbecker * and never move forward.
25e2d8c1SFrederic Weisbecker */
73fbec60SFrederic Weisbeckerstatic inline u64 irq_time_read(int cpu)
73fbec60SFrederic Weisbecker{
19d23dbfSFrederic Weisbecker	struct irqtime *irqtime = &per_cpu(cpu_irqtime, cpu);
19d23dbfSFrederic Weisbecker	unsigned int seq;
19d23dbfSFrederic Weisbecker	u64 total;
73fbec60SFrederic Weisbecker
73fbec60SFrederic Weisbecker	do {
19d23dbfSFrederic Weisbecker		seq = __u64_stats_fetch_begin(&irqtime->sync);
25e2d8c1SFrederic Weisbecker		total = irqtime->total;
19d23dbfSFrederic Weisbecker	} while (__u64_stats_fetch_retry(&irqtime->sync, seq));
73fbec60SFrederic Weisbecker
19d23dbfSFrederic Weisbecker	return total;
73fbec60SFrederic Weisbecker}
73fbec60SFrederic Weisbecker#endif /* CONFIG_IRQ_TIME_ACCOUNTING */
adaf9fcdSRafael J. Wysocki
adaf9fcdSRafael J. Wysocki#ifdef CONFIG_CPU_FREQ
b10abd0aSJoel Fernandes (Google)DECLARE_PER_CPU(struct update_util_data __rcu *, cpufreq_update_util_data);
adaf9fcdSRafael J. Wysocki
adaf9fcdSRafael J. Wysocki/**
adaf9fcdSRafael J. Wysocki * cpufreq_update_util - Take a note about CPU utilization changes.
12bde33dSRafael J. Wysocki * @rq: Runqueue to carry out the update for.
58919e83SRafael J. Wysocki * @flags: Update reason flags.
adaf9fcdSRafael J. Wysocki *
58919e83SRafael J. Wysocki * This function is called by the scheduler on the CPU whose utilization is
58919e83SRafael J. Wysocki * being updated.
adaf9fcdSRafael J. Wysocki *
adaf9fcdSRafael J. Wysocki * It can only be called from RCU-sched read-side critical sections.
adaf9fcdSRafael J. Wysocki *
adaf9fcdSRafael J. Wysocki * The way cpufreq is currently arranged requires it to evaluate the CPU
adaf9fcdSRafael J. Wysocki * performance state (frequency/voltage) on a regular basis to prevent it from
adaf9fcdSRafael J. Wysocki * being stuck in a completely inadequate performance level for too long.
e0367b12SJuri Lelli * That is not guaranteed to happen if the updates are only triggered from CFS
e0367b12SJuri Lelli * and DL, though, because they may not be coming in if only RT tasks are
e0367b12SJuri Lelli * active all the time (or there are RT tasks only).
adaf9fcdSRafael J. Wysocki *
e0367b12SJuri Lelli * As a workaround for that issue, this function is called periodically by the
e0367b12SJuri Lelli * RT sched class to trigger extra cpufreq updates to prevent it from stalling,
adaf9fcdSRafael J. Wysocki * but that really is a band-aid.  Going forward it should be replaced with
e0367b12SJuri Lelli * solutions targeted more specifically at RT tasks.
adaf9fcdSRafael J. Wysocki */
12bde33dSRafael J. Wysockistatic inline void cpufreq_update_util(struct rq *rq, unsigned int flags)
adaf9fcdSRafael J. Wysocki{
58919e83SRafael J. Wysocki	struct update_util_data *data;
58919e83SRafael J. Wysocki
674e7541SViresh Kumar	data = rcu_dereference_sched(*per_cpu_ptr(&cpufreq_update_util_data,
674e7541SViresh Kumar						  cpu_of(rq)));
58919e83SRafael J. Wysocki	if (data)
12bde33dSRafael J. Wysocki		data->func(data, rq_clock(rq), flags);
12bde33dSRafael J. Wysocki}
adaf9fcdSRafael J. Wysocki#else
12bde33dSRafael J. Wysockistatic inline void cpufreq_update_util(struct rq *rq, unsigned int flags) {}
adaf9fcdSRafael J. Wysocki#endif /* CONFIG_CPU_FREQ */
be53f58fSLinus Torvalds
9bdcb44eSRafael J. Wysocki#ifdef arch_scale_freq_capacity
9bdcb44eSRafael J. Wysocki# ifndef arch_scale_freq_invariant
97fb7a0aSIngo Molnar#  define arch_scale_freq_invariant()	true
9bdcb44eSRafael J. Wysocki# endif
97fb7a0aSIngo Molnar#else
97fb7a0aSIngo Molnar# define arch_scale_freq_invariant()	false
9bdcb44eSRafael J. Wysocki#endif
d4edd662SJuri Lelli
10a35e68SVincent Guittot#ifdef CONFIG_SMP
10a35e68SVincent Guittotstatic inline unsigned long capacity_orig_of(int cpu)
10a35e68SVincent Guittot{
10a35e68SVincent Guittot	return cpu_rq(cpu)->cpu_capacity_orig;
10a35e68SVincent Guittot}
10a35e68SVincent Guittot
938e5e4bSQuentin Perret/**
a5418be9SViresh Kumar * enum cpu_util_type - CPU utilization type
938e5e4bSQuentin Perret * @FREQUENCY_UTIL:	Utilization used to select frequency
938e5e4bSQuentin Perret * @ENERGY_UTIL:	Utilization used during energy calculation
938e5e4bSQuentin Perret *
938e5e4bSQuentin Perret * The utilization signals of all scheduling classes (CFS/RT/DL) and IRQ time
938e5e4bSQuentin Perret * need to be aggregated differently depending on the usage made of them. This
a5418be9SViresh Kumar * enum is used within effective_cpu_util() to differentiate the types of
938e5e4bSQuentin Perret * utilization expected by the callers, and adjust the aggregation accordingly.
938e5e4bSQuentin Perret */
a5418be9SViresh Kumarenum cpu_util_type {
938e5e4bSQuentin Perret	FREQUENCY_UTIL,
938e5e4bSQuentin Perret	ENERGY_UTIL,
938e5e4bSQuentin Perret};
938e5e4bSQuentin Perret
a5418be9SViresh Kumarunsigned long effective_cpu_util(int cpu, unsigned long util_cfs,
a5418be9SViresh Kumar				 unsigned long max, enum cpu_util_type type,
af24bde8SPatrick Bellasi				 struct task_struct *p);
938e5e4bSQuentin Perret
8cc90515SVincent Guittotstatic inline unsigned long cpu_bw_dl(struct rq *rq)
d4edd662SJuri Lelli{
d4edd662SJuri Lelli	return (rq->dl.running_bw * SCHED_CAPACITY_SCALE) >> BW_SHIFT;
d4edd662SJuri Lelli}
d4edd662SJuri Lelli
8cc90515SVincent Guittotstatic inline unsigned long cpu_util_dl(struct rq *rq)
8cc90515SVincent Guittot{
8cc90515SVincent Guittot	return READ_ONCE(rq->avg_dl.util_avg);
8cc90515SVincent Guittot}
8cc90515SVincent Guittot
82762d2aSDietmar Eggemann/**
82762d2aSDietmar Eggemann * cpu_util_cfs() - Estimates the amount of CPU capacity used by CFS tasks.
82762d2aSDietmar Eggemann * @cpu: the CPU to get the utilization for.
82762d2aSDietmar Eggemann *
82762d2aSDietmar Eggemann * The unit of the return value must be the same as the one of CPU capacity
82762d2aSDietmar Eggemann * so that CPU utilization can be compared with CPU capacity.
82762d2aSDietmar Eggemann *
82762d2aSDietmar Eggemann * CPU utilization is the sum of running time of runnable tasks plus the
82762d2aSDietmar Eggemann * recent utilization of currently non-runnable tasks on that CPU.
82762d2aSDietmar Eggemann * It represents the amount of CPU capacity currently used by CFS tasks in
82762d2aSDietmar Eggemann * the range [0..max CPU capacity] with max CPU capacity being the CPU
82762d2aSDietmar Eggemann * capacity at f_max.
82762d2aSDietmar Eggemann *
82762d2aSDietmar Eggemann * The estimated CPU utilization is defined as the maximum between CPU
82762d2aSDietmar Eggemann * utilization and sum of the estimated utilization of the currently
82762d2aSDietmar Eggemann * runnable tasks on that CPU. It preserves a utilization "snapshot" of
82762d2aSDietmar Eggemann * previously-executed tasks, which helps better deduce how busy a CPU will
82762d2aSDietmar Eggemann * be when a long-sleeping task wakes up. The contribution to CPU utilization
82762d2aSDietmar Eggemann * of such a task would be significantly decayed at this point of time.
82762d2aSDietmar Eggemann *
82762d2aSDietmar Eggemann * CPU utilization can be higher than the current CPU capacity
82762d2aSDietmar Eggemann * (f_curr/f_max * max CPU capacity) or even the max CPU capacity because
82762d2aSDietmar Eggemann * of rounding errors as well as task migrations or wakeups of new tasks.
82762d2aSDietmar Eggemann * CPU utilization has to be capped to fit into the [0..max CPU capacity]
82762d2aSDietmar Eggemann * range. Otherwise a group of CPUs (CPU0 util = 121% + CPU1 util = 80%)
82762d2aSDietmar Eggemann * could be seen as over-utilized even though CPU1 has 20% of spare CPU
82762d2aSDietmar Eggemann * capacity. CPU utilization is allowed to overshoot current CPU capacity
82762d2aSDietmar Eggemann * though since this is useful for predicting the CPU capacity required
82762d2aSDietmar Eggemann * after task migrations (scheduler-driven DVFS).
82762d2aSDietmar Eggemann *
82762d2aSDietmar Eggemann * Return: (Estimated) utilization for the specified CPU.
82762d2aSDietmar Eggemann */
82762d2aSDietmar Eggemannstatic inline unsigned long cpu_util_cfs(int cpu)
d4edd662SJuri Lelli{
82762d2aSDietmar Eggemann	struct cfs_rq *cfs_rq;
82762d2aSDietmar Eggemann	unsigned long util;
82762d2aSDietmar Eggemann
82762d2aSDietmar Eggemann	cfs_rq = &cpu_rq(cpu)->cfs;
82762d2aSDietmar Eggemann	util = READ_ONCE(cfs_rq->avg.util_avg);
a07630b8SPatrick Bellasi
a07630b8SPatrick Bellasi	if (sched_feat(UTIL_EST)) {
a07630b8SPatrick Bellasi		util = max_t(unsigned long, util,
82762d2aSDietmar Eggemann			     READ_ONCE(cfs_rq->avg.util_est.enqueued));
a07630b8SPatrick Bellasi	}
a07630b8SPatrick Bellasi
82762d2aSDietmar Eggemann	return min(util, capacity_orig_of(cpu));
d4edd662SJuri Lelli}
371bf427SVincent Guittot
371bf427SVincent Guittotstatic inline unsigned long cpu_util_rt(struct rq *rq)
371bf427SVincent Guittot{
dfa444dcSVincent Guittot	return READ_ONCE(rq->avg_rt.util_avg);
371bf427SVincent Guittot}
7d6a905fSViresh Kumar#endif
9033ea11SVincent Guittot
7a17e1dbSQais Yousef#ifdef CONFIG_UCLAMP_TASK
7a17e1dbSQais Yousefunsigned long uclamp_eff_value(struct task_struct *p, enum uclamp_id clamp_id);
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef/**
7a17e1dbSQais Yousef * uclamp_rq_util_with - clamp @util with @rq and @p effective uclamp values.
7a17e1dbSQais Yousef * @rq:		The rq to clamp against. Must not be NULL.
7a17e1dbSQais Yousef * @util:	The util value to clamp.
7a17e1dbSQais Yousef * @p:		The task to clamp against. Can be NULL if you want to clamp
7a17e1dbSQais Yousef *		against @rq only.
7a17e1dbSQais Yousef *
7a17e1dbSQais Yousef * Clamps the passed @util to the max(@rq, @p) effective uclamp values.
7a17e1dbSQais Yousef *
7a17e1dbSQais Yousef * If sched_uclamp_used static key is disabled, then just return the util
7a17e1dbSQais Yousef * without any clamping since uclamp aggregation at the rq level in the fast
7a17e1dbSQais Yousef * path is disabled, rendering this operation a NOP.
7a17e1dbSQais Yousef *
7a17e1dbSQais Yousef * Use uclamp_eff_value() if you don't care about uclamp values at rq level. It
7a17e1dbSQais Yousef * will return the correct effective uclamp value of the task even if the
7a17e1dbSQais Yousef * static key is disabled.
7a17e1dbSQais Yousef */
7a17e1dbSQais Yousefstatic __always_inline
7a17e1dbSQais Yousefunsigned long uclamp_rq_util_with(struct rq *rq, unsigned long util,
7a17e1dbSQais Yousef				  struct task_struct *p)
7a17e1dbSQais Yousef{
7a17e1dbSQais Yousef	unsigned long min_util = 0;
7a17e1dbSQais Yousef	unsigned long max_util = 0;
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	if (!static_branch_likely(&sched_uclamp_used))
7a17e1dbSQais Yousef		return util;
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	if (p) {
7a17e1dbSQais Yousef		min_util = uclamp_eff_value(p, UCLAMP_MIN);
7a17e1dbSQais Yousef		max_util = uclamp_eff_value(p, UCLAMP_MAX);
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef		/*
7a17e1dbSQais Yousef		 * Ignore last runnable task's max clamp, as this task will
7a17e1dbSQais Yousef		 * reset it. Similarly, no need to read the rq's min clamp.
7a17e1dbSQais Yousef		 */
7a17e1dbSQais Yousef		if (rq->uclamp_flags & UCLAMP_FLAG_IDLE)
7a17e1dbSQais Yousef			goto out;
7a17e1dbSQais Yousef	}
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	min_util = max_t(unsigned long, min_util, READ_ONCE(rq->uclamp[UCLAMP_MIN].value));
7a17e1dbSQais Yousef	max_util = max_t(unsigned long, max_util, READ_ONCE(rq->uclamp[UCLAMP_MAX].value));
7a17e1dbSQais Yousefout:
7a17e1dbSQais Yousef	/*
7a17e1dbSQais Yousef	 * Since CPU's {min,max}_util clamps are MAX aggregated considering
7a17e1dbSQais Yousef	 * RUNNABLE tasks with _different_ clamps, we can end up with an
7a17e1dbSQais Yousef	 * inversion. Fix it now when the clamps are applied.
7a17e1dbSQais Yousef	 */
7a17e1dbSQais Yousef	if (unlikely(min_util >= max_util))
7a17e1dbSQais Yousef		return min_util;
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	return clamp(util, min_util, max_util);
7a17e1dbSQais Yousef}
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef/* Is the rq being capped/throttled by uclamp_max? */
7a17e1dbSQais Yousefstatic inline bool uclamp_rq_is_capped(struct rq *rq)
7a17e1dbSQais Yousef{
7a17e1dbSQais Yousef	unsigned long rq_util;
7a17e1dbSQais Yousef	unsigned long max_util;
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	if (!static_branch_likely(&sched_uclamp_used))
7a17e1dbSQais Yousef		return false;
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	rq_util = cpu_util_cfs(cpu_of(rq)) + cpu_util_rt(rq);
7a17e1dbSQais Yousef	max_util = READ_ONCE(rq->uclamp[UCLAMP_MAX].value);
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef	return max_util != SCHED_CAPACITY_SCALE && rq_util >= max_util;
7a17e1dbSQais Yousef}
7a17e1dbSQais Yousef
7a17e1dbSQais Yousef/*
7a17e1dbSQais Yousef * When uclamp is compiled in, the aggregation at rq level is 'turned off'
7a17e1dbSQais Yousef * by default in the fast path and only gets turned on once userspace performs
7a17e1dbSQais Yousef * an operation that requires it.
7a17e1dbSQais Yousef *
7a17e1dbSQais Yousef * Returns true if userspace opted-in to use uclamp and aggregation at rq level
7a17e1dbSQais Yousef * hence is active.
7a17e1dbSQais Yousef */
7a17e1dbSQais Yousefstatic inline bool uclamp_is_used(void)
7a17e1dbSQais Yousef{
7a17e1dbSQais Yousef	return static_branch_likely(&sched_uclamp_used);
7a17e1dbSQais Yousef}
7a17e1dbSQais Yousef#else /* CONFIG_UCLAMP_TASK */
7a17e1dbSQais Yousefstatic inline
7a17e1dbSQais Yousefunsigned long uclamp_rq_util_with(struct rq *rq, unsigned long util,
7a17e1dbSQais Yousef				  struct task_struct *p)
7a17e1dbSQais Yousef{
7a17e1dbSQais Yousef	return util;
7a17e1dbSQais Yousef}
7a17e1dbSQais Yousef
7a17e1dbSQais Yousefstatic inline bool uclamp_rq_is_capped(struct rq *rq) { return false; }
7a17e1dbSQais Yousef
7a17e1dbSQais Yousefstatic inline bool uclamp_is_used(void)
7a17e1dbSQais Yousef{
7a17e1dbSQais Yousef	return false;
7a17e1dbSQais Yousef}
7a17e1dbSQais Yousef#endif /* CONFIG_UCLAMP_TASK */
7a17e1dbSQais Yousef
11d4afd4SVincent Guittot#ifdef CONFIG_HAVE_SCHED_AVG_IRQ
9033ea11SVincent Guittotstatic inline unsigned long cpu_util_irq(struct rq *rq)
9033ea11SVincent Guittot{
9033ea11SVincent Guittot	return rq->avg_irq.util_avg;
9033ea11SVincent Guittot}
2e62c474SVincent Guittot
2e62c474SVincent Guittotstatic inline
2e62c474SVincent Guittotunsigned long scale_irq_capacity(unsigned long util, unsigned long irq, unsigned long max)
2e62c474SVincent Guittot{
2e62c474SVincent Guittot	util *= (max - irq);
2e62c474SVincent Guittot	util /= max;
2e62c474SVincent Guittot
2e62c474SVincent Guittot	return util;
2e62c474SVincent Guittot
2e62c474SVincent Guittot}
9033ea11SVincent Guittot#else
9033ea11SVincent Guittotstatic inline unsigned long cpu_util_irq(struct rq *rq)
9033ea11SVincent Guittot{
9033ea11SVincent Guittot	return 0;
9033ea11SVincent Guittot}
9033ea11SVincent Guittot
2e62c474SVincent Guittotstatic inline
2e62c474SVincent Guittotunsigned long scale_irq_capacity(unsigned long util, unsigned long irq, unsigned long max)
2e62c474SVincent Guittot{
2e62c474SVincent Guittot	return util;
2e62c474SVincent Guittot}
794a56ebSJuri Lelli#endif
6aa140faSQuentin Perret
531b5c9fSQuentin Perret#if defined(CONFIG_ENERGY_MODEL) && defined(CONFIG_CPU_FREQ_GOV_SCHEDUTIL)
1f74de87SQuentin Perret
f8a696f2SPeter Zijlstra#define perf_domain_span(pd) (to_cpumask(((pd)->em_pd->cpus)))
f8a696f2SPeter Zijlstra
f8a696f2SPeter ZijlstraDECLARE_STATIC_KEY_FALSE(sched_energy_present);
f8a696f2SPeter Zijlstra
f8a696f2SPeter Zijlstrastatic inline bool sched_energy_enabled(void)
f8a696f2SPeter Zijlstra{
f8a696f2SPeter Zijlstra	return static_branch_unlikely(&sched_energy_present);
f8a696f2SPeter Zijlstra}
f8a696f2SPeter Zijlstra
f8a696f2SPeter Zijlstra#else /* ! (CONFIG_ENERGY_MODEL && CONFIG_CPU_FREQ_GOV_SCHEDUTIL) */
f8a696f2SPeter Zijlstra
f8a696f2SPeter Zijlstra#define perf_domain_span(pd) NULL
f8a696f2SPeter Zijlstrastatic inline bool sched_energy_enabled(void) { return false; }
f8a696f2SPeter Zijlstra
f8a696f2SPeter Zijlstra#endif /* CONFIG_ENERGY_MODEL && CONFIG_CPU_FREQ_GOV_SCHEDUTIL */
227a4aadSMathieu Desnoyers
227a4aadSMathieu Desnoyers#ifdef CONFIG_MEMBARRIER
227a4aadSMathieu Desnoyers/*
227a4aadSMathieu Desnoyers * The scheduler provides memory barriers required by membarrier between:
227a4aadSMathieu Desnoyers * - prior user-space memory accesses and store to rq->membarrier_state,
227a4aadSMathieu Desnoyers * - store to rq->membarrier_state and following user-space memory accesses.
227a4aadSMathieu Desnoyers * In the same way it provides those guarantees around store to rq->curr.
227a4aadSMathieu Desnoyers */
227a4aadSMathieu Desnoyersstatic inline void membarrier_switch_mm(struct rq *rq,
227a4aadSMathieu Desnoyers					struct mm_struct *prev_mm,
227a4aadSMathieu Desnoyers					struct mm_struct *next_mm)
227a4aadSMathieu Desnoyers{
227a4aadSMathieu Desnoyers	int membarrier_state;
227a4aadSMathieu Desnoyers
227a4aadSMathieu Desnoyers	if (prev_mm == next_mm)
227a4aadSMathieu Desnoyers		return;
227a4aadSMathieu Desnoyers
227a4aadSMathieu Desnoyers	membarrier_state = atomic_read(&next_mm->membarrier_state);
227a4aadSMathieu Desnoyers	if (READ_ONCE(rq->membarrier_state) == membarrier_state)
227a4aadSMathieu Desnoyers		return;
227a4aadSMathieu Desnoyers
227a4aadSMathieu Desnoyers	WRITE_ONCE(rq->membarrier_state, membarrier_state);
227a4aadSMathieu Desnoyers}
227a4aadSMathieu Desnoyers#else
227a4aadSMathieu Desnoyersstatic inline void membarrier_switch_mm(struct rq *rq,
227a4aadSMathieu Desnoyers					struct mm_struct *prev_mm,
227a4aadSMathieu Desnoyers					struct mm_struct *next_mm)
227a4aadSMathieu Desnoyers{
227a4aadSMathieu Desnoyers}
227a4aadSMathieu Desnoyers#endif
52262ee5SMel Gorman
52262ee5SMel Gorman#ifdef CONFIG_SMP
52262ee5SMel Gormanstatic inline bool is_per_cpu_kthread(struct task_struct *p)
52262ee5SMel Gorman{
52262ee5SMel Gorman	if (!(p->flags & PF_KTHREAD))
52262ee5SMel Gorman		return false;
52262ee5SMel Gorman
52262ee5SMel Gorman	if (p->nr_cpus_allowed != 1)
52262ee5SMel Gorman		return false;
52262ee5SMel Gorman
52262ee5SMel Gorman	return true;
52262ee5SMel Gorman}
52262ee5SMel Gorman#endif
b3212fe2SThomas Gleixner
1011dcceSPeter Zijlstraextern void swake_up_all_locked(struct swait_queue_head *q);
1011dcceSPeter Zijlstraextern void __prepare_to_swait(struct swait_queue_head *q, struct swait_queue *wait);
1011dcceSPeter Zijlstra
1011dcceSPeter Zijlstra#ifdef CONFIG_PREEMPT_DYNAMIC
1011dcceSPeter Zijlstraextern int preempt_dynamic_mode;
1011dcceSPeter Zijlstraextern int sched_dynamic_mode(const char *str);
1011dcceSPeter Zijlstraextern void sched_dynamic_update(int mode);
1011dcceSPeter Zijlstra#endif
1011dcceSPeter Zijlstra
95458477SIngo Molnar#endif /* _KERNEL_SCHED_SCHED_H */