1 // SPDX-License-Identifier: GPL-2.0-only
3 * itmt.c: Support Intel Turbo Boost Max Technology 3.0
5 * (C) Copyright 2016 Intel Corporation
6 * Author: Tim Chen <tim.c.chen@linux.intel.com>
8 * On platforms supporting Intel Turbo Boost Max Technology 3.0, (ITMT),
9 * the maximum turbo frequencies of some cores in a CPU package may be
10 * higher than for the other cores in the same package. In that case,
11 * better performance can be achieved by making the scheduler prefer
12 * to run tasks on the CPUs with higher max turbo frequencies.
14 * This file provides functions and data structures for enabling the
15 * scheduler to favor scheduling on cores can be boosted to a higher
16 * frequency under ITMT.
19 #include <linux/sched.h>
20 #include <linux/cpumask.h>
21 #include <linux/cpuset.h>
22 #include <linux/mutex.h>
23 #include <linux/sysctl.h>
24 #include <linux/nodemask.h>
26 static DEFINE_MUTEX(itmt_update_mutex
);
27 DEFINE_PER_CPU_READ_MOSTLY(int, sched_core_priority
);
29 /* Boolean to track if system has ITMT capabilities */
30 static bool __read_mostly sched_itmt_capable
;
33 * Boolean to control whether we want to move processes to cpu capable
34 * of higher turbo frequency for cpus supporting Intel Turbo Boost Max
37 * It can be set via /proc/sys/kernel/sched_itmt_enabled
39 unsigned int __read_mostly sysctl_sched_itmt_enabled
;
41 static int sched_itmt_update_handler(const struct ctl_table
*table
, int write
,
42 void *buffer
, size_t *lenp
, loff_t
*ppos
)
44 unsigned int old_sysctl
;
47 mutex_lock(&itmt_update_mutex
);
49 if (!sched_itmt_capable
) {
50 mutex_unlock(&itmt_update_mutex
);
54 old_sysctl
= sysctl_sched_itmt_enabled
;
55 ret
= proc_dointvec_minmax(table
, write
, buffer
, lenp
, ppos
);
57 if (!ret
&& write
&& old_sysctl
!= sysctl_sched_itmt_enabled
) {
58 x86_topology_update
= true;
59 rebuild_sched_domains();
62 mutex_unlock(&itmt_update_mutex
);
67 static struct ctl_table itmt_kern_table
[] = {
69 .procname
= "sched_itmt_enabled",
70 .data
= &sysctl_sched_itmt_enabled
,
71 .maxlen
= sizeof(unsigned int),
73 .proc_handler
= sched_itmt_update_handler
,
74 .extra1
= SYSCTL_ZERO
,
79 static struct ctl_table_header
*itmt_sysctl_header
;
82 * sched_set_itmt_support() - Indicate platform supports ITMT
84 * This function is used by the OS to indicate to scheduler that the platform
85 * is capable of supporting the ITMT feature.
87 * The current scheme has the pstate driver detects if the system
88 * is ITMT capable and call sched_set_itmt_support.
90 * This must be done only after sched_set_itmt_core_prio
91 * has been called to set the cpus' priorities.
92 * It must not be called with cpu hot plug lock
93 * held as we need to acquire the lock to rebuild sched domains
96 * Return: 0 on success
98 int sched_set_itmt_support(void)
100 mutex_lock(&itmt_update_mutex
);
102 if (sched_itmt_capable
) {
103 mutex_unlock(&itmt_update_mutex
);
107 itmt_sysctl_header
= register_sysctl("kernel", itmt_kern_table
);
108 if (!itmt_sysctl_header
) {
109 mutex_unlock(&itmt_update_mutex
);
113 sched_itmt_capable
= true;
115 sysctl_sched_itmt_enabled
= 1;
117 x86_topology_update
= true;
118 rebuild_sched_domains();
120 mutex_unlock(&itmt_update_mutex
);
126 * sched_clear_itmt_support() - Revoke platform's support of ITMT
128 * This function is used by the OS to indicate that it has
129 * revoked the platform's support of ITMT feature.
131 * It must not be called with cpu hot plug lock
132 * held as we need to acquire the lock to rebuild sched domains
135 void sched_clear_itmt_support(void)
137 mutex_lock(&itmt_update_mutex
);
139 if (!sched_itmt_capable
) {
140 mutex_unlock(&itmt_update_mutex
);
143 sched_itmt_capable
= false;
145 if (itmt_sysctl_header
) {
146 unregister_sysctl_table(itmt_sysctl_header
);
147 itmt_sysctl_header
= NULL
;
150 if (sysctl_sched_itmt_enabled
) {
151 /* disable sched_itmt if we are no longer ITMT capable */
152 sysctl_sched_itmt_enabled
= 0;
153 x86_topology_update
= true;
154 rebuild_sched_domains();
157 mutex_unlock(&itmt_update_mutex
);
160 int arch_asym_cpu_priority(int cpu
)
162 return per_cpu(sched_core_priority
, cpu
);
166 * sched_set_itmt_core_prio() - Set CPU priority based on ITMT
167 * @prio: Priority of @cpu
168 * @cpu: The CPU number
170 * The pstate driver will find out the max boost frequency
171 * and call this function to set a priority proportional
172 * to the max boost frequency. CPUs with higher boost
173 * frequency will receive higher priority.
175 * No need to rebuild sched domain after updating
176 * the CPU priorities. The sched domains have no
177 * dependency on CPU priorities.
179 void sched_set_itmt_core_prio(int prio
, int cpu
)
181 per_cpu(sched_core_priority
, cpu
) = prio
;