2 * itmt.c: Support Intel Turbo Boost Max Technology 3.0
4 * (C) Copyright 2016 Intel Corporation
5 * Author: Tim Chen <tim.c.chen@linux.intel.com>
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; version 2
12 * On platforms supporting Intel Turbo Boost Max Technology 3.0, (ITMT),
13 * the maximum turbo frequencies of some cores in a CPU package may be
14 * higher than for the other cores in the same package. In that case,
15 * better performance can be achieved by making the scheduler prefer
16 * to run tasks on the CPUs with higher max turbo frequencies.
18 * This file provides functions and data structures for enabling the
19 * scheduler to favor scheduling on cores can be boosted to a higher
20 * frequency under ITMT.
23 #include <linux/sched.h>
24 #include <linux/cpumask.h>
25 #include <linux/cpuset.h>
26 #include <linux/mutex.h>
27 #include <linux/sysctl.h>
28 #include <linux/nodemask.h>
30 static DEFINE_MUTEX(itmt_update_mutex
);
31 DEFINE_PER_CPU_READ_MOSTLY(int, sched_core_priority
);
33 /* Boolean to track if system has ITMT capabilities */
34 static bool __read_mostly sched_itmt_capable
;
37 * Boolean to control whether we want to move processes to cpu capable
38 * of higher turbo frequency for cpus supporting Intel Turbo Boost Max
41 * It can be set via /proc/sys/kernel/sched_itmt_enabled
43 unsigned int __read_mostly sysctl_sched_itmt_enabled
;
45 static int sched_itmt_update_handler(struct ctl_table
*table
, int write
,
46 void __user
*buffer
, size_t *lenp
,
49 unsigned int old_sysctl
;
52 mutex_lock(&itmt_update_mutex
);
54 if (!sched_itmt_capable
) {
55 mutex_unlock(&itmt_update_mutex
);
59 old_sysctl
= sysctl_sched_itmt_enabled
;
60 ret
= proc_dointvec_minmax(table
, write
, buffer
, lenp
, ppos
);
62 if (!ret
&& write
&& old_sysctl
!= sysctl_sched_itmt_enabled
) {
63 x86_topology_update
= true;
64 rebuild_sched_domains();
67 mutex_unlock(&itmt_update_mutex
);
72 static unsigned int zero
;
73 static unsigned int one
= 1;
74 static struct ctl_table itmt_kern_table
[] = {
76 .procname
= "sched_itmt_enabled",
77 .data
= &sysctl_sched_itmt_enabled
,
78 .maxlen
= sizeof(unsigned int),
80 .proc_handler
= sched_itmt_update_handler
,
87 static struct ctl_table itmt_root_table
[] = {
91 .child
= itmt_kern_table
,
96 static struct ctl_table_header
*itmt_sysctl_header
;
99 * sched_set_itmt_support() - Indicate platform supports ITMT
101 * This function is used by the OS to indicate to scheduler that the platform
102 * is capable of supporting the ITMT feature.
104 * The current scheme has the pstate driver detects if the system
105 * is ITMT capable and call sched_set_itmt_support.
107 * This must be done only after sched_set_itmt_core_prio
108 * has been called to set the cpus' priorities.
109 * It must not be called with cpu hot plug lock
110 * held as we need to acquire the lock to rebuild sched domains
113 * Return: 0 on success
115 int sched_set_itmt_support(void)
117 mutex_lock(&itmt_update_mutex
);
119 if (sched_itmt_capable
) {
120 mutex_unlock(&itmt_update_mutex
);
124 itmt_sysctl_header
= register_sysctl_table(itmt_root_table
);
125 if (!itmt_sysctl_header
) {
126 mutex_unlock(&itmt_update_mutex
);
130 sched_itmt_capable
= true;
132 sysctl_sched_itmt_enabled
= 1;
134 x86_topology_update
= true;
135 rebuild_sched_domains();
137 mutex_unlock(&itmt_update_mutex
);
143 * sched_clear_itmt_support() - Revoke platform's support of ITMT
145 * This function is used by the OS to indicate that it has
146 * revoked the platform's support of ITMT feature.
148 * It must not be called with cpu hot plug lock
149 * held as we need to acquire the lock to rebuild sched domains
152 void sched_clear_itmt_support(void)
154 mutex_lock(&itmt_update_mutex
);
156 if (!sched_itmt_capable
) {
157 mutex_unlock(&itmt_update_mutex
);
160 sched_itmt_capable
= false;
162 if (itmt_sysctl_header
) {
163 unregister_sysctl_table(itmt_sysctl_header
);
164 itmt_sysctl_header
= NULL
;
167 if (sysctl_sched_itmt_enabled
) {
168 /* disable sched_itmt if we are no longer ITMT capable */
169 sysctl_sched_itmt_enabled
= 0;
170 x86_topology_update
= true;
171 rebuild_sched_domains();
174 mutex_unlock(&itmt_update_mutex
);
177 int arch_asym_cpu_priority(int cpu
)
179 return per_cpu(sched_core_priority
, cpu
);
183 * sched_set_itmt_core_prio() - Set CPU priority based on ITMT
184 * @prio: Priority of cpu core
185 * @core_cpu: The cpu number associated with the core
187 * The pstate driver will find out the max boost frequency
188 * and call this function to set a priority proportional
189 * to the max boost frequency. CPU with higher boost
190 * frequency will receive higher priority.
192 * No need to rebuild sched domain after updating
193 * the CPU priorities. The sched domains have no
194 * dependency on CPU priorities.
196 void sched_set_itmt_core_prio(int prio
, int core_cpu
)
200 for_each_cpu(cpu
, topology_sibling_cpumask(core_cpu
)) {
204 * Ensure that the siblings are moved to the end
205 * of the priority chain and only used when
206 * all other high priority cpus are out of capacity.
208 smt_prio
= prio
* smp_num_siblings
/ i
;
209 per_cpu(sched_core_priority
, cpu
) = smt_prio
;