2 * devfreq_cooling: Thermal cooling device implementation for devices using
5 * Copyright (C) 2014-2015 ARM Limited
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
11 * This program is distributed "as is" WITHOUT ANY WARRANTY of any
12 * kind, whether express or implied; without even the implied warranty
13 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
17 * - If OPPs are added or removed after devfreq cooling has
18 * registered, the devfreq cooling won't react to it.
21 #include <linux/devfreq.h>
22 #include <linux/devfreq_cooling.h>
23 #include <linux/export.h>
24 #include <linux/slab.h>
25 #include <linux/pm_opp.h>
26 #include <linux/thermal.h>
28 #include <trace/events/thermal.h>
30 static DEFINE_MUTEX(devfreq_lock
);
31 static DEFINE_IDR(devfreq_idr
);
34 * struct devfreq_cooling_device - Devfreq cooling device
35 * @id: unique integer value corresponding to each
36 * devfreq_cooling_device registered.
37 * @cdev: Pointer to associated thermal cooling device.
38 * @devfreq: Pointer to associated devfreq device.
39 * @cooling_state: Current cooling state.
40 * @power_table: Pointer to table with maximum power draw for each
41 * cooling state. State is the index into the table, and
43 * @freq_table: Pointer to a table with the frequencies sorted in descending
44 * order. You can index the table by cooling device state
45 * @freq_table_size: Size of the @freq_table and @power_table
46 * @power_ops: Pointer to devfreq_cooling_power, used to generate the
49 struct devfreq_cooling_device
{
51 struct thermal_cooling_device
*cdev
;
52 struct devfreq
*devfreq
;
53 unsigned long cooling_state
;
56 size_t freq_table_size
;
57 struct devfreq_cooling_power
*power_ops
;
61 * get_idr - function to get a unique id.
62 * @idr: struct idr * handle used to create a id.
63 * @id: int * value generated by this function.
65 * This function will populate @id with an unique
66 * id, using the idr API.
68 * Return: 0 on success, an error code on failure.
70 static int get_idr(struct idr
*idr
, int *id
)
74 mutex_lock(&devfreq_lock
);
75 ret
= idr_alloc(idr
, NULL
, 0, 0, GFP_KERNEL
);
76 mutex_unlock(&devfreq_lock
);
77 if (unlikely(ret
< 0))
85 * release_idr - function to free the unique id.
86 * @idr: struct idr * handle used for creating the id.
87 * @id: int value representing the unique id.
89 static void release_idr(struct idr
*idr
, int id
)
91 mutex_lock(&devfreq_lock
);
93 mutex_unlock(&devfreq_lock
);
97 * partition_enable_opps() - disable all opps above a given state
98 * @dfc: Pointer to devfreq we are operating on
99 * @cdev_state: cooling device state we're setting
101 * Go through the OPPs of the device, enabling all OPPs until
102 * @cdev_state and disabling those frequencies above it.
104 static int partition_enable_opps(struct devfreq_cooling_device
*dfc
,
105 unsigned long cdev_state
)
108 struct device
*dev
= dfc
->devfreq
->dev
.parent
;
110 for (i
= 0; i
< dfc
->freq_table_size
; i
++) {
111 struct dev_pm_opp
*opp
;
113 unsigned int freq
= dfc
->freq_table
[i
];
114 bool want_enable
= i
>= cdev_state
? true : false;
117 opp
= dev_pm_opp_find_freq_exact(dev
, freq
, !want_enable
);
120 if (PTR_ERR(opp
) == -ERANGE
)
122 else if (IS_ERR(opp
))
126 ret
= dev_pm_opp_enable(dev
, freq
);
128 ret
= dev_pm_opp_disable(dev
, freq
);
137 static int devfreq_cooling_get_max_state(struct thermal_cooling_device
*cdev
,
138 unsigned long *state
)
140 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
142 *state
= dfc
->freq_table_size
- 1;
147 static int devfreq_cooling_get_cur_state(struct thermal_cooling_device
*cdev
,
148 unsigned long *state
)
150 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
152 *state
= dfc
->cooling_state
;
157 static int devfreq_cooling_set_cur_state(struct thermal_cooling_device
*cdev
,
160 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
161 struct devfreq
*df
= dfc
->devfreq
;
162 struct device
*dev
= df
->dev
.parent
;
165 if (state
== dfc
->cooling_state
)
168 dev_dbg(dev
, "Setting cooling state %lu\n", state
);
170 if (state
>= dfc
->freq_table_size
)
173 ret
= partition_enable_opps(dfc
, state
);
177 dfc
->cooling_state
= state
;
183 * freq_get_state() - get the cooling state corresponding to a frequency
184 * @dfc: Pointer to devfreq cooling device
185 * @freq: frequency in Hz
187 * Return: the cooling state associated with the @freq, or
188 * THERMAL_CSTATE_INVALID if it wasn't found.
191 freq_get_state(struct devfreq_cooling_device
*dfc
, unsigned long freq
)
195 for (i
= 0; i
< dfc
->freq_table_size
; i
++) {
196 if (dfc
->freq_table
[i
] == freq
)
200 return THERMAL_CSTATE_INVALID
;
204 * get_static_power() - calculate the static power
205 * @dfc: Pointer to devfreq cooling device
206 * @freq: Frequency in Hz
208 * Calculate the static power in milliwatts using the supplied
209 * get_static_power(). The current voltage is calculated using the
210 * OPP library. If no get_static_power() was supplied, assume the
211 * static power is negligible.
214 get_static_power(struct devfreq_cooling_device
*dfc
, unsigned long freq
)
216 struct devfreq
*df
= dfc
->devfreq
;
217 struct device
*dev
= df
->dev
.parent
;
218 unsigned long voltage
;
219 struct dev_pm_opp
*opp
;
221 if (!dfc
->power_ops
->get_static_power
)
226 opp
= dev_pm_opp_find_freq_exact(dev
, freq
, true);
227 if (IS_ERR(opp
) && (PTR_ERR(opp
) == -ERANGE
))
228 opp
= dev_pm_opp_find_freq_exact(dev
, freq
, false);
230 voltage
= dev_pm_opp_get_voltage(opp
) / 1000; /* mV */
235 dev_warn_ratelimited(dev
,
236 "Failed to get voltage for frequency %lu: %ld\n",
237 freq
, IS_ERR(opp
) ? PTR_ERR(opp
) : 0);
241 return dfc
->power_ops
->get_static_power(voltage
);
245 * get_dynamic_power - calculate the dynamic power
246 * @dfc: Pointer to devfreq cooling device
247 * @freq: Frequency in Hz
248 * @voltage: Voltage in millivolts
250 * Calculate the dynamic power in milliwatts consumed by the device at
251 * frequency @freq and voltage @voltage. If the get_dynamic_power()
252 * was supplied as part of the devfreq_cooling_power struct, then that
253 * function is used. Otherwise, a simple power model (Pdyn = Coeff *
254 * Voltage^2 * Frequency) is used.
257 get_dynamic_power(struct devfreq_cooling_device
*dfc
, unsigned long freq
,
258 unsigned long voltage
)
262 struct devfreq_cooling_power
*dfc_power
= dfc
->power_ops
;
264 if (dfc_power
->get_dynamic_power
)
265 return dfc_power
->get_dynamic_power(freq
, voltage
);
267 freq_mhz
= freq
/ 1000000;
268 power
= (u64
)dfc_power
->dyn_power_coeff
* freq_mhz
* voltage
* voltage
;
269 do_div(power
, 1000000000);
274 static int devfreq_cooling_get_requested_power(struct thermal_cooling_device
*cdev
,
275 struct thermal_zone_device
*tz
,
278 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
279 struct devfreq
*df
= dfc
->devfreq
;
280 struct devfreq_dev_status
*status
= &df
->last_status
;
282 unsigned long freq
= status
->current_frequency
;
283 u32 dyn_power
, static_power
;
285 /* Get dynamic power for state */
286 state
= freq_get_state(dfc
, freq
);
287 if (state
== THERMAL_CSTATE_INVALID
)
290 dyn_power
= dfc
->power_table
[state
];
292 /* Scale dynamic power for utilization */
293 dyn_power
= (dyn_power
* status
->busy_time
) / status
->total_time
;
295 /* Get static power */
296 static_power
= get_static_power(dfc
, freq
);
298 trace_thermal_power_devfreq_get_power(cdev
, status
, freq
, dyn_power
,
301 *power
= dyn_power
+ static_power
;
306 static int devfreq_cooling_state2power(struct thermal_cooling_device
*cdev
,
307 struct thermal_zone_device
*tz
,
311 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
315 if (state
< 0 || state
>= dfc
->freq_table_size
)
318 freq
= dfc
->freq_table
[state
];
319 static_power
= get_static_power(dfc
, freq
);
321 *power
= dfc
->power_table
[state
] + static_power
;
325 static int devfreq_cooling_power2state(struct thermal_cooling_device
*cdev
,
326 struct thermal_zone_device
*tz
,
327 u32 power
, unsigned long *state
)
329 struct devfreq_cooling_device
*dfc
= cdev
->devdata
;
330 struct devfreq
*df
= dfc
->devfreq
;
331 struct devfreq_dev_status
*status
= &df
->last_status
;
332 unsigned long freq
= status
->current_frequency
;
333 unsigned long busy_time
;
338 static_power
= get_static_power(dfc
, freq
);
340 dyn_power
= power
- static_power
;
341 dyn_power
= dyn_power
> 0 ? dyn_power
: 0;
343 /* Scale dynamic power for utilization */
344 busy_time
= status
->busy_time
?: 1;
345 dyn_power
= (dyn_power
* status
->total_time
) / busy_time
;
348 * Find the first cooling state that is within the power
349 * budget for dynamic power.
351 for (i
= 0; i
< dfc
->freq_table_size
- 1; i
++)
352 if (dyn_power
>= dfc
->power_table
[i
])
356 trace_thermal_power_devfreq_limit(cdev
, freq
, *state
, power
);
360 static struct thermal_cooling_device_ops devfreq_cooling_ops
= {
361 .get_max_state
= devfreq_cooling_get_max_state
,
362 .get_cur_state
= devfreq_cooling_get_cur_state
,
363 .set_cur_state
= devfreq_cooling_set_cur_state
,
367 * devfreq_cooling_gen_tables() - Generate power and freq tables.
368 * @dfc: Pointer to devfreq cooling device.
370 * Generate power and frequency tables: the power table hold the
371 * device's maximum power usage at each cooling state (OPP). The
372 * static and dynamic power using the appropriate voltage and
373 * frequency for the state, is acquired from the struct
374 * devfreq_cooling_power, and summed to make the maximum power draw.
376 * The frequency table holds the frequencies in descending order.
377 * That way its indexed by cooling device state.
379 * The tables are malloced, and pointers put in dfc. They must be
380 * freed when unregistering the devfreq cooling device.
382 * Return: 0 on success, negative error code on failure.
384 static int devfreq_cooling_gen_tables(struct devfreq_cooling_device
*dfc
)
386 struct devfreq
*df
= dfc
->devfreq
;
387 struct device
*dev
= df
->dev
.parent
;
390 u32
*power_table
= NULL
;
394 num_opps
= dev_pm_opp_get_opp_count(dev
);
396 if (dfc
->power_ops
) {
397 power_table
= kcalloc(num_opps
, sizeof(*power_table
),
403 freq_table
= kcalloc(num_opps
, sizeof(*freq_table
),
407 goto free_power_table
;
410 for (i
= 0, freq
= ULONG_MAX
; i
< num_opps
; i
++, freq
--) {
411 unsigned long power_dyn
, voltage
;
412 struct dev_pm_opp
*opp
;
416 opp
= dev_pm_opp_find_freq_floor(dev
, &freq
);
423 voltage
= dev_pm_opp_get_voltage(opp
) / 1000; /* mV */
427 if (dfc
->power_ops
) {
428 power_dyn
= get_dynamic_power(dfc
, freq
, voltage
);
430 dev_dbg(dev
, "Dynamic power table: %lu MHz @ %lu mV: %lu = %lu mW\n",
431 freq
/ 1000000, voltage
, power_dyn
, power_dyn
);
433 power_table
[i
] = power_dyn
;
436 freq_table
[i
] = freq
;
440 dfc
->power_table
= power_table
;
442 dfc
->freq_table
= freq_table
;
443 dfc
->freq_table_size
= num_opps
;
456 * of_devfreq_cooling_register_power() - Register devfreq cooling device,
457 * with OF and power information.
458 * @np: Pointer to OF device_node.
459 * @df: Pointer to devfreq device.
460 * @dfc_power: Pointer to devfreq_cooling_power.
462 * Register a devfreq cooling device. The available OPPs must be
463 * registered on the device.
465 * If @dfc_power is provided, the cooling device is registered with the
466 * power extensions. For the power extensions to work correctly,
467 * devfreq should use the simple_ondemand governor, other governors
468 * are not currently supported.
470 struct thermal_cooling_device
*
471 of_devfreq_cooling_register_power(struct device_node
*np
, struct devfreq
*df
,
472 struct devfreq_cooling_power
*dfc_power
)
474 struct thermal_cooling_device
*cdev
;
475 struct devfreq_cooling_device
*dfc
;
476 char dev_name
[THERMAL_NAME_LENGTH
];
479 dfc
= kzalloc(sizeof(*dfc
), GFP_KERNEL
);
481 return ERR_PTR(-ENOMEM
);
486 dfc
->power_ops
= dfc_power
;
488 devfreq_cooling_ops
.get_requested_power
=
489 devfreq_cooling_get_requested_power
;
490 devfreq_cooling_ops
.state2power
= devfreq_cooling_state2power
;
491 devfreq_cooling_ops
.power2state
= devfreq_cooling_power2state
;
494 err
= devfreq_cooling_gen_tables(dfc
);
498 err
= get_idr(&devfreq_idr
, &dfc
->id
);
502 snprintf(dev_name
, sizeof(dev_name
), "thermal-devfreq-%d", dfc
->id
);
504 cdev
= thermal_of_cooling_device_register(np
, dev_name
, dfc
,
505 &devfreq_cooling_ops
);
508 dev_err(df
->dev
.parent
,
509 "Failed to register devfreq cooling device (%d)\n",
519 release_idr(&devfreq_idr
, dfc
->id
);
521 kfree(dfc
->power_table
);
522 kfree(dfc
->freq_table
);
528 EXPORT_SYMBOL_GPL(of_devfreq_cooling_register_power
);
531 * of_devfreq_cooling_register() - Register devfreq cooling device,
532 * with OF information.
533 * @np: Pointer to OF device_node.
534 * @df: Pointer to devfreq device.
536 struct thermal_cooling_device
*
537 of_devfreq_cooling_register(struct device_node
*np
, struct devfreq
*df
)
539 return of_devfreq_cooling_register_power(np
, df
, NULL
);
541 EXPORT_SYMBOL_GPL(of_devfreq_cooling_register
);
544 * devfreq_cooling_register() - Register devfreq cooling device.
545 * @df: Pointer to devfreq device.
547 struct thermal_cooling_device
*devfreq_cooling_register(struct devfreq
*df
)
549 return of_devfreq_cooling_register(NULL
, df
);
551 EXPORT_SYMBOL_GPL(devfreq_cooling_register
);
554 * devfreq_cooling_unregister() - Unregister devfreq cooling device.
555 * @dfc: Pointer to devfreq cooling device to unregister.
557 void devfreq_cooling_unregister(struct thermal_cooling_device
*cdev
)
559 struct devfreq_cooling_device
*dfc
;
566 thermal_cooling_device_unregister(dfc
->cdev
);
567 release_idr(&devfreq_idr
, dfc
->id
);
568 kfree(dfc
->power_table
);
569 kfree(dfc
->freq_table
);
573 EXPORT_SYMBOL_GPL(devfreq_cooling_unregister
);