2 * Idle daemon for PowerPC. Idle daemon will handle any action
3 * that needs to be taken when the system becomes idle.
5 * Originally Written by Cort Dougan (cort@cs.nmt.edu)
7 * iSeries supported added by Mike Corrigan <mikejc@us.ibm.com>
9 * Additional shared processor, SMT, and firmware support
10 * Copyright (c) 2003 Dave Engebretsen <engebret@us.ibm.com>
12 * This program is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU General Public License
14 * as published by the Free Software Foundation; either version
15 * 2 of the License, or (at your option) any later version.
18 #include <linux/config.h>
19 #include <linux/sched.h>
20 #include <linux/kernel.h>
21 #include <linux/smp.h>
22 #include <linux/cpu.h>
23 #include <linux/module.h>
24 #include <linux/sysctl.h>
25 #include <linux/smp.h>
27 #include <asm/system.h>
28 #include <asm/processor.h>
30 #include <asm/cputable.h>
32 #include <asm/iSeries/HvCall.h>
33 #include <asm/iSeries/ItLpQueue.h>
34 #include <asm/plpar_wrappers.h>
35 #include <asm/systemcfg.h>
37 extern void power4_idle(void);
39 static int (*idle_loop
)(void);
41 #ifdef CONFIG_PPC_ISERIES
42 static unsigned long maxYieldTime
= 0;
43 static unsigned long minYieldTime
= 0xffffffffffffffffUL
;
45 static void yield_shared_processor(void)
48 unsigned long yieldTime
;
50 HvCall_setEnabledInterrupts(HvCall_MaskIPI
|
56 /* Compute future tb value when yield should expire */
57 HvCall_yieldProcessor(HvCall_YieldTimed
, tb
+tb_ticks_per_jiffy
);
59 yieldTime
= get_tb() - tb
;
60 if (yieldTime
> maxYieldTime
)
61 maxYieldTime
= yieldTime
;
63 if (yieldTime
< minYieldTime
)
64 minYieldTime
= yieldTime
;
67 * The decrementer stops during the yield. Force a fake decrementer
68 * here and let the timer_interrupt code sort out the actual time.
70 get_paca()->lppaca
.int_dword
.fields
.decr_int
= 1;
71 process_iSeries_events();
74 static int iSeries_idle(void)
76 struct paca_struct
*lpaca
;
80 /* ensure iSeries run light will be out when idle */
81 clear_thread_flag(TIF_RUN_LIGHT
);
89 if (lpaca
->lppaca
.shared_proc
) {
90 if (ItLpQueue_isLpIntPending(lpaca
->lpqueue_ptr
))
91 process_iSeries_events();
93 yield_shared_processor();
95 oldval
= test_and_clear_thread_flag(TIF_NEED_RESCHED
);
98 set_thread_flag(TIF_POLLING_NRFLAG
);
100 while (!need_resched()) {
102 if (ItLpQueue_isLpIntPending(lpaca
->lpqueue_ptr
))
103 process_iSeries_events();
108 clear_thread_flag(TIF_POLLING_NRFLAG
);
122 static int default_idle(void)
125 unsigned int cpu
= smp_processor_id();
128 oldval
= test_and_clear_thread_flag(TIF_NEED_RESCHED
);
131 set_thread_flag(TIF_POLLING_NRFLAG
);
133 while (!need_resched() && !cpu_is_offline(cpu
)) {
136 * Go into low thread priority and possibly
144 clear_thread_flag(TIF_POLLING_NRFLAG
);
150 if (cpu_is_offline(cpu
) && system_state
== SYSTEM_RUNNING
)
157 #ifdef CONFIG_PPC_PSERIES
159 DECLARE_PER_CPU(unsigned long, smt_snooze_delay
);
161 int dedicated_idle(void)
164 struct paca_struct
*lpaca
= get_paca(), *ppaca
;
165 unsigned long start_snooze
;
166 unsigned long *smt_snooze_delay
= &__get_cpu_var(smt_snooze_delay
);
167 unsigned int cpu
= smp_processor_id();
169 ppaca
= &paca
[cpu
^ 1];
173 * Indicate to the HV that we are idle. Now would be
174 * a good time to find other work to dispatch.
176 lpaca
->lppaca
.idle
= 1;
178 oldval
= test_and_clear_thread_flag(TIF_NEED_RESCHED
);
180 set_thread_flag(TIF_POLLING_NRFLAG
);
181 start_snooze
= __get_tb() +
182 *smt_snooze_delay
* tb_ticks_per_usec
;
183 while (!need_resched() && !cpu_is_offline(cpu
)) {
185 * Go into low thread priority and possibly
191 if (*smt_snooze_delay
== 0 ||
192 __get_tb() < start_snooze
)
197 if (!(ppaca
->lppaca
.idle
)) {
201 * We are about to sleep the thread
202 * and so wont be polling any
205 clear_thread_flag(TIF_POLLING_NRFLAG
);
208 * SMT dynamic mode. Cede will result
209 * in this thread going dormant, if the
210 * partner thread is still doing work.
211 * Thread wakes up if partner goes idle,
212 * an interrupt is presented, or a prod
213 * occurs. Returning from the cede
214 * enables external interrupts.
222 * Give the HV an opportunity at the
223 * processor, since we are not doing
230 clear_thread_flag(TIF_POLLING_NRFLAG
);
236 lpaca
->lppaca
.idle
= 0;
238 if (cpu_is_offline(cpu
) && system_state
== SYSTEM_RUNNING
)
244 static int shared_idle(void)
246 struct paca_struct
*lpaca
= get_paca();
247 unsigned int cpu
= smp_processor_id();
251 * Indicate to the HV that we are idle. Now would be
252 * a good time to find other work to dispatch.
254 lpaca
->lppaca
.idle
= 1;
256 while (!need_resched() && !cpu_is_offline(cpu
)) {
260 * Yield the processor to the hypervisor. We return if
261 * an external interrupt occurs (which are driven prior
262 * to returning here) or if a prod occurs from another
263 * processor. When returning here, external interrupts
266 * Check need_resched() again with interrupts disabled
276 lpaca
->lppaca
.idle
= 0;
278 if (cpu_is_offline(smp_processor_id()) &&
279 system_state
== SYSTEM_RUNNING
)
286 #endif /* CONFIG_PPC_PSERIES */
288 static int native_idle(void)
291 /* check CPU type here */
297 if (cpu_is_offline(_smp_processor_id()) &&
298 system_state
== SYSTEM_RUNNING
)
304 #endif /* CONFIG_PPC_ISERIES */
315 * Register the sysctl to set/clear powersave_nap.
317 static ctl_table powersave_nap_ctl_table
[]={
319 .ctl_name
= KERN_PPC_POWERSAVE_NAP
,
320 .procname
= "powersave-nap",
321 .data
= &powersave_nap
,
322 .maxlen
= sizeof(int),
324 .proc_handler
= &proc_dointvec
,
328 static ctl_table powersave_nap_sysctl_root
[] = {
329 { 1, "kernel", NULL
, 0, 0755, powersave_nap_ctl_table
, },
334 register_powersave_nap_sysctl(void)
336 register_sysctl_table(powersave_nap_sysctl_root
, 0);
340 __initcall(register_powersave_nap_sysctl
);
346 * Move that junk to each platform specific file, eventually define
347 * a pSeries_idle for shared processor stuff
349 #ifdef CONFIG_PPC_ISERIES
350 idle_loop
= iSeries_idle
;
353 idle_loop
= default_idle
;
355 #ifdef CONFIG_PPC_PSERIES
356 if (systemcfg
->platform
& PLATFORM_PSERIES
) {
357 if (cur_cpu_spec
->firmware_features
& FW_FEATURE_SPLPAR
) {
358 if (get_paca()->lppaca
.shared_proc
) {
359 printk(KERN_INFO
"Using shared processor idle loop\n");
360 idle_loop
= shared_idle
;
362 printk(KERN_INFO
"Using dedicated idle loop\n");
363 idle_loop
= dedicated_idle
;
366 printk(KERN_INFO
"Using default idle loop\n");
367 idle_loop
= default_idle
;
370 #endif /* CONFIG_PPC_PSERIES */
371 #ifndef CONFIG_PPC_ISERIES
372 if (systemcfg
->platform
== PLATFORM_POWERMAC
||
373 systemcfg
->platform
== PLATFORM_MAPLE
) {
374 printk(KERN_INFO
"Using native/NAP idle loop\n");
375 idle_loop
= native_idle
;
377 #endif /* CONFIG_PPC_ISERIES */