sched: retune wake granularity
[wrt350n-kernel.git] / arch / powerpc / kernel / smp.c
blobbe35ffae10f0726b5e2ac3746b80f464f976222c
1 /*
2 * SMP support for ppc.
4 * Written by Cort Dougan (cort@cs.nmt.edu) borrowing a great
5 * deal of code from the sparc and intel versions.
7 * Copyright (C) 1999 Cort Dougan <cort@cs.nmt.edu>
9 * PowerPC-64 Support added by Dave Engebretsen, Peter Bergner, and
10 * Mike Corrigan {engebret|bergner|mikec}@us.ibm.com
12 * This program is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU General Public License
14 * as published by the Free Software Foundation; either version
15 * 2 of the License, or (at your option) any later version.
18 #undef DEBUG
20 #include <linux/kernel.h>
21 #include <linux/module.h>
22 #include <linux/sched.h>
23 #include <linux/smp.h>
24 #include <linux/interrupt.h>
25 #include <linux/delay.h>
26 #include <linux/init.h>
27 #include <linux/spinlock.h>
28 #include <linux/cache.h>
29 #include <linux/err.h>
30 #include <linux/sysdev.h>
31 #include <linux/cpu.h>
32 #include <linux/notifier.h>
33 #include <linux/topology.h>
35 #include <asm/ptrace.h>
36 #include <asm/atomic.h>
37 #include <asm/irq.h>
38 #include <asm/page.h>
39 #include <asm/pgtable.h>
40 #include <asm/prom.h>
41 #include <asm/smp.h>
42 #include <asm/time.h>
43 #include <asm/machdep.h>
44 #include <asm/cputable.h>
45 #include <asm/system.h>
46 #include <asm/mpic.h>
47 #include <asm/vdso_datapage.h>
48 #ifdef CONFIG_PPC64
49 #include <asm/paca.h>
50 #endif
52 #ifdef DEBUG
53 #include <asm/udbg.h>
54 #define DBG(fmt...) udbg_printf(fmt)
55 #else
56 #define DBG(fmt...)
57 #endif
59 int smp_hw_index[NR_CPUS];
60 struct thread_info *secondary_ti;
62 cpumask_t cpu_possible_map = CPU_MASK_NONE;
63 cpumask_t cpu_online_map = CPU_MASK_NONE;
64 DEFINE_PER_CPU(cpumask_t, cpu_sibling_map) = CPU_MASK_NONE;
66 EXPORT_SYMBOL(cpu_online_map);
67 EXPORT_SYMBOL(cpu_possible_map);
68 EXPORT_PER_CPU_SYMBOL(cpu_sibling_map);
70 /* SMP operations for this machine */
71 struct smp_ops_t *smp_ops;
73 static volatile unsigned int cpu_callin_map[NR_CPUS];
75 void smp_call_function_interrupt(void);
77 int smt_enabled_at_boot = 1;
79 static int ipi_fail_ok;
81 static void (*crash_ipi_function_ptr)(struct pt_regs *) = NULL;
83 #ifdef CONFIG_PPC64
84 void __devinit smp_generic_kick_cpu(int nr)
86 BUG_ON(nr < 0 || nr >= NR_CPUS);
89 * The processor is currently spinning, waiting for the
90 * cpu_start field to become non-zero After we set cpu_start,
91 * the processor will continue on to secondary_start
93 paca[nr].cpu_start = 1;
94 smp_mb();
96 #endif
98 void smp_message_recv(int msg)
100 switch(msg) {
101 case PPC_MSG_CALL_FUNCTION:
102 smp_call_function_interrupt();
103 break;
104 case PPC_MSG_RESCHEDULE:
105 /* XXX Do we have to do this? */
106 set_need_resched();
107 break;
108 case PPC_MSG_DEBUGGER_BREAK:
109 if (crash_ipi_function_ptr) {
110 crash_ipi_function_ptr(get_irq_regs());
111 break;
113 #ifdef CONFIG_DEBUGGER
114 debugger_ipi(get_irq_regs());
115 break;
116 #endif /* CONFIG_DEBUGGER */
117 /* FALLTHROUGH */
118 default:
119 printk("SMP %d: smp_message_recv(): unknown msg %d\n",
120 smp_processor_id(), msg);
121 break;
125 void smp_send_reschedule(int cpu)
127 if (likely(smp_ops))
128 smp_ops->message_pass(cpu, PPC_MSG_RESCHEDULE);
131 #ifdef CONFIG_DEBUGGER
132 void smp_send_debugger_break(int cpu)
134 if (likely(smp_ops))
135 smp_ops->message_pass(cpu, PPC_MSG_DEBUGGER_BREAK);
137 #endif
139 #ifdef CONFIG_KEXEC
140 void crash_send_ipi(void (*crash_ipi_callback)(struct pt_regs *))
142 crash_ipi_function_ptr = crash_ipi_callback;
143 if (crash_ipi_callback && smp_ops) {
144 mb();
145 smp_ops->message_pass(MSG_ALL_BUT_SELF, PPC_MSG_DEBUGGER_BREAK);
148 #endif
150 static void stop_this_cpu(void *dummy)
152 local_irq_disable();
153 while (1)
158 * Structure and data for smp_call_function(). This is designed to minimise
159 * static memory requirements. It also looks cleaner.
160 * Stolen from the i386 version.
162 static __cacheline_aligned_in_smp DEFINE_SPINLOCK(call_lock);
164 static struct call_data_struct {
165 void (*func) (void *info);
166 void *info;
167 atomic_t started;
168 atomic_t finished;
169 int wait;
170 } *call_data;
172 /* delay of at least 8 seconds */
173 #define SMP_CALL_TIMEOUT 8
176 * These functions send a 'generic call function' IPI to other online
177 * CPUS in the system.
179 * [SUMMARY] Run a function on other CPUs.
180 * <func> The function to run. This must be fast and non-blocking.
181 * <info> An arbitrary pointer to pass to the function.
182 * <nonatomic> currently unused.
183 * <wait> If true, wait (atomically) until function has completed on other CPUs.
184 * [RETURNS] 0 on success, else a negative status code. Does not return until
185 * remote CPUs are nearly ready to execute <<func>> or are or have executed.
186 * <map> is a cpu map of the cpus to send IPI to.
188 * You must not call this function with disabled interrupts or from a
189 * hardware interrupt handler or from a bottom half handler.
191 static int __smp_call_function_map(void (*func) (void *info), void *info,
192 int nonatomic, int wait, cpumask_t map)
194 struct call_data_struct data;
195 int ret = -1, num_cpus;
196 int cpu;
197 u64 timeout;
199 if (unlikely(smp_ops == NULL))
200 return ret;
202 data.func = func;
203 data.info = info;
204 atomic_set(&data.started, 0);
205 data.wait = wait;
206 if (wait)
207 atomic_set(&data.finished, 0);
209 /* remove 'self' from the map */
210 if (cpu_isset(smp_processor_id(), map))
211 cpu_clear(smp_processor_id(), map);
213 /* sanity check the map, remove any non-online processors. */
214 cpus_and(map, map, cpu_online_map);
216 num_cpus = cpus_weight(map);
217 if (!num_cpus)
218 goto done;
220 call_data = &data;
221 smp_wmb();
222 /* Send a message to all CPUs in the map */
223 for_each_cpu_mask(cpu, map)
224 smp_ops->message_pass(cpu, PPC_MSG_CALL_FUNCTION);
226 timeout = get_tb() + (u64) SMP_CALL_TIMEOUT * tb_ticks_per_sec;
228 /* Wait for indication that they have received the message */
229 while (atomic_read(&data.started) != num_cpus) {
230 HMT_low();
231 if (get_tb() >= timeout) {
232 printk("smp_call_function on cpu %d: other cpus not "
233 "responding (%d)\n", smp_processor_id(),
234 atomic_read(&data.started));
235 if (!ipi_fail_ok)
236 debugger(NULL);
237 goto out;
241 /* optionally wait for the CPUs to complete */
242 if (wait) {
243 while (atomic_read(&data.finished) != num_cpus) {
244 HMT_low();
245 if (get_tb() >= timeout) {
246 printk("smp_call_function on cpu %d: other "
247 "cpus not finishing (%d/%d)\n",
248 smp_processor_id(),
249 atomic_read(&data.finished),
250 atomic_read(&data.started));
251 debugger(NULL);
252 goto out;
257 done:
258 ret = 0;
260 out:
261 call_data = NULL;
262 HMT_medium();
263 return ret;
266 static int __smp_call_function(void (*func)(void *info), void *info,
267 int nonatomic, int wait)
269 int ret;
270 spin_lock(&call_lock);
271 ret =__smp_call_function_map(func, info, nonatomic, wait,
272 cpu_online_map);
273 spin_unlock(&call_lock);
274 return ret;
277 int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
278 int wait)
280 /* Can deadlock when called with interrupts disabled */
281 WARN_ON(irqs_disabled());
283 return __smp_call_function(func, info, nonatomic, wait);
285 EXPORT_SYMBOL(smp_call_function);
287 int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
288 int nonatomic, int wait)
290 cpumask_t map = CPU_MASK_NONE;
291 int ret = 0;
293 /* Can deadlock when called with interrupts disabled */
294 WARN_ON(irqs_disabled());
296 if (!cpu_online(cpu))
297 return -EINVAL;
299 cpu_set(cpu, map);
300 if (cpu != get_cpu()) {
301 spin_lock(&call_lock);
302 ret = __smp_call_function_map(func, info, nonatomic, wait, map);
303 spin_unlock(&call_lock);
304 } else {
305 local_irq_disable();
306 func(info);
307 local_irq_enable();
309 put_cpu();
310 return ret;
312 EXPORT_SYMBOL(smp_call_function_single);
314 void smp_send_stop(void)
316 int nolock;
318 /* It's OK to fail sending the IPI, since the alternative is to
319 * be stuck forever waiting on the other CPU to take the interrupt.
321 * It's better to at least continue and go through reboot, since this
322 * function is usually called at panic or reboot time in the first
323 * place.
325 ipi_fail_ok = 1;
327 /* Don't deadlock in case we got called through panic */
328 nolock = !spin_trylock(&call_lock);
329 __smp_call_function_map(stop_this_cpu, NULL, 1, 0, cpu_online_map);
330 if (!nolock)
331 spin_unlock(&call_lock);
334 void smp_call_function_interrupt(void)
336 void (*func) (void *info);
337 void *info;
338 int wait;
340 /* call_data will be NULL if the sender timed out while
341 * waiting on us to receive the call.
343 if (!call_data)
344 return;
346 func = call_data->func;
347 info = call_data->info;
348 wait = call_data->wait;
350 if (!wait)
351 smp_mb__before_atomic_inc();
354 * Notify initiating CPU that I've grabbed the data and am
355 * about to execute the function
357 atomic_inc(&call_data->started);
359 * At this point the info structure may be out of scope unless wait==1
361 (*func)(info);
362 if (wait) {
363 smp_mb__before_atomic_inc();
364 atomic_inc(&call_data->finished);
368 extern struct gettimeofday_struct do_gtod;
370 struct thread_info *current_set[NR_CPUS];
372 DECLARE_PER_CPU(unsigned int, pvr);
374 static void __devinit smp_store_cpu_info(int id)
376 per_cpu(pvr, id) = mfspr(SPRN_PVR);
379 static void __init smp_create_idle(unsigned int cpu)
381 struct task_struct *p;
383 /* create a process for the processor */
384 p = fork_idle(cpu);
385 if (IS_ERR(p))
386 panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
387 #ifdef CONFIG_PPC64
388 paca[cpu].__current = p;
389 #endif
390 current_set[cpu] = task_thread_info(p);
391 task_thread_info(p)->cpu = cpu;
394 void __init smp_prepare_cpus(unsigned int max_cpus)
396 unsigned int cpu;
398 DBG("smp_prepare_cpus\n");
401 * setup_cpu may need to be called on the boot cpu. We havent
402 * spun any cpus up but lets be paranoid.
404 BUG_ON(boot_cpuid != smp_processor_id());
406 /* Fixup boot cpu */
407 smp_store_cpu_info(boot_cpuid);
408 cpu_callin_map[boot_cpuid] = 1;
410 if (smp_ops)
411 max_cpus = smp_ops->probe();
412 else
413 max_cpus = 1;
415 smp_space_timers(max_cpus);
417 for_each_possible_cpu(cpu)
418 if (cpu != boot_cpuid)
419 smp_create_idle(cpu);
422 void __devinit smp_prepare_boot_cpu(void)
424 BUG_ON(smp_processor_id() != boot_cpuid);
426 cpu_set(boot_cpuid, cpu_online_map);
427 #ifdef CONFIG_PPC64
428 paca[boot_cpuid].__current = current;
429 #endif
430 current_set[boot_cpuid] = task_thread_info(current);
433 #ifdef CONFIG_HOTPLUG_CPU
434 /* State of each CPU during hotplug phases */
435 DEFINE_PER_CPU(int, cpu_state) = { 0 };
437 int generic_cpu_disable(void)
439 unsigned int cpu = smp_processor_id();
441 if (cpu == boot_cpuid)
442 return -EBUSY;
444 cpu_clear(cpu, cpu_online_map);
445 #ifdef CONFIG_PPC64
446 vdso_data->processorCount--;
447 fixup_irqs(cpu_online_map);
448 #endif
449 return 0;
452 int generic_cpu_enable(unsigned int cpu)
454 /* Do the normal bootup if we haven't
455 * already bootstrapped. */
456 if (system_state != SYSTEM_RUNNING)
457 return -ENOSYS;
459 /* get the target out of it's holding state */
460 per_cpu(cpu_state, cpu) = CPU_UP_PREPARE;
461 smp_wmb();
463 while (!cpu_online(cpu))
464 cpu_relax();
466 #ifdef CONFIG_PPC64
467 fixup_irqs(cpu_online_map);
468 /* counter the irq disable in fixup_irqs */
469 local_irq_enable();
470 #endif
471 return 0;
474 void generic_cpu_die(unsigned int cpu)
476 int i;
478 for (i = 0; i < 100; i++) {
479 smp_rmb();
480 if (per_cpu(cpu_state, cpu) == CPU_DEAD)
481 return;
482 msleep(100);
484 printk(KERN_ERR "CPU%d didn't die...\n", cpu);
487 void generic_mach_cpu_die(void)
489 unsigned int cpu;
491 local_irq_disable();
492 cpu = smp_processor_id();
493 printk(KERN_DEBUG "CPU%d offline\n", cpu);
494 __get_cpu_var(cpu_state) = CPU_DEAD;
495 smp_wmb();
496 while (__get_cpu_var(cpu_state) != CPU_UP_PREPARE)
497 cpu_relax();
498 cpu_set(cpu, cpu_online_map);
499 local_irq_enable();
501 #endif
503 static int __devinit cpu_enable(unsigned int cpu)
505 if (smp_ops && smp_ops->cpu_enable)
506 return smp_ops->cpu_enable(cpu);
508 return -ENOSYS;
511 int __cpuinit __cpu_up(unsigned int cpu)
513 int c;
515 secondary_ti = current_set[cpu];
516 if (!cpu_enable(cpu))
517 return 0;
519 if (smp_ops == NULL ||
520 (smp_ops->cpu_bootable && !smp_ops->cpu_bootable(cpu)))
521 return -EINVAL;
523 /* Make sure callin-map entry is 0 (can be leftover a CPU
524 * hotplug
526 cpu_callin_map[cpu] = 0;
528 /* The information for processor bringup must
529 * be written out to main store before we release
530 * the processor.
532 smp_mb();
534 /* wake up cpus */
535 DBG("smp: kicking cpu %d\n", cpu);
536 smp_ops->kick_cpu(cpu);
539 * wait to see if the cpu made a callin (is actually up).
540 * use this value that I found through experimentation.
541 * -- Cort
543 if (system_state < SYSTEM_RUNNING)
544 for (c = 50000; c && !cpu_callin_map[cpu]; c--)
545 udelay(100);
546 #ifdef CONFIG_HOTPLUG_CPU
547 else
549 * CPUs can take much longer to come up in the
550 * hotplug case. Wait five seconds.
552 for (c = 25; c && !cpu_callin_map[cpu]; c--) {
553 msleep(200);
555 #endif
557 if (!cpu_callin_map[cpu]) {
558 printk("Processor %u is stuck.\n", cpu);
559 return -ENOENT;
562 printk("Processor %u found.\n", cpu);
564 if (smp_ops->give_timebase)
565 smp_ops->give_timebase();
567 /* Wait until cpu puts itself in the online map */
568 while (!cpu_online(cpu))
569 cpu_relax();
571 return 0;
575 /* Activate a secondary processor. */
576 int __devinit start_secondary(void *unused)
578 unsigned int cpu = smp_processor_id();
580 atomic_inc(&init_mm.mm_count);
581 current->active_mm = &init_mm;
583 smp_store_cpu_info(cpu);
584 set_dec(tb_ticks_per_jiffy);
585 preempt_disable();
586 cpu_callin_map[cpu] = 1;
588 smp_ops->setup_cpu(cpu);
589 if (smp_ops->take_timebase)
590 smp_ops->take_timebase();
592 if (system_state > SYSTEM_BOOTING)
593 snapshot_timebase();
595 secondary_cpu_time_init();
597 spin_lock(&call_lock);
598 cpu_set(cpu, cpu_online_map);
599 spin_unlock(&call_lock);
601 local_irq_enable();
603 cpu_idle();
604 return 0;
607 int setup_profiling_timer(unsigned int multiplier)
609 return 0;
612 void __init smp_cpus_done(unsigned int max_cpus)
614 cpumask_t old_mask;
616 /* We want the setup_cpu() here to be called from CPU 0, but our
617 * init thread may have been "borrowed" by another CPU in the meantime
618 * se we pin us down to CPU 0 for a short while
620 old_mask = current->cpus_allowed;
621 set_cpus_allowed(current, cpumask_of_cpu(boot_cpuid));
623 if (smp_ops)
624 smp_ops->setup_cpu(boot_cpuid);
626 set_cpus_allowed(current, old_mask);
628 snapshot_timebases();
630 dump_numa_cpu_topology();
633 #ifdef CONFIG_HOTPLUG_CPU
634 int __cpu_disable(void)
636 if (smp_ops->cpu_disable)
637 return smp_ops->cpu_disable();
639 return -ENOSYS;
642 void __cpu_die(unsigned int cpu)
644 if (smp_ops->cpu_die)
645 smp_ops->cpu_die(cpu);
647 #endif