2 * This program is free software; you can redistribute it and/or
3 * modify it under the terms of the GNU General Public License
4 * as published by the Free Software Foundation; either version 2
5 * of the License, or (at your option) any later version.
7 * This program is distributed in the hope that it will be useful,
8 * but WITHOUT ANY WARRANTY; without even the implied warranty of
9 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10 * GNU General Public License for more details.
12 * You should have received a copy of the GNU General Public License
13 * along with this program; if not, write to the Free Software
14 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
16 * Copyright (C) 2000, 2001 Kanoj Sarcar
17 * Copyright (C) 2000, 2001 Ralf Baechle
18 * Copyright (C) 2000, 2001 Silicon Graphics, Inc.
19 * Copyright (C) 2000, 2001, 2003 Broadcom Corporation
21 #include <linux/cache.h>
22 #include <linux/delay.h>
23 #include <linux/init.h>
24 #include <linux/interrupt.h>
25 #include <linux/spinlock.h>
26 #include <linux/threads.h>
27 #include <linux/module.h>
28 #include <linux/time.h>
29 #include <linux/timex.h>
30 #include <linux/sched.h>
31 #include <linux/cpumask.h>
33 #include <asm/atomic.h>
35 #include <asm/processor.h>
36 #include <asm/system.h>
37 #include <asm/mmu_context.h>
40 cpumask_t phys_cpu_present_map
; /* Bitmask of available CPUs */
41 volatile cpumask_t cpu_callin_map
; /* Bitmask of started secondaries */
42 cpumask_t cpu_online_map
; /* Bitmask of currently online CPUs */
43 int __cpu_number_map
[NR_CPUS
]; /* Map physical to logical */
44 int __cpu_logical_map
[NR_CPUS
]; /* Map logical to physical */
46 EXPORT_SYMBOL(phys_cpu_present_map
);
47 EXPORT_SYMBOL(cpu_online_map
);
49 static void smp_tune_scheduling (void)
51 struct cache_desc
*cd
= ¤t_cpu_data
.scache
;
52 unsigned long cachesize
; /* kB */
53 unsigned long bandwidth
= 350; /* MB/s */
54 unsigned long cpu_khz
;
57 * Crude estimate until we actually meassure ...
59 cpu_khz
= loops_per_jiffy
* 2 * HZ
/ 1000;
62 * Rough estimation for SMP scheduling, this is the number of
63 * cycles it takes for a fully memory-limited process to flush
64 * the SMP-local cache.
66 * (For a P5 this pretty much means we will choose another idle
67 * CPU almost always at wakeup time (this is due to the small
68 * L1 cache), on PIIs it's around 50-100 usecs, depending on
74 cachesize
= cd
->linesz
* cd
->sets
* cd
->ways
;
77 extern void __init
calibrate_delay(void);
78 extern ATTRIB_NORET
void cpu_idle(void);
81 * First C code run on the secondary CPUs after being started up by
84 asmlinkage
void start_secondary(void)
86 unsigned int cpu
= smp_processor_id();
91 prom_init_secondary();
94 * XXX parity protection should be folded in here when it's converted
95 * to an option instead of something based on .cputype
99 cpu_data
[cpu
].udelay_val
= loops_per_jiffy
;
103 cpu_set(cpu
, cpu_callin_map
);
108 DEFINE_SPINLOCK(smp_call_lock
);
110 struct call_data_struct
*call_data
;
113 * Run a function on all other CPUs.
114 * <func> The function to run. This must be fast and non-blocking.
115 * <info> An arbitrary pointer to pass to the function.
116 * <retry> If true, keep retrying until ready.
117 * <wait> If true, wait until function has completed on other CPUs.
118 * [RETURNS] 0 on success, else a negative status code.
120 * Does not return until remote CPUs are nearly ready to execute <func>
121 * or are or have executed.
123 * You must not call this function with disabled interrupts or from a
124 * hardware interrupt handler or from a bottom half handler.
126 int smp_call_function (void (*func
) (void *info
), void *info
, int retry
,
129 struct call_data_struct data
;
130 int i
, cpus
= num_online_cpus() - 1;
131 int cpu
= smp_processor_id();
136 /* Can deadlock when called with interrupts disabled */
137 WARN_ON(irqs_disabled());
141 atomic_set(&data
.started
, 0);
144 atomic_set(&data
.finished
, 0);
146 spin_lock(&smp_call_lock
);
150 /* Send a message to all other CPUs and wait for them to respond */
151 for (i
= 0; i
< NR_CPUS
; i
++)
152 if (cpu_online(i
) && i
!= cpu
)
153 core_send_ipi(i
, SMP_CALL_FUNCTION
);
155 /* Wait for response */
156 /* FIXME: lock-up detection, backtrace on lock-up */
157 while (atomic_read(&data
.started
) != cpus
)
161 while (atomic_read(&data
.finished
) != cpus
)
163 spin_unlock(&smp_call_lock
);
168 void smp_call_function_interrupt(void)
170 void (*func
) (void *info
) = call_data
->func
;
171 void *info
= call_data
->info
;
172 int wait
= call_data
->wait
;
175 * Notify initiating CPU that I've grabbed the data and am
176 * about to execute the function.
179 atomic_inc(&call_data
->started
);
182 * At this point the info structure may be out of scope unless wait==1.
190 atomic_inc(&call_data
->finished
);
194 static void stop_this_cpu(void *dummy
)
199 cpu_clear(smp_processor_id(), cpu_online_map
);
200 local_irq_enable(); /* May need to service _machine_restart IPI */
201 for (;;); /* Wait if available. */
204 void smp_send_stop(void)
206 smp_call_function(stop_this_cpu
, NULL
, 1, 0);
209 void __init
smp_cpus_done(unsigned int max_cpus
)
214 /* called from main before smp_init() */
215 void __init
smp_prepare_cpus(unsigned int max_cpus
)
217 cpu_data
[0].udelay_val
= loops_per_jiffy
;
218 init_new_context(current
, &init_mm
);
219 current_thread_info()->cpu
= 0;
220 smp_tune_scheduling();
221 prom_prepare_cpus(max_cpus
);
224 /* preload SMP state for boot cpu */
225 void __devinit
smp_prepare_boot_cpu(void)
228 * This assumes that bootup is always handled by the processor
229 * with the logic and physical number 0.
231 __cpu_number_map
[0] = 0;
232 __cpu_logical_map
[0] = 0;
233 cpu_set(0, phys_cpu_present_map
);
234 cpu_set(0, cpu_online_map
);
235 cpu_set(0, cpu_callin_map
);
239 * Startup the CPU with this logical number
241 static int __init
do_boot_cpu(int cpu
)
243 struct task_struct
*idle
;
246 * The following code is purely to make sure
247 * Linux can schedule processes on this slave.
249 idle
= fork_idle(cpu
);
251 panic("failed fork for CPU %d\n", cpu
);
253 prom_boot_secondary(cpu
, idle
);
256 while (!cpu_isset(cpu
, cpu_callin_map
))
259 cpu_set(cpu
, cpu_online_map
);
265 * Called once for each "cpu_possible(cpu)". Needs to spin up the cpu
266 * and keep control until "cpu_online(cpu)" is set. Note: cpu is
267 * physical, not logical.
269 int __devinit
__cpu_up(unsigned int cpu
)
273 /* Processor goes to start_secondary(), sets online flag */
274 ret
= do_boot_cpu(cpu
);
281 /* Not really SMP stuff ... */
282 int setup_profiling_timer(unsigned int multiplier
)
287 static void flush_tlb_all_ipi(void *info
)
289 local_flush_tlb_all();
292 void flush_tlb_all(void)
294 on_each_cpu(flush_tlb_all_ipi
, 0, 1, 1);
297 static void flush_tlb_mm_ipi(void *mm
)
299 local_flush_tlb_mm((struct mm_struct
*)mm
);
303 * The following tlb flush calls are invoked when old translations are
304 * being torn down, or pte attributes are changing. For single threaded
305 * address spaces, a new context is obtained on the current cpu, and tlb
306 * context on other cpus are invalidated to force a new context allocation
307 * at switch_mm time, should the mm ever be used on other cpus. For
308 * multithreaded address spaces, intercpu interrupts have to be sent.
309 * Another case where intercpu interrupts are required is when the target
310 * mm might be active on another cpu (eg debuggers doing the flushes on
311 * behalf of debugees, kswapd stealing pages from another process etc).
315 void flush_tlb_mm(struct mm_struct
*mm
)
319 if ((atomic_read(&mm
->mm_users
) != 1) || (current
->mm
!= mm
)) {
320 smp_call_function(flush_tlb_mm_ipi
, (void *)mm
, 1, 1);
323 for (i
= 0; i
< num_online_cpus(); i
++)
324 if (smp_processor_id() != i
)
325 cpu_context(i
, mm
) = 0;
327 local_flush_tlb_mm(mm
);
332 struct flush_tlb_data
{
333 struct vm_area_struct
*vma
;
338 static void flush_tlb_range_ipi(void *info
)
340 struct flush_tlb_data
*fd
= (struct flush_tlb_data
*)info
;
342 local_flush_tlb_range(fd
->vma
, fd
->addr1
, fd
->addr2
);
345 void flush_tlb_range(struct vm_area_struct
*vma
, unsigned long start
, unsigned long end
)
347 struct mm_struct
*mm
= vma
->vm_mm
;
350 if ((atomic_read(&mm
->mm_users
) != 1) || (current
->mm
!= mm
)) {
351 struct flush_tlb_data fd
;
356 smp_call_function(flush_tlb_range_ipi
, (void *)&fd
, 1, 1);
359 for (i
= 0; i
< num_online_cpus(); i
++)
360 if (smp_processor_id() != i
)
361 cpu_context(i
, mm
) = 0;
363 local_flush_tlb_range(vma
, start
, end
);
367 static void flush_tlb_kernel_range_ipi(void *info
)
369 struct flush_tlb_data
*fd
= (struct flush_tlb_data
*)info
;
371 local_flush_tlb_kernel_range(fd
->addr1
, fd
->addr2
);
374 void flush_tlb_kernel_range(unsigned long start
, unsigned long end
)
376 struct flush_tlb_data fd
;
380 on_each_cpu(flush_tlb_kernel_range_ipi
, (void *)&fd
, 1, 1);
383 static void flush_tlb_page_ipi(void *info
)
385 struct flush_tlb_data
*fd
= (struct flush_tlb_data
*)info
;
387 local_flush_tlb_page(fd
->vma
, fd
->addr1
);
390 void flush_tlb_page(struct vm_area_struct
*vma
, unsigned long page
)
393 if ((atomic_read(&vma
->vm_mm
->mm_users
) != 1) || (current
->mm
!= vma
->vm_mm
)) {
394 struct flush_tlb_data fd
;
398 smp_call_function(flush_tlb_page_ipi
, (void *)&fd
, 1, 1);
401 for (i
= 0; i
< num_online_cpus(); i
++)
402 if (smp_processor_id() != i
)
403 cpu_context(i
, vma
->vm_mm
) = 0;
405 local_flush_tlb_page(vma
, page
);
409 static void flush_tlb_one_ipi(void *info
)
411 unsigned long vaddr
= (unsigned long) info
;
413 local_flush_tlb_one(vaddr
);
416 void flush_tlb_one(unsigned long vaddr
)
418 smp_call_function(flush_tlb_one_ipi
, (void *) vaddr
, 1, 1);
419 local_flush_tlb_one(vaddr
);
422 EXPORT_SYMBOL(flush_tlb_page
);
423 EXPORT_SYMBOL(flush_tlb_one
);
424 EXPORT_SYMBOL(cpu_data
);
425 EXPORT_SYMBOL(synchronize_irq
);