Merge branch 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...
[cris-mirror.git] / arch / sparc / include / asm / trap_block.h
blobec9c04de3664910d81b7a55bbb09084d5e235d39
1 #ifndef _SPARC_TRAP_BLOCK_H
2 #define _SPARC_TRAP_BLOCK_H
4 #include <asm/hypervisor.h>
5 #include <asm/asi.h>
7 #ifndef __ASSEMBLY__
9 /* Trap handling code needs to get at a few critical values upon
10 * trap entry and to process TSB misses. These cannot be in the
11 * per_cpu() area as we really need to lock them into the TLB and
12 * thus make them part of the main kernel image. As a result we
13 * try to make this as small as possible.
15 * This is padded out and aligned to 64-bytes to avoid false sharing
16 * on SMP.
19 /* If you modify the size of this structure, please update
20 * TRAP_BLOCK_SZ_SHIFT below.
22 struct thread_info;
23 struct trap_per_cpu {
24 /* D-cache line 1: Basic thread information, cpu and device mondo queues */
25 struct thread_info *thread;
26 unsigned long pgd_paddr;
27 unsigned long cpu_mondo_pa;
28 unsigned long dev_mondo_pa;
30 /* D-cache line 2: Error Mondo Queue and kernel buffer pointers */
31 unsigned long resum_mondo_pa;
32 unsigned long resum_kernel_buf_pa;
33 unsigned long nonresum_mondo_pa;
34 unsigned long nonresum_kernel_buf_pa;
36 /* Dcache lines 3, 4, 5, and 6: Hypervisor Fault Status */
37 struct hv_fault_status fault_info;
39 /* Dcache line 7: Physical addresses of CPU send mondo block and CPU list. */
40 unsigned long cpu_mondo_block_pa;
41 unsigned long cpu_list_pa;
42 unsigned long tsb_huge;
43 unsigned long tsb_huge_temp;
45 /* Dcache line 8: IRQ work list, and keep trap_block a power-of-2 in size. */
46 unsigned long irq_worklist_pa;
47 unsigned int cpu_mondo_qmask;
48 unsigned int dev_mondo_qmask;
49 unsigned int resum_qmask;
50 unsigned int nonresum_qmask;
51 unsigned long __per_cpu_base;
52 } __attribute__((aligned(64)));
53 extern struct trap_per_cpu trap_block[NR_CPUS];
54 void init_cur_cpu_trap(struct thread_info *);
55 void setup_tba(void);
56 extern int ncpus_probed;
58 unsigned long real_hard_smp_processor_id(void);
60 struct cpuid_patch_entry {
61 unsigned int addr;
62 unsigned int cheetah_safari[4];
63 unsigned int cheetah_jbus[4];
64 unsigned int starfire[4];
65 unsigned int sun4v[4];
67 extern struct cpuid_patch_entry __cpuid_patch, __cpuid_patch_end;
69 struct sun4v_1insn_patch_entry {
70 unsigned int addr;
71 unsigned int insn;
73 extern struct sun4v_1insn_patch_entry __sun4v_1insn_patch,
74 __sun4v_1insn_patch_end;
76 struct sun4v_2insn_patch_entry {
77 unsigned int addr;
78 unsigned int insns[2];
80 extern struct sun4v_2insn_patch_entry __sun4v_2insn_patch,
81 __sun4v_2insn_patch_end;
82 extern struct sun4v_2insn_patch_entry __sun_m7_2insn_patch,
83 __sun_m7_2insn_patch_end;
86 #endif /* !(__ASSEMBLY__) */
88 #define TRAP_PER_CPU_THREAD 0x00
89 #define TRAP_PER_CPU_PGD_PADDR 0x08
90 #define TRAP_PER_CPU_CPU_MONDO_PA 0x10
91 #define TRAP_PER_CPU_DEV_MONDO_PA 0x18
92 #define TRAP_PER_CPU_RESUM_MONDO_PA 0x20
93 #define TRAP_PER_CPU_RESUM_KBUF_PA 0x28
94 #define TRAP_PER_CPU_NONRESUM_MONDO_PA 0x30
95 #define TRAP_PER_CPU_NONRESUM_KBUF_PA 0x38
96 #define TRAP_PER_CPU_FAULT_INFO 0x40
97 #define TRAP_PER_CPU_CPU_MONDO_BLOCK_PA 0xc0
98 #define TRAP_PER_CPU_CPU_LIST_PA 0xc8
99 #define TRAP_PER_CPU_TSB_HUGE 0xd0
100 #define TRAP_PER_CPU_TSB_HUGE_TEMP 0xd8
101 #define TRAP_PER_CPU_IRQ_WORKLIST_PA 0xe0
102 #define TRAP_PER_CPU_CPU_MONDO_QMASK 0xe8
103 #define TRAP_PER_CPU_DEV_MONDO_QMASK 0xec
104 #define TRAP_PER_CPU_RESUM_QMASK 0xf0
105 #define TRAP_PER_CPU_NONRESUM_QMASK 0xf4
106 #define TRAP_PER_CPU_PER_CPU_BASE 0xf8
108 #define TRAP_BLOCK_SZ_SHIFT 8
110 #include <asm/scratchpad.h>
112 #define __GET_CPUID(REG) \
113 /* Spitfire implementation (default). */ \
114 661: ldxa [%g0] ASI_UPA_CONFIG, REG; \
115 srlx REG, 17, REG; \
116 and REG, 0x1f, REG; \
117 nop; \
118 .section .cpuid_patch, "ax"; \
119 /* Instruction location. */ \
120 .word 661b; \
121 /* Cheetah Safari implementation. */ \
122 ldxa [%g0] ASI_SAFARI_CONFIG, REG; \
123 srlx REG, 17, REG; \
124 and REG, 0x3ff, REG; \
125 nop; \
126 /* Cheetah JBUS implementation. */ \
127 ldxa [%g0] ASI_JBUS_CONFIG, REG; \
128 srlx REG, 17, REG; \
129 and REG, 0x1f, REG; \
130 nop; \
131 /* Starfire implementation. */ \
132 sethi %hi(0x1fff40000d0 >> 9), REG; \
133 sllx REG, 9, REG; \
134 or REG, 0xd0, REG; \
135 lduwa [REG] ASI_PHYS_BYPASS_EC_E, REG;\
136 /* sun4v implementation. */ \
137 mov SCRATCHPAD_CPUID, REG; \
138 ldxa [REG] ASI_SCRATCHPAD, REG; \
139 nop; \
140 nop; \
141 .previous;
143 #ifdef CONFIG_SMP
145 #define TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
146 __GET_CPUID(TMP) \
147 sethi %hi(trap_block), DEST; \
148 sllx TMP, TRAP_BLOCK_SZ_SHIFT, TMP; \
149 or DEST, %lo(trap_block), DEST; \
150 add DEST, TMP, DEST; \
152 /* Clobbers TMP, current address space PGD phys address into DEST. */
153 #define TRAP_LOAD_PGD_PHYS(DEST, TMP) \
154 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
155 ldx [DEST + TRAP_PER_CPU_PGD_PADDR], DEST;
157 /* Clobbers TMP, loads local processor's IRQ work area into DEST. */
158 #define TRAP_LOAD_IRQ_WORK_PA(DEST, TMP) \
159 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
160 add DEST, TRAP_PER_CPU_IRQ_WORKLIST_PA, DEST;
162 /* Clobbers TMP, loads DEST with current thread info pointer. */
163 #define TRAP_LOAD_THREAD_REG(DEST, TMP) \
164 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
165 ldx [DEST + TRAP_PER_CPU_THREAD], DEST;
167 /* Given the current thread info pointer in THR, load the per-cpu
168 * area base of the current processor into DEST. REG1, REG2, and REG3 are
169 * clobbered.
171 * You absolutely cannot use DEST as a temporary in this code. The
172 * reason is that traps can happen during execution, and return from
173 * trap will load the fully resolved DEST per-cpu base. This can corrupt
174 * the calculations done by the macro mid-stream.
176 #define LOAD_PER_CPU_BASE(DEST, THR, REG1, REG2, REG3) \
177 lduh [THR + TI_CPU], REG1; \
178 sethi %hi(trap_block), REG2; \
179 sllx REG1, TRAP_BLOCK_SZ_SHIFT, REG1; \
180 or REG2, %lo(trap_block), REG2; \
181 add REG2, REG1, REG2; \
182 ldx [REG2 + TRAP_PER_CPU_PER_CPU_BASE], DEST;
184 #else
186 #define TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
187 sethi %hi(trap_block), DEST; \
188 or DEST, %lo(trap_block), DEST; \
190 /* Uniprocessor versions, we know the cpuid is zero. */
191 #define TRAP_LOAD_PGD_PHYS(DEST, TMP) \
192 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
193 ldx [DEST + TRAP_PER_CPU_PGD_PADDR], DEST;
195 /* Clobbers TMP, loads local processor's IRQ work area into DEST. */
196 #define TRAP_LOAD_IRQ_WORK_PA(DEST, TMP) \
197 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
198 add DEST, TRAP_PER_CPU_IRQ_WORKLIST_PA, DEST;
200 #define TRAP_LOAD_THREAD_REG(DEST, TMP) \
201 TRAP_LOAD_TRAP_BLOCK(DEST, TMP) \
202 ldx [DEST + TRAP_PER_CPU_THREAD], DEST;
204 /* No per-cpu areas on uniprocessor, so no need to load DEST. */
205 #define LOAD_PER_CPU_BASE(DEST, THR, REG1, REG2, REG3)
207 #endif /* !(CONFIG_SMP) */
209 #endif /* _SPARC_TRAP_BLOCK_H */