2 * Page fault handler for SH with an MMU.
4 * Copyright (C) 1999 Niibe Yutaka
5 * Copyright (C) 2003 - 2009 Paul Mundt
7 * Based on linux/arch/i386/mm/fault.c:
8 * Copyright (C) 1995 Linus Torvalds
10 * This file is subject to the terms and conditions of the GNU General Public
11 * License. See the file "COPYING" in the main directory of this archive
14 #include <linux/kernel.h>
16 #include <linux/hardirq.h>
17 #include <linux/kprobes.h>
18 #include <linux/perf_event.h>
19 #include <asm/io_trapped.h>
20 #include <asm/system.h>
21 #include <asm/mmu_context.h>
22 #include <asm/tlbflush.h>
24 static inline int notify_page_fault(struct pt_regs
*regs
, int trap
)
28 if (kprobes_built_in() && !user_mode(regs
)) {
30 if (kprobe_running() && kprobe_fault_handler(regs
, trap
))
38 static inline pmd_t
*vmalloc_sync_one(pgd_t
*pgd
, unsigned long address
)
40 unsigned index
= pgd_index(address
);
46 pgd_k
= init_mm
.pgd
+ index
;
48 if (!pgd_present(*pgd_k
))
51 pud
= pud_offset(pgd
, address
);
52 pud_k
= pud_offset(pgd_k
, address
);
53 if (!pud_present(*pud_k
))
56 if (!pud_present(*pud
))
59 pmd
= pmd_offset(pud
, address
);
60 pmd_k
= pmd_offset(pud_k
, address
);
61 if (!pmd_present(*pmd_k
))
64 if (!pmd_present(*pmd
))
68 * The page tables are fully synchronised so there must
69 * be another reason for the fault. Return NULL here to
70 * signal that we have not taken care of the fault.
72 BUG_ON(pmd_page(*pmd
) != pmd_page(*pmd_k
));
80 * Handle a fault on the vmalloc or module mapping area
82 static noinline
int vmalloc_fault(unsigned long address
)
88 /* Make sure we are in vmalloc/module/P3 area: */
89 if (!(address
>= VMALLOC_START
&& address
< P3_ADDR_MAX
))
93 * Synchronize this task's top level page-table
94 * with the 'reference' page table.
96 * Do _not_ use "current" here. We might be inside
97 * an interrupt in the middle of a task switch..
100 pmd_k
= vmalloc_sync_one(pgd_k
, address
);
104 pte_k
= pte_offset_kernel(pmd_k
, address
);
105 if (!pte_present(*pte_k
))
111 static int fault_in_kernel_space(unsigned long address
)
113 return address
>= TASK_SIZE
;
117 * This routine handles page faults. It determines the address,
118 * and the problem, and then passes it off to one of the appropriate
121 asmlinkage
void __kprobes
do_page_fault(struct pt_regs
*regs
,
122 unsigned long writeaccess
,
123 unsigned long address
)
126 struct task_struct
*tsk
;
127 struct mm_struct
*mm
;
128 struct vm_area_struct
* vma
;
135 si_code
= SEGV_MAPERR
;
136 vec
= lookup_exception_vector();
139 * We fault-in kernel-space virtual memory on-demand. The
140 * 'reference' page table is init_mm.pgd.
142 * NOTE! We MUST NOT take any locks for this case. We may
143 * be in an interrupt or a critical region, and should
144 * only copy the information from the master page table,
147 if (unlikely(fault_in_kernel_space(address
))) {
148 if (vmalloc_fault(address
) >= 0)
150 if (notify_page_fault(regs
, vec
))
153 goto bad_area_nosemaphore
;
156 if (unlikely(notify_page_fault(regs
, vec
)))
159 /* Only enable interrupts if they were on before the fault */
160 if ((regs
->sr
& SR_IMASK
) != SR_IMASK
)
163 perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS
, 1, regs
, address
);
166 * If we're in an interrupt, have no user context or are running
167 * in an atomic region then we must not take the fault:
169 if (in_atomic() || !mm
)
172 down_read(&mm
->mmap_sem
);
174 vma
= find_vma(mm
, address
);
177 if (vma
->vm_start
<= address
)
179 if (!(vma
->vm_flags
& VM_GROWSDOWN
))
181 if (expand_stack(vma
, address
))
185 * Ok, we have a good vm_area for this memory access, so
189 si_code
= SEGV_ACCERR
;
191 if (!(vma
->vm_flags
& VM_WRITE
))
194 if (!(vma
->vm_flags
& (VM_READ
| VM_EXEC
| VM_WRITE
)))
199 * If for any reason at all we couldn't handle the fault,
200 * make sure we exit gracefully rather than endlessly redo
203 fault
= handle_mm_fault(mm
, vma
, address
, writeaccess
? FAULT_FLAG_WRITE
: 0);
204 if (unlikely(fault
& VM_FAULT_ERROR
)) {
205 if (fault
& VM_FAULT_OOM
)
207 else if (fault
& VM_FAULT_SIGBUS
)
211 if (fault
& VM_FAULT_MAJOR
) {
213 perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MAJ
, 1,
217 perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MIN
, 1,
221 up_read(&mm
->mmap_sem
);
225 * Something tried to access memory that isn't in our memory map..
226 * Fix it, but check if it's kernel or user first..
229 up_read(&mm
->mmap_sem
);
231 bad_area_nosemaphore
:
232 if (user_mode(regs
)) {
233 info
.si_signo
= SIGSEGV
;
235 info
.si_code
= si_code
;
236 info
.si_addr
= (void *) address
;
237 force_sig_info(SIGSEGV
, &info
, tsk
);
242 /* Are we prepared to handle this kernel fault? */
243 if (fixup_exception(regs
))
246 if (handle_trapped_io(regs
, address
))
249 * Oops. The kernel tried to access some bad page. We'll have to
250 * terminate things with extreme prejudice.
256 if (oops_may_print()) {
259 if (address
< PAGE_SIZE
)
260 printk(KERN_ALERT
"Unable to handle kernel NULL "
261 "pointer dereference");
263 printk(KERN_ALERT
"Unable to handle kernel paging "
265 printk(" at virtual address %08lx\n", address
);
266 printk(KERN_ALERT
"pc = %08lx\n", regs
->pc
);
267 page
= (unsigned long)get_TTB();
269 page
= ((__typeof__(page
) *)page
)[address
>> PGDIR_SHIFT
];
270 printk(KERN_ALERT
"*pde = %08lx\n", page
);
271 if (page
& _PAGE_PRESENT
) {
273 address
&= 0x003ff000;
274 page
= ((__typeof__(page
) *)
275 __va(page
))[address
>>
277 printk(KERN_ALERT
"*pte = %08lx\n", page
);
282 die("Oops", regs
, writeaccess
);
287 * We ran out of memory, or some other thing happened to us that made
288 * us unable to handle the page fault gracefully.
291 up_read(&mm
->mmap_sem
);
292 if (!user_mode(regs
))
294 pagefault_out_of_memory();
298 up_read(&mm
->mmap_sem
);
301 * Send a sigbus, regardless of whether we were in kernel
304 info
.si_signo
= SIGBUS
;
306 info
.si_code
= BUS_ADRERR
;
307 info
.si_addr
= (void *)address
;
308 force_sig_info(SIGBUS
, &info
, tsk
);
310 /* Kernel mode? Handle exceptions or die */
311 if (!user_mode(regs
))
316 * Called with interrupts disabled.
318 asmlinkage
int __kprobes
319 handle_tlbmiss(struct pt_regs
*regs
, unsigned long writeaccess
,
320 unsigned long address
)
329 * We don't take page faults for P1, P2, and parts of P4, these
330 * are always mapped, whether it be due to legacy behaviour in
331 * 29-bit mode, or due to PMB configuration in 32-bit mode.
333 if (address
>= P3SEG
&& address
< P3_ADDR_MAX
) {
334 pgd
= pgd_offset_k(address
);
336 if (unlikely(address
>= TASK_SIZE
|| !current
->mm
))
339 pgd
= pgd_offset(current
->mm
, address
);
342 pud
= pud_offset(pgd
, address
);
343 if (pud_none_or_clear_bad(pud
))
345 pmd
= pmd_offset(pud
, address
);
346 if (pmd_none_or_clear_bad(pmd
))
348 pte
= pte_offset_kernel(pmd
, address
);
350 if (unlikely(pte_none(entry
) || pte_not_present(entry
)))
352 if (unlikely(writeaccess
&& !pte_write(entry
)))
356 entry
= pte_mkdirty(entry
);
357 entry
= pte_mkyoung(entry
);
361 #if defined(CONFIG_CPU_SH4) && !defined(CONFIG_SMP)
363 * SH-4 does not set MMUCR.RC to the corresponding TLB entry in
364 * the case of an initial page write exception, so we need to
365 * flush it in order to avoid potential TLB entry duplication.
367 if (writeaccess
== 2)
368 local_flush_tlb_one(get_asid(), address
& PAGE_MASK
);
371 update_mmu_cache(NULL
, address
, pte
);