blob: b8b3bb4423cf433ca2aab05b449db77e08611104 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/arm/mm/fault.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 * Modifications for ARM processor (c) 1995-2004 Russell King
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070011#include <linux/module.h>
12#include <linux/signal.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/mm.h>
Russell King67306da2008-12-14 18:01:44 +000014#include <linux/hardirq.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include <linux/init.h>
Nicolas Pitre25ce1dd2007-12-03 15:21:57 -050016#include <linux/kprobes.h>
Russell King33fa9b12008-09-06 11:35:55 +010017#include <linux/uaccess.h>
Nicolas Pitre252d4c22008-09-11 11:52:02 -040018#include <linux/page-flags.h>
Catalin Marinas412bb0a2009-07-24 12:37:09 +010019#include <linux/sched.h>
Russell King65cec8e2009-08-17 20:02:06 +010020#include <linux/highmem.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021
22#include <asm/system.h>
23#include <asm/pgtable.h>
24#include <asm/tlbflush.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
26#include "fault.h"
27
Russell Kingc88d6aa2009-09-20 12:41:58 +010028/*
29 * Fault status register encodings
30 */
31#define FSR_WRITE (1 << 11)
32#define FSR_FS4 (1 << 10)
33#define FSR_FS3_0 (15)
34
35static inline int fsr_fs(unsigned int fsr)
36{
37 return (fsr & FSR_FS3_0) | (fsr & FSR_FS4) >> 6;
38}
39
Catalin Marinas09529f72009-07-24 12:34:55 +010040#ifdef CONFIG_MMU
Nicolas Pitre25ce1dd2007-12-03 15:21:57 -050041
42#ifdef CONFIG_KPROBES
43static inline int notify_page_fault(struct pt_regs *regs, unsigned int fsr)
44{
45 int ret = 0;
46
47 if (!user_mode(regs)) {
48 /* kprobe_running() needs smp_processor_id() */
49 preempt_disable();
50 if (kprobe_running() && kprobe_fault_handler(regs, fsr))
51 ret = 1;
52 preempt_enable();
53 }
54
55 return ret;
56}
57#else
58static inline int notify_page_fault(struct pt_regs *regs, unsigned int fsr)
59{
60 return 0;
61}
62#endif
63
Linus Torvalds1da177e2005-04-16 15:20:36 -070064/*
65 * This is useful to dump out the page tables associated with
66 * 'addr' in mm 'mm'.
67 */
68void show_pte(struct mm_struct *mm, unsigned long addr)
69{
70 pgd_t *pgd;
71
72 if (!mm)
73 mm = &init_mm;
74
75 printk(KERN_ALERT "pgd = %p\n", mm->pgd);
76 pgd = pgd_offset(mm, addr);
77 printk(KERN_ALERT "[%08lx] *pgd=%08lx", addr, pgd_val(*pgd));
78
79 do {
80 pmd_t *pmd;
81 pte_t *pte;
82
83 if (pgd_none(*pgd))
84 break;
85
86 if (pgd_bad(*pgd)) {
87 printk("(bad)");
88 break;
89 }
90
91 pmd = pmd_offset(pgd, addr);
Nicolas Pitreda46c792008-09-30 16:10:11 +010092 if (PTRS_PER_PMD != 1)
93 printk(", *pmd=%08lx", pmd_val(*pmd));
Linus Torvalds1da177e2005-04-16 15:20:36 -070094
95 if (pmd_none(*pmd))
96 break;
97
98 if (pmd_bad(*pmd)) {
99 printk("(bad)");
100 break;
101 }
102
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103 /* We must not map this if we have highmem enabled */
Nicolas Pitre252d4c22008-09-11 11:52:02 -0400104 if (PageHighMem(pfn_to_page(pmd_val(*pmd) >> PAGE_SHIFT)))
105 break;
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 pte = pte_offset_map(pmd, addr);
108 printk(", *pte=%08lx", pte_val(*pte));
109 printk(", *ppte=%08lx", pte_val(pte[-PTRS_PER_PTE]));
110 pte_unmap(pte);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 } while(0);
112
113 printk("\n");
114}
Catalin Marinas09529f72009-07-24 12:34:55 +0100115#else /* CONFIG_MMU */
116void show_pte(struct mm_struct *mm, unsigned long addr)
117{ }
118#endif /* CONFIG_MMU */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
120/*
121 * Oops. The kernel tried to access some page that wasn't present.
122 */
123static void
124__do_kernel_fault(struct mm_struct *mm, unsigned long addr, unsigned int fsr,
125 struct pt_regs *regs)
126{
127 /*
128 * Are we prepared to handle this kernel fault?
129 */
130 if (fixup_exception(regs))
131 return;
132
133 /*
134 * No handler, we'll have to terminate things with extreme prejudice.
135 */
136 bust_spinlocks(1);
137 printk(KERN_ALERT
138 "Unable to handle kernel %s at virtual address %08lx\n",
139 (addr < PAGE_SIZE) ? "NULL pointer dereference" :
140 "paging request", addr);
141
142 show_pte(mm, addr);
143 die("Oops", regs, fsr);
144 bust_spinlocks(0);
145 do_exit(SIGKILL);
146}
147
148/*
149 * Something tried to access memory that isn't in our memory map..
150 * User mode accesses just cause a SIGSEGV
151 */
152static void
153__do_user_fault(struct task_struct *tsk, unsigned long addr,
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700154 unsigned int fsr, unsigned int sig, int code,
155 struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156{
157 struct siginfo si;
158
159#ifdef CONFIG_DEBUG_USER
160 if (user_debug & UDBG_SEGV) {
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700161 printk(KERN_DEBUG "%s: unhandled page fault (%d) at 0x%08lx, code 0x%03x\n",
162 tsk->comm, sig, addr, fsr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 show_pte(tsk->mm, addr);
164 show_regs(regs);
165 }
166#endif
167
168 tsk->thread.address = addr;
169 tsk->thread.error_code = fsr;
170 tsk->thread.trap_no = 14;
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700171 si.si_signo = sig;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 si.si_errno = 0;
173 si.si_code = code;
174 si.si_addr = (void __user *)addr;
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700175 force_sig_info(sig, &si, tsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176}
177
Russell Kinge5beac32006-09-27 16:13:48 +0100178void do_bad_area(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179{
Russell Kinge5beac32006-09-27 16:13:48 +0100180 struct task_struct *tsk = current;
181 struct mm_struct *mm = tsk->active_mm;
182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 /*
184 * If we are in kernel mode at this point, we
185 * have no context to handle this fault with.
186 */
187 if (user_mode(regs))
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700188 __do_user_fault(tsk, addr, fsr, SIGSEGV, SEGV_MAPERR, regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189 else
190 __do_kernel_fault(mm, addr, fsr, regs);
191}
192
Catalin Marinas09529f72009-07-24 12:34:55 +0100193#ifdef CONFIG_MMU
Nick Piggin5c72fc52007-07-20 09:21:06 +0200194#define VM_FAULT_BADMAP 0x010000
195#define VM_FAULT_BADACCESS 0x020000
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196
197static int
198__do_page_fault(struct mm_struct *mm, unsigned long addr, unsigned int fsr,
199 struct task_struct *tsk)
200{
201 struct vm_area_struct *vma;
202 int fault, mask;
203
204 vma = find_vma(mm, addr);
205 fault = VM_FAULT_BADMAP;
206 if (!vma)
207 goto out;
208 if (vma->vm_start > addr)
209 goto check_stack;
210
211 /*
212 * Ok, we have a good vm_area for this
213 * memory access, so we can handle it.
214 */
215good_area:
Russell Kingc88d6aa2009-09-20 12:41:58 +0100216 if (fsr & FSR_WRITE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 mask = VM_WRITE;
218 else
Jason Barondf67b3d2006-09-29 01:58:58 -0700219 mask = VM_READ|VM_EXEC|VM_WRITE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220
221 fault = VM_FAULT_BADACCESS;
222 if (!(vma->vm_flags & mask))
223 goto out;
224
225 /*
Russell Kingb42c6342009-09-20 12:47:40 +0100226 * If for any reason at all we couldn't handle the fault, make
227 * sure we exit gracefully rather than endlessly redo the fault.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 */
Russell Kingc88d6aa2009-09-20 12:41:58 +0100229 fault = handle_mm_fault(mm, vma, addr & PAGE_MASK, (fsr & FSR_WRITE) ? FAULT_FLAG_WRITE : 0);
Russell Kingb42c6342009-09-20 12:47:40 +0100230 if (unlikely(fault & VM_FAULT_ERROR))
231 return fault;
Nick Piggin83c54072007-07-19 01:47:05 -0700232 if (fault & VM_FAULT_MAJOR)
233 tsk->maj_flt++;
234 else
235 tsk->min_flt++;
236 return fault;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238check_stack:
239 if (vma->vm_flags & VM_GROWSDOWN && !expand_stack(vma, addr))
240 goto good_area;
241out:
242 return fault;
243}
244
Nicolas Pitre785d3cd2007-12-03 15:27:56 -0500245static int __kprobes
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246do_page_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
247{
248 struct task_struct *tsk;
249 struct mm_struct *mm;
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700250 int fault, sig, code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Nicolas Pitre25ce1dd2007-12-03 15:21:57 -0500252 if (notify_page_fault(regs, fsr))
253 return 0;
254
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 tsk = current;
256 mm = tsk->mm;
257
258 /*
259 * If we're in an interrupt or have no user
260 * context, we must not take the fault..
261 */
Peter Zijlstra6edaf682006-12-06 20:32:18 -0800262 if (in_atomic() || !mm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 goto no_context;
264
Russell King840ff6a2005-09-20 17:52:13 +0100265 /*
266 * As per x86, we may deadlock here. However, since the kernel only
267 * validly references user space from well defined areas of the code,
268 * we can bug out early if this is from code which shouldn't.
269 */
270 if (!down_read_trylock(&mm->mmap_sem)) {
271 if (!user_mode(regs) && !search_exception_tables(regs->ARM_pc))
272 goto no_context;
273 down_read(&mm->mmap_sem);
Russell Kingbf456992009-09-20 12:52:19 +0100274 } else {
275 /*
276 * The above down_read_trylock() might have succeeded in
277 * which case, we'll have missed the might_sleep() from
278 * down_read()
279 */
280 might_sleep();
Russell King840ff6a2005-09-20 17:52:13 +0100281 }
282
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283 fault = __do_page_fault(mm, addr, fsr, tsk);
284 up_read(&mm->mmap_sem);
285
286 /*
Russell Kingff2afb92005-08-04 14:17:33 +0100287 * Handle the "normal" case first - VM_FAULT_MAJOR / VM_FAULT_MINOR
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 */
Nick Piggin5c72fc52007-07-20 09:21:06 +0200289 if (likely(!(fault & (VM_FAULT_ERROR | VM_FAULT_BADMAP | VM_FAULT_BADACCESS))))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290 return 0;
291
Russell Kingb42c6342009-09-20 12:47:40 +0100292 if (fault & VM_FAULT_OOM) {
293 /*
294 * We ran out of memory, call the OOM killer, and return to
295 * userspace (which will retry the fault, or kill us if we
296 * got oom-killed)
297 */
298 pagefault_out_of_memory();
299 return 0;
300 }
301
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303 * If we are in kernel mode at this point, we
304 * have no context to handle this fault with.
305 */
306 if (!user_mode(regs))
307 goto no_context;
308
Nick Piggin83c54072007-07-19 01:47:05 -0700309 if (fault & VM_FAULT_SIGBUS) {
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700310 /*
311 * We had some memory, but were unable to
312 * successfully fix up this page fault.
313 */
314 sig = SIGBUS;
315 code = BUS_ADRERR;
Nick Piggin83c54072007-07-19 01:47:05 -0700316 } else {
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700317 /*
318 * Something tried to access memory that
319 * isn't in our memory map..
320 */
321 sig = SIGSEGV;
322 code = fault == VM_FAULT_BADACCESS ?
323 SEGV_ACCERR : SEGV_MAPERR;
akpm@osdl.org2d137c22005-04-16 15:23:55 -0700324 }
325
326 __do_user_fault(tsk, addr, fsr, sig, code, regs);
327 return 0;
328
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329no_context:
330 __do_kernel_fault(mm, addr, fsr, regs);
331 return 0;
332}
Catalin Marinas09529f72009-07-24 12:34:55 +0100333#else /* CONFIG_MMU */
334static int
335do_page_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
336{
337 return 0;
338}
339#endif /* CONFIG_MMU */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340
341/*
342 * First Level Translation Fault Handler
343 *
344 * We enter here because the first level page table doesn't contain
345 * a valid entry for the address.
346 *
347 * If the address is in kernel space (>= TASK_SIZE), then we are
348 * probably faulting in the vmalloc() area.
349 *
350 * If the init_task's first level page tables contains the relevant
351 * entry, we copy the it to this task. If not, we send the process
352 * a signal, fixup the exception, or oops the kernel.
353 *
354 * NOTE! We MUST NOT take any locks for this case. We may be in an
355 * interrupt or a critical region, and should only copy the information
356 * from the master page table, nothing more.
357 */
Catalin Marinas09529f72009-07-24 12:34:55 +0100358#ifdef CONFIG_MMU
Nicolas Pitre785d3cd2007-12-03 15:27:56 -0500359static int __kprobes
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360do_translation_fault(unsigned long addr, unsigned int fsr,
361 struct pt_regs *regs)
362{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 unsigned int index;
364 pgd_t *pgd, *pgd_k;
365 pmd_t *pmd, *pmd_k;
366
367 if (addr < TASK_SIZE)
368 return do_page_fault(addr, fsr, regs);
369
370 index = pgd_index(addr);
371
372 /*
373 * FIXME: CP15 C1 is write only on ARMv3 architectures.
374 */
375 pgd = cpu_get_pgd() + index;
376 pgd_k = init_mm.pgd + index;
377
378 if (pgd_none(*pgd_k))
379 goto bad_area;
380
381 if (!pgd_present(*pgd))
382 set_pgd(pgd, *pgd_k);
383
384 pmd_k = pmd_offset(pgd_k, addr);
385 pmd = pmd_offset(pgd, addr);
386
387 if (pmd_none(*pmd_k))
388 goto bad_area;
389
390 copy_pmd(pmd, pmd_k);
391 return 0;
392
393bad_area:
Russell Kinge5beac32006-09-27 16:13:48 +0100394 do_bad_area(addr, fsr, regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 return 0;
396}
Catalin Marinas09529f72009-07-24 12:34:55 +0100397#else /* CONFIG_MMU */
398static int
399do_translation_fault(unsigned long addr, unsigned int fsr,
400 struct pt_regs *regs)
401{
402 return 0;
403}
404#endif /* CONFIG_MMU */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700405
406/*
407 * Some section permission faults need to be handled gracefully.
408 * They can happen due to a __{get,put}_user during an oops.
409 */
410static int
411do_sect_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
412{
Russell Kinge5beac32006-09-27 16:13:48 +0100413 do_bad_area(addr, fsr, regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 return 0;
415}
416
417/*
418 * This abort handler always returns "fault".
419 */
420static int
421do_bad(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
422{
423 return 1;
424}
425
426static struct fsr_info {
427 int (*fn)(unsigned long addr, unsigned int fsr, struct pt_regs *regs);
428 int sig;
Russell Kingcfb08102005-06-30 11:06:49 +0100429 int code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430 const char *name;
431} fsr_info[] = {
432 /*
433 * The following are the standard ARMv3 and ARMv4 aborts. ARMv5
434 * defines these to be "precise" aborts.
435 */
Russell Kingcfb08102005-06-30 11:06:49 +0100436 { do_bad, SIGSEGV, 0, "vector exception" },
437 { do_bad, SIGILL, BUS_ADRALN, "alignment exception" },
438 { do_bad, SIGKILL, 0, "terminal exception" },
439 { do_bad, SIGILL, BUS_ADRALN, "alignment exception" },
440 { do_bad, SIGBUS, 0, "external abort on linefetch" },
441 { do_translation_fault, SIGSEGV, SEGV_MAPERR, "section translation fault" },
442 { do_bad, SIGBUS, 0, "external abort on linefetch" },
443 { do_page_fault, SIGSEGV, SEGV_MAPERR, "page translation fault" },
444 { do_bad, SIGBUS, 0, "external abort on non-linefetch" },
445 { do_bad, SIGSEGV, SEGV_ACCERR, "section domain fault" },
446 { do_bad, SIGBUS, 0, "external abort on non-linefetch" },
447 { do_bad, SIGSEGV, SEGV_ACCERR, "page domain fault" },
448 { do_bad, SIGBUS, 0, "external abort on translation" },
449 { do_sect_fault, SIGSEGV, SEGV_ACCERR, "section permission fault" },
450 { do_bad, SIGBUS, 0, "external abort on translation" },
451 { do_page_fault, SIGSEGV, SEGV_ACCERR, "page permission fault" },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 /*
453 * The following are "imprecise" aborts, which are signalled by bit
454 * 10 of the FSR, and may not be recoverable. These are only
455 * supported if the CPU abort handler supports bit 10.
456 */
Russell Kingcfb08102005-06-30 11:06:49 +0100457 { do_bad, SIGBUS, 0, "unknown 16" },
458 { do_bad, SIGBUS, 0, "unknown 17" },
459 { do_bad, SIGBUS, 0, "unknown 18" },
460 { do_bad, SIGBUS, 0, "unknown 19" },
461 { do_bad, SIGBUS, 0, "lock abort" }, /* xscale */
462 { do_bad, SIGBUS, 0, "unknown 21" },
463 { do_bad, SIGBUS, BUS_OBJERR, "imprecise external abort" }, /* xscale */
464 { do_bad, SIGBUS, 0, "unknown 23" },
465 { do_bad, SIGBUS, 0, "dcache parity error" }, /* xscale */
466 { do_bad, SIGBUS, 0, "unknown 25" },
467 { do_bad, SIGBUS, 0, "unknown 26" },
468 { do_bad, SIGBUS, 0, "unknown 27" },
469 { do_bad, SIGBUS, 0, "unknown 28" },
470 { do_bad, SIGBUS, 0, "unknown 29" },
471 { do_bad, SIGBUS, 0, "unknown 30" },
472 { do_bad, SIGBUS, 0, "unknown 31" }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473};
474
475void __init
476hook_fault_code(int nr, int (*fn)(unsigned long, unsigned int, struct pt_regs *),
477 int sig, const char *name)
478{
479 if (nr >= 0 && nr < ARRAY_SIZE(fsr_info)) {
480 fsr_info[nr].fn = fn;
481 fsr_info[nr].sig = sig;
482 fsr_info[nr].name = name;
483 }
484}
485
486/*
487 * Dispatch a data abort to the relevant handler.
488 */
Russell King7ab3f8d2007-03-02 15:01:36 +0000489asmlinkage void __exception
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490do_DataAbort(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
491{
Russell Kingc88d6aa2009-09-20 12:41:58 +0100492 const struct fsr_info *inf = fsr_info + fsr_fs(fsr);
Russell Kingcfb08102005-06-30 11:06:49 +0100493 struct siginfo info;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494
495 if (!inf->fn(addr, fsr, regs))
496 return;
497
498 printk(KERN_ALERT "Unhandled fault: %s (0x%03x) at 0x%08lx\n",
499 inf->name, fsr, addr);
Russell Kingcfb08102005-06-30 11:06:49 +0100500
501 info.si_signo = inf->sig;
502 info.si_errno = 0;
503 info.si_code = inf->code;
504 info.si_addr = (void __user *)addr;
Christoph Hellwig1eeb66a2007-05-08 00:27:03 -0700505 arm_notify_die("", regs, &info, fsr, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506}
507
Russell King7ab3f8d2007-03-02 15:01:36 +0000508asmlinkage void __exception
Linus Torvalds1da177e2005-04-16 15:20:36 -0700509do_PrefetchAbort(unsigned long addr, struct pt_regs *regs)
510{
511 do_translation_fault(addr, 0, regs);
512}
513