ARM: Ensure correct might_sleep() check in pagefault path
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / arch / arm / mm / fault.c
CommitLineData
1da177e4
LT
1/*
2 * linux/arch/arm/mm/fault.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 * Modifications for ARM processor (c) 1995-2004 Russell King
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
1da177e4
LT
11#include <linux/module.h>
12#include <linux/signal.h>
1da177e4 13#include <linux/mm.h>
67306da6 14#include <linux/hardirq.h>
1da177e4 15#include <linux/init.h>
25ce1dd7 16#include <linux/kprobes.h>
33fa9b13 17#include <linux/uaccess.h>
252d4c27 18#include <linux/page-flags.h>
412bb0a6 19#include <linux/sched.h>
65cec8e3 20#include <linux/highmem.h>
1da177e4
LT
21
22#include <asm/system.h>
23#include <asm/pgtable.h>
24#include <asm/tlbflush.h>
1da177e4
LT
25
26#include "fault.h"
27
c88d6aa7
RK
28/*
29 * Fault status register encodings
30 */
31#define FSR_WRITE (1 << 11)
32#define FSR_FS4 (1 << 10)
33#define FSR_FS3_0 (15)
34
35static inline int fsr_fs(unsigned int fsr)
36{
37 return (fsr & FSR_FS3_0) | (fsr & FSR_FS4) >> 6;
38}
39
09529f7a 40#ifdef CONFIG_MMU
25ce1dd7
NP
41
42#ifdef CONFIG_KPROBES
43static inline int notify_page_fault(struct pt_regs *regs, unsigned int fsr)
44{
45 int ret = 0;
46
47 if (!user_mode(regs)) {
48 /* kprobe_running() needs smp_processor_id() */
49 preempt_disable();
50 if (kprobe_running() && kprobe_fault_handler(regs, fsr))
51 ret = 1;
52 preempt_enable();
53 }
54
55 return ret;
56}
57#else
58static inline int notify_page_fault(struct pt_regs *regs, unsigned int fsr)
59{
60 return 0;
61}
62#endif
63
1da177e4
LT
64/*
65 * This is useful to dump out the page tables associated with
66 * 'addr' in mm 'mm'.
67 */
68void show_pte(struct mm_struct *mm, unsigned long addr)
69{
70 pgd_t *pgd;
71
72 if (!mm)
73 mm = &init_mm;
74
75 printk(KERN_ALERT "pgd = %p\n", mm->pgd);
76 pgd = pgd_offset(mm, addr);
77 printk(KERN_ALERT "[%08lx] *pgd=%08lx", addr, pgd_val(*pgd));
78
79 do {
80 pmd_t *pmd;
81 pte_t *pte;
82
83 if (pgd_none(*pgd))
84 break;
85
86 if (pgd_bad(*pgd)) {
87 printk("(bad)");
88 break;
89 }
90
91 pmd = pmd_offset(pgd, addr);
da46c79a
NP
92 if (PTRS_PER_PMD != 1)
93 printk(", *pmd=%08lx", pmd_val(*pmd));
1da177e4
LT
94
95 if (pmd_none(*pmd))
96 break;
97
98 if (pmd_bad(*pmd)) {
99 printk("(bad)");
100 break;
101 }
102
1da177e4 103 /* We must not map this if we have highmem enabled */
252d4c27
NP
104 if (PageHighMem(pfn_to_page(pmd_val(*pmd) >> PAGE_SHIFT)))
105 break;
106
1da177e4
LT
107 pte = pte_offset_map(pmd, addr);
108 printk(", *pte=%08lx", pte_val(*pte));
109 printk(", *ppte=%08lx", pte_val(pte[-PTRS_PER_PTE]));
110 pte_unmap(pte);
1da177e4
LT
111 } while(0);
112
113 printk("\n");
114}
09529f7a
CM
115#else /* CONFIG_MMU */
116void show_pte(struct mm_struct *mm, unsigned long addr)
117{ }
118#endif /* CONFIG_MMU */
1da177e4
LT
119
120/*
121 * Oops. The kernel tried to access some page that wasn't present.
122 */
123static void
124__do_kernel_fault(struct mm_struct *mm, unsigned long addr, unsigned int fsr,
125 struct pt_regs *regs)
126{
127 /*
128 * Are we prepared to handle this kernel fault?
129 */
130 if (fixup_exception(regs))
131 return;
132
133 /*
134 * No handler, we'll have to terminate things with extreme prejudice.
135 */
136 bust_spinlocks(1);
137 printk(KERN_ALERT
138 "Unable to handle kernel %s at virtual address %08lx\n",
139 (addr < PAGE_SIZE) ? "NULL pointer dereference" :
140 "paging request", addr);
141
142 show_pte(mm, addr);
143 die("Oops", regs, fsr);
144 bust_spinlocks(0);
145 do_exit(SIGKILL);
146}
147
148/*
149 * Something tried to access memory that isn't in our memory map..
150 * User mode accesses just cause a SIGSEGV
151 */
152static void
153__do_user_fault(struct task_struct *tsk, unsigned long addr,
2d137c24
AM
154 unsigned int fsr, unsigned int sig, int code,
155 struct pt_regs *regs)
1da177e4
LT
156{
157 struct siginfo si;
158
159#ifdef CONFIG_DEBUG_USER
160 if (user_debug & UDBG_SEGV) {
2d137c24
AM
161 printk(KERN_DEBUG "%s: unhandled page fault (%d) at 0x%08lx, code 0x%03x\n",
162 tsk->comm, sig, addr, fsr);
1da177e4
LT
163 show_pte(tsk->mm, addr);
164 show_regs(regs);
165 }
166#endif
167
168 tsk->thread.address = addr;
169 tsk->thread.error_code = fsr;
170 tsk->thread.trap_no = 14;
2d137c24 171 si.si_signo = sig;
1da177e4
LT
172 si.si_errno = 0;
173 si.si_code = code;
174 si.si_addr = (void __user *)addr;
2d137c24 175 force_sig_info(sig, &si, tsk);
1da177e4
LT
176}
177
e5beac37 178void do_bad_area(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
1da177e4 179{
e5beac37
RK
180 struct task_struct *tsk = current;
181 struct mm_struct *mm = tsk->active_mm;
182
1da177e4
LT
183 /*
184 * If we are in kernel mode at this point, we
185 * have no context to handle this fault with.
186 */
187 if (user_mode(regs))
2d137c24 188 __do_user_fault(tsk, addr, fsr, SIGSEGV, SEGV_MAPERR, regs);
1da177e4
LT
189 else
190 __do_kernel_fault(mm, addr, fsr, regs);
191}
192
09529f7a 193#ifdef CONFIG_MMU
5c72fc5c
NP
194#define VM_FAULT_BADMAP 0x010000
195#define VM_FAULT_BADACCESS 0x020000
1da177e4
LT
196
197static int
198__do_page_fault(struct mm_struct *mm, unsigned long addr, unsigned int fsr,
199 struct task_struct *tsk)
200{
201 struct vm_area_struct *vma;
202 int fault, mask;
203
204 vma = find_vma(mm, addr);
205 fault = VM_FAULT_BADMAP;
206 if (!vma)
207 goto out;
208 if (vma->vm_start > addr)
209 goto check_stack;
210
211 /*
212 * Ok, we have a good vm_area for this
213 * memory access, so we can handle it.
214 */
215good_area:
c88d6aa7 216 if (fsr & FSR_WRITE)
1da177e4
LT
217 mask = VM_WRITE;
218 else
df67b3da 219 mask = VM_READ|VM_EXEC|VM_WRITE;
1da177e4
LT
220
221 fault = VM_FAULT_BADACCESS;
222 if (!(vma->vm_flags & mask))
223 goto out;
224
225 /*
b42c6344
RK
226 * If for any reason at all we couldn't handle the fault, make
227 * sure we exit gracefully rather than endlessly redo the fault.
1da177e4 228 */
c88d6aa7 229 fault = handle_mm_fault(mm, vma, addr & PAGE_MASK, (fsr & FSR_WRITE) ? FAULT_FLAG_WRITE : 0);
b42c6344
RK
230 if (unlikely(fault & VM_FAULT_ERROR))
231 return fault;
83c54070 232 if (fault & VM_FAULT_MAJOR)
1da177e4 233 tsk->maj_flt++;
83c54070 234 else
1da177e4 235 tsk->min_flt++;
83c54070 236 return fault;
1da177e4 237
1da177e4
LT
238check_stack:
239 if (vma->vm_flags & VM_GROWSDOWN && !expand_stack(vma, addr))
240 goto good_area;
241out:
242 return fault;
243}
244
785d3cd2 245static int __kprobes
1da177e4
LT
246do_page_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
247{
248 struct task_struct *tsk;
249 struct mm_struct *mm;
2d137c24 250 int fault, sig, code;
1da177e4 251
25ce1dd7
NP
252 if (notify_page_fault(regs, fsr))
253 return 0;
254
1da177e4
LT
255 tsk = current;
256 mm = tsk->mm;
257
258 /*
259 * If we're in an interrupt or have no user
260 * context, we must not take the fault..
261 */
6edaf68a 262 if (in_atomic() || !mm)
1da177e4
LT
263 goto no_context;
264
840ff6a4
RK
265 /*
266 * As per x86, we may deadlock here. However, since the kernel only
267 * validly references user space from well defined areas of the code,
268 * we can bug out early if this is from code which shouldn't.
269 */
270 if (!down_read_trylock(&mm->mmap_sem)) {
271 if (!user_mode(regs) && !search_exception_tables(regs->ARM_pc))
272 goto no_context;
273 down_read(&mm->mmap_sem);
bf456992
RK
274 } else {
275 /*
276 * The above down_read_trylock() might have succeeded in
277 * which case, we'll have missed the might_sleep() from
278 * down_read()
279 */
280 might_sleep();
840ff6a4
RK
281 }
282
1da177e4
LT
283 fault = __do_page_fault(mm, addr, fsr, tsk);
284 up_read(&mm->mmap_sem);
285
286 /*
ff2afb9d 287 * Handle the "normal" case first - VM_FAULT_MAJOR / VM_FAULT_MINOR
1da177e4 288 */
5c72fc5c 289 if (likely(!(fault & (VM_FAULT_ERROR | VM_FAULT_BADMAP | VM_FAULT_BADACCESS))))
1da177e4
LT
290 return 0;
291
b42c6344
RK
292 if (fault & VM_FAULT_OOM) {
293 /*
294 * We ran out of memory, call the OOM killer, and return to
295 * userspace (which will retry the fault, or kill us if we
296 * got oom-killed)
297 */
298 pagefault_out_of_memory();
299 return 0;
300 }
301
1da177e4
LT
302 /*
303 * If we are in kernel mode at this point, we
304 * have no context to handle this fault with.
305 */
306 if (!user_mode(regs))
307 goto no_context;
308
83c54070 309 if (fault & VM_FAULT_SIGBUS) {
2d137c24
AM
310 /*
311 * We had some memory, but were unable to
312 * successfully fix up this page fault.
313 */
314 sig = SIGBUS;
315 code = BUS_ADRERR;
83c54070 316 } else {
2d137c24
AM
317 /*
318 * Something tried to access memory that
319 * isn't in our memory map..
320 */
321 sig = SIGSEGV;
322 code = fault == VM_FAULT_BADACCESS ?
323 SEGV_ACCERR : SEGV_MAPERR;
1da177e4 324 }
1da177e4 325
2d137c24
AM
326 __do_user_fault(tsk, addr, fsr, sig, code, regs);
327 return 0;
1da177e4
LT
328
329no_context:
330 __do_kernel_fault(mm, addr, fsr, regs);
331 return 0;
332}
09529f7a
CM
333#else /* CONFIG_MMU */
334static int
335do_page_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
336{
337 return 0;
338}
339#endif /* CONFIG_MMU */
1da177e4
LT
340
341/*
342 * First Level Translation Fault Handler
343 *
344 * We enter here because the first level page table doesn't contain
345 * a valid entry for the address.
346 *
347 * If the address is in kernel space (>= TASK_SIZE), then we are
348 * probably faulting in the vmalloc() area.
349 *
350 * If the init_task's first level page tables contains the relevant
351 * entry, we copy the it to this task. If not, we send the process
352 * a signal, fixup the exception, or oops the kernel.
353 *
354 * NOTE! We MUST NOT take any locks for this case. We may be in an
355 * interrupt or a critical region, and should only copy the information
356 * from the master page table, nothing more.
357 */
09529f7a 358#ifdef CONFIG_MMU
785d3cd2 359static int __kprobes
1da177e4
LT
360do_translation_fault(unsigned long addr, unsigned int fsr,
361 struct pt_regs *regs)
362{
1da177e4
LT
363 unsigned int index;
364 pgd_t *pgd, *pgd_k;
365 pmd_t *pmd, *pmd_k;
366
367 if (addr < TASK_SIZE)
368 return do_page_fault(addr, fsr, regs);
369
370 index = pgd_index(addr);
371
372 /*
373 * FIXME: CP15 C1 is write only on ARMv3 architectures.
374 */
375 pgd = cpu_get_pgd() + index;
376 pgd_k = init_mm.pgd + index;
377
378 if (pgd_none(*pgd_k))
379 goto bad_area;
380
381 if (!pgd_present(*pgd))
382 set_pgd(pgd, *pgd_k);
383
384 pmd_k = pmd_offset(pgd_k, addr);
385 pmd = pmd_offset(pgd, addr);
386
387 if (pmd_none(*pmd_k))
388 goto bad_area;
389
390 copy_pmd(pmd, pmd_k);
391 return 0;
392
393bad_area:
e5beac37 394 do_bad_area(addr, fsr, regs);
1da177e4
LT
395 return 0;
396}
09529f7a
CM
397#else /* CONFIG_MMU */
398static int
399do_translation_fault(unsigned long addr, unsigned int fsr,
400 struct pt_regs *regs)
401{
402 return 0;
403}
404#endif /* CONFIG_MMU */
1da177e4
LT
405
406/*
407 * Some section permission faults need to be handled gracefully.
408 * They can happen due to a __{get,put}_user during an oops.
409 */
410static int
411do_sect_fault(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
412{
e5beac37 413 do_bad_area(addr, fsr, regs);
1da177e4
LT
414 return 0;
415}
416
417/*
418 * This abort handler always returns "fault".
419 */
420static int
421do_bad(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
422{
423 return 1;
424}
425
426static struct fsr_info {
427 int (*fn)(unsigned long addr, unsigned int fsr, struct pt_regs *regs);
428 int sig;
cfb0810e 429 int code;
1da177e4
LT
430 const char *name;
431} fsr_info[] = {
432 /*
433 * The following are the standard ARMv3 and ARMv4 aborts. ARMv5
434 * defines these to be "precise" aborts.
435 */
cfb0810e
RK
436 { do_bad, SIGSEGV, 0, "vector exception" },
437 { do_bad, SIGILL, BUS_ADRALN, "alignment exception" },
438 { do_bad, SIGKILL, 0, "terminal exception" },
439 { do_bad, SIGILL, BUS_ADRALN, "alignment exception" },
440 { do_bad, SIGBUS, 0, "external abort on linefetch" },
441 { do_translation_fault, SIGSEGV, SEGV_MAPERR, "section translation fault" },
442 { do_bad, SIGBUS, 0, "external abort on linefetch" },
443 { do_page_fault, SIGSEGV, SEGV_MAPERR, "page translation fault" },
444 { do_bad, SIGBUS, 0, "external abort on non-linefetch" },
445 { do_bad, SIGSEGV, SEGV_ACCERR, "section domain fault" },
446 { do_bad, SIGBUS, 0, "external abort on non-linefetch" },
447 { do_bad, SIGSEGV, SEGV_ACCERR, "page domain fault" },
448 { do_bad, SIGBUS, 0, "external abort on translation" },
449 { do_sect_fault, SIGSEGV, SEGV_ACCERR, "section permission fault" },
450 { do_bad, SIGBUS, 0, "external abort on translation" },
451 { do_page_fault, SIGSEGV, SEGV_ACCERR, "page permission fault" },
1da177e4
LT
452 /*
453 * The following are "imprecise" aborts, which are signalled by bit
454 * 10 of the FSR, and may not be recoverable. These are only
455 * supported if the CPU abort handler supports bit 10.
456 */
cfb0810e
RK
457 { do_bad, SIGBUS, 0, "unknown 16" },
458 { do_bad, SIGBUS, 0, "unknown 17" },
459 { do_bad, SIGBUS, 0, "unknown 18" },
460 { do_bad, SIGBUS, 0, "unknown 19" },
461 { do_bad, SIGBUS, 0, "lock abort" }, /* xscale */
462 { do_bad, SIGBUS, 0, "unknown 21" },
463 { do_bad, SIGBUS, BUS_OBJERR, "imprecise external abort" }, /* xscale */
464 { do_bad, SIGBUS, 0, "unknown 23" },
465 { do_bad, SIGBUS, 0, "dcache parity error" }, /* xscale */
466 { do_bad, SIGBUS, 0, "unknown 25" },
467 { do_bad, SIGBUS, 0, "unknown 26" },
468 { do_bad, SIGBUS, 0, "unknown 27" },
469 { do_bad, SIGBUS, 0, "unknown 28" },
470 { do_bad, SIGBUS, 0, "unknown 29" },
471 { do_bad, SIGBUS, 0, "unknown 30" },
472 { do_bad, SIGBUS, 0, "unknown 31" }
1da177e4
LT
473};
474
475void __init
476hook_fault_code(int nr, int (*fn)(unsigned long, unsigned int, struct pt_regs *),
477 int sig, const char *name)
478{
479 if (nr >= 0 && nr < ARRAY_SIZE(fsr_info)) {
480 fsr_info[nr].fn = fn;
481 fsr_info[nr].sig = sig;
482 fsr_info[nr].name = name;
483 }
484}
485
486/*
487 * Dispatch a data abort to the relevant handler.
488 */
7ab3f8d5 489asmlinkage void __exception
1da177e4
LT
490do_DataAbort(unsigned long addr, unsigned int fsr, struct pt_regs *regs)
491{
c88d6aa7 492 const struct fsr_info *inf = fsr_info + fsr_fs(fsr);
cfb0810e 493 struct siginfo info;
1da177e4
LT
494
495 if (!inf->fn(addr, fsr, regs))
496 return;
497
498 printk(KERN_ALERT "Unhandled fault: %s (0x%03x) at 0x%08lx\n",
499 inf->name, fsr, addr);
cfb0810e
RK
500
501 info.si_signo = inf->sig;
502 info.si_errno = 0;
503 info.si_code = inf->code;
504 info.si_addr = (void __user *)addr;
1eeb66a1 505 arm_notify_die("", regs, &info, fsr, 0);
1da177e4
LT
506}
507
7ab3f8d5 508asmlinkage void __exception
1da177e4
LT
509do_PrefetchAbort(unsigned long addr, struct pt_regs *regs)
510{
511 do_translation_fault(addr, 0, regs);
512}
513