x86/amd-iommu: Workaround for erratum 63
[linux-2.6/verdex.git] / arch / sh / mm / tlbflush_64.c
blob3ce40ea34824914f6ad30ad2abb38a0d8ca9d401
1 /*
2 * arch/sh/mm/tlb-flush_64.c
4 * Copyright (C) 2000, 2001 Paolo Alberelli
5 * Copyright (C) 2003 Richard Curnow (/proc/tlb, bug fixes)
6 * Copyright (C) 2003 - 2009 Paul Mundt
8 * This file is subject to the terms and conditions of the GNU General Public
9 * License. See the file "COPYING" in the main directory of this archive
10 * for more details.
12 #include <linux/signal.h>
13 #include <linux/rwsem.h>
14 #include <linux/sched.h>
15 #include <linux/kernel.h>
16 #include <linux/errno.h>
17 #include <linux/string.h>
18 #include <linux/types.h>
19 #include <linux/ptrace.h>
20 #include <linux/mman.h>
21 #include <linux/mm.h>
22 #include <linux/smp.h>
23 #include <linux/perf_counter.h>
24 #include <linux/interrupt.h>
25 #include <asm/system.h>
26 #include <asm/io.h>
27 #include <asm/tlb.h>
28 #include <asm/uaccess.h>
29 #include <asm/pgalloc.h>
30 #include <asm/mmu_context.h>
32 extern void die(const char *,struct pt_regs *,long);
34 #define PFLAG(val,flag) (( (val) & (flag) ) ? #flag : "" )
35 #define PPROT(flag) PFLAG(pgprot_val(prot),flag)
37 static inline void print_prots(pgprot_t prot)
39 printk("prot is 0x%08lx\n",pgprot_val(prot));
41 printk("%s %s %s %s %s\n",PPROT(_PAGE_SHARED),PPROT(_PAGE_READ),
42 PPROT(_PAGE_EXECUTE),PPROT(_PAGE_WRITE),PPROT(_PAGE_USER));
45 static inline void print_vma(struct vm_area_struct *vma)
47 printk("vma start 0x%08lx\n", vma->vm_start);
48 printk("vma end 0x%08lx\n", vma->vm_end);
50 print_prots(vma->vm_page_prot);
51 printk("vm_flags 0x%08lx\n", vma->vm_flags);
54 static inline void print_task(struct task_struct *tsk)
56 printk("Task pid %d\n", task_pid_nr(tsk));
59 static pte_t *lookup_pte(struct mm_struct *mm, unsigned long address)
61 pgd_t *dir;
62 pud_t *pud;
63 pmd_t *pmd;
64 pte_t *pte;
65 pte_t entry;
67 dir = pgd_offset(mm, address);
68 if (pgd_none(*dir))
69 return NULL;
71 pud = pud_offset(dir, address);
72 if (pud_none(*pud))
73 return NULL;
75 pmd = pmd_offset(pud, address);
76 if (pmd_none(*pmd))
77 return NULL;
79 pte = pte_offset_kernel(pmd, address);
80 entry = *pte;
81 if (pte_none(entry) || !pte_present(entry))
82 return NULL;
84 return pte;
88 * This routine handles page faults. It determines the address,
89 * and the problem, and then passes it off to one of the appropriate
90 * routines.
92 asmlinkage void do_page_fault(struct pt_regs *regs, unsigned long writeaccess,
93 unsigned long textaccess, unsigned long address)
95 struct task_struct *tsk;
96 struct mm_struct *mm;
97 struct vm_area_struct * vma;
98 const struct exception_table_entry *fixup;
99 pte_t *pte;
100 int fault;
102 /* SIM
103 * Note this is now called with interrupts still disabled
104 * This is to cope with being called for a missing IO port
105 * address with interrupts disabled. This should be fixed as
106 * soon as we have a better 'fast path' miss handler.
108 * Plus take care how you try and debug this stuff.
109 * For example, writing debug data to a port which you
110 * have just faulted on is not going to work.
113 tsk = current;
114 mm = tsk->mm;
116 /* Not an IO address, so reenable interrupts */
117 local_irq_enable();
119 perf_swcounter_event(PERF_COUNT_SW_PAGE_FAULTS, 1, 0, regs, address);
122 * If we're in an interrupt or have no user
123 * context, we must not take the fault..
125 if (in_atomic() || !mm)
126 goto no_context;
128 /* TLB misses upon some cache flushes get done under cli() */
129 down_read(&mm->mmap_sem);
131 vma = find_vma(mm, address);
133 if (!vma) {
134 #ifdef DEBUG_FAULT
135 print_task(tsk);
136 printk("%s:%d fault, address is 0x%08x PC %016Lx textaccess %d writeaccess %d\n",
137 __func__, __LINE__,
138 address,regs->pc,textaccess,writeaccess);
139 show_regs(regs);
140 #endif
141 goto bad_area;
143 if (vma->vm_start <= address) {
144 goto good_area;
147 if (!(vma->vm_flags & VM_GROWSDOWN)) {
148 #ifdef DEBUG_FAULT
149 print_task(tsk);
150 printk("%s:%d fault, address is 0x%08x PC %016Lx textaccess %d writeaccess %d\n",
151 __func__, __LINE__,
152 address,regs->pc,textaccess,writeaccess);
153 show_regs(regs);
155 print_vma(vma);
156 #endif
157 goto bad_area;
159 if (expand_stack(vma, address)) {
160 #ifdef DEBUG_FAULT
161 print_task(tsk);
162 printk("%s:%d fault, address is 0x%08x PC %016Lx textaccess %d writeaccess %d\n",
163 __func__, __LINE__,
164 address,regs->pc,textaccess,writeaccess);
165 show_regs(regs);
166 #endif
167 goto bad_area;
170 * Ok, we have a good vm_area for this memory access, so
171 * we can handle it..
173 good_area:
174 if (textaccess) {
175 if (!(vma->vm_flags & VM_EXEC))
176 goto bad_area;
177 } else {
178 if (writeaccess) {
179 if (!(vma->vm_flags & VM_WRITE))
180 goto bad_area;
181 } else {
182 if (!(vma->vm_flags & VM_READ))
183 goto bad_area;
188 * If for any reason at all we couldn't handle the fault,
189 * make sure we exit gracefully rather than endlessly redo
190 * the fault.
192 survive:
193 fault = handle_mm_fault(mm, vma, address, writeaccess ? FAULT_FLAG_WRITE : 0);
194 if (unlikely(fault & VM_FAULT_ERROR)) {
195 if (fault & VM_FAULT_OOM)
196 goto out_of_memory;
197 else if (fault & VM_FAULT_SIGBUS)
198 goto do_sigbus;
199 BUG();
202 if (fault & VM_FAULT_MAJOR) {
203 tsk->maj_flt++;
204 perf_swcounter_event(PERF_COUNT_SW_PAGE_FAULTS_MAJ, 1, 0,
205 regs, address);
206 } else {
207 tsk->min_flt++;
208 perf_swcounter_event(PERF_COUNT_SW_PAGE_FAULTS_MIN, 1, 0,
209 regs, address);
212 /* If we get here, the page fault has been handled. Do the TLB refill
213 now from the newly-setup PTE, to avoid having to fault again right
214 away on the same instruction. */
215 pte = lookup_pte (mm, address);
216 if (!pte) {
217 /* From empirical evidence, we can get here, due to
218 !pte_present(pte). (e.g. if a swap-in occurs, and the page
219 is swapped back out again before the process that wanted it
220 gets rescheduled?) */
221 goto no_pte;
224 __do_tlb_refill(address, textaccess, pte);
226 no_pte:
228 up_read(&mm->mmap_sem);
229 return;
232 * Something tried to access memory that isn't in our memory map..
233 * Fix it, but check if it's kernel or user first..
235 bad_area:
236 #ifdef DEBUG_FAULT
237 printk("fault:bad area\n");
238 #endif
239 up_read(&mm->mmap_sem);
241 if (user_mode(regs)) {
242 static int count=0;
243 siginfo_t info;
244 if (count < 4) {
245 /* This is really to help debug faults when starting
246 * usermode, so only need a few */
247 count++;
248 printk("user mode bad_area address=%08lx pid=%d (%s) pc=%08lx\n",
249 address, task_pid_nr(current), current->comm,
250 (unsigned long) regs->pc);
251 #if 0
252 show_regs(regs);
253 #endif
255 if (is_global_init(tsk)) {
256 panic("INIT had user mode bad_area\n");
258 tsk->thread.address = address;
259 tsk->thread.error_code = writeaccess;
260 info.si_signo = SIGSEGV;
261 info.si_errno = 0;
262 info.si_addr = (void *) address;
263 force_sig_info(SIGSEGV, &info, tsk);
264 return;
267 no_context:
268 #ifdef DEBUG_FAULT
269 printk("fault:No context\n");
270 #endif
271 /* Are we prepared to handle this kernel fault? */
272 fixup = search_exception_tables(regs->pc);
273 if (fixup) {
274 regs->pc = fixup->fixup;
275 return;
279 * Oops. The kernel tried to access some bad page. We'll have to
280 * terminate things with extreme prejudice.
283 if (address < PAGE_SIZE)
284 printk(KERN_ALERT "Unable to handle kernel NULL pointer dereference");
285 else
286 printk(KERN_ALERT "Unable to handle kernel paging request");
287 printk(" at virtual address %08lx\n", address);
288 printk(KERN_ALERT "pc = %08Lx%08Lx\n", regs->pc >> 32, regs->pc & 0xffffffff);
289 die("Oops", regs, writeaccess);
290 do_exit(SIGKILL);
293 * We ran out of memory, or some other thing happened to us that made
294 * us unable to handle the page fault gracefully.
296 out_of_memory:
297 if (is_global_init(current)) {
298 panic("INIT out of memory\n");
299 yield();
300 goto survive;
302 printk("fault:Out of memory\n");
303 up_read(&mm->mmap_sem);
304 if (is_global_init(current)) {
305 yield();
306 down_read(&mm->mmap_sem);
307 goto survive;
309 printk("VM: killing process %s\n", tsk->comm);
310 if (user_mode(regs))
311 do_group_exit(SIGKILL);
312 goto no_context;
314 do_sigbus:
315 printk("fault:Do sigbus\n");
316 up_read(&mm->mmap_sem);
319 * Send a sigbus, regardless of whether we were in kernel
320 * or user mode.
322 tsk->thread.address = address;
323 tsk->thread.error_code = writeaccess;
324 tsk->thread.trap_no = 14;
325 force_sig(SIGBUS, tsk);
327 /* Kernel mode? Handle exceptions or die */
328 if (!user_mode(regs))
329 goto no_context;
332 void update_mmu_cache(struct vm_area_struct * vma,
333 unsigned long address, pte_t pte)
336 * This appears to get called once for every pte entry that gets
337 * established => I don't think it's efficient to try refilling the
338 * TLBs with the pages - some may not get accessed even. Also, for
339 * executable pages, it is impossible to determine reliably here which
340 * TLB they should be mapped into (or both even).
342 * So, just do nothing here and handle faults on demand. In the
343 * TLBMISS handling case, the refill is now done anyway after the pte
344 * has been fixed up, so that deals with most useful cases.
348 void local_flush_tlb_one(unsigned long asid, unsigned long page)
350 unsigned long long match, pteh=0, lpage;
351 unsigned long tlb;
354 * Sign-extend based on neff.
356 lpage = (page & NEFF_SIGN) ? (page | NEFF_MASK) : page;
357 match = (asid << PTEH_ASID_SHIFT) | PTEH_VALID;
358 match |= lpage;
360 for_each_itlb_entry(tlb) {
361 asm volatile ("getcfg %1, 0, %0"
362 : "=r" (pteh)
363 : "r" (tlb) );
365 if (pteh == match) {
366 __flush_tlb_slot(tlb);
367 break;
371 for_each_dtlb_entry(tlb) {
372 asm volatile ("getcfg %1, 0, %0"
373 : "=r" (pteh)
374 : "r" (tlb) );
376 if (pteh == match) {
377 __flush_tlb_slot(tlb);
378 break;
384 void local_flush_tlb_page(struct vm_area_struct *vma, unsigned long page)
386 unsigned long flags;
388 if (vma->vm_mm) {
389 page &= PAGE_MASK;
390 local_irq_save(flags);
391 local_flush_tlb_one(get_asid(), page);
392 local_irq_restore(flags);
396 void local_flush_tlb_range(struct vm_area_struct *vma, unsigned long start,
397 unsigned long end)
399 unsigned long flags;
400 unsigned long long match, pteh=0, pteh_epn, pteh_low;
401 unsigned long tlb;
402 unsigned int cpu = smp_processor_id();
403 struct mm_struct *mm;
405 mm = vma->vm_mm;
406 if (cpu_context(cpu, mm) == NO_CONTEXT)
407 return;
409 local_irq_save(flags);
411 start &= PAGE_MASK;
412 end &= PAGE_MASK;
414 match = (cpu_asid(cpu, mm) << PTEH_ASID_SHIFT) | PTEH_VALID;
416 /* Flush ITLB */
417 for_each_itlb_entry(tlb) {
418 asm volatile ("getcfg %1, 0, %0"
419 : "=r" (pteh)
420 : "r" (tlb) );
422 pteh_epn = pteh & PAGE_MASK;
423 pteh_low = pteh & ~PAGE_MASK;
425 if (pteh_low == match && pteh_epn >= start && pteh_epn <= end)
426 __flush_tlb_slot(tlb);
429 /* Flush DTLB */
430 for_each_dtlb_entry(tlb) {
431 asm volatile ("getcfg %1, 0, %0"
432 : "=r" (pteh)
433 : "r" (tlb) );
435 pteh_epn = pteh & PAGE_MASK;
436 pteh_low = pteh & ~PAGE_MASK;
438 if (pteh_low == match && pteh_epn >= start && pteh_epn <= end)
439 __flush_tlb_slot(tlb);
442 local_irq_restore(flags);
445 void local_flush_tlb_mm(struct mm_struct *mm)
447 unsigned long flags;
448 unsigned int cpu = smp_processor_id();
450 if (cpu_context(cpu, mm) == NO_CONTEXT)
451 return;
453 local_irq_save(flags);
455 cpu_context(cpu, mm) = NO_CONTEXT;
456 if (mm == current->mm)
457 activate_context(mm, cpu);
459 local_irq_restore(flags);
462 void local_flush_tlb_all(void)
464 /* Invalidate all, including shared pages, excluding fixed TLBs */
465 unsigned long flags, tlb;
467 local_irq_save(flags);
469 /* Flush each ITLB entry */
470 for_each_itlb_entry(tlb)
471 __flush_tlb_slot(tlb);
473 /* Flush each DTLB entry */
474 for_each_dtlb_entry(tlb)
475 __flush_tlb_slot(tlb);
477 local_irq_restore(flags);
480 void local_flush_tlb_kernel_range(unsigned long start, unsigned long end)
482 /* FIXME: Optimize this later.. */
483 flush_tlb_all();