[PATCH] mm: init_mm without ptlock
[linux-2.6/btrfs-unstable.git] / arch / ppc / mm / pgtable.c
blob6ea9185fd120fa16c6e8013fe545898ef169960d
1 /*
2 * This file contains the routines setting up the linux page tables.
3 * -- paulus
5 * Derived from arch/ppc/mm/init.c:
6 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
8 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
9 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
10 * Copyright (C) 1996 Paul Mackerras
11 * Amiga/APUS changes by Jesper Skov (jskov@cygnus.co.uk).
13 * Derived from "arch/i386/mm/init.c"
14 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
16 * This program is free software; you can redistribute it and/or
17 * modify it under the terms of the GNU General Public License
18 * as published by the Free Software Foundation; either version
19 * 2 of the License, or (at your option) any later version.
23 #include <linux/config.h>
24 #include <linux/kernel.h>
25 #include <linux/module.h>
26 #include <linux/types.h>
27 #include <linux/mm.h>
28 #include <linux/vmalloc.h>
29 #include <linux/init.h>
30 #include <linux/highmem.h>
32 #include <asm/pgtable.h>
33 #include <asm/pgalloc.h>
34 #include <asm/io.h>
36 #include "mmu_decl.h"
38 unsigned long ioremap_base;
39 unsigned long ioremap_bot;
40 int io_bat_index;
42 #if defined(CONFIG_6xx) || defined(CONFIG_POWER3)
43 #define HAVE_BATS 1
44 #endif
46 #if defined(CONFIG_FSL_BOOKE)
47 #define HAVE_TLBCAM 1
48 #endif
50 extern char etext[], _stext[];
52 #ifdef CONFIG_SMP
53 extern void hash_page_sync(void);
54 #endif
56 #ifdef HAVE_BATS
57 extern unsigned long v_mapped_by_bats(unsigned long va);
58 extern unsigned long p_mapped_by_bats(unsigned long pa);
59 void setbat(int index, unsigned long virt, unsigned long phys,
60 unsigned int size, int flags);
62 #else /* !HAVE_BATS */
63 #define v_mapped_by_bats(x) (0UL)
64 #define p_mapped_by_bats(x) (0UL)
65 #endif /* HAVE_BATS */
67 #ifdef HAVE_TLBCAM
68 extern unsigned int tlbcam_index;
69 extern unsigned long v_mapped_by_tlbcam(unsigned long va);
70 extern unsigned long p_mapped_by_tlbcam(unsigned long pa);
71 #else /* !HAVE_TLBCAM */
72 #define v_mapped_by_tlbcam(x) (0UL)
73 #define p_mapped_by_tlbcam(x) (0UL)
74 #endif /* HAVE_TLBCAM */
76 #ifdef CONFIG_PTE_64BIT
77 /* 44x uses an 8kB pgdir because it has 8-byte Linux PTEs. */
78 #define PGDIR_ORDER 1
79 #else
80 #define PGDIR_ORDER 0
81 #endif
83 pgd_t *pgd_alloc(struct mm_struct *mm)
85 pgd_t *ret;
87 ret = (pgd_t *)__get_free_pages(GFP_KERNEL|__GFP_ZERO, PGDIR_ORDER);
88 return ret;
91 void pgd_free(pgd_t *pgd)
93 free_pages((unsigned long)pgd, PGDIR_ORDER);
96 pte_t *pte_alloc_one_kernel(struct mm_struct *mm, unsigned long address)
98 pte_t *pte;
99 extern int mem_init_done;
100 extern void *early_get_page(void);
102 if (mem_init_done) {
103 pte = (pte_t *)__get_free_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO);
104 } else {
105 pte = (pte_t *)early_get_page();
106 if (pte)
107 clear_page(pte);
109 return pte;
112 struct page *pte_alloc_one(struct mm_struct *mm, unsigned long address)
114 struct page *ptepage;
116 #ifdef CONFIG_HIGHPTE
117 gfp_t flags = GFP_KERNEL | __GFP_HIGHMEM | __GFP_REPEAT;
118 #else
119 gfp_t flags = GFP_KERNEL | __GFP_REPEAT;
120 #endif
122 ptepage = alloc_pages(flags, 0);
123 if (ptepage)
124 clear_highpage(ptepage);
125 return ptepage;
128 void pte_free_kernel(pte_t *pte)
130 #ifdef CONFIG_SMP
131 hash_page_sync();
132 #endif
133 free_page((unsigned long)pte);
136 void pte_free(struct page *ptepage)
138 #ifdef CONFIG_SMP
139 hash_page_sync();
140 #endif
141 __free_page(ptepage);
144 #ifndef CONFIG_PHYS_64BIT
145 void __iomem *
146 ioremap(phys_addr_t addr, unsigned long size)
148 return __ioremap(addr, size, _PAGE_NO_CACHE);
150 #else /* CONFIG_PHYS_64BIT */
151 void __iomem *
152 ioremap64(unsigned long long addr, unsigned long size)
154 return __ioremap(addr, size, _PAGE_NO_CACHE);
157 void __iomem *
158 ioremap(phys_addr_t addr, unsigned long size)
160 phys_addr_t addr64 = fixup_bigphys_addr(addr, size);
162 return ioremap64(addr64, size);
164 #endif /* CONFIG_PHYS_64BIT */
166 void __iomem *
167 __ioremap(phys_addr_t addr, unsigned long size, unsigned long flags)
169 unsigned long v, i;
170 phys_addr_t p;
171 int err;
174 * Choose an address to map it to.
175 * Once the vmalloc system is running, we use it.
176 * Before then, we use space going down from ioremap_base
177 * (ioremap_bot records where we're up to).
179 p = addr & PAGE_MASK;
180 size = PAGE_ALIGN(addr + size) - p;
183 * If the address lies within the first 16 MB, assume it's in ISA
184 * memory space
186 if (p < 16*1024*1024)
187 p += _ISA_MEM_BASE;
190 * Don't allow anybody to remap normal RAM that we're using.
191 * mem_init() sets high_memory so only do the check after that.
193 if ( mem_init_done && (p < virt_to_phys(high_memory)) )
195 printk("__ioremap(): phys addr "PHYS_FMT" is RAM lr %p\n", p,
196 __builtin_return_address(0));
197 return NULL;
200 if (size == 0)
201 return NULL;
204 * Is it already mapped? Perhaps overlapped by a previous
205 * BAT mapping. If the whole area is mapped then we're done,
206 * otherwise remap it since we want to keep the virt addrs for
207 * each request contiguous.
209 * We make the assumption here that if the bottom and top
210 * of the range we want are mapped then it's mapped to the
211 * same virt address (and this is contiguous).
212 * -- Cort
214 if ((v = p_mapped_by_bats(p)) /*&& p_mapped_by_bats(p+size-1)*/ )
215 goto out;
217 if ((v = p_mapped_by_tlbcam(p)))
218 goto out;
220 if (mem_init_done) {
221 struct vm_struct *area;
222 area = get_vm_area(size, VM_IOREMAP);
223 if (area == 0)
224 return NULL;
225 v = (unsigned long) area->addr;
226 } else {
227 v = (ioremap_bot -= size);
230 if ((flags & _PAGE_PRESENT) == 0)
231 flags |= _PAGE_KERNEL;
232 if (flags & _PAGE_NO_CACHE)
233 flags |= _PAGE_GUARDED;
236 * Should check if it is a candidate for a BAT mapping
239 err = 0;
240 for (i = 0; i < size && err == 0; i += PAGE_SIZE)
241 err = map_page(v+i, p+i, flags);
242 if (err) {
243 if (mem_init_done)
244 vunmap((void *)v);
245 return NULL;
248 out:
249 return (void __iomem *) (v + ((unsigned long)addr & ~PAGE_MASK));
252 void iounmap(volatile void __iomem *addr)
255 * If mapped by BATs then there is nothing to do.
256 * Calling vfree() generates a benign warning.
258 if (v_mapped_by_bats((unsigned long)addr)) return;
260 if (addr > high_memory && (unsigned long) addr < ioremap_bot)
261 vunmap((void *) (PAGE_MASK & (unsigned long)addr));
264 void __iomem *ioport_map(unsigned long port, unsigned int len)
266 return (void __iomem *) (port + _IO_BASE);
269 void ioport_unmap(void __iomem *addr)
271 /* Nothing to do */
273 EXPORT_SYMBOL(ioport_map);
274 EXPORT_SYMBOL(ioport_unmap);
277 map_page(unsigned long va, phys_addr_t pa, int flags)
279 pmd_t *pd;
280 pte_t *pg;
281 int err = -ENOMEM;
283 /* Use upper 10 bits of VA to index the first level map */
284 pd = pmd_offset(pgd_offset_k(va), va);
285 /* Use middle 10 bits of VA to index the second-level map */
286 pg = pte_alloc_kernel(pd, va);
287 if (pg != 0) {
288 err = 0;
289 set_pte_at(&init_mm, va, pg, pfn_pte(pa >> PAGE_SHIFT, __pgprot(flags)));
290 if (mem_init_done)
291 flush_HPTE(0, va, pmd_val(*pd));
293 return err;
297 * Map in all of physical memory starting at KERNELBASE.
299 void __init mapin_ram(void)
301 unsigned long v, p, s, f;
303 s = mmu_mapin_ram();
304 v = KERNELBASE + s;
305 p = PPC_MEMSTART + s;
306 for (; s < total_lowmem; s += PAGE_SIZE) {
307 if ((char *) v >= _stext && (char *) v < etext)
308 f = _PAGE_RAM_TEXT;
309 else
310 f = _PAGE_RAM;
311 map_page(v, p, f);
312 v += PAGE_SIZE;
313 p += PAGE_SIZE;
317 /* is x a power of 2? */
318 #define is_power_of_2(x) ((x) != 0 && (((x) & ((x) - 1)) == 0))
320 /* is x a power of 4? */
321 #define is_power_of_4(x) ((x) != 0 && (((x) & (x-1)) == 0) && (ffs(x) & 1))
324 * Set up a mapping for a block of I/O.
325 * virt, phys, size must all be page-aligned.
326 * This should only be called before ioremap is called.
328 void __init io_block_mapping(unsigned long virt, phys_addr_t phys,
329 unsigned int size, int flags)
331 int i;
333 if (virt > KERNELBASE && virt < ioremap_bot)
334 ioremap_bot = ioremap_base = virt;
336 #ifdef HAVE_BATS
338 * Use a BAT for this if possible...
340 if (io_bat_index < 2 && is_power_of_2(size)
341 && (virt & (size - 1)) == 0 && (phys & (size - 1)) == 0) {
342 setbat(io_bat_index, virt, phys, size, flags);
343 ++io_bat_index;
344 return;
346 #endif /* HAVE_BATS */
348 #ifdef HAVE_TLBCAM
350 * Use a CAM for this if possible...
352 if (tlbcam_index < num_tlbcam_entries && is_power_of_4(size)
353 && (virt & (size - 1)) == 0 && (phys & (size - 1)) == 0) {
354 settlbcam(tlbcam_index, virt, phys, size, flags, 0);
355 ++tlbcam_index;
356 return;
358 #endif /* HAVE_TLBCAM */
360 /* No BATs available, put it in the page tables. */
361 for (i = 0; i < size; i += PAGE_SIZE)
362 map_page(virt + i, phys + i, flags);
365 /* Scan the real Linux page tables and return a PTE pointer for
366 * a virtual address in a context.
367 * Returns true (1) if PTE was found, zero otherwise. The pointer to
368 * the PTE pointer is unmodified if PTE is not found.
371 get_pteptr(struct mm_struct *mm, unsigned long addr, pte_t **ptep)
373 pgd_t *pgd;
374 pmd_t *pmd;
375 pte_t *pte;
376 int retval = 0;
378 pgd = pgd_offset(mm, addr & PAGE_MASK);
379 if (pgd) {
380 pmd = pmd_offset(pgd, addr & PAGE_MASK);
381 if (pmd_present(*pmd)) {
382 pte = pte_offset_map(pmd, addr & PAGE_MASK);
383 if (pte) {
384 retval = 1;
385 *ptep = pte;
386 /* XXX caller needs to do pte_unmap, yuck */
390 return(retval);
393 /* Find physical address for this virtual address. Normally used by
394 * I/O functions, but anyone can call it.
396 unsigned long iopa(unsigned long addr)
398 unsigned long pa;
400 /* I don't know why this won't work on PMacs or CHRP. It
401 * appears there is some bug, or there is some implicit
402 * mapping done not properly represented by BATs or in page
403 * tables.......I am actively working on resolving this, but
404 * can't hold up other stuff. -- Dan
406 pte_t *pte;
407 struct mm_struct *mm;
409 /* Check the BATs */
410 pa = v_mapped_by_bats(addr);
411 if (pa)
412 return pa;
414 /* Allow mapping of user addresses (within the thread)
415 * for DMA if necessary.
417 if (addr < TASK_SIZE)
418 mm = current->mm;
419 else
420 mm = &init_mm;
422 pa = 0;
423 if (get_pteptr(mm, addr, &pte)) {
424 pa = (pte_val(*pte) & PAGE_MASK) | (addr & ~PAGE_MASK);
425 pte_unmap(pte);
428 return(pa);
431 /* This is will find the virtual address for a physical one....
432 * Swiped from APUS, could be dangerous :-).
433 * This is only a placeholder until I really find a way to make this
434 * work. -- Dan
436 unsigned long
437 mm_ptov (unsigned long paddr)
439 unsigned long ret;
440 #if 0
441 if (paddr < 16*1024*1024)
442 ret = ZTWO_VADDR(paddr);
443 else {
444 int i;
446 for (i = 0; i < kmap_chunk_count;){
447 unsigned long phys = kmap_chunks[i++];
448 unsigned long size = kmap_chunks[i++];
449 unsigned long virt = kmap_chunks[i++];
450 if (paddr >= phys
451 && paddr < (phys + size)){
452 ret = virt + paddr - phys;
453 goto exit;
457 ret = (unsigned long) __va(paddr);
459 exit:
460 #ifdef DEBUGPV
461 printk ("PTOV(%lx)=%lx\n", paddr, ret);
462 #endif
463 #else
464 ret = (unsigned long)paddr + KERNELBASE;
465 #endif
466 return ret;