2 * This file contains the routines setting up the linux page tables.
5 * Derived from arch/ppc/mm/init.c:
6 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
8 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
9 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
10 * Copyright (C) 1996 Paul Mackerras
12 * Derived from "arch/i386/mm/init.c"
13 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
15 * This program is free software; you can redistribute it and/or
16 * modify it under the terms of the GNU General Public License
17 * as published by the Free Software Foundation; either version
18 * 2 of the License, or (at your option) any later version.
22 #include <linux/kernel.h>
23 #include <linux/module.h>
24 #include <linux/types.h>
26 #include <linux/vmalloc.h>
27 #include <linux/init.h>
28 #include <linux/highmem.h>
29 #include <linux/memblock.h>
30 #include <linux/slab.h>
32 #include <asm/pgtable.h>
33 #include <asm/pgalloc.h>
34 #include <asm/fixmap.h>
36 #include <asm/setup.h>
40 unsigned long ioremap_base
;
41 unsigned long ioremap_bot
;
42 EXPORT_SYMBOL(ioremap_bot
); /* aka VMALLOC_END */
44 #if defined(CONFIG_6xx) || defined(CONFIG_POWER3)
48 #if defined(CONFIG_FSL_BOOKE)
52 extern char etext
[], _stext
[];
55 extern phys_addr_t
v_mapped_by_bats(unsigned long va
);
56 extern unsigned long p_mapped_by_bats(phys_addr_t pa
);
57 void setbat(int index
, unsigned long virt
, phys_addr_t phys
,
58 unsigned int size
, int flags
);
60 #else /* !HAVE_BATS */
61 #define v_mapped_by_bats(x) (0UL)
62 #define p_mapped_by_bats(x) (0UL)
63 #endif /* HAVE_BATS */
66 extern unsigned int tlbcam_index
;
67 extern phys_addr_t
v_mapped_by_tlbcam(unsigned long va
);
68 extern unsigned long p_mapped_by_tlbcam(phys_addr_t pa
);
69 #else /* !HAVE_TLBCAM */
70 #define v_mapped_by_tlbcam(x) (0UL)
71 #define p_mapped_by_tlbcam(x) (0UL)
72 #endif /* HAVE_TLBCAM */
74 #define PGDIR_ORDER (32 + PGD_T_LOG2 - PGDIR_SHIFT)
76 pgd_t
*pgd_alloc(struct mm_struct
*mm
)
80 /* pgdir take page or two with 4K pages and a page fraction otherwise */
81 #ifndef CONFIG_PPC_4K_PAGES
82 ret
= kzalloc(1 << PGDIR_ORDER
, GFP_KERNEL
);
84 ret
= (pgd_t
*)__get_free_pages(GFP_KERNEL
|__GFP_ZERO
,
85 PGDIR_ORDER
- PAGE_SHIFT
);
90 void pgd_free(struct mm_struct
*mm
, pgd_t
*pgd
)
92 #ifndef CONFIG_PPC_4K_PAGES
95 free_pages((unsigned long)pgd
, PGDIR_ORDER
- PAGE_SHIFT
);
99 __init_refok pte_t
*pte_alloc_one_kernel(struct mm_struct
*mm
, unsigned long address
)
102 extern int mem_init_done
;
103 extern void *early_get_page(void);
106 pte
= (pte_t
*)__get_free_page(GFP_KERNEL
|__GFP_REPEAT
|__GFP_ZERO
);
108 pte
= (pte_t
*)early_get_page();
115 pgtable_t
pte_alloc_one(struct mm_struct
*mm
, unsigned long address
)
117 struct page
*ptepage
;
119 gfp_t flags
= GFP_KERNEL
| __GFP_REPEAT
| __GFP_ZERO
;
121 ptepage
= alloc_pages(flags
, 0);
124 if (!pgtable_page_ctor(ptepage
)) {
125 __free_page(ptepage
);
132 ioremap(phys_addr_t addr
, unsigned long size
)
134 return __ioremap_caller(addr
, size
, _PAGE_NO_CACHE
| _PAGE_GUARDED
,
135 __builtin_return_address(0));
137 EXPORT_SYMBOL(ioremap
);
140 ioremap_wc(phys_addr_t addr
, unsigned long size
)
142 return __ioremap_caller(addr
, size
, _PAGE_NO_CACHE
,
143 __builtin_return_address(0));
145 EXPORT_SYMBOL(ioremap_wc
);
148 ioremap_prot(phys_addr_t addr
, unsigned long size
, unsigned long flags
)
150 /* writeable implies dirty for kernel addresses */
151 if (flags
& _PAGE_RW
)
152 flags
|= _PAGE_DIRTY
| _PAGE_HWWRITE
;
154 /* we don't want to let _PAGE_USER and _PAGE_EXEC leak out */
155 flags
&= ~(_PAGE_USER
| _PAGE_EXEC
);
158 /* _PAGE_USER contains _PAGE_BAP_SR on BookE using the new PTE format
159 * which means that we just cleared supervisor access... oops ;-) This
162 flags
|= _PAGE_BAP_SR
;
165 return __ioremap_caller(addr
, size
, flags
, __builtin_return_address(0));
167 EXPORT_SYMBOL(ioremap_prot
);
170 __ioremap(phys_addr_t addr
, unsigned long size
, unsigned long flags
)
172 return __ioremap_caller(addr
, size
, flags
, __builtin_return_address(0));
176 __ioremap_caller(phys_addr_t addr
, unsigned long size
, unsigned long flags
,
183 /* Make sure we have the base flags */
184 if ((flags
& _PAGE_PRESENT
) == 0)
185 flags
|= PAGE_KERNEL
;
187 /* Non-cacheable page cannot be coherent */
188 if (flags
& _PAGE_NO_CACHE
)
189 flags
&= ~_PAGE_COHERENT
;
192 * Choose an address to map it to.
193 * Once the vmalloc system is running, we use it.
194 * Before then, we use space going down from ioremap_base
195 * (ioremap_bot records where we're up to).
197 p
= addr
& PAGE_MASK
;
198 size
= PAGE_ALIGN(addr
+ size
) - p
;
201 * If the address lies within the first 16 MB, assume it's in ISA
204 if (p
< 16*1024*1024)
207 #ifndef CONFIG_CRASH_DUMP
209 * Don't allow anybody to remap normal RAM that we're using.
210 * mem_init() sets high_memory so only do the check after that.
212 if (mem_init_done
&& (p
< virt_to_phys(high_memory
)) &&
213 !(__allow_ioremap_reserved
&& memblock_is_region_reserved(p
, size
))) {
214 printk("__ioremap(): phys addr 0x%llx is RAM lr %pf\n",
215 (unsigned long long)p
, __builtin_return_address(0));
224 * Is it already mapped? Perhaps overlapped by a previous
225 * BAT mapping. If the whole area is mapped then we're done,
226 * otherwise remap it since we want to keep the virt addrs for
227 * each request contiguous.
229 * We make the assumption here that if the bottom and top
230 * of the range we want are mapped then it's mapped to the
231 * same virt address (and this is contiguous).
234 if ((v
= p_mapped_by_bats(p
)) /*&& p_mapped_by_bats(p+size-1)*/ )
237 if ((v
= p_mapped_by_tlbcam(p
)))
241 struct vm_struct
*area
;
242 area
= get_vm_area_caller(size
, VM_IOREMAP
, caller
);
246 v
= (unsigned long) area
->addr
;
248 v
= (ioremap_bot
-= size
);
252 * Should check if it is a candidate for a BAT mapping
256 for (i
= 0; i
< size
&& err
== 0; i
+= PAGE_SIZE
)
257 err
= map_page(v
+i
, p
+i
, flags
);
265 return (void __iomem
*) (v
+ ((unsigned long)addr
& ~PAGE_MASK
));
267 EXPORT_SYMBOL(__ioremap
);
269 void iounmap(volatile void __iomem
*addr
)
272 * If mapped by BATs then there is nothing to do.
273 * Calling vfree() generates a benign warning.
275 if (v_mapped_by_bats((unsigned long)addr
)) return;
277 if (addr
> high_memory
&& (unsigned long) addr
< ioremap_bot
)
278 vunmap((void *) (PAGE_MASK
& (unsigned long)addr
));
280 EXPORT_SYMBOL(iounmap
);
282 int map_page(unsigned long va
, phys_addr_t pa
, int flags
)
288 /* Use upper 10 bits of VA to index the first level map */
289 pd
= pmd_offset(pud_offset(pgd_offset_k(va
), va
), va
);
290 /* Use middle 10 bits of VA to index the second-level map */
291 pg
= pte_alloc_kernel(pd
, va
);
294 /* The PTE should never be already set nor present in the
297 BUG_ON((pte_val(*pg
) & (_PAGE_PRESENT
| _PAGE_HASHPTE
)) &&
299 set_pte_at(&init_mm
, va
, pg
, pfn_pte(pa
>> PAGE_SHIFT
,
307 * Map in a chunk of physical memory starting at start.
309 void __init
__mapin_ram_chunk(unsigned long offset
, unsigned long top
)
311 unsigned long v
, s
, f
;
317 p
= memstart_addr
+ s
;
318 for (; s
< top
; s
+= PAGE_SIZE
) {
319 ktext
= ((char *) v
>= _stext
&& (char *) v
< etext
);
320 f
= ktext
? PAGE_KERNEL_TEXT
: PAGE_KERNEL
;
322 #ifdef CONFIG_PPC_STD_MMU_32
324 hash_preload(&init_mm
, v
, 0, 0x300);
331 void __init
mapin_ram(void)
333 unsigned long s
, top
;
337 s
= mmu_mapin_ram(top
);
338 __mapin_ram_chunk(s
, top
);
340 if (!wii_hole_size
) {
341 s
= mmu_mapin_ram(total_lowmem
);
342 __mapin_ram_chunk(s
, total_lowmem
);
344 top
= wii_hole_start
;
345 s
= mmu_mapin_ram(top
);
346 __mapin_ram_chunk(s
, top
);
348 top
= memblock_end_of_DRAM();
349 s
= wii_mmu_mapin_mem2(top
);
350 __mapin_ram_chunk(s
, top
);
355 /* Scan the real Linux page tables and return a PTE pointer for
356 * a virtual address in a context.
357 * Returns true (1) if PTE was found, zero otherwise. The pointer to
358 * the PTE pointer is unmodified if PTE is not found.
361 get_pteptr(struct mm_struct
*mm
, unsigned long addr
, pte_t
**ptep
, pmd_t
**pmdp
)
369 pgd
= pgd_offset(mm
, addr
& PAGE_MASK
);
371 pud
= pud_offset(pgd
, addr
& PAGE_MASK
);
372 if (pud
&& pud_present(*pud
)) {
373 pmd
= pmd_offset(pud
, addr
& PAGE_MASK
);
374 if (pmd_present(*pmd
)) {
375 pte
= pte_offset_map(pmd
, addr
& PAGE_MASK
);
381 /* XXX caller needs to do pte_unmap, yuck */
389 #ifdef CONFIG_DEBUG_PAGEALLOC
391 static int __change_page_attr(struct page
*page
, pgprot_t prot
)
395 unsigned long address
;
397 BUG_ON(PageHighMem(page
));
398 address
= (unsigned long)page_address(page
);
400 if (v_mapped_by_bats(address
) || v_mapped_by_tlbcam(address
))
402 if (!get_pteptr(&init_mm
, address
, &kpte
, &kpmd
))
404 __set_pte_at(&init_mm
, address
, kpte
, mk_pte(page
, prot
), 0);
406 flush_tlb_page(NULL
, address
);
413 * Change the page attributes of an page in the linear mapping.
415 * THIS CONFLICTS WITH BAT MAPPINGS, DEBUG USE ONLY
417 static int change_page_attr(struct page
*page
, int numpages
, pgprot_t prot
)
422 local_irq_save(flags
);
423 for (i
= 0; i
< numpages
; i
++, page
++) {
424 err
= __change_page_attr(page
, prot
);
428 local_irq_restore(flags
);
433 void kernel_map_pages(struct page
*page
, int numpages
, int enable
)
435 if (PageHighMem(page
))
438 change_page_attr(page
, numpages
, enable
? PAGE_KERNEL
: __pgprot(0));
440 #endif /* CONFIG_DEBUG_PAGEALLOC */
444 void __set_fixmap (enum fixed_addresses idx
, phys_addr_t phys
, pgprot_t flags
)
446 unsigned long address
= __fix_to_virt(idx
);
448 if (idx
>= __end_of_fixed_addresses
) {
453 map_page(address
, phys
, pgprot_val(flags
));
457 void __this_fixmap_does_not_exist(void)