blob: a1924876cad69edd0d2f057f8837ec3650815685 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file contains the routines setting up the linux page tables.
3 * -- paulus
4 *
5 * Derived from arch/ppc/mm/init.c:
6 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
7 *
8 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
9 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
10 * Copyright (C) 1996 Paul Mackerras
11 * Amiga/APUS changes by Jesper Skov (jskov@cygnus.co.uk).
12 *
13 * Derived from "arch/i386/mm/init.c"
14 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
15 *
16 * This program is free software; you can redistribute it and/or
17 * modify it under the terms of the GNU General Public License
18 * as published by the Free Software Foundation; either version
19 * 2 of the License, or (at your option) any later version.
20 *
21 */
22
23#include <linux/config.h>
24#include <linux/kernel.h>
25#include <linux/module.h>
26#include <linux/types.h>
27#include <linux/mm.h>
28#include <linux/vmalloc.h>
29#include <linux/init.h>
30#include <linux/highmem.h>
31
32#include <asm/pgtable.h>
33#include <asm/pgalloc.h>
34#include <asm/io.h>
35
36#include "mmu_decl.h"
37
38unsigned long ioremap_base;
39unsigned long ioremap_bot;
40int io_bat_index;
41
Paul Mackerras0a26b132006-03-28 10:22:10 +110042#if defined(CONFIG_6xx)
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#define HAVE_BATS 1
44#endif
45
46#if defined(CONFIG_FSL_BOOKE)
47#define HAVE_TLBCAM 1
48#endif
49
50extern char etext[], _stext[];
51
52#ifdef CONFIG_SMP
53extern void hash_page_sync(void);
54#endif
55
56#ifdef HAVE_BATS
57extern unsigned long v_mapped_by_bats(unsigned long va);
58extern unsigned long p_mapped_by_bats(unsigned long pa);
59void setbat(int index, unsigned long virt, unsigned long phys,
60 unsigned int size, int flags);
61
62#else /* !HAVE_BATS */
63#define v_mapped_by_bats(x) (0UL)
64#define p_mapped_by_bats(x) (0UL)
65#endif /* HAVE_BATS */
66
67#ifdef HAVE_TLBCAM
68extern unsigned int tlbcam_index;
Linus Torvalds1da177e2005-04-16 15:20:36 -070069extern unsigned long v_mapped_by_tlbcam(unsigned long va);
70extern unsigned long p_mapped_by_tlbcam(unsigned long pa);
71#else /* !HAVE_TLBCAM */
72#define v_mapped_by_tlbcam(x) (0UL)
73#define p_mapped_by_tlbcam(x) (0UL)
74#endif /* HAVE_TLBCAM */
75
Kumar Galaa85f6d42005-04-16 15:24:21 -070076#ifdef CONFIG_PTE_64BIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070077/* 44x uses an 8kB pgdir because it has 8-byte Linux PTEs. */
78#define PGDIR_ORDER 1
79#else
80#define PGDIR_ORDER 0
81#endif
82
83pgd_t *pgd_alloc(struct mm_struct *mm)
84{
85 pgd_t *ret;
86
87 ret = (pgd_t *)__get_free_pages(GFP_KERNEL|__GFP_ZERO, PGDIR_ORDER);
88 return ret;
89}
90
91void pgd_free(pgd_t *pgd)
92{
93 free_pages((unsigned long)pgd, PGDIR_ORDER);
94}
95
96pte_t *pte_alloc_one_kernel(struct mm_struct *mm, unsigned long address)
97{
98 pte_t *pte;
99 extern int mem_init_done;
100 extern void *early_get_page(void);
101
102 if (mem_init_done) {
103 pte = (pte_t *)__get_free_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO);
104 } else {
105 pte = (pte_t *)early_get_page();
106 if (pte)
107 clear_page(pte);
108 }
109 return pte;
110}
111
112struct page *pte_alloc_one(struct mm_struct *mm, unsigned long address)
113{
114 struct page *ptepage;
115
116#ifdef CONFIG_HIGHPTE
Al Viro53f9fc92005-10-21 03:22:24 -0400117 gfp_t flags = GFP_KERNEL | __GFP_HIGHMEM | __GFP_REPEAT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118#else
Al Viro53f9fc92005-10-21 03:22:24 -0400119 gfp_t flags = GFP_KERNEL | __GFP_REPEAT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120#endif
121
122 ptepage = alloc_pages(flags, 0);
123 if (ptepage)
124 clear_highpage(ptepage);
125 return ptepage;
126}
127
128void pte_free_kernel(pte_t *pte)
129{
130#ifdef CONFIG_SMP
131 hash_page_sync();
132#endif
133 free_page((unsigned long)pte);
134}
135
136void pte_free(struct page *ptepage)
137{
138#ifdef CONFIG_SMP
139 hash_page_sync();
140#endif
141 __free_page(ptepage);
142}
143
Kumar Galaa85f6d42005-04-16 15:24:21 -0700144#ifndef CONFIG_PHYS_64BIT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145void __iomem *
146ioremap(phys_addr_t addr, unsigned long size)
147{
148 return __ioremap(addr, size, _PAGE_NO_CACHE);
149}
Kumar Galaa85f6d42005-04-16 15:24:21 -0700150#else /* CONFIG_PHYS_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151void __iomem *
152ioremap64(unsigned long long addr, unsigned long size)
153{
154 return __ioremap(addr, size, _PAGE_NO_CACHE);
155}
156
157void __iomem *
158ioremap(phys_addr_t addr, unsigned long size)
159{
160 phys_addr_t addr64 = fixup_bigphys_addr(addr, size);
161
162 return ioremap64(addr64, size);
163}
Kumar Galaa85f6d42005-04-16 15:24:21 -0700164#endif /* CONFIG_PHYS_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165
166void __iomem *
167__ioremap(phys_addr_t addr, unsigned long size, unsigned long flags)
168{
169 unsigned long v, i;
170 phys_addr_t p;
171 int err;
172
173 /*
174 * Choose an address to map it to.
175 * Once the vmalloc system is running, we use it.
176 * Before then, we use space going down from ioremap_base
177 * (ioremap_bot records where we're up to).
178 */
179 p = addr & PAGE_MASK;
180 size = PAGE_ALIGN(addr + size) - p;
181
182 /*
183 * If the address lies within the first 16 MB, assume it's in ISA
184 * memory space
185 */
186 if (p < 16*1024*1024)
187 p += _ISA_MEM_BASE;
188
189 /*
190 * Don't allow anybody to remap normal RAM that we're using.
191 * mem_init() sets high_memory so only do the check after that.
192 */
193 if ( mem_init_done && (p < virt_to_phys(high_memory)) )
194 {
Kumar Galaa85f6d42005-04-16 15:24:21 -0700195 printk("__ioremap(): phys addr "PHYS_FMT" is RAM lr %p\n", p,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 __builtin_return_address(0));
197 return NULL;
198 }
199
200 if (size == 0)
201 return NULL;
202
203 /*
204 * Is it already mapped? Perhaps overlapped by a previous
205 * BAT mapping. If the whole area is mapped then we're done,
206 * otherwise remap it since we want to keep the virt addrs for
207 * each request contiguous.
208 *
209 * We make the assumption here that if the bottom and top
210 * of the range we want are mapped then it's mapped to the
211 * same virt address (and this is contiguous).
212 * -- Cort
213 */
214 if ((v = p_mapped_by_bats(p)) /*&& p_mapped_by_bats(p+size-1)*/ )
215 goto out;
216
217 if ((v = p_mapped_by_tlbcam(p)))
218 goto out;
219
220 if (mem_init_done) {
221 struct vm_struct *area;
222 area = get_vm_area(size, VM_IOREMAP);
223 if (area == 0)
224 return NULL;
225 v = (unsigned long) area->addr;
226 } else {
227 v = (ioremap_bot -= size);
228 }
229
230 if ((flags & _PAGE_PRESENT) == 0)
231 flags |= _PAGE_KERNEL;
232 if (flags & _PAGE_NO_CACHE)
233 flags |= _PAGE_GUARDED;
234
235 /*
236 * Should check if it is a candidate for a BAT mapping
237 */
238
239 err = 0;
240 for (i = 0; i < size && err == 0; i += PAGE_SIZE)
241 err = map_page(v+i, p+i, flags);
242 if (err) {
243 if (mem_init_done)
244 vunmap((void *)v);
245 return NULL;
246 }
247
248out:
249 return (void __iomem *) (v + ((unsigned long)addr & ~PAGE_MASK));
250}
251
252void iounmap(volatile void __iomem *addr)
253{
254 /*
255 * If mapped by BATs then there is nothing to do.
256 * Calling vfree() generates a benign warning.
257 */
258 if (v_mapped_by_bats((unsigned long)addr)) return;
259
260 if (addr > high_memory && (unsigned long) addr < ioremap_bot)
261 vunmap((void *) (PAGE_MASK & (unsigned long)addr));
262}
263
264void __iomem *ioport_map(unsigned long port, unsigned int len)
265{
266 return (void __iomem *) (port + _IO_BASE);
267}
268
269void ioport_unmap(void __iomem *addr)
270{
271 /* Nothing to do */
272}
273EXPORT_SYMBOL(ioport_map);
274EXPORT_SYMBOL(ioport_unmap);
275
276int
277map_page(unsigned long va, phys_addr_t pa, int flags)
278{
279 pmd_t *pd;
280 pte_t *pg;
281 int err = -ENOMEM;
282
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283 /* Use upper 10 bits of VA to index the first level map */
284 pd = pmd_offset(pgd_offset_k(va), va);
285 /* Use middle 10 bits of VA to index the second-level map */
Hugh Dickins872fec12005-10-29 18:16:21 -0700286 pg = pte_alloc_kernel(pd, va);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287 if (pg != 0) {
288 err = 0;
289 set_pte_at(&init_mm, va, pg, pfn_pte(pa >> PAGE_SHIFT, __pgprot(flags)));
290 if (mem_init_done)
291 flush_HPTE(0, va, pmd_val(*pd));
292 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 return err;
294}
295
296/*
297 * Map in all of physical memory starting at KERNELBASE.
298 */
299void __init mapin_ram(void)
300{
301 unsigned long v, p, s, f;
302
303 s = mmu_mapin_ram();
304 v = KERNELBASE + s;
305 p = PPC_MEMSTART + s;
306 for (; s < total_lowmem; s += PAGE_SIZE) {
307 if ((char *) v >= _stext && (char *) v < etext)
308 f = _PAGE_RAM_TEXT;
309 else
310 f = _PAGE_RAM;
311 map_page(v, p, f);
312 v += PAGE_SIZE;
313 p += PAGE_SIZE;
314 }
315}
316
317/* is x a power of 2? */
318#define is_power_of_2(x) ((x) != 0 && (((x) & ((x) - 1)) == 0))
319
320/* is x a power of 4? */
321#define is_power_of_4(x) ((x) != 0 && (((x) & (x-1)) == 0) && (ffs(x) & 1))
322
323/*
324 * Set up a mapping for a block of I/O.
325 * virt, phys, size must all be page-aligned.
326 * This should only be called before ioremap is called.
327 */
328void __init io_block_mapping(unsigned long virt, phys_addr_t phys,
329 unsigned int size, int flags)
330{
331 int i;
332
333 if (virt > KERNELBASE && virt < ioremap_bot)
334 ioremap_bot = ioremap_base = virt;
335
336#ifdef HAVE_BATS
337 /*
338 * Use a BAT for this if possible...
339 */
340 if (io_bat_index < 2 && is_power_of_2(size)
341 && (virt & (size - 1)) == 0 && (phys & (size - 1)) == 0) {
342 setbat(io_bat_index, virt, phys, size, flags);
343 ++io_bat_index;
344 return;
345 }
346#endif /* HAVE_BATS */
347
348#ifdef HAVE_TLBCAM
349 /*
350 * Use a CAM for this if possible...
351 */
352 if (tlbcam_index < num_tlbcam_entries && is_power_of_4(size)
353 && (virt & (size - 1)) == 0 && (phys & (size - 1)) == 0) {
354 settlbcam(tlbcam_index, virt, phys, size, flags, 0);
355 ++tlbcam_index;
356 return;
357 }
358#endif /* HAVE_TLBCAM */
359
360 /* No BATs available, put it in the page tables. */
361 for (i = 0; i < size; i += PAGE_SIZE)
362 map_page(virt + i, phys + i, flags);
363}
364
365/* Scan the real Linux page tables and return a PTE pointer for
366 * a virtual address in a context.
367 * Returns true (1) if PTE was found, zero otherwise. The pointer to
368 * the PTE pointer is unmodified if PTE is not found.
369 */
370int
371get_pteptr(struct mm_struct *mm, unsigned long addr, pte_t **ptep)
372{
373 pgd_t *pgd;
374 pmd_t *pmd;
375 pte_t *pte;
376 int retval = 0;
377
378 pgd = pgd_offset(mm, addr & PAGE_MASK);
379 if (pgd) {
380 pmd = pmd_offset(pgd, addr & PAGE_MASK);
381 if (pmd_present(*pmd)) {
382 pte = pte_offset_map(pmd, addr & PAGE_MASK);
383 if (pte) {
384 retval = 1;
385 *ptep = pte;
386 /* XXX caller needs to do pte_unmap, yuck */
387 }
388 }
389 }
390 return(retval);
391}
392
393/* Find physical address for this virtual address. Normally used by
394 * I/O functions, but anyone can call it.
395 */
396unsigned long iopa(unsigned long addr)
397{
398 unsigned long pa;
399
400 /* I don't know why this won't work on PMacs or CHRP. It
401 * appears there is some bug, or there is some implicit
402 * mapping done not properly represented by BATs or in page
403 * tables.......I am actively working on resolving this, but
404 * can't hold up other stuff. -- Dan
405 */
406 pte_t *pte;
407 struct mm_struct *mm;
408
409 /* Check the BATs */
410 pa = v_mapped_by_bats(addr);
411 if (pa)
412 return pa;
413
414 /* Allow mapping of user addresses (within the thread)
415 * for DMA if necessary.
416 */
417 if (addr < TASK_SIZE)
418 mm = current->mm;
419 else
420 mm = &init_mm;
421
422 pa = 0;
423 if (get_pteptr(mm, addr, &pte)) {
424 pa = (pte_val(*pte) & PAGE_MASK) | (addr & ~PAGE_MASK);
425 pte_unmap(pte);
426 }
427
428 return(pa);
429}
430
431/* This is will find the virtual address for a physical one....
432 * Swiped from APUS, could be dangerous :-).
433 * This is only a placeholder until I really find a way to make this
434 * work. -- Dan
435 */
436unsigned long
437mm_ptov (unsigned long paddr)
438{
439 unsigned long ret;
440#if 0
441 if (paddr < 16*1024*1024)
442 ret = ZTWO_VADDR(paddr);
443 else {
444 int i;
445
446 for (i = 0; i < kmap_chunk_count;){
447 unsigned long phys = kmap_chunks[i++];
448 unsigned long size = kmap_chunks[i++];
449 unsigned long virt = kmap_chunks[i++];
450 if (paddr >= phys
451 && paddr < (phys + size)){
452 ret = virt + paddr - phys;
453 goto exit;
454 }
455 }
456
457 ret = (unsigned long) __va(paddr);
458 }
459exit:
460#ifdef DEBUGPV
461 printk ("PTOV(%lx)=%lx\n", paddr, ret);
462#endif
463#else
464 ret = (unsigned long)paddr + KERNELBASE;
465#endif
466 return ret;
467}
468