Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
| 2 | * This file is subject to the terms and conditions of the GNU General Public |
| 3 | * License. See the file "COPYING" in the main directory of this archive |
| 4 | * for more details. |
| 5 | * |
| 6 | * Copyright (C) 1994, 95, 96, 97, 98, 99, 2000, 2003 Ralf Baechle |
| 7 | * Copyright (C) 1999, 2000, 2001 Silicon Graphics, Inc. |
| 8 | */ |
| 9 | #ifndef _ASM_PGTABLE_64_H |
| 10 | #define _ASM_PGTABLE_64_H |
| 11 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 12 | #include <linux/linkage.h> |
| 13 | |
| 14 | #include <asm/addrspace.h> |
| 15 | #include <asm/page.h> |
| 16 | #include <asm/cachectl.h> |
Atsushi Nemoto | 656be92 | 2006-10-26 00:08:31 +0900 | [diff] [blame] | 17 | #include <asm/fixmap.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 18 | |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 19 | #include <asm-generic/pgtable-nopud.h> |
| 20 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 21 | /* |
| 22 | * Each address space has 2 4K pages as its page directory, giving 1024 |
| 23 | * (== PTRS_PER_PGD) 8 byte pointers to pmd tables. Each pmd table is a |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 24 | * single 4K page, giving 512 (== PTRS_PER_PMD) 8 byte pointers to page |
| 25 | * tables. Each page table is also a single 4K page, giving 512 (== |
| 26 | * PTRS_PER_PTE) 8 byte ptes. Each pud entry is initialized to point to |
| 27 | * invalid_pmd_table, each pmd entry is initialized to point to |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 28 | * invalid_pte_table, each pte is initialized to 0. When memory is low, |
| 29 | * and a pmd table or a page table allocation fails, empty_bad_pmd_table |
| 30 | * and empty_bad_page_table is returned back to higher layer code, so |
| 31 | * that the failure is recognized later on. Linux does not seem to |
| 32 | * handle these failures very well though. The empty_bad_page_table has |
| 33 | * invalid pte entries in it, to force page faults. |
| 34 | * |
| 35 | * Kernel mappings: kernel mappings are held in the swapper_pg_table. |
| 36 | * The layout is identical to userspace except it's indexed with the |
| 37 | * fault address - VMALLOC_START. |
| 38 | */ |
| 39 | |
| 40 | /* PMD_SHIFT determines the size of the area a second-level page table can map */ |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 41 | #define PMD_SHIFT (PAGE_SHIFT + (PAGE_SHIFT + PTE_ORDER - 3)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 42 | #define PMD_SIZE (1UL << PMD_SHIFT) |
| 43 | #define PMD_MASK (~(PMD_SIZE-1)) |
| 44 | |
| 45 | /* PGDIR_SHIFT determines what a third-level page table entry can map */ |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 46 | #define PGDIR_SHIFT (PMD_SHIFT + (PAGE_SHIFT + PMD_ORDER - 3)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 47 | #define PGDIR_SIZE (1UL << PGDIR_SHIFT) |
| 48 | #define PGDIR_MASK (~(PGDIR_SIZE-1)) |
| 49 | |
| 50 | /* |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 51 | * For 4kB page size we use a 3 level page tree and an 8kB pud, which |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 52 | * permits us mapping 40 bits of virtual address space. |
| 53 | * |
| 54 | * We used to implement 41 bits by having an order 1 pmd level but that seemed |
| 55 | * rather pointless. |
| 56 | * |
| 57 | * For 8kB page size we use a 3 level page tree which permits a total of |
| 58 | * 8TB of address space. Alternatively a 33-bit / 8GB organization using |
| 59 | * two levels would be easy to implement. |
| 60 | * |
| 61 | * For 16kB page size we use a 2 level page tree which permits a total of |
Thiemo Seufer | f29244a | 2005-02-21 11:11:32 +0000 | [diff] [blame] | 62 | * 36 bits of virtual address space. We could add a third level but it seems |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 63 | * like at the moment there's no need for this. |
| 64 | * |
| 65 | * For 64kB page size we use a 2 level page table tree for a total of 42 bits |
| 66 | * of virtual address space. |
| 67 | */ |
| 68 | #ifdef CONFIG_PAGE_SIZE_4KB |
| 69 | #define PGD_ORDER 1 |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 70 | #define PUD_ORDER aieeee_attempt_to_allocate_pud |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 71 | #define PMD_ORDER 0 |
| 72 | #define PTE_ORDER 0 |
| 73 | #endif |
| 74 | #ifdef CONFIG_PAGE_SIZE_8KB |
| 75 | #define PGD_ORDER 0 |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 76 | #define PUD_ORDER aieeee_attempt_to_allocate_pud |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 77 | #define PMD_ORDER 0 |
| 78 | #define PTE_ORDER 0 |
| 79 | #endif |
| 80 | #ifdef CONFIG_PAGE_SIZE_16KB |
| 81 | #define PGD_ORDER 0 |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 82 | #define PUD_ORDER aieeee_attempt_to_allocate_pud |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 83 | #define PMD_ORDER 0 |
| 84 | #define PTE_ORDER 0 |
| 85 | #endif |
Ralf Baechle | c52399b | 2009-04-02 14:07:10 +0200 | [diff] [blame] | 86 | #ifdef CONFIG_PAGE_SIZE_32KB |
| 87 | #define PGD_ORDER 0 |
| 88 | #define PUD_ORDER aieeee_attempt_to_allocate_pud |
| 89 | #define PMD_ORDER 0 |
| 90 | #define PTE_ORDER 0 |
| 91 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 92 | #ifdef CONFIG_PAGE_SIZE_64KB |
| 93 | #define PGD_ORDER 0 |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 94 | #define PUD_ORDER aieeee_attempt_to_allocate_pud |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 95 | #define PMD_ORDER 0 |
| 96 | #define PTE_ORDER 0 |
| 97 | #endif |
| 98 | |
| 99 | #define PTRS_PER_PGD ((PAGE_SIZE << PGD_ORDER) / sizeof(pgd_t)) |
| 100 | #define PTRS_PER_PMD ((PAGE_SIZE << PMD_ORDER) / sizeof(pmd_t)) |
| 101 | #define PTRS_PER_PTE ((PAGE_SIZE << PTE_ORDER) / sizeof(pte_t)) |
| 102 | |
Peter Watkins | 9dbd7b9 | 2006-08-23 11:15:49 -0400 | [diff] [blame] | 103 | #if PGDIR_SIZE >= TASK_SIZE |
| 104 | #define USER_PTRS_PER_PGD (1) |
| 105 | #else |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 106 | #define USER_PTRS_PER_PGD (TASK_SIZE / PGDIR_SIZE) |
Peter Watkins | 9dbd7b9 | 2006-08-23 11:15:49 -0400 | [diff] [blame] | 107 | #endif |
| 108 | #define FIRST_USER_ADDRESS 0UL |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 109 | |
Thiemo Seufer | f29244a | 2005-02-21 11:11:32 +0000 | [diff] [blame] | 110 | #define VMALLOC_START MAP_BASE |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 111 | #define VMALLOC_END \ |
Wu Fei | e0cc87f | 2009-09-03 22:29:53 +0800 | [diff] [blame] | 112 | (VMALLOC_START + \ |
Guenter Roeck | 91dfc42 | 2010-02-02 08:52:20 -0800 | [diff] [blame] | 113 | min(PTRS_PER_PGD * PTRS_PER_PMD * PTRS_PER_PTE * PAGE_SIZE, \ |
| 114 | (1UL << cpu_vmbits)) - (1UL << 32)) |
| 115 | |
Franck Bui-Huu | 054c51b | 2007-02-15 14:21:36 +0100 | [diff] [blame] | 116 | #if defined(CONFIG_MODULES) && defined(KBUILD_64BIT_SYM32) && \ |
Atsushi Nemoto | 656be92 | 2006-10-26 00:08:31 +0900 | [diff] [blame] | 117 | VMALLOC_START != CKSSEG |
| 118 | /* Load modules into 32bit-compatible segment. */ |
| 119 | #define MODULE_START CKSSEG |
| 120 | #define MODULE_END (FIXADDR_START-2*PAGE_SIZE) |
Atsushi Nemoto | 656be92 | 2006-10-26 00:08:31 +0900 | [diff] [blame] | 121 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 122 | |
| 123 | #define pte_ERROR(e) \ |
| 124 | printk("%s:%d: bad pte %016lx.\n", __FILE__, __LINE__, pte_val(e)) |
| 125 | #define pmd_ERROR(e) \ |
| 126 | printk("%s:%d: bad pmd %016lx.\n", __FILE__, __LINE__, pmd_val(e)) |
| 127 | #define pgd_ERROR(e) \ |
| 128 | printk("%s:%d: bad pgd %016lx.\n", __FILE__, __LINE__, pgd_val(e)) |
| 129 | |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 130 | extern pte_t invalid_pte_table[PTRS_PER_PTE]; |
| 131 | extern pte_t empty_bad_page_table[PTRS_PER_PTE]; |
| 132 | extern pmd_t invalid_pmd_table[PTRS_PER_PMD]; |
| 133 | extern pmd_t empty_bad_pmd_table[PTRS_PER_PMD]; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 134 | |
| 135 | /* |
Thiemo Seufer | 1b3a6e9 | 2005-04-01 14:07:13 +0000 | [diff] [blame] | 136 | * Empty pgd/pmd entries point to the invalid_pte_table. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 137 | */ |
| 138 | static inline int pmd_none(pmd_t pmd) |
| 139 | { |
| 140 | return pmd_val(pmd) == (unsigned long) invalid_pte_table; |
| 141 | } |
| 142 | |
| 143 | #define pmd_bad(pmd) (pmd_val(pmd) & ~PAGE_MASK) |
| 144 | |
| 145 | static inline int pmd_present(pmd_t pmd) |
| 146 | { |
| 147 | return pmd_val(pmd) != (unsigned long) invalid_pte_table; |
| 148 | } |
| 149 | |
| 150 | static inline void pmd_clear(pmd_t *pmdp) |
| 151 | { |
| 152 | pmd_val(*pmdp) = ((unsigned long) invalid_pte_table); |
| 153 | } |
| 154 | |
| 155 | /* |
Thiemo Seufer | f29244a | 2005-02-21 11:11:32 +0000 | [diff] [blame] | 156 | * Empty pud entries point to the invalid_pmd_table. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 157 | */ |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 158 | static inline int pud_none(pud_t pud) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 159 | { |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 160 | return pud_val(pud) == (unsigned long) invalid_pmd_table; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 161 | } |
| 162 | |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 163 | static inline int pud_bad(pud_t pud) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 164 | { |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 165 | return pud_val(pud) & ~PAGE_MASK; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 166 | } |
| 167 | |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 168 | static inline int pud_present(pud_t pud) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 169 | { |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 170 | return pud_val(pud) != (unsigned long) invalid_pmd_table; |
| 171 | } |
| 172 | |
| 173 | static inline void pud_clear(pud_t *pudp) |
| 174 | { |
| 175 | pud_val(*pudp) = ((unsigned long) invalid_pmd_table); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 176 | } |
| 177 | |
Thiemo Seufer | 1b3a6e9 | 2005-04-01 14:07:13 +0000 | [diff] [blame] | 178 | #define pte_page(x) pfn_to_page(pte_pfn(x)) |
| 179 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 180 | #ifdef CONFIG_CPU_VR41XX |
| 181 | #define pte_pfn(x) ((unsigned long)((x).pte >> (PAGE_SHIFT + 2))) |
| 182 | #define pfn_pte(pfn, prot) __pte(((pfn) << (PAGE_SHIFT + 2)) | pgprot_val(prot)) |
| 183 | #else |
| 184 | #define pte_pfn(x) ((unsigned long)((x).pte >> PAGE_SHIFT)) |
| 185 | #define pfn_pte(pfn, prot) __pte(((pfn) << PAGE_SHIFT) | pgprot_val(prot)) |
| 186 | #endif |
| 187 | |
| 188 | #define __pgd_offset(address) pgd_index(address) |
Thiemo Seufer | f29244a | 2005-02-21 11:11:32 +0000 | [diff] [blame] | 189 | #define __pud_offset(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1)) |
Thiemo Seufer | 1b3a6e9 | 2005-04-01 14:07:13 +0000 | [diff] [blame] | 190 | #define __pmd_offset(address) pmd_index(address) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 191 | |
| 192 | /* to find an entry in a kernel page-table-directory */ |
Wu Fei | e0cc87f | 2009-09-03 22:29:53 +0800 | [diff] [blame] | 193 | #define pgd_offset_k(address) pgd_offset(&init_mm, address) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 194 | |
Thiemo Seufer | f29244a | 2005-02-21 11:11:32 +0000 | [diff] [blame] | 195 | #define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1)) |
Thiemo Seufer | 1b3a6e9 | 2005-04-01 14:07:13 +0000 | [diff] [blame] | 196 | #define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 197 | |
| 198 | /* to find an entry in a page-table-directory */ |
Ralf Baechle | 21a151d | 2007-10-11 23:46:15 +0100 | [diff] [blame] | 199 | #define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 200 | |
Dave McCracken | 46a82b2 | 2006-09-25 23:31:48 -0700 | [diff] [blame] | 201 | static inline unsigned long pud_page_vaddr(pud_t pud) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 202 | { |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 203 | return pud_val(pud); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 204 | } |
Franck Bui-Huu | c9d0696 | 2007-03-19 17:36:42 +0100 | [diff] [blame] | 205 | #define pud_phys(pud) virt_to_phys((void *)pud_val(pud)) |
Dave McCracken | 46a82b2 | 2006-09-25 23:31:48 -0700 | [diff] [blame] | 206 | #define pud_page(pud) (pfn_to_page(pud_phys(pud) >> PAGE_SHIFT)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 207 | |
| 208 | /* Find an entry in the second-level page table.. */ |
Ralf Baechle | c6e8b58 | 2005-02-10 12:19:59 +0000 | [diff] [blame] | 209 | static inline pmd_t *pmd_offset(pud_t * pud, unsigned long address) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 210 | { |
Dave McCracken | 46a82b2 | 2006-09-25 23:31:48 -0700 | [diff] [blame] | 211 | return (pmd_t *) pud_page_vaddr(*pud) + pmd_index(address); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 212 | } |
| 213 | |
| 214 | /* Find an entry in the third-level page table.. */ |
| 215 | #define __pte_offset(address) \ |
| 216 | (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1)) |
| 217 | #define pte_offset(dir, address) \ |
Franck Bui-Huu | 5b70a31 | 2006-12-05 10:39:56 +0100 | [diff] [blame] | 218 | ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 219 | #define pte_offset_kernel(dir, address) \ |
Franck Bui-Huu | 5b70a31 | 2006-12-05 10:39:56 +0100 | [diff] [blame] | 220 | ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 221 | #define pte_offset_map(dir, address) \ |
| 222 | ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address)) |
| 223 | #define pte_offset_map_nested(dir, address) \ |
| 224 | ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address)) |
| 225 | #define pte_unmap(pte) ((void)(pte)) |
| 226 | #define pte_unmap_nested(pte) ((void)(pte)) |
| 227 | |
| 228 | /* |
| 229 | * Initialize a new pgd / pmd table with invalid pointers. |
| 230 | */ |
| 231 | extern void pgd_init(unsigned long page); |
| 232 | extern void pmd_init(unsigned long page, unsigned long pagetable); |
| 233 | |
| 234 | /* |
| 235 | * Non-present pages: high 24 bits are offset, next 8 bits type, |
| 236 | * low 32 bits zero. |
| 237 | */ |
| 238 | static inline pte_t mk_swap_pte(unsigned long type, unsigned long offset) |
| 239 | { pte_t pte; pte_val(pte) = (type << 32) | (offset << 40); return pte; } |
| 240 | |
| 241 | #define __swp_type(x) (((x).val >> 32) & 0xff) |
| 242 | #define __swp_offset(x) ((x).val >> 40) |
Ralf Baechle | 21a151d | 2007-10-11 23:46:15 +0100 | [diff] [blame] | 243 | #define __swp_entry(type, offset) ((swp_entry_t) { pte_val(mk_swap_pte((type), (offset))) }) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 244 | #define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) }) |
| 245 | #define __swp_entry_to_pte(x) ((pte_t) { (x).val }) |
| 246 | |
| 247 | /* |
Sergei Shtylyov | 7cb710c | 2006-05-27 22:39:39 +0400 | [diff] [blame] | 248 | * Bits 0, 4, 6, and 7 are taken. Let's leave bits 1, 2, 3, and 5 alone to |
| 249 | * make things easier, and only use the upper 56 bits for the page offset... |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 250 | */ |
Sergei Shtylyov | 7cb710c | 2006-05-27 22:39:39 +0400 | [diff] [blame] | 251 | #define PTE_FILE_MAX_BITS 56 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 252 | |
Sergei Shtylyov | 7cb710c | 2006-05-27 22:39:39 +0400 | [diff] [blame] | 253 | #define pte_to_pgoff(_pte) ((_pte).pte >> 8) |
| 254 | #define pgoff_to_pte(off) ((pte_t) { ((off) << 8) | _PAGE_FILE }) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 255 | |
| 256 | #endif /* _ASM_PGTABLE_64_H */ |