blob: 55908fd56b1fc66ed5fe99d61bc54b8a243a1159 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1994, 95, 96, 97, 98, 99, 2000, 2003 Ralf Baechle
7 * Copyright (C) 1999, 2000, 2001 Silicon Graphics, Inc.
8 */
9#ifndef _ASM_PGTABLE_64_H
10#define _ASM_PGTABLE_64_H
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/linkage.h>
13
14#include <asm/addrspace.h>
15#include <asm/page.h>
16#include <asm/cachectl.h>
Atsushi Nemoto656be922006-10-26 00:08:31 +090017#include <asm/fixmap.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018
David Daney325f8a02009-12-04 13:52:36 -080019#ifdef CONFIG_PAGE_SIZE_64KB
20#include <asm-generic/pgtable-nopmd.h>
21#else
Ralf Baechlec6e8b582005-02-10 12:19:59 +000022#include <asm-generic/pgtable-nopud.h>
David Daney325f8a02009-12-04 13:52:36 -080023#endif
Ralf Baechlec6e8b582005-02-10 12:19:59 +000024
Linus Torvalds1da177e2005-04-16 15:20:36 -070025/*
26 * Each address space has 2 4K pages as its page directory, giving 1024
27 * (== PTRS_PER_PGD) 8 byte pointers to pmd tables. Each pmd table is a
Ralf Baechlec6e8b582005-02-10 12:19:59 +000028 * single 4K page, giving 512 (== PTRS_PER_PMD) 8 byte pointers to page
29 * tables. Each page table is also a single 4K page, giving 512 (==
30 * PTRS_PER_PTE) 8 byte ptes. Each pud entry is initialized to point to
31 * invalid_pmd_table, each pmd entry is initialized to point to
Linus Torvalds1da177e2005-04-16 15:20:36 -070032 * invalid_pte_table, each pte is initialized to 0. When memory is low,
33 * and a pmd table or a page table allocation fails, empty_bad_pmd_table
34 * and empty_bad_page_table is returned back to higher layer code, so
35 * that the failure is recognized later on. Linux does not seem to
36 * handle these failures very well though. The empty_bad_page_table has
37 * invalid pte entries in it, to force page faults.
38 *
39 * Kernel mappings: kernel mappings are held in the swapper_pg_table.
40 * The layout is identical to userspace except it's indexed with the
41 * fault address - VMALLOC_START.
42 */
43
David Daney325f8a02009-12-04 13:52:36 -080044
45/* PGDIR_SHIFT determines what a third-level page table entry can map */
46#ifdef __PAGETABLE_PMD_FOLDED
47#define PGDIR_SHIFT (PAGE_SHIFT + PAGE_SHIFT + PTE_ORDER - 3)
48#else
49
Linus Torvalds1da177e2005-04-16 15:20:36 -070050/* PMD_SHIFT determines the size of the area a second-level page table can map */
Ralf Baechlec6e8b582005-02-10 12:19:59 +000051#define PMD_SHIFT (PAGE_SHIFT + (PAGE_SHIFT + PTE_ORDER - 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#define PMD_SIZE (1UL << PMD_SHIFT)
53#define PMD_MASK (~(PMD_SIZE-1))
54
David Daney325f8a02009-12-04 13:52:36 -080055
Ralf Baechlec6e8b582005-02-10 12:19:59 +000056#define PGDIR_SHIFT (PMD_SHIFT + (PAGE_SHIFT + PMD_ORDER - 3))
David Daney325f8a02009-12-04 13:52:36 -080057#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070058#define PGDIR_SIZE (1UL << PGDIR_SHIFT)
59#define PGDIR_MASK (~(PGDIR_SIZE-1))
60
61/*
Ralf Baechlec6e8b582005-02-10 12:19:59 +000062 * For 4kB page size we use a 3 level page tree and an 8kB pud, which
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 * permits us mapping 40 bits of virtual address space.
64 *
65 * We used to implement 41 bits by having an order 1 pmd level but that seemed
66 * rather pointless.
67 *
68 * For 8kB page size we use a 3 level page tree which permits a total of
69 * 8TB of address space. Alternatively a 33-bit / 8GB organization using
70 * two levels would be easy to implement.
71 *
72 * For 16kB page size we use a 2 level page tree which permits a total of
Thiemo Seuferf29244a2005-02-21 11:11:32 +000073 * 36 bits of virtual address space. We could add a third level but it seems
Linus Torvalds1da177e2005-04-16 15:20:36 -070074 * like at the moment there's no need for this.
75 *
76 * For 64kB page size we use a 2 level page table tree for a total of 42 bits
77 * of virtual address space.
78 */
79#ifdef CONFIG_PAGE_SIZE_4KB
80#define PGD_ORDER 1
Ralf Baechlec6e8b582005-02-10 12:19:59 +000081#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070082#define PMD_ORDER 0
83#define PTE_ORDER 0
84#endif
85#ifdef CONFIG_PAGE_SIZE_8KB
86#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000087#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070088#define PMD_ORDER 0
89#define PTE_ORDER 0
90#endif
91#ifdef CONFIG_PAGE_SIZE_16KB
92#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000093#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070094#define PMD_ORDER 0
95#define PTE_ORDER 0
96#endif
Ralf Baechlec52399b2009-04-02 14:07:10 +020097#ifdef CONFIG_PAGE_SIZE_32KB
98#define PGD_ORDER 0
99#define PUD_ORDER aieeee_attempt_to_allocate_pud
100#define PMD_ORDER 0
101#define PTE_ORDER 0
102#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103#ifdef CONFIG_PAGE_SIZE_64KB
104#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000105#define PUD_ORDER aieeee_attempt_to_allocate_pud
David Daney325f8a02009-12-04 13:52:36 -0800106#define PMD_ORDER aieeee_attempt_to_allocate_pmd
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107#define PTE_ORDER 0
108#endif
109
110#define PTRS_PER_PGD ((PAGE_SIZE << PGD_ORDER) / sizeof(pgd_t))
David Daney325f8a02009-12-04 13:52:36 -0800111#ifndef __PAGETABLE_PMD_FOLDED
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112#define PTRS_PER_PMD ((PAGE_SIZE << PMD_ORDER) / sizeof(pmd_t))
David Daney325f8a02009-12-04 13:52:36 -0800113#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#define PTRS_PER_PTE ((PAGE_SIZE << PTE_ORDER) / sizeof(pte_t))
115
David Daney949e51b2010-10-14 11:32:33 -0700116#if PGDIR_SIZE >= TASK_SIZE64
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400117#define USER_PTRS_PER_PGD (1)
118#else
David Daney949e51b2010-10-14 11:32:33 -0700119#define USER_PTRS_PER_PGD (TASK_SIZE64 / PGDIR_SIZE)
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400120#endif
121#define FIRST_USER_ADDRESS 0UL
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122
David Daneyc8f3cc02010-04-19 11:43:10 -0700123/*
124 * TLB refill handlers also map the vmalloc area into xuseg. Avoid
125 * the first couple of pages so NULL pointer dereferences will still
126 * reliably trap.
127 */
128#define VMALLOC_START (MAP_BASE + (2 * PAGE_SIZE))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129#define VMALLOC_END \
David Daneyc8f3cc02010-04-19 11:43:10 -0700130 (MAP_BASE + \
Guenter Roeck91dfc422010-02-02 08:52:20 -0800131 min(PTRS_PER_PGD * PTRS_PER_PMD * PTRS_PER_PTE * PAGE_SIZE, \
132 (1UL << cpu_vmbits)) - (1UL << 32))
133
Franck Bui-Huu054c51b2007-02-15 14:21:36 +0100134#if defined(CONFIG_MODULES) && defined(KBUILD_64BIT_SYM32) && \
Atsushi Nemoto656be922006-10-26 00:08:31 +0900135 VMALLOC_START != CKSSEG
136/* Load modules into 32bit-compatible segment. */
137#define MODULE_START CKSSEG
138#define MODULE_END (FIXADDR_START-2*PAGE_SIZE)
Atsushi Nemoto656be922006-10-26 00:08:31 +0900139#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140
141#define pte_ERROR(e) \
142 printk("%s:%d: bad pte %016lx.\n", __FILE__, __LINE__, pte_val(e))
David Daney325f8a02009-12-04 13:52:36 -0800143#ifndef __PAGETABLE_PMD_FOLDED
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144#define pmd_ERROR(e) \
145 printk("%s:%d: bad pmd %016lx.\n", __FILE__, __LINE__, pmd_val(e))
David Daney325f8a02009-12-04 13:52:36 -0800146#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147#define pgd_ERROR(e) \
148 printk("%s:%d: bad pgd %016lx.\n", __FILE__, __LINE__, pgd_val(e))
149
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000150extern pte_t invalid_pte_table[PTRS_PER_PTE];
151extern pte_t empty_bad_page_table[PTRS_PER_PTE];
David Daney325f8a02009-12-04 13:52:36 -0800152
153
154#ifndef __PAGETABLE_PMD_FOLDED
155/*
156 * For 3-level pagetables we defines these ourselves, for 2-level the
157 * definitions are supplied by <asm-generic/pgtable-nopmd.h>.
158 */
159typedef struct { unsigned long pmd; } pmd_t;
160#define pmd_val(x) ((x).pmd)
161#define __pmd(x) ((pmd_t) { (x) } )
162
163
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000164extern pmd_t invalid_pmd_table[PTRS_PER_PMD];
165extern pmd_t empty_bad_pmd_table[PTRS_PER_PMD];
David Daney325f8a02009-12-04 13:52:36 -0800166#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
168/*
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000169 * Empty pgd/pmd entries point to the invalid_pte_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170 */
171static inline int pmd_none(pmd_t pmd)
172{
173 return pmd_val(pmd) == (unsigned long) invalid_pte_table;
174}
175
176#define pmd_bad(pmd) (pmd_val(pmd) & ~PAGE_MASK)
177
178static inline int pmd_present(pmd_t pmd)
179{
180 return pmd_val(pmd) != (unsigned long) invalid_pte_table;
181}
182
183static inline void pmd_clear(pmd_t *pmdp)
184{
185 pmd_val(*pmdp) = ((unsigned long) invalid_pte_table);
186}
David Daney325f8a02009-12-04 13:52:36 -0800187#ifndef __PAGETABLE_PMD_FOLDED
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188
189/*
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000190 * Empty pud entries point to the invalid_pmd_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191 */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000192static inline int pud_none(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000194 return pud_val(pud) == (unsigned long) invalid_pmd_table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195}
196
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000197static inline int pud_bad(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000199 return pud_val(pud) & ~PAGE_MASK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200}
201
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000202static inline int pud_present(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000204 return pud_val(pud) != (unsigned long) invalid_pmd_table;
205}
206
207static inline void pud_clear(pud_t *pudp)
208{
209 pud_val(*pudp) = ((unsigned long) invalid_pmd_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210}
David Daney325f8a02009-12-04 13:52:36 -0800211#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000213#define pte_page(x) pfn_to_page(pte_pfn(x))
214
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215#ifdef CONFIG_CPU_VR41XX
216#define pte_pfn(x) ((unsigned long)((x).pte >> (PAGE_SHIFT + 2)))
217#define pfn_pte(pfn, prot) __pte(((pfn) << (PAGE_SHIFT + 2)) | pgprot_val(prot))
218#else
David Daney6dd93442010-02-10 15:12:47 -0800219#define pte_pfn(x) ((unsigned long)((x).pte >> _PFN_SHIFT))
220#define pfn_pte(pfn, prot) __pte(((pfn) << _PFN_SHIFT) | pgprot_val(prot))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221#endif
222
223#define __pgd_offset(address) pgd_index(address)
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000224#define __pud_offset(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000225#define __pmd_offset(address) pmd_index(address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226
227/* to find an entry in a kernel page-table-directory */
Wu Feie0cc87f2009-09-03 22:29:53 +0800228#define pgd_offset_k(address) pgd_offset(&init_mm, address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000230#define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000231#define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
233/* to find an entry in a page-table-directory */
Ralf Baechle21a151d2007-10-11 23:46:15 +0100234#define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235
David Daney325f8a02009-12-04 13:52:36 -0800236#ifndef __PAGETABLE_PMD_FOLDED
Dave McCracken46a82b22006-09-25 23:31:48 -0700237static inline unsigned long pud_page_vaddr(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000239 return pud_val(pud);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240}
Franck Bui-Huuc9d06962007-03-19 17:36:42 +0100241#define pud_phys(pud) virt_to_phys((void *)pud_val(pud))
Dave McCracken46a82b22006-09-25 23:31:48 -0700242#define pud_page(pud) (pfn_to_page(pud_phys(pud) >> PAGE_SHIFT))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243
244/* Find an entry in the second-level page table.. */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000245static inline pmd_t *pmd_offset(pud_t * pud, unsigned long address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246{
Dave McCracken46a82b22006-09-25 23:31:48 -0700247 return (pmd_t *) pud_page_vaddr(*pud) + pmd_index(address);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248}
David Daney325f8a02009-12-04 13:52:36 -0800249#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250
251/* Find an entry in the third-level page table.. */
252#define __pte_offset(address) \
253 (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
254#define pte_offset(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100255 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256#define pte_offset_kernel(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100257 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258#define pte_offset_map(dir, address) \
259 ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260#define pte_unmap(pte) ((void)(pte))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261
262/*
263 * Initialize a new pgd / pmd table with invalid pointers.
264 */
265extern void pgd_init(unsigned long page);
266extern void pmd_init(unsigned long page, unsigned long pagetable);
267
268/*
269 * Non-present pages: high 24 bits are offset, next 8 bits type,
270 * low 32 bits zero.
271 */
272static inline pte_t mk_swap_pte(unsigned long type, unsigned long offset)
273{ pte_t pte; pte_val(pte) = (type << 32) | (offset << 40); return pte; }
274
275#define __swp_type(x) (((x).val >> 32) & 0xff)
276#define __swp_offset(x) ((x).val >> 40)
Ralf Baechle21a151d2007-10-11 23:46:15 +0100277#define __swp_entry(type, offset) ((swp_entry_t) { pte_val(mk_swap_pte((type), (offset))) })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278#define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) })
279#define __swp_entry_to_pte(x) ((pte_t) { (x).val })
280
281/*
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400282 * Bits 0, 4, 6, and 7 are taken. Let's leave bits 1, 2, 3, and 5 alone to
283 * make things easier, and only use the upper 56 bits for the page offset...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 */
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400285#define PTE_FILE_MAX_BITS 56
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400287#define pte_to_pgoff(_pte) ((_pte).pte >> 8)
288#define pgoff_to_pte(off) ((pte_t) { ((off) << 8) | _PAGE_FILE })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289
290#endif /* _ASM_PGTABLE_64_H */