blob: 8eda30b467da60705265dac71fee27377562b0cc [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1994, 95, 96, 97, 98, 99, 2000, 2003 Ralf Baechle
7 * Copyright (C) 1999, 2000, 2001 Silicon Graphics, Inc.
8 */
9#ifndef _ASM_PGTABLE_64_H
10#define _ASM_PGTABLE_64_H
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/linkage.h>
13
14#include <asm/addrspace.h>
15#include <asm/page.h>
16#include <asm/cachectl.h>
Atsushi Nemoto656be922006-10-26 00:08:31 +090017#include <asm/fixmap.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018
Ralf Baechlec6e8b582005-02-10 12:19:59 +000019#include <asm-generic/pgtable-nopud.h>
20
Linus Torvalds1da177e2005-04-16 15:20:36 -070021/*
22 * Each address space has 2 4K pages as its page directory, giving 1024
23 * (== PTRS_PER_PGD) 8 byte pointers to pmd tables. Each pmd table is a
Ralf Baechlec6e8b582005-02-10 12:19:59 +000024 * single 4K page, giving 512 (== PTRS_PER_PMD) 8 byte pointers to page
25 * tables. Each page table is also a single 4K page, giving 512 (==
26 * PTRS_PER_PTE) 8 byte ptes. Each pud entry is initialized to point to
27 * invalid_pmd_table, each pmd entry is initialized to point to
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 * invalid_pte_table, each pte is initialized to 0. When memory is low,
29 * and a pmd table or a page table allocation fails, empty_bad_pmd_table
30 * and empty_bad_page_table is returned back to higher layer code, so
31 * that the failure is recognized later on. Linux does not seem to
32 * handle these failures very well though. The empty_bad_page_table has
33 * invalid pte entries in it, to force page faults.
34 *
35 * Kernel mappings: kernel mappings are held in the swapper_pg_table.
36 * The layout is identical to userspace except it's indexed with the
37 * fault address - VMALLOC_START.
38 */
39
40/* PMD_SHIFT determines the size of the area a second-level page table can map */
Ralf Baechlec6e8b582005-02-10 12:19:59 +000041#define PMD_SHIFT (PAGE_SHIFT + (PAGE_SHIFT + PTE_ORDER - 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#define PMD_SIZE (1UL << PMD_SHIFT)
43#define PMD_MASK (~(PMD_SIZE-1))
44
45/* PGDIR_SHIFT determines what a third-level page table entry can map */
Ralf Baechlec6e8b582005-02-10 12:19:59 +000046#define PGDIR_SHIFT (PMD_SHIFT + (PAGE_SHIFT + PMD_ORDER - 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#define PGDIR_SIZE (1UL << PGDIR_SHIFT)
48#define PGDIR_MASK (~(PGDIR_SIZE-1))
49
50/*
Ralf Baechlec6e8b582005-02-10 12:19:59 +000051 * For 4kB page size we use a 3 level page tree and an 8kB pud, which
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 * permits us mapping 40 bits of virtual address space.
53 *
54 * We used to implement 41 bits by having an order 1 pmd level but that seemed
55 * rather pointless.
56 *
57 * For 8kB page size we use a 3 level page tree which permits a total of
58 * 8TB of address space. Alternatively a 33-bit / 8GB organization using
59 * two levels would be easy to implement.
60 *
61 * For 16kB page size we use a 2 level page tree which permits a total of
Thiemo Seuferf29244a2005-02-21 11:11:32 +000062 * 36 bits of virtual address space. We could add a third level but it seems
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 * like at the moment there's no need for this.
64 *
65 * For 64kB page size we use a 2 level page table tree for a total of 42 bits
66 * of virtual address space.
67 */
68#ifdef CONFIG_PAGE_SIZE_4KB
69#define PGD_ORDER 1
Ralf Baechlec6e8b582005-02-10 12:19:59 +000070#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070071#define PMD_ORDER 0
72#define PTE_ORDER 0
73#endif
74#ifdef CONFIG_PAGE_SIZE_8KB
75#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000076#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070077#define PMD_ORDER 0
78#define PTE_ORDER 0
79#endif
80#ifdef CONFIG_PAGE_SIZE_16KB
81#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000082#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070083#define PMD_ORDER 0
84#define PTE_ORDER 0
85#endif
Ralf Baechlec52399b2009-04-02 14:07:10 +020086#ifdef CONFIG_PAGE_SIZE_32KB
87#define PGD_ORDER 0
88#define PUD_ORDER aieeee_attempt_to_allocate_pud
89#define PMD_ORDER 0
90#define PTE_ORDER 0
91#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070092#ifdef CONFIG_PAGE_SIZE_64KB
93#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000094#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#define PMD_ORDER 0
96#define PTE_ORDER 0
97#endif
98
99#define PTRS_PER_PGD ((PAGE_SIZE << PGD_ORDER) / sizeof(pgd_t))
100#define PTRS_PER_PMD ((PAGE_SIZE << PMD_ORDER) / sizeof(pmd_t))
101#define PTRS_PER_PTE ((PAGE_SIZE << PTE_ORDER) / sizeof(pte_t))
102
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400103#if PGDIR_SIZE >= TASK_SIZE
104#define USER_PTRS_PER_PGD (1)
105#else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#define USER_PTRS_PER_PGD (TASK_SIZE / PGDIR_SIZE)
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400107#endif
108#define FIRST_USER_ADDRESS 0UL
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000110#define VMALLOC_START MAP_BASE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111#define VMALLOC_END \
Wu Feie0cc87f2009-09-03 22:29:53 +0800112 (VMALLOC_START + \
Guenter Roeck91dfc422010-02-02 08:52:20 -0800113 min(PTRS_PER_PGD * PTRS_PER_PMD * PTRS_PER_PTE * PAGE_SIZE, \
114 (1UL << cpu_vmbits)) - (1UL << 32))
115
Franck Bui-Huu054c51b2007-02-15 14:21:36 +0100116#if defined(CONFIG_MODULES) && defined(KBUILD_64BIT_SYM32) && \
Atsushi Nemoto656be922006-10-26 00:08:31 +0900117 VMALLOC_START != CKSSEG
118/* Load modules into 32bit-compatible segment. */
119#define MODULE_START CKSSEG
120#define MODULE_END (FIXADDR_START-2*PAGE_SIZE)
Atsushi Nemoto656be922006-10-26 00:08:31 +0900121#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122
123#define pte_ERROR(e) \
124 printk("%s:%d: bad pte %016lx.\n", __FILE__, __LINE__, pte_val(e))
125#define pmd_ERROR(e) \
126 printk("%s:%d: bad pmd %016lx.\n", __FILE__, __LINE__, pmd_val(e))
127#define pgd_ERROR(e) \
128 printk("%s:%d: bad pgd %016lx.\n", __FILE__, __LINE__, pgd_val(e))
129
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000130extern pte_t invalid_pte_table[PTRS_PER_PTE];
131extern pte_t empty_bad_page_table[PTRS_PER_PTE];
132extern pmd_t invalid_pmd_table[PTRS_PER_PMD];
133extern pmd_t empty_bad_pmd_table[PTRS_PER_PMD];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134
135/*
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000136 * Empty pgd/pmd entries point to the invalid_pte_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 */
138static inline int pmd_none(pmd_t pmd)
139{
140 return pmd_val(pmd) == (unsigned long) invalid_pte_table;
141}
142
143#define pmd_bad(pmd) (pmd_val(pmd) & ~PAGE_MASK)
144
145static inline int pmd_present(pmd_t pmd)
146{
147 return pmd_val(pmd) != (unsigned long) invalid_pte_table;
148}
149
150static inline void pmd_clear(pmd_t *pmdp)
151{
152 pmd_val(*pmdp) = ((unsigned long) invalid_pte_table);
153}
154
155/*
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000156 * Empty pud entries point to the invalid_pmd_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000158static inline int pud_none(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000160 return pud_val(pud) == (unsigned long) invalid_pmd_table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161}
162
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000163static inline int pud_bad(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000165 return pud_val(pud) & ~PAGE_MASK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166}
167
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000168static inline int pud_present(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000170 return pud_val(pud) != (unsigned long) invalid_pmd_table;
171}
172
173static inline void pud_clear(pud_t *pudp)
174{
175 pud_val(*pudp) = ((unsigned long) invalid_pmd_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176}
177
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000178#define pte_page(x) pfn_to_page(pte_pfn(x))
179
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180#ifdef CONFIG_CPU_VR41XX
181#define pte_pfn(x) ((unsigned long)((x).pte >> (PAGE_SHIFT + 2)))
182#define pfn_pte(pfn, prot) __pte(((pfn) << (PAGE_SHIFT + 2)) | pgprot_val(prot))
183#else
184#define pte_pfn(x) ((unsigned long)((x).pte >> PAGE_SHIFT))
185#define pfn_pte(pfn, prot) __pte(((pfn) << PAGE_SHIFT) | pgprot_val(prot))
186#endif
187
188#define __pgd_offset(address) pgd_index(address)
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000189#define __pud_offset(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000190#define __pmd_offset(address) pmd_index(address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191
192/* to find an entry in a kernel page-table-directory */
Wu Feie0cc87f2009-09-03 22:29:53 +0800193#define pgd_offset_k(address) pgd_offset(&init_mm, address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000195#define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000196#define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197
198/* to find an entry in a page-table-directory */
Ralf Baechle21a151d2007-10-11 23:46:15 +0100199#define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
Dave McCracken46a82b22006-09-25 23:31:48 -0700201static inline unsigned long pud_page_vaddr(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000203 return pud_val(pud);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204}
Franck Bui-Huuc9d06962007-03-19 17:36:42 +0100205#define pud_phys(pud) virt_to_phys((void *)pud_val(pud))
Dave McCracken46a82b22006-09-25 23:31:48 -0700206#define pud_page(pud) (pfn_to_page(pud_phys(pud) >> PAGE_SHIFT))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207
208/* Find an entry in the second-level page table.. */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000209static inline pmd_t *pmd_offset(pud_t * pud, unsigned long address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210{
Dave McCracken46a82b22006-09-25 23:31:48 -0700211 return (pmd_t *) pud_page_vaddr(*pud) + pmd_index(address);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212}
213
214/* Find an entry in the third-level page table.. */
215#define __pte_offset(address) \
216 (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
217#define pte_offset(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100218 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219#define pte_offset_kernel(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100220 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221#define pte_offset_map(dir, address) \
222 ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address))
223#define pte_offset_map_nested(dir, address) \
224 ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address))
225#define pte_unmap(pte) ((void)(pte))
226#define pte_unmap_nested(pte) ((void)(pte))
227
228/*
229 * Initialize a new pgd / pmd table with invalid pointers.
230 */
231extern void pgd_init(unsigned long page);
232extern void pmd_init(unsigned long page, unsigned long pagetable);
233
234/*
235 * Non-present pages: high 24 bits are offset, next 8 bits type,
236 * low 32 bits zero.
237 */
238static inline pte_t mk_swap_pte(unsigned long type, unsigned long offset)
239{ pte_t pte; pte_val(pte) = (type << 32) | (offset << 40); return pte; }
240
241#define __swp_type(x) (((x).val >> 32) & 0xff)
242#define __swp_offset(x) ((x).val >> 40)
Ralf Baechle21a151d2007-10-11 23:46:15 +0100243#define __swp_entry(type, offset) ((swp_entry_t) { pte_val(mk_swap_pte((type), (offset))) })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244#define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) })
245#define __swp_entry_to_pte(x) ((pte_t) { (x).val })
246
247/*
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400248 * Bits 0, 4, 6, and 7 are taken. Let's leave bits 1, 2, 3, and 5 alone to
249 * make things easier, and only use the upper 56 bits for the page offset...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 */
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400251#define PTE_FILE_MAX_BITS 56
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400253#define pte_to_pgoff(_pte) ((_pte).pte >> 8)
254#define pgoff_to_pte(off) ((pte_t) { ((off) << 8) | _PAGE_FILE })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
256#endif /* _ASM_PGTABLE_64_H */