blob: 4ed9d1bba2ba7d10244bd6a7884651f0cbeea076 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1994, 95, 96, 97, 98, 99, 2000, 2003 Ralf Baechle
7 * Copyright (C) 1999, 2000, 2001 Silicon Graphics, Inc.
8 */
9#ifndef _ASM_PGTABLE_64_H
10#define _ASM_PGTABLE_64_H
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/linkage.h>
13
14#include <asm/addrspace.h>
15#include <asm/page.h>
16#include <asm/cachectl.h>
Atsushi Nemoto656be922006-10-26 00:08:31 +090017#include <asm/fixmap.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018
Ralf Baechlec6e8b582005-02-10 12:19:59 +000019#include <asm-generic/pgtable-nopud.h>
20
Linus Torvalds1da177e2005-04-16 15:20:36 -070021/*
22 * Each address space has 2 4K pages as its page directory, giving 1024
23 * (== PTRS_PER_PGD) 8 byte pointers to pmd tables. Each pmd table is a
Ralf Baechlec6e8b582005-02-10 12:19:59 +000024 * single 4K page, giving 512 (== PTRS_PER_PMD) 8 byte pointers to page
25 * tables. Each page table is also a single 4K page, giving 512 (==
26 * PTRS_PER_PTE) 8 byte ptes. Each pud entry is initialized to point to
27 * invalid_pmd_table, each pmd entry is initialized to point to
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 * invalid_pte_table, each pte is initialized to 0. When memory is low,
29 * and a pmd table or a page table allocation fails, empty_bad_pmd_table
30 * and empty_bad_page_table is returned back to higher layer code, so
31 * that the failure is recognized later on. Linux does not seem to
32 * handle these failures very well though. The empty_bad_page_table has
33 * invalid pte entries in it, to force page faults.
34 *
35 * Kernel mappings: kernel mappings are held in the swapper_pg_table.
36 * The layout is identical to userspace except it's indexed with the
37 * fault address - VMALLOC_START.
38 */
39
40/* PMD_SHIFT determines the size of the area a second-level page table can map */
Ralf Baechlec6e8b582005-02-10 12:19:59 +000041#define PMD_SHIFT (PAGE_SHIFT + (PAGE_SHIFT + PTE_ORDER - 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#define PMD_SIZE (1UL << PMD_SHIFT)
43#define PMD_MASK (~(PMD_SIZE-1))
44
45/* PGDIR_SHIFT determines what a third-level page table entry can map */
Ralf Baechlec6e8b582005-02-10 12:19:59 +000046#define PGDIR_SHIFT (PMD_SHIFT + (PAGE_SHIFT + PMD_ORDER - 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#define PGDIR_SIZE (1UL << PGDIR_SHIFT)
48#define PGDIR_MASK (~(PGDIR_SIZE-1))
49
50/*
Ralf Baechlec6e8b582005-02-10 12:19:59 +000051 * For 4kB page size we use a 3 level page tree and an 8kB pud, which
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 * permits us mapping 40 bits of virtual address space.
53 *
54 * We used to implement 41 bits by having an order 1 pmd level but that seemed
55 * rather pointless.
56 *
57 * For 8kB page size we use a 3 level page tree which permits a total of
58 * 8TB of address space. Alternatively a 33-bit / 8GB organization using
59 * two levels would be easy to implement.
60 *
61 * For 16kB page size we use a 2 level page tree which permits a total of
Thiemo Seuferf29244a2005-02-21 11:11:32 +000062 * 36 bits of virtual address space. We could add a third level but it seems
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 * like at the moment there's no need for this.
64 *
65 * For 64kB page size we use a 2 level page table tree for a total of 42 bits
66 * of virtual address space.
67 */
68#ifdef CONFIG_PAGE_SIZE_4KB
69#define PGD_ORDER 1
Ralf Baechlec6e8b582005-02-10 12:19:59 +000070#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070071#define PMD_ORDER 0
72#define PTE_ORDER 0
73#endif
74#ifdef CONFIG_PAGE_SIZE_8KB
75#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000076#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070077#define PMD_ORDER 0
78#define PTE_ORDER 0
79#endif
80#ifdef CONFIG_PAGE_SIZE_16KB
81#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000082#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070083#define PMD_ORDER 0
84#define PTE_ORDER 0
85#endif
Ralf Baechlec52399b2009-04-02 14:07:10 +020086#ifdef CONFIG_PAGE_SIZE_32KB
87#define PGD_ORDER 0
88#define PUD_ORDER aieeee_attempt_to_allocate_pud
89#define PMD_ORDER 0
90#define PTE_ORDER 0
91#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070092#ifdef CONFIG_PAGE_SIZE_64KB
93#define PGD_ORDER 0
Ralf Baechlec6e8b582005-02-10 12:19:59 +000094#define PUD_ORDER aieeee_attempt_to_allocate_pud
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#define PMD_ORDER 0
96#define PTE_ORDER 0
97#endif
98
99#define PTRS_PER_PGD ((PAGE_SIZE << PGD_ORDER) / sizeof(pgd_t))
100#define PTRS_PER_PMD ((PAGE_SIZE << PMD_ORDER) / sizeof(pmd_t))
101#define PTRS_PER_PTE ((PAGE_SIZE << PTE_ORDER) / sizeof(pte_t))
102
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400103#if PGDIR_SIZE >= TASK_SIZE
104#define USER_PTRS_PER_PGD (1)
105#else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#define USER_PTRS_PER_PGD (TASK_SIZE / PGDIR_SIZE)
Peter Watkins9dbd7b92006-08-23 11:15:49 -0400107#endif
108#define FIRST_USER_ADDRESS 0UL
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000110#define VMALLOC_START MAP_BASE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111#define VMALLOC_END \
112 (VMALLOC_START + PTRS_PER_PGD * PTRS_PER_PMD * PTRS_PER_PTE * PAGE_SIZE)
Franck Bui-Huu054c51b2007-02-15 14:21:36 +0100113#if defined(CONFIG_MODULES) && defined(KBUILD_64BIT_SYM32) && \
Atsushi Nemoto656be922006-10-26 00:08:31 +0900114 VMALLOC_START != CKSSEG
115/* Load modules into 32bit-compatible segment. */
116#define MODULE_START CKSSEG
117#define MODULE_END (FIXADDR_START-2*PAGE_SIZE)
118extern pgd_t module_pg_dir[PTRS_PER_PGD];
119#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
121#define pte_ERROR(e) \
122 printk("%s:%d: bad pte %016lx.\n", __FILE__, __LINE__, pte_val(e))
123#define pmd_ERROR(e) \
124 printk("%s:%d: bad pmd %016lx.\n", __FILE__, __LINE__, pmd_val(e))
125#define pgd_ERROR(e) \
126 printk("%s:%d: bad pgd %016lx.\n", __FILE__, __LINE__, pgd_val(e))
127
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000128extern pte_t invalid_pte_table[PTRS_PER_PTE];
129extern pte_t empty_bad_page_table[PTRS_PER_PTE];
130extern pmd_t invalid_pmd_table[PTRS_PER_PMD];
131extern pmd_t empty_bad_pmd_table[PTRS_PER_PMD];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132
133/*
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000134 * Empty pgd/pmd entries point to the invalid_pte_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 */
136static inline int pmd_none(pmd_t pmd)
137{
138 return pmd_val(pmd) == (unsigned long) invalid_pte_table;
139}
140
141#define pmd_bad(pmd) (pmd_val(pmd) & ~PAGE_MASK)
142
143static inline int pmd_present(pmd_t pmd)
144{
145 return pmd_val(pmd) != (unsigned long) invalid_pte_table;
146}
147
148static inline void pmd_clear(pmd_t *pmdp)
149{
150 pmd_val(*pmdp) = ((unsigned long) invalid_pte_table);
151}
152
153/*
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000154 * Empty pud entries point to the invalid_pmd_table.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000156static inline int pud_none(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000158 return pud_val(pud) == (unsigned long) invalid_pmd_table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159}
160
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000161static inline int pud_bad(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000163 return pud_val(pud) & ~PAGE_MASK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164}
165
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000166static inline int pud_present(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000168 return pud_val(pud) != (unsigned long) invalid_pmd_table;
169}
170
171static inline void pud_clear(pud_t *pudp)
172{
173 pud_val(*pudp) = ((unsigned long) invalid_pmd_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174}
175
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000176#define pte_page(x) pfn_to_page(pte_pfn(x))
177
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178#ifdef CONFIG_CPU_VR41XX
179#define pte_pfn(x) ((unsigned long)((x).pte >> (PAGE_SHIFT + 2)))
180#define pfn_pte(pfn, prot) __pte(((pfn) << (PAGE_SHIFT + 2)) | pgprot_val(prot))
181#else
182#define pte_pfn(x) ((unsigned long)((x).pte >> PAGE_SHIFT))
183#define pfn_pte(pfn, prot) __pte(((pfn) << PAGE_SHIFT) | pgprot_val(prot))
184#endif
185
186#define __pgd_offset(address) pgd_index(address)
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000187#define __pud_offset(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000188#define __pmd_offset(address) pmd_index(address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189
190/* to find an entry in a kernel page-table-directory */
Atsushi Nemoto656be922006-10-26 00:08:31 +0900191#ifdef MODULE_START
192#define pgd_offset_k(address) \
193 ((address) >= MODULE_START ? module_pg_dir : pgd_offset(&init_mm, 0UL))
194#else
Ralf Baechle242954b2006-10-24 02:29:01 +0100195#define pgd_offset_k(address) pgd_offset(&init_mm, 0UL)
Atsushi Nemoto656be922006-10-26 00:08:31 +0900196#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197
Thiemo Seuferf29244a2005-02-21 11:11:32 +0000198#define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1))
Thiemo Seufer1b3a6e92005-04-01 14:07:13 +0000199#define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
201/* to find an entry in a page-table-directory */
Ralf Baechle21a151d2007-10-11 23:46:15 +0100202#define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Dave McCracken46a82b22006-09-25 23:31:48 -0700204static inline unsigned long pud_page_vaddr(pud_t pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205{
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000206 return pud_val(pud);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207}
Franck Bui-Huuc9d06962007-03-19 17:36:42 +0100208#define pud_phys(pud) virt_to_phys((void *)pud_val(pud))
Dave McCracken46a82b22006-09-25 23:31:48 -0700209#define pud_page(pud) (pfn_to_page(pud_phys(pud) >> PAGE_SHIFT))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
211/* Find an entry in the second-level page table.. */
Ralf Baechlec6e8b582005-02-10 12:19:59 +0000212static inline pmd_t *pmd_offset(pud_t * pud, unsigned long address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213{
Dave McCracken46a82b22006-09-25 23:31:48 -0700214 return (pmd_t *) pud_page_vaddr(*pud) + pmd_index(address);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215}
216
217/* Find an entry in the third-level page table.. */
218#define __pte_offset(address) \
219 (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
220#define pte_offset(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100221 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222#define pte_offset_kernel(dir, address) \
Franck Bui-Huu5b70a312006-12-05 10:39:56 +0100223 ((pte_t *) pmd_page_vaddr(*(dir)) + __pte_offset(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224#define pte_offset_map(dir, address) \
225 ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address))
226#define pte_offset_map_nested(dir, address) \
227 ((pte_t *)page_address(pmd_page(*(dir))) + __pte_offset(address))
228#define pte_unmap(pte) ((void)(pte))
229#define pte_unmap_nested(pte) ((void)(pte))
230
231/*
232 * Initialize a new pgd / pmd table with invalid pointers.
233 */
234extern void pgd_init(unsigned long page);
235extern void pmd_init(unsigned long page, unsigned long pagetable);
236
237/*
238 * Non-present pages: high 24 bits are offset, next 8 bits type,
239 * low 32 bits zero.
240 */
241static inline pte_t mk_swap_pte(unsigned long type, unsigned long offset)
242{ pte_t pte; pte_val(pte) = (type << 32) | (offset << 40); return pte; }
243
244#define __swp_type(x) (((x).val >> 32) & 0xff)
245#define __swp_offset(x) ((x).val >> 40)
Ralf Baechle21a151d2007-10-11 23:46:15 +0100246#define __swp_entry(type, offset) ((swp_entry_t) { pte_val(mk_swap_pte((type), (offset))) })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247#define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) })
248#define __swp_entry_to_pte(x) ((pte_t) { (x).val })
249
250/*
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400251 * Bits 0, 4, 6, and 7 are taken. Let's leave bits 1, 2, 3, and 5 alone to
252 * make things easier, and only use the upper 56 bits for the page offset...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 */
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400254#define PTE_FILE_MAX_BITS 56
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
Sergei Shtylyov7cb710c2006-05-27 22:39:39 +0400256#define pte_to_pgoff(_pte) ((_pte).pte >> 8)
257#define pgoff_to_pte(off) ((pte_t) { ((off) << 8) | _PAGE_FILE })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
259#endif /* _ASM_PGTABLE_64_H */