blob: 8ae0000cbdb34d8c6db0efacc566fb3a5b78d2d3 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * IA-32 Huge TLB Page Support for Kernel.
4 *
5 * Copyright (C) 2002, Rohit Seth <rohit.seth@intel.com>
6 */
7
Linus Torvalds1da177e2005-04-16 15:20:36 -07008#include <linux/init.h>
9#include <linux/fs.h>
10#include <linux/mm.h>
Ingo Molnar01042602017-02-08 18:51:31 +010011#include <linux/sched/mm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/hugetlb.h>
13#include <linux/pagemap.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070014#include <linux/err.h>
15#include <linux/sysctl.h>
Dmitry Safonove13b73d2017-03-14 14:41:26 +030016#include <linux/compat.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <asm/mman.h>
18#include <asm/tlb.h>
19#include <asm/tlbflush.h>
Jeremy Fitzhardingea5a19c62008-01-30 13:33:39 +010020#include <asm/pgalloc.h>
Dmitry Safonove13b73d2017-03-14 14:41:26 +030021#include <asm/elf.h>
Kirill A. Shutemov44b04912017-07-17 01:59:51 +030022#include <asm/mpx.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#if 0 /* This is just for testing */
25struct page *
26follow_huge_addr(struct mm_struct *mm, unsigned long address, int write)
27{
28 unsigned long start = address;
29 int length = 1;
30 int nr;
31 struct page *page;
32 struct vm_area_struct *vma;
33
34 vma = find_vma(mm, addr);
35 if (!vma || !is_vm_hugetlb_page(vma))
36 return ERR_PTR(-EINVAL);
37
Punit Agrawal7868a202017-07-06 15:39:42 -070038 pte = huge_pte_offset(mm, address, vma_mmu_pagesize(vma));
Linus Torvalds1da177e2005-04-16 15:20:36 -070039
40 /* hugetlb should be locked, and hence, prefaulted */
41 WARN_ON(!pte || pte_none(*pte));
42
43 page = &pte_page(*pte)[vpfn % (HPAGE_SIZE/PAGE_SIZE)];
44
Christoph Lameter25e59882008-03-26 21:03:04 -070045 WARN_ON(!PageHead(page));
Linus Torvalds1da177e2005-04-16 15:20:36 -070046
47 return page;
48}
49
50int pmd_huge(pmd_t pmd)
51{
52 return 0;
53}
54
Andi Kleenceb86872008-07-23 21:27:50 -070055int pud_huge(pud_t pud)
56{
57 return 0;
58}
59
Linus Torvalds1da177e2005-04-16 15:20:36 -070060#else
61
Naoya Horiguchicbef8472015-02-11 15:25:19 -080062/*
63 * pmd_huge() returns 1 if @pmd is hugetlb related entry, that is normal
64 * hugetlb entry or non-present (migration or hwpoisoned) hugetlb entry.
65 * Otherwise, returns 0.
66 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070067int pmd_huge(pmd_t pmd)
68{
Naoya Horiguchicbef8472015-02-11 15:25:19 -080069 return !pmd_none(pmd) &&
70 (pmd_val(pmd) & (_PAGE_PRESENT|_PAGE_PSE)) != _PAGE_PRESENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -070071}
72
Andi Kleenceb86872008-07-23 21:27:50 -070073int pud_huge(pud_t pud)
74{
Andi Kleen39c11e62008-07-23 21:27:50 -070075 return !!(pud_val(pud) & _PAGE_PSE);
Andi Kleenceb86872008-07-23 21:27:50 -070076}
Linus Torvalds1da177e2005-04-16 15:20:36 -070077#endif
78
Kirill A. Shutemovfd8526a2013-11-19 15:17:50 +020079#ifdef CONFIG_HUGETLB_PAGE
Linus Torvalds1da177e2005-04-16 15:20:36 -070080static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *file,
81 unsigned long addr, unsigned long len,
82 unsigned long pgoff, unsigned long flags)
83{
Andi Kleen39c11e62008-07-23 21:27:50 -070084 struct hstate *h = hstate_file(file);
Michel Lespinassecdc17342012-12-11 16:02:02 -080085 struct vm_unmapped_area_info info;
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
Michel Lespinassecdc17342012-12-11 16:02:02 -080087 info.flags = 0;
88 info.length = len;
Dmitry Safonove13b73d2017-03-14 14:41:26 +030089 info.low_limit = get_mmap_base(1);
Kirill A. Shutemovb569bab2017-07-17 01:59:52 +030090
91 /*
92 * If hint address is above DEFAULT_MAP_WINDOW, look for unmapped area
93 * in the full address space.
94 */
Dmitry Safonove13b73d2017-03-14 14:41:26 +030095 info.high_limit = in_compat_syscall() ?
Kirill A. Shutemovb569bab2017-07-17 01:59:52 +030096 task_size_32bit() : task_size_64bit(addr > DEFAULT_MAP_WINDOW);
97
Michel Lespinassecdc17342012-12-11 16:02:02 -080098 info.align_mask = PAGE_MASK & ~huge_page_mask(h);
99 info.align_offset = 0;
100 return vm_unmapped_area(&info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101}
102
103static unsigned long hugetlb_get_unmapped_area_topdown(struct file *file,
Kirill A. Shutemovb569bab2017-07-17 01:59:52 +0300104 unsigned long addr, unsigned long len,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 unsigned long pgoff, unsigned long flags)
106{
Andi Kleen39c11e62008-07-23 21:27:50 -0700107 struct hstate *h = hstate_file(file);
Michel Lespinassecdc17342012-12-11 16:02:02 -0800108 struct vm_unmapped_area_info info;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Michel Lespinassecdc17342012-12-11 16:02:02 -0800110 info.flags = VM_UNMAPPED_AREA_TOPDOWN;
111 info.length = len;
112 info.low_limit = PAGE_SIZE;
Dmitry Safonove13b73d2017-03-14 14:41:26 +0300113 info.high_limit = get_mmap_base(0);
Kirill A. Shutemovb569bab2017-07-17 01:59:52 +0300114
115 /*
116 * If hint address is above DEFAULT_MAP_WINDOW, look for unmapped area
117 * in the full address space.
118 */
119 if (addr > DEFAULT_MAP_WINDOW && !in_compat_syscall())
120 info.high_limit += TASK_SIZE_MAX - DEFAULT_MAP_WINDOW;
121
Michel Lespinassecdc17342012-12-11 16:02:02 -0800122 info.align_mask = PAGE_MASK & ~huge_page_mask(h);
123 info.align_offset = 0;
124 addr = vm_unmapped_area(&info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 /*
127 * A failed mmap() very likely causes application failure,
128 * so fall back to the bottom-up function here. This scenario
129 * can happen with large stack limits and large mmap()
130 * allocations.
131 */
Michel Lespinassecdc17342012-12-11 16:02:02 -0800132 if (addr & ~PAGE_MASK) {
133 VM_BUG_ON(addr != -ENOMEM);
134 info.flags = 0;
135 info.low_limit = TASK_UNMAPPED_BASE;
Kirill A. Shutemovb569bab2017-07-17 01:59:52 +0300136 info.high_limit = TASK_SIZE_LOW;
Michel Lespinassecdc17342012-12-11 16:02:02 -0800137 addr = vm_unmapped_area(&info);
138 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139
140 return addr;
141}
142
143unsigned long
144hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
145 unsigned long len, unsigned long pgoff, unsigned long flags)
146{
Andi Kleen39c11e62008-07-23 21:27:50 -0700147 struct hstate *h = hstate_file(file);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 struct mm_struct *mm = current->mm;
149 struct vm_area_struct *vma;
150
Andi Kleen39c11e62008-07-23 21:27:50 -0700151 if (len & ~huge_page_mask(h))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152 return -EINVAL;
Kirill A. Shutemov44b04912017-07-17 01:59:51 +0300153
154 addr = mpx_unmapped_area_check(addr, len, flags);
155 if (IS_ERR_VALUE(addr))
156 return addr;
157
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 if (len > TASK_SIZE)
159 return -ENOMEM;
160
Benjamin Herrenschmidt5a8130f2007-05-06 14:50:08 -0700161 if (flags & MAP_FIXED) {
Andi Kleena5516432008-07-23 21:27:41 -0700162 if (prepare_hugepage_range(file, addr, len))
Benjamin Herrenschmidt5a8130f2007-05-06 14:50:08 -0700163 return -EINVAL;
164 return addr;
165 }
166
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167 if (addr) {
Andi Kleen39c11e62008-07-23 21:27:50 -0700168 addr = ALIGN(addr, huge_page_size(h));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 vma = find_vma(mm, addr);
170 if (TASK_SIZE - len >= addr &&
Hugh Dickins1be71072017-06-19 04:03:24 -0700171 (!vma || addr + len <= vm_start_gap(vma)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 return addr;
173 }
174 if (mm->get_unmapped_area == arch_get_unmapped_area)
175 return hugetlb_get_unmapped_area_bottomup(file, addr, len,
176 pgoff, flags);
177 else
178 return hugetlb_get_unmapped_area_topdown(file, addr, len,
179 pgoff, flags);
180}
Kirill A. Shutemovfd8526a2013-11-19 15:17:50 +0200181#endif /* CONFIG_HUGETLB_PAGE */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182
Andi Kleenb4718e62008-07-23 21:27:51 -0700183#ifdef CONFIG_X86_64
184static __init int setup_hugepagesz(char *opt)
185{
186 unsigned long ps = memparse(opt, &opt);
187 if (ps == PMD_SIZE) {
188 hugetlb_add_hstate(PMD_SHIFT - PAGE_SHIFT);
Borislav Petkovb8291adc2016-03-29 17:41:58 +0200189 } else if (ps == PUD_SIZE && boot_cpu_has(X86_FEATURE_GBPAGES)) {
Andi Kleenb4718e62008-07-23 21:27:51 -0700190 hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
191 } else {
Vaishali Thakkar2b18e532016-05-19 17:11:20 -0700192 hugetlb_bad_size();
Andi Kleenb4718e62008-07-23 21:27:51 -0700193 printk(KERN_ERR "hugepagesz: Unsupported page size %lu M\n",
194 ps >> 20);
195 return 0;
196 }
197 return 1;
198}
199__setup("hugepagesz=", setup_hugepagesz);
Kirill A. Shutemovece84b32015-02-10 14:08:19 -0800200
Vlastimil Babka080fe202016-02-05 15:36:41 -0800201#if (defined(CONFIG_MEMORY_ISOLATION) && defined(CONFIG_COMPACTION)) || defined(CONFIG_CMA)
Kirill A. Shutemovece84b32015-02-10 14:08:19 -0800202static __init int gigantic_pages_init(void)
203{
Vlastimil Babka080fe202016-02-05 15:36:41 -0800204 /* With compaction or CMA we can allocate gigantic pages at runtime */
Borislav Petkovb8291adc2016-03-29 17:41:58 +0200205 if (boot_cpu_has(X86_FEATURE_GBPAGES) && !size_to_hstate(1UL << PUD_SHIFT))
Kirill A. Shutemovece84b32015-02-10 14:08:19 -0800206 hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
207 return 0;
208}
209arch_initcall(gigantic_pages_init);
210#endif
Andi Kleenb4718e62008-07-23 21:27:51 -0700211#endif