blob: d8abfcf524d102573a53e456fec24592cf933a01 [file] [log] [blame]
H. Peter Anvin1965aae2008-10-22 22:26:29 -07001#ifndef _ASM_X86_MMU_CONTEXT_H
2#define _ASM_X86_MMU_CONTEXT_H
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -04003
4#include <asm/desc.h>
Arun Sharma600634972011-07-26 16:09:06 -07005#include <linux/atomic.h>
Dave Hansend17d8f92014-07-31 08:40:59 -07006#include <linux/mm_types.h>
7
8#include <trace/events/tlb.h>
9
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -040010#include <asm/pgalloc.h>
11#include <asm/tlbflush.h>
12#include <asm/paravirt.h>
Dave Hansenfe3d1972014-11-14 07:18:29 -080013#include <asm/mpx.h>
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -040014#ifndef CONFIG_PARAVIRT
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -040015static inline void paravirt_activate_mm(struct mm_struct *prev,
16 struct mm_struct *next)
17{
18}
19#endif /* !CONFIG_PARAVIRT */
20
Andy Lutomirski7911d3f2014-10-24 15:58:12 -070021#ifdef CONFIG_PERF_EVENTS
Andy Lutomirskia6673422014-10-24 15:58:13 -070022extern struct static_key rdpmc_always_available;
23
Andy Lutomirski7911d3f2014-10-24 15:58:12 -070024static inline void load_mm_cr4(struct mm_struct *mm)
25{
Peter Zijlstraa8335812015-07-09 19:23:38 +020026 if (static_key_false(&rdpmc_always_available) ||
Andy Lutomirskia6673422014-10-24 15:58:13 -070027 atomic_read(&mm->context.perf_rdpmc_allowed))
Andy Lutomirski7911d3f2014-10-24 15:58:12 -070028 cr4_set_bits(X86_CR4_PCE);
29 else
30 cr4_clear_bits(X86_CR4_PCE);
31}
32#else
33static inline void load_mm_cr4(struct mm_struct *mm) {}
34#endif
35
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070036#ifdef CONFIG_MODIFY_LDT_SYSCALL
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -040037/*
Andy Lutomirski37868fe2015-07-30 14:31:32 -070038 * ldt_structs can be allocated, used, and freed, but they are never
39 * modified while live.
40 */
41struct ldt_struct {
42 /*
43 * Xen requires page-aligned LDTs with special permissions. This is
44 * needed to prevent us from installing evil descriptors such as
45 * call gates. On native, we could merge the ldt_struct and LDT
46 * allocations, but it's not worth trying to optimize.
47 */
48 struct desc_struct *entries;
49 int size;
50};
51
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070052/*
53 * Used for LDT copy/destruction.
54 */
Dave Hansen39a05262016-02-12 13:02:34 -080055int init_new_context_ldt(struct task_struct *tsk, struct mm_struct *mm);
56void destroy_context_ldt(struct mm_struct *mm);
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070057#else /* CONFIG_MODIFY_LDT_SYSCALL */
Dave Hansen39a05262016-02-12 13:02:34 -080058static inline int init_new_context_ldt(struct task_struct *tsk,
59 struct mm_struct *mm)
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070060{
61 return 0;
62}
Dave Hansen39a05262016-02-12 13:02:34 -080063static inline void destroy_context_ldt(struct mm_struct *mm) {}
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070064#endif
65
Andy Lutomirski37868fe2015-07-30 14:31:32 -070066static inline void load_mm_ldt(struct mm_struct *mm)
67{
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070068#ifdef CONFIG_MODIFY_LDT_SYSCALL
Andy Lutomirski37868fe2015-07-30 14:31:32 -070069 struct ldt_struct *ldt;
70
71 /* lockless_dereference synchronizes with smp_store_release */
72 ldt = lockless_dereference(mm->context.ldt);
73
74 /*
75 * Any change to mm->context.ldt is followed by an IPI to all
76 * CPUs with the mm active. The LDT will not be freed until
77 * after the IPI is handled by all such CPUs. This means that,
78 * if the ldt_struct changes before we return, the values we see
79 * will be safe, and the new values will be loaded before we run
80 * any user code.
81 *
82 * NB: don't try to convert this to use RCU without extreme care.
83 * We would still need IRQs off, because we don't want to change
84 * the local LDT after an IPI loaded a newer value than the one
85 * that we can see.
86 */
87
88 if (unlikely(ldt))
89 set_ldt(ldt->entries, ldt->size);
90 else
91 clear_LDT();
Andy Lutomirskia5b9e5a2015-07-30 14:31:34 -070092#else
93 clear_LDT();
94#endif
Andy Lutomirski37868fe2015-07-30 14:31:32 -070095
96 DEBUG_LOCKS_WARN_ON(preemptible());
97}
98
Brian Gerst6826c8f2009-01-21 17:26:06 +090099static inline void enter_lazy_tlb(struct mm_struct *mm, struct task_struct *tsk)
100{
101#ifdef CONFIG_SMP
Alex Shic6ae41e2012-05-11 15:35:27 +0800102 if (this_cpu_read(cpu_tlbstate.state) == TLBSTATE_OK)
103 this_cpu_write(cpu_tlbstate.state, TLBSTATE_LAZY);
Thomas Gleixner96a388d2007-10-11 11:20:03 +0200104#endif
Brian Gerst6826c8f2009-01-21 17:26:06 +0900105}
106
Dave Hansen39a05262016-02-12 13:02:34 -0800107static inline int init_new_context(struct task_struct *tsk,
108 struct mm_struct *mm)
109{
110 init_new_context_ldt(tsk, mm);
111 return 0;
112}
113static inline void destroy_context(struct mm_struct *mm)
114{
115 destroy_context_ldt(mm);
116}
117
Andy Lutomirski69c03192016-04-26 09:39:08 -0700118extern void switch_mm(struct mm_struct *prev, struct mm_struct *next,
119 struct task_struct *tsk);
Brian Gerst6826c8f2009-01-21 17:26:06 +0900120
Andy Lutomirski078194f2016-04-26 09:39:09 -0700121extern void switch_mm_irqs_off(struct mm_struct *prev, struct mm_struct *next,
122 struct task_struct *tsk);
123#define switch_mm_irqs_off switch_mm_irqs_off
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -0400124
125#define activate_mm(prev, next) \
126do { \
127 paravirt_activate_mm((prev), (next)); \
128 switch_mm((prev), (next), NULL); \
129} while (0);
130
Brian Gerst6826c8f2009-01-21 17:26:06 +0900131#ifdef CONFIG_X86_32
132#define deactivate_mm(tsk, mm) \
133do { \
Tejun Heoccbeed32009-02-09 22:17:40 +0900134 lazy_load_gs(0); \
Brian Gerst6826c8f2009-01-21 17:26:06 +0900135} while (0)
136#else
137#define deactivate_mm(tsk, mm) \
138do { \
139 load_gs_index(0); \
140 loadsegment(fs, 0); \
141} while (0)
142#endif
Jeremy Fitzhardingec3c2fee2008-06-25 00:19:07 -0400143
Dave Hansena1ea1c02014-11-18 10:23:49 -0800144static inline void arch_dup_mmap(struct mm_struct *oldmm,
145 struct mm_struct *mm)
146{
147 paravirt_arch_dup_mmap(oldmm, mm);
148}
149
150static inline void arch_exit_mmap(struct mm_struct *mm)
151{
152 paravirt_arch_exit_mmap(mm);
153}
154
Dave Hansenb0e9b092015-06-07 11:37:04 -0700155#ifdef CONFIG_X86_64
156static inline bool is_64bit_mm(struct mm_struct *mm)
157{
Masahiro Yamada97f26452016-08-03 13:45:50 -0700158 return !IS_ENABLED(CONFIG_IA32_EMULATION) ||
Dave Hansenb0e9b092015-06-07 11:37:04 -0700159 !(mm->context.ia32_compat == TIF_IA32);
160}
161#else
162static inline bool is_64bit_mm(struct mm_struct *mm)
163{
164 return false;
165}
166#endif
167
Dave Hansenfe3d1972014-11-14 07:18:29 -0800168static inline void arch_bprm_mm_init(struct mm_struct *mm,
169 struct vm_area_struct *vma)
170{
171 mpx_mm_init(mm);
172}
173
Dave Hansen1de4fa12014-11-14 07:18:31 -0800174static inline void arch_unmap(struct mm_struct *mm, struct vm_area_struct *vma,
175 unsigned long start, unsigned long end)
176{
Dave Hansenc9222282015-01-08 14:30:21 -0800177 /*
178 * mpx_notify_unmap() goes and reads a rarely-hot
179 * cacheline in the mm_struct. That can be expensive
180 * enough to be seen in profiles.
181 *
182 * The mpx_notify_unmap() call and its contents have been
183 * observed to affect munmap() performance on hardware
184 * where MPX is not present.
185 *
186 * The unlikely() optimizes for the fast case: no MPX
187 * in the CPU, or no MPX use in the process. Even if
188 * we get this wrong (in the unlikely event that MPX
189 * is widely enabled on some system) the overhead of
190 * MPX itself (reading bounds tables) is expected to
191 * overwhelm the overhead of getting this unlikely()
192 * consistently wrong.
193 */
194 if (unlikely(cpu_feature_enabled(X86_FEATURE_MPX)))
195 mpx_notify_unmap(mm, vma, start, end);
Dave Hansen1de4fa12014-11-14 07:18:31 -0800196}
197
Dave Hansen8f62c882016-02-12 13:02:10 -0800198static inline int vma_pkey(struct vm_area_struct *vma)
199{
200 u16 pkey = 0;
201#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS
202 unsigned long vma_pkey_mask = VM_PKEY_BIT0 | VM_PKEY_BIT1 |
203 VM_PKEY_BIT2 | VM_PKEY_BIT3;
204 pkey = (vma->vm_flags & vma_pkey_mask) >> VM_PKEY_SHIFT;
205#endif
206 return pkey;
207}
208
Dave Hansen33a709b2016-02-12 13:02:19 -0800209static inline bool __pkru_allows_pkey(u16 pkey, bool write)
210{
211 u32 pkru = read_pkru();
212
213 if (!__pkru_allows_read(pkru, pkey))
214 return false;
215 if (write && !__pkru_allows_write(pkru, pkey))
216 return false;
217
218 return true;
219}
220
221/*
222 * We only want to enforce protection keys on the current process
223 * because we effectively have no access to PKRU for other
224 * processes or any way to tell *which * PKRU in a threaded
225 * process we could use.
226 *
227 * So do not enforce things if the VMA is not from the current
228 * mm, or if we are in a kernel thread.
229 */
230static inline bool vma_is_foreign(struct vm_area_struct *vma)
231{
232 if (!current->mm)
233 return true;
234 /*
235 * Should PKRU be enforced on the access to this VMA? If
236 * the VMA is from another process, then PKRU has no
237 * relevance and should not be enforced.
238 */
239 if (current->mm != vma->vm_mm)
240 return true;
241
242 return false;
243}
244
Dave Hansen1b2ee122016-02-12 13:02:21 -0800245static inline bool arch_vma_access_permitted(struct vm_area_struct *vma,
Dave Hansend61172b2016-02-12 13:02:24 -0800246 bool write, bool execute, bool foreign)
Dave Hansen33a709b2016-02-12 13:02:19 -0800247{
Dave Hansend61172b2016-02-12 13:02:24 -0800248 /* pkeys never affect instruction fetches */
249 if (execute)
250 return true;
Dave Hansen33a709b2016-02-12 13:02:19 -0800251 /* allow access if the VMA is not one from this process */
Dave Hansen1b2ee122016-02-12 13:02:21 -0800252 if (foreign || vma_is_foreign(vma))
Dave Hansen33a709b2016-02-12 13:02:19 -0800253 return true;
254 return __pkru_allows_pkey(vma_pkey(vma), write);
255}
256
257static inline bool arch_pte_access_permitted(pte_t pte, bool write)
258{
259 return __pkru_allows_pkey(pte_flags_pkey(pte_flags(pte)), write);
260}
261
H. Peter Anvin1965aae2008-10-22 22:26:29 -0700262#endif /* _ASM_X86_MMU_CONTEXT_H */