blob: b37a58e1c92da8bfa9092828f6d3a92126da29d9 [file] [log] [blame]
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +00001/*
2 * This file contains the routines for TLB flushing.
3 * On machines where the MMU does not use a hash table to store virtual to
4 * physical translations (ie, SW loaded TLBs or Book3E compilant processors,
5 * this does -not- include 603 however which shares the implementation with
6 * hash based processors)
7 *
8 * -- BenH
9 *
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +000010 * Copyright 2008,2009 Ben Herrenschmidt <benh@kernel.crashing.org>
11 * IBM Corp.
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +000012 *
13 * Derived from arch/ppc/mm/init.c:
14 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
15 *
16 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
17 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
18 * Copyright (C) 1996 Paul Mackerras
19 *
20 * Derived from "arch/i386/mm/init.c"
21 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
22 *
23 * This program is free software; you can redistribute it and/or
24 * modify it under the terms of the GNU General Public License
25 * as published by the Free Software Foundation; either version
26 * 2 of the License, or (at your option) any later version.
27 *
28 */
29
30#include <linux/kernel.h>
Paul Gortmaker93087942011-07-29 16:19:31 +100031#include <linux/export.h>
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +000032#include <linux/mm.h>
33#include <linux/init.h>
34#include <linux/highmem.h>
35#include <linux/pagemap.h>
36#include <linux/preempt.h>
37#include <linux/spinlock.h>
Yinghai Lu95f72d12010-07-12 14:36:09 +100038#include <linux/memblock.h>
Dave Kleikamp91b191c2011-07-04 18:38:03 +000039#include <linux/of_fdt.h>
Becky Bruce41151e72011-06-28 09:54:48 +000040#include <linux/hugetlb.h>
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +000041
42#include <asm/tlbflush.h>
43#include <asm/tlb.h>
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +000044#include <asm/code-patching.h>
Becky Bruce41151e72011-06-28 09:54:48 +000045#include <asm/hugetlb.h>
Scott Wood28efc352013-10-11 19:22:38 -050046#include <asm/paca.h>
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +000047
48#include "mmu_decl.h"
49
Becky Bruce41151e72011-06-28 09:54:48 +000050/*
51 * This struct lists the sw-supported page sizes. The hardawre MMU may support
52 * other sizes not listed here. The .ind field is only used on MMUs that have
53 * indirect page table entries.
54 */
55#ifdef CONFIG_PPC_BOOK3E_MMU
Becky Bruce881fde12011-10-10 10:50:40 +000056#ifdef CONFIG_PPC_FSL_BOOK3E
Becky Bruce41151e72011-06-28 09:54:48 +000057struct mmu_psize_def mmu_psize_defs[MMU_PAGE_COUNT] = {
58 [MMU_PAGE_4K] = {
59 .shift = 12,
60 .enc = BOOK3E_PAGESZ_4K,
61 },
Scott Wood28efc352013-10-11 19:22:38 -050062 [MMU_PAGE_2M] = {
63 .shift = 21,
64 .enc = BOOK3E_PAGESZ_2M,
65 },
Becky Bruce41151e72011-06-28 09:54:48 +000066 [MMU_PAGE_4M] = {
67 .shift = 22,
68 .enc = BOOK3E_PAGESZ_4M,
69 },
70 [MMU_PAGE_16M] = {
71 .shift = 24,
72 .enc = BOOK3E_PAGESZ_16M,
73 },
74 [MMU_PAGE_64M] = {
75 .shift = 26,
76 .enc = BOOK3E_PAGESZ_64M,
77 },
78 [MMU_PAGE_256M] = {
79 .shift = 28,
80 .enc = BOOK3E_PAGESZ_256M,
81 },
82 [MMU_PAGE_1G] = {
83 .shift = 30,
84 .enc = BOOK3E_PAGESZ_1GB,
85 },
86};
87#else
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +000088struct mmu_psize_def mmu_psize_defs[MMU_PAGE_COUNT] = {
89 [MMU_PAGE_4K] = {
90 .shift = 12,
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +100091 .ind = 20,
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +000092 .enc = BOOK3E_PAGESZ_4K,
93 },
94 [MMU_PAGE_16K] = {
95 .shift = 14,
96 .enc = BOOK3E_PAGESZ_16K,
97 },
98 [MMU_PAGE_64K] = {
99 .shift = 16,
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000100 .ind = 28,
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000101 .enc = BOOK3E_PAGESZ_64K,
102 },
103 [MMU_PAGE_1M] = {
104 .shift = 20,
105 .enc = BOOK3E_PAGESZ_1M,
106 },
107 [MMU_PAGE_16M] = {
108 .shift = 24,
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000109 .ind = 36,
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000110 .enc = BOOK3E_PAGESZ_16M,
111 },
112 [MMU_PAGE_256M] = {
113 .shift = 28,
114 .enc = BOOK3E_PAGESZ_256M,
115 },
116 [MMU_PAGE_1G] = {
117 .shift = 30,
118 .enc = BOOK3E_PAGESZ_1GB,
119 },
120};
Becky Bruce41151e72011-06-28 09:54:48 +0000121#endif /* CONFIG_FSL_BOOKE */
122
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000123static inline int mmu_get_tsize(int psize)
124{
125 return mmu_psize_defs[psize].enc;
126}
127#else
128static inline int mmu_get_tsize(int psize)
129{
130 /* This isn't used on !Book3E for now */
131 return 0;
132}
Becky Bruce41151e72011-06-28 09:54:48 +0000133#endif /* CONFIG_PPC_BOOK3E_MMU */
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000134
135/* The variables below are currently only used on 64-bit Book3E
136 * though this will probably be made common with other nohash
137 * implementations at some point
138 */
139#ifdef CONFIG_PPC64
140
141int mmu_linear_psize; /* Page size used for the linear mapping */
142int mmu_pte_psize; /* Page size used for PTE pages */
Benjamin Herrenschmidt32a74942009-07-23 23:15:58 +0000143int mmu_vmemmap_psize; /* Page size used for the virtual mem map */
Scott Wood28efc352013-10-11 19:22:38 -0500144int book3e_htw_mode; /* HW tablewalk? Value is PPC_HTW_* */
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000145unsigned long linear_map_top; /* Top of linear mapping */
146
147#endif /* CONFIG_PPC64 */
148
Becky Bruce3160b092011-06-28 14:54:47 -0500149#ifdef CONFIG_PPC_FSL_BOOK3E
150/* next_tlbcam_idx is used to round-robin tlbcam entry assignment */
151DEFINE_PER_CPU(int, next_tlbcam_idx);
152EXPORT_PER_CPU_SYMBOL(next_tlbcam_idx);
153#endif
154
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000155/*
156 * Base TLB flushing operations:
157 *
158 * - flush_tlb_mm(mm) flushes the specified mm context TLB's
159 * - flush_tlb_page(vma, vmaddr) flushes one page
160 * - flush_tlb_range(vma, start, end) flushes a range of pages
161 * - flush_tlb_kernel_range(start, end) flushes kernel pages
162 *
163 * - local_* variants of page and mm only apply to the current
164 * processor
165 */
166
167/*
168 * These are the base non-SMP variants of page and mm flushing
169 */
170void local_flush_tlb_mm(struct mm_struct *mm)
171{
172 unsigned int pid;
173
174 preempt_disable();
175 pid = mm->context.id;
176 if (pid != MMU_NO_CONTEXT)
177 _tlbil_pid(pid);
178 preempt_enable();
179}
180EXPORT_SYMBOL(local_flush_tlb_mm);
181
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000182void __local_flush_tlb_page(struct mm_struct *mm, unsigned long vmaddr,
183 int tsize, int ind)
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000184{
185 unsigned int pid;
186
187 preempt_disable();
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000188 pid = mm ? mm->context.id : 0;
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000189 if (pid != MMU_NO_CONTEXT)
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000190 _tlbil_va(vmaddr, pid, tsize, ind);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000191 preempt_enable();
192}
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000193
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000194void local_flush_tlb_page(struct vm_area_struct *vma, unsigned long vmaddr)
195{
196 __local_flush_tlb_page(vma ? vma->vm_mm : NULL, vmaddr,
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000197 mmu_get_tsize(mmu_virtual_psize), 0);
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000198}
199EXPORT_SYMBOL(local_flush_tlb_page);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000200
201/*
202 * And here are the SMP non-local implementations
203 */
204#ifdef CONFIG_SMP
205
Thomas Gleixner3eb93c52010-02-18 02:22:44 +0000206static DEFINE_RAW_SPINLOCK(tlbivax_lock);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000207
Benjamin Herrenschmidtfcce8102009-07-23 23:15:10 +0000208static int mm_is_core_local(struct mm_struct *mm)
209{
210 return cpumask_subset(mm_cpumask(mm),
211 topology_thread_cpumask(smp_processor_id()));
212}
213
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000214struct tlb_flush_param {
215 unsigned long addr;
216 unsigned int pid;
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000217 unsigned int tsize;
218 unsigned int ind;
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000219};
220
221static void do_flush_tlb_mm_ipi(void *param)
222{
223 struct tlb_flush_param *p = param;
224
225 _tlbil_pid(p ? p->pid : 0);
226}
227
228static void do_flush_tlb_page_ipi(void *param)
229{
230 struct tlb_flush_param *p = param;
231
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000232 _tlbil_va(p->addr, p->pid, p->tsize, p->ind);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000233}
234
235
236/* Note on invalidations and PID:
237 *
238 * We snapshot the PID with preempt disabled. At this point, it can still
239 * change either because:
240 * - our context is being stolen (PID -> NO_CONTEXT) on another CPU
241 * - we are invaliating some target that isn't currently running here
242 * and is concurrently acquiring a new PID on another CPU
243 * - some other CPU is re-acquiring a lost PID for this mm
244 * etc...
245 *
246 * However, this shouldn't be a problem as we only guarantee
247 * invalidation of TLB entries present prior to this call, so we
248 * don't care about the PID changing, and invalidating a stale PID
249 * is generally harmless.
250 */
251
252void flush_tlb_mm(struct mm_struct *mm)
253{
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000254 unsigned int pid;
255
256 preempt_disable();
257 pid = mm->context.id;
258 if (unlikely(pid == MMU_NO_CONTEXT))
259 goto no_context;
Benjamin Herrenschmidtfcce8102009-07-23 23:15:10 +0000260 if (!mm_is_core_local(mm)) {
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000261 struct tlb_flush_param p = { .pid = pid };
Rusty Russell56aa4122009-03-15 18:16:43 +0000262 /* Ignores smp_processor_id() even if set. */
263 smp_call_function_many(mm_cpumask(mm),
264 do_flush_tlb_mm_ipi, &p, 1);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000265 }
266 _tlbil_pid(pid);
267 no_context:
268 preempt_enable();
269}
270EXPORT_SYMBOL(flush_tlb_mm);
271
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000272void __flush_tlb_page(struct mm_struct *mm, unsigned long vmaddr,
273 int tsize, int ind)
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000274{
Rusty Russell56aa4122009-03-15 18:16:43 +0000275 struct cpumask *cpu_mask;
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000276 unsigned int pid;
277
278 preempt_disable();
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000279 pid = mm ? mm->context.id : 0;
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000280 if (unlikely(pid == MMU_NO_CONTEXT))
281 goto bail;
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000282 cpu_mask = mm_cpumask(mm);
Benjamin Herrenschmidtfcce8102009-07-23 23:15:10 +0000283 if (!mm_is_core_local(mm)) {
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000284 /* If broadcast tlbivax is supported, use it */
285 if (mmu_has_feature(MMU_FTR_USE_TLBIVAX_BCAST)) {
286 int lock = mmu_has_feature(MMU_FTR_LOCK_BCAST_INVAL);
287 if (lock)
Thomas Gleixner3eb93c52010-02-18 02:22:44 +0000288 raw_spin_lock(&tlbivax_lock);
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000289 _tlbivax_bcast(vmaddr, pid, tsize, ind);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000290 if (lock)
Thomas Gleixner3eb93c52010-02-18 02:22:44 +0000291 raw_spin_unlock(&tlbivax_lock);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000292 goto bail;
293 } else {
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000294 struct tlb_flush_param p = {
295 .pid = pid,
296 .addr = vmaddr,
297 .tsize = tsize,
298 .ind = ind,
299 };
Rusty Russell56aa4122009-03-15 18:16:43 +0000300 /* Ignores smp_processor_id() even if set in cpu_mask */
301 smp_call_function_many(cpu_mask,
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000302 do_flush_tlb_page_ipi, &p, 1);
303 }
304 }
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000305 _tlbil_va(vmaddr, pid, tsize, ind);
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000306 bail:
307 preempt_enable();
308}
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000309
310void flush_tlb_page(struct vm_area_struct *vma, unsigned long vmaddr)
311{
Becky Bruce41151e72011-06-28 09:54:48 +0000312#ifdef CONFIG_HUGETLB_PAGE
Scott Woodd742aa12013-11-21 18:26:42 -0600313 if (vma && is_vm_hugetlb_page(vma))
Becky Bruce41151e72011-06-28 09:54:48 +0000314 flush_hugetlb_page(vma, vmaddr);
315#endif
316
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000317 __flush_tlb_page(vma ? vma->vm_mm : NULL, vmaddr,
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000318 mmu_get_tsize(mmu_virtual_psize), 0);
Benjamin Herrenschmidtd4e167d2009-07-23 23:15:24 +0000319}
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000320EXPORT_SYMBOL(flush_tlb_page);
321
322#endif /* CONFIG_SMP */
323
Dave Kleikamp91b191c2011-07-04 18:38:03 +0000324#ifdef CONFIG_PPC_47x
325void __init early_init_mmu_47x(void)
326{
327#ifdef CONFIG_SMP
328 unsigned long root = of_get_flat_dt_root();
329 if (of_get_flat_dt_prop(root, "cooperative-partition", NULL))
330 mmu_clear_feature(MMU_FTR_USE_TLBIVAX_BCAST);
331#endif /* CONFIG_SMP */
332}
333#endif /* CONFIG_PPC_47x */
334
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000335/*
336 * Flush kernel TLB entries in the given range
337 */
338void flush_tlb_kernel_range(unsigned long start, unsigned long end)
339{
340#ifdef CONFIG_SMP
341 preempt_disable();
342 smp_call_function(do_flush_tlb_mm_ipi, NULL, 1);
343 _tlbil_pid(0);
344 preempt_enable();
Dave Liud6a09e02008-12-30 23:42:55 +0000345#else
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000346 _tlbil_pid(0);
Dave Liud6a09e02008-12-30 23:42:55 +0000347#endif
Benjamin Herrenschmidtf048aac2008-12-18 19:13:38 +0000348}
349EXPORT_SYMBOL(flush_tlb_kernel_range);
350
351/*
352 * Currently, for range flushing, we just do a full mm flush. This should
353 * be optimized based on a threshold on the size of the range, since
354 * some implementation can stack multiple tlbivax before a tlbsync but
355 * for now, we keep it that way
356 */
357void flush_tlb_range(struct vm_area_struct *vma, unsigned long start,
358 unsigned long end)
359
360{
361 flush_tlb_mm(vma->vm_mm);
362}
363EXPORT_SYMBOL(flush_tlb_range);
Benjamin Herrenschmidtc7cc58a12009-07-23 23:15:28 +0000364
365void tlb_flush(struct mmu_gather *tlb)
366{
367 flush_tlb_mm(tlb->mm);
Benjamin Herrenschmidtc7cc58a12009-07-23 23:15:28 +0000368}
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000369
370/*
371 * Below are functions specific to the 64-bit variant of Book3E though that
372 * may change in the future
373 */
374
375#ifdef CONFIG_PPC64
376
377/*
378 * Handling of virtual linear page tables or indirect TLB entries
379 * flushing when PTE pages are freed
380 */
381void tlb_flush_pgtable(struct mmu_gather *tlb, unsigned long address)
382{
383 int tsize = mmu_psize_defs[mmu_pte_psize].enc;
384
Scott Wood28efc352013-10-11 19:22:38 -0500385 if (book3e_htw_mode != PPC_HTW_NONE) {
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000386 unsigned long start = address & PMD_MASK;
387 unsigned long end = address + PMD_SIZE;
388 unsigned long size = 1UL << mmu_psize_defs[mmu_pte_psize].shift;
389
390 /* This isn't the most optimal, ideally we would factor out the
391 * while preempt & CPU mask mucking around, or even the IPI but
392 * it will do for now
393 */
394 while (start < end) {
395 __flush_tlb_page(tlb->mm, start, tsize, 1);
396 start += size;
397 }
398 } else {
399 unsigned long rmask = 0xf000000000000000ul;
400 unsigned long rid = (address & rmask) | 0x1000000000000000ul;
401 unsigned long vpte = address & ~rmask;
402
403#ifdef CONFIG_PPC_64K_PAGES
404 vpte = (vpte >> (PAGE_SHIFT - 4)) & ~0xfffful;
405#else
406 vpte = (vpte >> (PAGE_SHIFT - 3)) & ~0xffful;
407#endif
408 vpte |= rid;
409 __flush_tlb_page(tlb->mm, vpte, tsize, 0);
410 }
411}
412
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000413static void setup_page_sizes(void)
414{
Kumar Gala988cf862010-10-08 02:13:25 -0500415 unsigned int tlb0cfg;
416 unsigned int tlb0ps;
417 unsigned int eptcfg;
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000418 int i, psize;
419
Kumar Gala988cf862010-10-08 02:13:25 -0500420#ifdef CONFIG_PPC_FSL_BOOK3E
421 unsigned int mmucfg = mfspr(SPRN_MMUCFG);
Kumar Gala1b291872013-03-05 12:08:32 -0600422 int fsl_mmu = mmu_has_feature(MMU_FTR_TYPE_FSL_E);
Kumar Gala988cf862010-10-08 02:13:25 -0500423
Kumar Gala1b291872013-03-05 12:08:32 -0600424 if (fsl_mmu && (mmucfg & MMUCFG_MAVN) == MMUCFG_MAVN_V1) {
Kumar Gala988cf862010-10-08 02:13:25 -0500425 unsigned int tlb1cfg = mfspr(SPRN_TLB1CFG);
426 unsigned int min_pg, max_pg;
427
428 min_pg = (tlb1cfg & TLBnCFG_MINSIZE) >> TLBnCFG_MINSIZE_SHIFT;
429 max_pg = (tlb1cfg & TLBnCFG_MAXSIZE) >> TLBnCFG_MAXSIZE_SHIFT;
430
431 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) {
432 struct mmu_psize_def *def;
433 unsigned int shift;
434
435 def = &mmu_psize_defs[psize];
436 shift = def->shift;
437
Scott Wood28efc352013-10-11 19:22:38 -0500438 if (shift == 0 || shift & 1)
Kumar Gala988cf862010-10-08 02:13:25 -0500439 continue;
440
441 /* adjust to be in terms of 4^shift Kb */
442 shift = (shift - 10) >> 1;
443
444 if ((shift >= min_pg) && (shift <= max_pg))
445 def->flags |= MMU_PAGE_SIZE_DIRECT;
446 }
447
Scott Wood28efc352013-10-11 19:22:38 -0500448 goto out;
Kumar Gala988cf862010-10-08 02:13:25 -0500449 }
Kumar Gala1b291872013-03-05 12:08:32 -0600450
451 if (fsl_mmu && (mmucfg & MMUCFG_MAVN) == MMUCFG_MAVN_V2) {
Scott Wood28efc352013-10-11 19:22:38 -0500452 u32 tlb1cfg, tlb1ps;
453
454 tlb0cfg = mfspr(SPRN_TLB0CFG);
455 tlb1cfg = mfspr(SPRN_TLB1CFG);
456 tlb1ps = mfspr(SPRN_TLB1PS);
457 eptcfg = mfspr(SPRN_EPTCFG);
458
459 if ((tlb1cfg & TLBnCFG_IND) && (tlb0cfg & TLBnCFG_PT))
460 book3e_htw_mode = PPC_HTW_E6500;
461
462 /*
463 * We expect 4K subpage size and unrestricted indirect size.
464 * The lack of a restriction on indirect size is a Freescale
465 * extension, indicated by PSn = 0 but SPSn != 0.
466 */
467 if (eptcfg != 2)
468 book3e_htw_mode = PPC_HTW_NONE;
Kumar Gala1b291872013-03-05 12:08:32 -0600469
470 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) {
471 struct mmu_psize_def *def = &mmu_psize_defs[psize];
472
473 if (tlb1ps & (1U << (def->shift - 10))) {
474 def->flags |= MMU_PAGE_SIZE_DIRECT;
Scott Wood28efc352013-10-11 19:22:38 -0500475
476 if (book3e_htw_mode && psize == MMU_PAGE_2M)
477 def->flags |= MMU_PAGE_SIZE_INDIRECT;
Kumar Gala1b291872013-03-05 12:08:32 -0600478 }
479 }
480
Scott Wood28efc352013-10-11 19:22:38 -0500481 goto out;
Kumar Gala1b291872013-03-05 12:08:32 -0600482 }
Kumar Gala988cf862010-10-08 02:13:25 -0500483#endif
484
485 tlb0cfg = mfspr(SPRN_TLB0CFG);
486 tlb0ps = mfspr(SPRN_TLB0PS);
487 eptcfg = mfspr(SPRN_EPTCFG);
488
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000489 /* Look for supported direct sizes */
490 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) {
491 struct mmu_psize_def *def = &mmu_psize_defs[psize];
492
493 if (tlb0ps & (1U << (def->shift - 10)))
494 def->flags |= MMU_PAGE_SIZE_DIRECT;
495 }
496
497 /* Indirect page sizes supported ? */
Scott Wood28efc352013-10-11 19:22:38 -0500498 if ((tlb0cfg & TLBnCFG_IND) == 0 ||
499 (tlb0cfg & TLBnCFG_PT) == 0)
500 goto out;
501
502 book3e_htw_mode = PPC_HTW_IBM;
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000503
504 /* Now, we only deal with one IND page size for each
505 * direct size. Hopefully all implementations today are
506 * unambiguous, but we might want to be careful in the
507 * future.
508 */
509 for (i = 0; i < 3; i++) {
510 unsigned int ps, sps;
511
512 sps = eptcfg & 0x1f;
513 eptcfg >>= 5;
514 ps = eptcfg & 0x1f;
515 eptcfg >>= 5;
516 if (!ps || !sps)
517 continue;
518 for (psize = 0; psize < MMU_PAGE_COUNT; psize++) {
519 struct mmu_psize_def *def = &mmu_psize_defs[psize];
520
521 if (ps == (def->shift - 10))
522 def->flags |= MMU_PAGE_SIZE_INDIRECT;
523 if (sps == (def->shift - 10))
524 def->ind = ps + 10;
525 }
526 }
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000527
Scott Wood28efc352013-10-11 19:22:38 -0500528out:
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000529 /* Cleanup array and print summary */
530 pr_info("MMU: Supported page sizes\n");
531 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) {
532 struct mmu_psize_def *def = &mmu_psize_defs[psize];
533 const char *__page_type_names[] = {
534 "unsupported",
535 "direct",
536 "indirect",
537 "direct & indirect"
538 };
539 if (def->flags == 0) {
540 def->shift = 0;
541 continue;
542 }
543 pr_info(" %8ld KB as %s\n", 1ul << (def->shift - 10),
544 __page_type_names[def->flags & 0x3]);
545 }
546}
547
Scott Woodf67f4ef2011-06-22 11:25:42 +0000548static void setup_mmu_htw(void)
549{
Scott Wood28efc352013-10-11 19:22:38 -0500550 /*
551 * If we want to use HW tablewalk, enable it by patching the TLB miss
552 * handlers to branch to the one dedicated to it.
553 */
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000554
Scott Wood28efc352013-10-11 19:22:38 -0500555 switch (book3e_htw_mode) {
556 case PPC_HTW_IBM:
Scott Woodf67f4ef2011-06-22 11:25:42 +0000557 patch_exception(0x1c0, exc_data_tlb_miss_htw_book3e);
558 patch_exception(0x1e0, exc_instruction_tlb_miss_htw_book3e);
Scott Wood28efc352013-10-11 19:22:38 -0500559 break;
Scott Wood9841c792014-01-17 18:36:38 -0600560#ifdef CONFIG_PPC_FSL_BOOK3E
Scott Wood28efc352013-10-11 19:22:38 -0500561 case PPC_HTW_E6500:
562 patch_exception(0x1c0, exc_data_tlb_miss_e6500_book3e);
563 patch_exception(0x1e0, exc_instruction_tlb_miss_e6500_book3e);
564 break;
Scott Wood9841c792014-01-17 18:36:38 -0600565#endif
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000566 }
Kumar Gala32d206e2011-05-19 20:09:28 +0000567 pr_info("MMU: Book3E HW tablewalk %s\n",
Scott Wood28efc352013-10-11 19:22:38 -0500568 book3e_htw_mode != PPC_HTW_NONE ? "enabled" : "not supported");
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000569}
570
571/*
572 * Early initialization of the MMU TLB code
573 */
574static void __early_init_mmu(int boot_cpu)
575{
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000576 unsigned int mas4;
577
578 /* XXX This will have to be decided at runtime, but right
Benjamin Herrenschmidt32a74942009-07-23 23:15:58 +0000579 * now our boot and TLB miss code hard wires it. Ideally
580 * we should find out a suitable page size and patch the
581 * TLB miss code (either that or use the PACA to store
582 * the value we want)
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000583 */
584 mmu_linear_psize = MMU_PAGE_1G;
585
Benjamin Herrenschmidt32a74942009-07-23 23:15:58 +0000586 /* XXX This should be decided at runtime based on supported
587 * page sizes in the TLB, but for now let's assume 16M is
588 * always there and a good fit (which it probably is)
589 */
590 mmu_vmemmap_psize = MMU_PAGE_16M;
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000591
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000592 /* XXX This code only checks for TLB 0 capabilities and doesn't
593 * check what page size combos are supported by the HW. It
594 * also doesn't handle the case where a separate array holds
595 * the IND entries from the array loaded by the PT.
596 */
597 if (boot_cpu) {
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000598 /* Look for supported page sizes */
599 setup_page_sizes();
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000600
Benjamin Herrenschmidtf2b26c92010-07-09 14:57:43 +1000601 /* Look for HW tablewalk support */
602 setup_mmu_htw();
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000603 }
604
605 /* Set MAS4 based on page table setting */
606
607 mas4 = 0x4 << MAS4_WIMGED_SHIFT;
Scott Wood28efc352013-10-11 19:22:38 -0500608 switch (book3e_htw_mode) {
609 case PPC_HTW_E6500:
610 mas4 |= MAS4_INDD;
611 mas4 |= BOOK3E_PAGESZ_2M << MAS4_TSIZED_SHIFT;
612 mas4 |= MAS4_TLBSELD(1);
613 mmu_pte_psize = MMU_PAGE_2M;
614 break;
615
616 case PPC_HTW_IBM:
617 mas4 |= MAS4_INDD;
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000618#ifdef CONFIG_PPC_64K_PAGES
619 mas4 |= BOOK3E_PAGESZ_256M << MAS4_TSIZED_SHIFT;
620 mmu_pte_psize = MMU_PAGE_256M;
621#else
622 mas4 |= BOOK3E_PAGESZ_1M << MAS4_TSIZED_SHIFT;
623 mmu_pte_psize = MMU_PAGE_1M;
624#endif
Scott Wood28efc352013-10-11 19:22:38 -0500625 break;
626
627 case PPC_HTW_NONE:
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000628#ifdef CONFIG_PPC_64K_PAGES
629 mas4 |= BOOK3E_PAGESZ_64K << MAS4_TSIZED_SHIFT;
630#else
631 mas4 |= BOOK3E_PAGESZ_4K << MAS4_TSIZED_SHIFT;
632#endif
633 mmu_pte_psize = mmu_virtual_psize;
Scott Wood28efc352013-10-11 19:22:38 -0500634 break;
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000635 }
636 mtspr(SPRN_MAS4, mas4);
637
638 /* Set the global containing the top of the linear mapping
639 * for use by the TLB miss code
640 */
Yinghai Lu95f72d12010-07-12 14:36:09 +1000641 linear_map_top = memblock_end_of_DRAM();
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000642
Kumar Gala55fd7662009-10-16 18:48:40 -0500643#ifdef CONFIG_PPC_FSL_BOOK3E
644 if (mmu_has_feature(MMU_FTR_TYPE_FSL_E)) {
645 unsigned int num_cams;
646
647 /* use a quarter of the TLBCAM for bolted linear map */
648 num_cams = (mfspr(SPRN_TLB1CFG) & TLBnCFG_N_ENTRY) / 4;
649 linear_map_top = map_mem_in_cams(linear_map_top, num_cams);
650
651 /* limit memory so we dont have linear faults */
652 memblock_enforce_memory_limit(linear_map_top);
Scott Woodf67f4ef2011-06-22 11:25:42 +0000653
Scott Wood28efc352013-10-11 19:22:38 -0500654 if (book3e_htw_mode == PPC_HTW_NONE) {
655 patch_exception(0x1c0, exc_data_tlb_miss_bolted_book3e);
656 patch_exception(0x1e0,
657 exc_instruction_tlb_miss_bolted_book3e);
658 }
Kumar Gala55fd7662009-10-16 18:48:40 -0500659 }
660#endif
661
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000662 /* A sync won't hurt us after mucking around with
663 * the MMU configuration
664 */
665 mb();
Benjamin Herrenschmidte63075a2010-07-06 15:39:01 -0700666
667 memblock_set_current_limit(linear_map_top);
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000668}
669
670void __init early_init_mmu(void)
671{
672 __early_init_mmu(1);
673}
674
Paul Gortmaker061d19f2013-06-24 15:30:09 -0400675void early_init_mmu_secondary(void)
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000676{
677 __early_init_mmu(0);
678}
679
Benjamin Herrenschmidtcd3db0c2010-07-06 15:39:02 -0700680void setup_initial_memory_limit(phys_addr_t first_memblock_base,
681 phys_addr_t first_memblock_size)
682{
Kumar Gala1dc91c32011-09-16 10:39:59 -0500683 /* On non-FSL Embedded 64-bit, we adjust the RMA size to match
Benjamin Herrenschmidtcd3db0c2010-07-06 15:39:02 -0700684 * the bolted TLB entry. We know for now that only 1G
685 * entries are supported though that may eventually
Kumar Gala1dc91c32011-09-16 10:39:59 -0500686 * change.
687 *
688 * on FSL Embedded 64-bit, we adjust the RMA size to match the
689 * first bolted TLB entry size. We still limit max to 1G even if
690 * the TLB could cover more. This is due to what the early init
691 * code is setup to do.
692 *
693 * We crop it to the size of the first MEMBLOCK to
Benjamin Herrenschmidtcd3db0c2010-07-06 15:39:02 -0700694 * avoid going over total available memory just in case...
695 */
Kumar Gala1dc91c32011-09-16 10:39:59 -0500696#ifdef CONFIG_PPC_FSL_BOOK3E
697 if (mmu_has_feature(MMU_FTR_TYPE_FSL_E)) {
698 unsigned long linear_sz;
699 linear_sz = calc_cam_sz(first_memblock_size, PAGE_OFFSET,
700 first_memblock_base);
701 ppc64_rma_size = min_t(u64, linear_sz, 0x40000000);
702 } else
703#endif
704 ppc64_rma_size = min_t(u64, first_memblock_size, 0x40000000);
Benjamin Herrenschmidtcd3db0c2010-07-06 15:39:02 -0700705
706 /* Finally limit subsequent allocations */
Kumar Gala4a892612010-11-10 12:29:49 +0000707 memblock_set_current_limit(first_memblock_base + ppc64_rma_size);
Benjamin Herrenschmidtcd3db0c2010-07-06 15:39:02 -0700708}
Dave Kleikamp91b191c2011-07-04 18:38:03 +0000709#else /* ! CONFIG_PPC64 */
710void __init early_init_mmu(void)
711{
712#ifdef CONFIG_PPC_47x
713 early_init_mmu_47x();
714#endif
715}
Benjamin Herrenschmidt25d21ad2009-07-23 23:15:47 +0000716#endif /* CONFIG_PPC64 */