blob: 2add0b7b9f6d19bc076eb7b8458db849b204d532 [file] [log] [blame]
Paul Mackerras14cf11a2005-09-26 16:04:21 +10001/*
2 * PowerPC version
3 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
4 *
5 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
6 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
7 * Copyright (C) 1996 Paul Mackerras
Paul Mackerras14cf11a2005-09-26 16:04:21 +10008 * PPC44x/36-bit changes by Matt Porter (mporter@mvista.com)
9 *
10 * Derived from "arch/i386/mm/init.c"
11 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
12 *
13 * This program is free software; you can redistribute it and/or
14 * modify it under the terms of the GNU General Public License
15 * as published by the Free Software Foundation; either version
16 * 2 of the License, or (at your option) any later version.
17 *
18 */
19
Paul Gortmaker4b16f8e2011-07-22 18:24:23 -040020#include <linux/export.h>
Paul Mackerras14cf11a2005-09-26 16:04:21 +100021#include <linux/sched.h>
22#include <linux/kernel.h>
23#include <linux/errno.h>
24#include <linux/string.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090025#include <linux/gfp.h>
Paul Mackerras14cf11a2005-09-26 16:04:21 +100026#include <linux/types.h>
27#include <linux/mm.h>
28#include <linux/stddef.h>
29#include <linux/init.h>
30#include <linux/bootmem.h>
31#include <linux/highmem.h>
32#include <linux/initrd.h>
33#include <linux/pagemap.h>
Johannes Berg4e8ad3e2007-05-08 19:25:00 +100034#include <linux/suspend.h>
Yinghai Lu95f72d12010-07-12 14:36:09 +100035#include <linux/memblock.h>
David Gibson0895ecd2009-10-26 19:24:31 +000036#include <linux/hugetlb.h>
Anton Blanchardc40dd2f2011-11-02 14:56:12 +000037#include <linux/slab.h>
Anton Blanchard16d0f5c2014-10-14 22:17:47 +110038#include <linux/vmalloc.h>
Paul Mackerras14cf11a2005-09-26 16:04:21 +100039
40#include <asm/pgalloc.h>
41#include <asm/prom.h>
42#include <asm/io.h>
43#include <asm/mmu_context.h>
44#include <asm/pgtable.h>
45#include <asm/mmu.h>
46#include <asm/smp.h>
47#include <asm/machdep.h>
48#include <asm/btext.h>
49#include <asm/tlb.h>
Paul Mackerras7c8c6b92005-10-06 12:23:33 +100050#include <asm/sections.h>
Tony Breedsdb7f37d2008-07-01 11:30:06 +100051#include <asm/sparsemem.h>
Paul Mackerrasab1f9da2005-10-10 21:58:35 +100052#include <asm/vdso.h>
Kumar Gala2c419bd2008-04-23 23:05:20 +100053#include <asm/fixmap.h>
FUJITA Tomonoria9327292010-03-16 13:16:25 +000054#include <asm/swiotlb.h>
sukadev@linux.vnet.ibm.com8a3e3d32011-12-02 12:26:23 +000055#include <asm/rtas.h>
Paul Mackerras14cf11a2005-09-26 16:04:21 +100056
Paul Mackerras14cf11a2005-09-26 16:04:21 +100057#include "mmu_decl.h"
58
59#ifndef CPU_FTR_COHERENT_ICACHE
60#define CPU_FTR_COHERENT_ICACHE 0 /* XXX for now */
61#define CPU_FTR_NOEXECUTE 0
62#endif
63
Paul Mackerras7c8c6b92005-10-06 12:23:33 +100064int init_bootmem_done;
65int mem_init_done;
Suzuki Poulosea84fcd42012-08-21 01:42:33 +000066unsigned long long memory_limit;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +100067
Kumar Gala2c419bd2008-04-23 23:05:20 +100068#ifdef CONFIG_HIGHMEM
69pte_t *kmap_pte;
Kumar Gala2c419bd2008-04-23 23:05:20 +100070EXPORT_SYMBOL(kmap_pte);
Valentina Manea8040bda2013-03-10 03:22:39 +000071pgprot_t kmap_prot;
72EXPORT_SYMBOL(kmap_prot);
Kumar Gala2c419bd2008-04-23 23:05:20 +100073
74static inline pte_t *virt_to_kpte(unsigned long vaddr)
75{
76 return pte_offset_kernel(pmd_offset(pud_offset(pgd_offset_k(vaddr),
77 vaddr), vaddr), vaddr);
78}
79#endif
80
Paul Mackerras14cf11a2005-09-26 16:04:21 +100081int page_is_ram(unsigned long pfn)
82{
Paul Mackerras14cf11a2005-09-26 16:04:21 +100083#ifndef CONFIG_PPC64 /* XXX for now */
Roland Dreiera880e762008-09-15 10:43:35 +000084 return pfn < max_pfn;
Paul Mackerras14cf11a2005-09-26 16:04:21 +100085#else
Roland Dreiera880e762008-09-15 10:43:35 +000086 unsigned long paddr = (pfn << PAGE_SHIFT);
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +100087 struct memblock_region *reg;
Paul Mackerras14cf11a2005-09-26 16:04:21 +100088
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +100089 for_each_memblock(memory, reg)
90 if (paddr >= reg->base && paddr < (reg->base + reg->size))
Paul Mackerras14cf11a2005-09-26 16:04:21 +100091 return 1;
Paul Mackerras14cf11a2005-09-26 16:04:21 +100092 return 0;
93#endif
94}
Paul Mackerras14cf11a2005-09-26 16:04:21 +100095
Roland Dreier8b150472005-10-28 17:46:18 -070096pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
Paul Mackerras14cf11a2005-09-26 16:04:21 +100097 unsigned long size, pgprot_t vma_prot)
98{
99 if (ppc_md.phys_mem_access_prot)
Roland Dreier8b150472005-10-28 17:46:18 -0700100 return ppc_md.phys_mem_access_prot(file, pfn, size, vma_prot);
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000101
Roland Dreier8b150472005-10-28 17:46:18 -0700102 if (!page_is_ram(pfn))
Benjamin Herrenschmidt64b3d0e2008-12-18 19:13:51 +0000103 vma_prot = pgprot_noncached(vma_prot);
104
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000105 return vma_prot;
106}
107EXPORT_SYMBOL(phys_mem_access_prot);
108
Paul Mackerras23fd0772005-10-31 13:37:12 +1100109#ifdef CONFIG_MEMORY_HOTPLUG
110
Yasunori Gotobc02af92006-06-27 02:53:30 -0700111#ifdef CONFIG_NUMA
112int memory_add_physaddr_to_nid(u64 start)
113{
114 return hot_add_scn_to_nid(start);
115}
116#endif
117
Geert Uytterhoevenfa90f702008-03-29 03:10:50 +1100118int arch_add_memory(int nid, u64 start, u64 size)
Paul Mackerras23fd0772005-10-31 13:37:12 +1100119{
Mike Kravetz237a0982005-12-05 12:06:42 -0800120 struct pglist_data *pgdata;
Paul Mackerras23fd0772005-10-31 13:37:12 +1100121 struct zone *zone;
122 unsigned long start_pfn = start >> PAGE_SHIFT;
123 unsigned long nr_pages = size >> PAGE_SHIFT;
124
Mike Kravetz237a0982005-12-05 12:06:42 -0800125 pgdata = NODE_DATA(nid);
126
Andrew Morton2d0eee12006-03-21 23:00:05 -0800127 start = (unsigned long)__va(start);
Anton Blancharda1194092011-08-10 20:44:24 +0000128 if (create_section_mapping(start, start + size))
129 return -EINVAL;
Mike Kravetz54b79242005-11-07 16:25:48 -0800130
Paul Mackerras23fd0772005-10-31 13:37:12 +1100131 /* this should work for most non-highmem platforms */
Wang Nanf51202d2014-08-06 16:07:45 -0700132 zone = pgdata->node_zones +
133 zone_for_memory(nid, start, size, 0);
Paul Mackerras23fd0772005-10-31 13:37:12 +1100134
Gary Hadec04fc582009-01-06 14:39:14 -0800135 return __add_pages(nid, zone, start_pfn, nr_pages);
Paul Mackerras23fd0772005-10-31 13:37:12 +1100136}
Wen Congyang24d335c2013-02-22 16:32:58 -0800137
138#ifdef CONFIG_MEMORY_HOTREMOVE
139int arch_remove_memory(u64 start, u64 size)
140{
141 unsigned long start_pfn = start >> PAGE_SHIFT;
142 unsigned long nr_pages = size >> PAGE_SHIFT;
143 struct zone *zone;
Nathan Fontenot9ac8cde2014-01-27 10:54:06 -0600144 int ret;
Wen Congyang24d335c2013-02-22 16:32:58 -0800145
146 zone = page_zone(pfn_to_page(start_pfn));
Nathan Fontenot9ac8cde2014-01-27 10:54:06 -0600147 ret = __remove_pages(zone, start_pfn, nr_pages);
Anton Blanchard16d0f5c2014-10-14 22:17:47 +1100148 if (ret)
149 return ret;
150
151 /* Remove htab bolted mappings for this section of memory */
152 start = (unsigned long)__va(start);
153 ret = remove_section_mapping(start, start + size);
154
155 /* Ensure all vmalloc mappings are flushed in case they also
156 * hit that section of memory
157 */
158 vm_unmap_aliases();
Nathan Fontenot9ac8cde2014-01-27 10:54:06 -0600159
160 return ret;
Wen Congyang24d335c2013-02-22 16:32:58 -0800161}
162#endif
Nathan Lynch0d579942008-06-04 08:30:54 +1000163#endif /* CONFIG_MEMORY_HOTPLUG */
Badari Pulavartya99824f2008-02-05 00:10:18 -0800164
165/*
166 * walk_memory_resource() needs to make sure there is no holes in a given
Badari Pulavarty9d88a2e2008-04-18 13:33:53 -0700167 * memory range. PPC64 does not maintain the memory layout in /proc/iomem.
Yinghai Lu95f72d12010-07-12 14:36:09 +1000168 * Instead it maintains it in memblock.memory structures. Walk through the
Badari Pulavarty9d88a2e2008-04-18 13:33:53 -0700169 * memory regions, find holes and callback for contiguous regions.
Badari Pulavartya99824f2008-02-05 00:10:18 -0800170 */
171int
KAMEZAWA Hiroyuki908eedc2009-09-22 16:45:46 -0700172walk_system_ram_range(unsigned long start_pfn, unsigned long nr_pages,
173 void *arg, int (*func)(unsigned long, unsigned long, void *))
Badari Pulavartya99824f2008-02-05 00:10:18 -0800174{
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000175 struct memblock_region *reg;
176 unsigned long end_pfn = start_pfn + nr_pages;
177 unsigned long tstart, tend;
Badari Pulavarty9d88a2e2008-04-18 13:33:53 -0700178 int ret = -1;
179
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000180 for_each_memblock(memory, reg) {
Yinghai Luc7fc2de2010-10-12 14:07:09 -0700181 tstart = max(start_pfn, memblock_region_memory_base_pfn(reg));
182 tend = min(end_pfn, memblock_region_memory_end_pfn(reg));
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000183 if (tstart >= tend)
184 continue;
185 ret = (*func)(tstart, tend - tstart, arg);
Badari Pulavarty9d88a2e2008-04-18 13:33:53 -0700186 if (ret)
187 break;
Badari Pulavarty9d88a2e2008-04-18 13:33:53 -0700188 }
189 return ret;
Badari Pulavartya99824f2008-02-05 00:10:18 -0800190}
KAMEZAWA Hiroyuki908eedc2009-09-22 16:45:46 -0700191EXPORT_SYMBOL_GPL(walk_system_ram_range);
Badari Pulavartya99824f2008-02-05 00:10:18 -0800192
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000193/*
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000194 * Initialize the bootmem system and give it all the memory we
195 * have available. If we are using highmem, we only put the
196 * lowmem into the bootmem system.
197 */
198#ifndef CONFIG_NEED_MULTIPLE_NODES
199void __init do_init_bootmem(void)
200{
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000201 unsigned long start, bootmap_pages;
202 unsigned long total_pages;
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000203 struct memblock_region *reg;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000204 int boot_mapsize;
205
Yinghai Lu95f72d12010-07-12 14:36:09 +1000206 max_low_pfn = max_pfn = memblock_end_of_DRAM() >> PAGE_SHIFT;
207 total_pages = (memblock_end_of_DRAM() - memstart_addr) >> PAGE_SHIFT;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000208#ifdef CONFIG_HIGHMEM
209 total_pages = total_lowmem >> PAGE_SHIFT;
Kumar Galad7917ba2008-04-16 05:52:22 +1000210 max_low_pfn = lowmem_end_addr >> PAGE_SHIFT;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000211#endif
212
213 /*
214 * Find an area to use for the bootmem bitmap. Calculate the size of
215 * bitmap required as (Total Memory) / PAGE_SIZE / BITS_PER_BYTE.
216 * Add 1 additional page in case the address isn't page-aligned.
217 */
218 bootmap_pages = bootmem_bootmap_pages(total_pages);
219
Yinghai Lu95f72d12010-07-12 14:36:09 +1000220 start = memblock_alloc(bootmap_pages << PAGE_SHIFT, PAGE_SIZE);
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000221
Kumar Gala37dd2ba2008-04-22 04:22:34 +1000222 min_low_pfn = MEMORY_START >> PAGE_SHIFT;
223 boot_mapsize = init_bootmem_node(NODE_DATA(0), start >> PAGE_SHIFT, min_low_pfn, max_low_pfn);
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000224
Cody P Schafer4e8309b2013-01-09 12:40:18 +0000225 /* Place all memblock_regions in the same node and merge contiguous
226 * memblock_regions
227 */
Tang Chene7e8de52014-01-21 15:49:26 -0800228 memblock_set_node(0, (phys_addr_t)ULLONG_MAX, &memblock.memory, 0);
Mel Gormanc67c3cb2006-09-27 01:49:49 -0700229
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000230 /* Add all physical memory to the bootmem map, mark each area
231 * present.
232 */
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000233#ifdef CONFIG_HIGHMEM
Kumar Galad7917ba2008-04-16 05:52:22 +1000234 free_bootmem_with_active_regions(0, lowmem_end_addr >> PAGE_SHIFT);
Kumar Galaf98eeb42008-01-09 11:27:23 -0600235
236 /* reserve the sections we're already using */
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000237 for_each_memblock(reserved, reg) {
238 unsigned long top = reg->base + reg->size - 1;
239 if (top < lowmem_end_addr)
240 reserve_bootmem(reg->base, reg->size, BOOTMEM_DEFAULT);
241 else if (reg->base < lowmem_end_addr) {
242 unsigned long trunc_size = lowmem_end_addr - reg->base;
243 reserve_bootmem(reg->base, trunc_size, BOOTMEM_DEFAULT);
Kumar Galaf98eeb42008-01-09 11:27:23 -0600244 }
245 }
Mel Gormanc67c3cb2006-09-27 01:49:49 -0700246#else
247 free_bootmem_with_active_regions(0, max_pfn);
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000248
249 /* reserve the sections we're already using */
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000250 for_each_memblock(reserved, reg)
251 reserve_bootmem(reg->base, reg->size, BOOTMEM_DEFAULT);
Kumar Galaf98eeb42008-01-09 11:27:23 -0600252#endif
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000253 /* XXX need to clip this if using highmem? */
Mel Gormanc67c3cb2006-09-27 01:49:49 -0700254 sparse_memory_present_with_active_regions(0);
255
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000256 init_bootmem_done = 1;
257}
258
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000259/* mark pages that don't exist as nosave */
260static int __init mark_nonram_nosave(void)
261{
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000262 struct memblock_region *reg, *prev = NULL;
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000263
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000264 for_each_memblock(memory, reg) {
265 if (prev &&
Yinghai Luc7fc2de2010-10-12 14:07:09 -0700266 memblock_region_memory_end_pfn(prev) < memblock_region_memory_base_pfn(reg))
267 register_nosave_region(memblock_region_memory_end_pfn(prev),
268 memblock_region_memory_base_pfn(reg));
Benjamin Herrenschmidt28be7072010-08-04 13:43:53 +1000269 prev = reg;
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000270 }
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000271 return 0;
272}
Scott Wood6db35ad2014-09-18 14:05:02 -0500273#else /* CONFIG_NEED_MULTIPLE_NODES */
274static int __init mark_nonram_nosave(void)
275{
276 return 0;
277}
278#endif
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000279
Scott Wood1c980252014-08-08 18:40:42 -0500280static bool zone_limits_final;
281
282static unsigned long max_zone_pfns[MAX_NR_ZONES] = {
283 [0 ... MAX_NR_ZONES - 1] = ~0UL
284};
285
286/*
287 * Restrict the specified zone and all more restrictive zones
288 * to be below the specified pfn. May not be called after
289 * paging_init().
290 */
291void __init limit_zone_pfn(enum zone_type zone, unsigned long pfn_limit)
292{
293 int i;
294
295 if (WARN_ON(zone_limits_final))
296 return;
297
298 for (i = zone; i >= 0; i--) {
299 if (max_zone_pfns[i] > pfn_limit)
300 max_zone_pfns[i] = pfn_limit;
301 }
302}
303
304/*
305 * Find the least restrictive zone that is entirely below the
306 * specified pfn limit. Returns < 0 if no suitable zone is found.
307 *
308 * pfn_limit must be u64 because it can exceed 32 bits even on 32-bit
309 * systems -- the DMA limit can be higher than any possible real pfn.
310 */
311int dma_pfn_limit_to_zone(u64 pfn_limit)
312{
313 enum zone_type top_zone = ZONE_NORMAL;
314 int i;
315
316#ifdef CONFIG_HIGHMEM
317 top_zone = ZONE_HIGHMEM;
318#endif
319
320 for (i = top_zone; i >= 0; i--) {
321 if (max_zone_pfns[i] <= pfn_limit)
322 return i;
323 }
324
325 return -EPERM;
326}
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000327
328/*
329 * paging_init() sets up the page tables - in fact we've already done this.
330 */
331void __init paging_init(void)
332{
Tony Breedsf7ba2992011-07-04 18:44:19 +0000333 unsigned long long total_ram = memblock_phys_mem_size();
Yinghai Lu95f72d12010-07-12 14:36:09 +1000334 phys_addr_t top_of_ram = memblock_end_of_DRAM();
Scott Wood1c980252014-08-08 18:40:42 -0500335 enum zone_type top_zone;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000336
Kumar Gala2c419bd2008-04-23 23:05:20 +1000337#ifdef CONFIG_PPC32
338 unsigned long v = __fix_to_virt(__end_of_fixed_addresses - 1);
339 unsigned long end = __fix_to_virt(FIX_HOLE);
340
341 for (; v < end; v += PAGE_SIZE)
342 map_page(v, 0, 0); /* XXX gross */
343#endif
344
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000345#ifdef CONFIG_HIGHMEM
346 map_page(PKMAP_BASE, 0, 0); /* XXX gross */
Kumar Gala2c419bd2008-04-23 23:05:20 +1000347 pkmap_page_table = virt_to_kpte(PKMAP_BASE);
348
349 kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN));
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000350 kmap_prot = PAGE_KERNEL;
351#endif /* CONFIG_HIGHMEM */
352
Tony Breedsf7ba2992011-07-04 18:44:19 +0000353 printk(KERN_DEBUG "Top of RAM: 0x%llx, Total RAM: 0x%llx\n",
Tony Breedsfb610632008-07-31 13:51:42 +1000354 (unsigned long long)top_of_ram, total_ram);
Olof Johanssone110b282006-04-12 15:25:01 -0500355 printk(KERN_DEBUG "Memory hole size: %ldMB\n",
Stefan Roese2bf30162008-07-10 01:09:23 +1000356 (long int)((top_of_ram - total_ram) >> 20));
Scott Wood1c980252014-08-08 18:40:42 -0500357
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000358#ifdef CONFIG_HIGHMEM
Scott Wood1c980252014-08-08 18:40:42 -0500359 top_zone = ZONE_HIGHMEM;
360 limit_zone_pfn(ZONE_NORMAL, lowmem_end_addr >> PAGE_SHIFT);
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000361#else
Scott Wood1c980252014-08-08 18:40:42 -0500362 top_zone = ZONE_NORMAL;
Mel Gormanc67c3cb2006-09-27 01:49:49 -0700363#endif
Scott Wood1c980252014-08-08 18:40:42 -0500364
365 limit_zone_pfn(top_zone, top_of_ram >> PAGE_SHIFT);
366 zone_limits_final = true;
Mel Gormanc67c3cb2006-09-27 01:49:49 -0700367 free_area_init_nodes(max_zone_pfns);
Johannes Berg4e8ad3e2007-05-08 19:25:00 +1000368
369 mark_nonram_nosave();
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000370}
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000371
Nathan Fontenotf7e33342013-09-27 10:18:09 -0500372static void __init register_page_bootmem_info(void)
373{
374 int i;
375
376 for_each_online_node(i)
377 register_page_bootmem_info_node(NODE_DATA(i));
378}
379
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000380void __init mem_init(void)
381{
Scott Wood28efc352013-10-11 19:22:38 -0500382 /*
383 * book3s is limited to 16 page sizes due to encoding this in
384 * a 4-bit field for slices.
385 */
386 BUILD_BUG_ON(MMU_PAGE_COUNT > 16);
387
FUJITA Tomonoria9327292010-03-16 13:16:25 +0000388#ifdef CONFIG_SWIOTLB
Jia Hongtao688ba1d2012-08-03 18:14:10 +0800389 swiotlb_init(0);
FUJITA Tomonoria9327292010-03-16 13:16:25 +0000390#endif
391
Nathan Fontenotf7e33342013-09-27 10:18:09 -0500392 register_page_bootmem_info();
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000393 high_memory = (void *) __va(max_low_pfn * PAGE_SIZE);
Jiang Liu602ddc72013-07-03 15:04:32 -0700394 set_max_mapnr(max_pfn);
Jiang Liu0c988532013-07-03 15:03:24 -0700395 free_all_bootmem();
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000396
397#ifdef CONFIG_HIGHMEM
398 {
399 unsigned long pfn, highmem_mapnr;
400
Kumar Galad7917ba2008-04-16 05:52:22 +1000401 highmem_mapnr = lowmem_end_addr >> PAGE_SHIFT;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000402 for (pfn = highmem_mapnr; pfn < max_mapnr; ++pfn) {
Becky Bruce3d41e0f2011-06-28 09:54:46 +0000403 phys_addr_t paddr = (phys_addr_t)pfn << PAGE_SHIFT;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000404 struct page *page = pfn_to_page(pfn);
Jiang Liu369a9d82013-07-03 15:04:09 -0700405 if (!memblock_is_reserved(paddr))
406 free_highmem_page(page);
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000407 }
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000408 }
409#endif /* CONFIG_HIGHMEM */
410
Becky Bruce3160b092011-06-28 14:54:47 -0500411#if defined(CONFIG_PPC_FSL_BOOK3E) && !defined(CONFIG_SMP)
412 /*
413 * If smp is enabled, next_tlbcam_idx is initialized in the cpu up
414 * functions.... do it here for the non-smp case.
415 */
416 per_cpu(next_tlbcam_idx, smp_processor_id()) =
417 (mfspr(SPRN_TLB1CFG) & TLBnCFG_N_ENTRY) - 1;
418#endif
419
Jiang Liu369a9d82013-07-03 15:04:09 -0700420 mem_init_print_info(NULL);
Benjamin Herrenschmidtf637a492009-05-27 13:44:50 +1000421#ifdef CONFIG_PPC32
422 pr_info("Kernel virtual memory layout:\n");
423 pr_info(" * 0x%08lx..0x%08lx : fixmap\n", FIXADDR_START, FIXADDR_TOP);
424#ifdef CONFIG_HIGHMEM
425 pr_info(" * 0x%08lx..0x%08lx : highmem PTEs\n",
426 PKMAP_BASE, PKMAP_ADDR(LAST_PKMAP));
427#endif /* CONFIG_HIGHMEM */
Benjamin Herrenschmidt8b31e492009-05-27 13:50:33 +1000428#ifdef CONFIG_NOT_COHERENT_CACHE
429 pr_info(" * 0x%08lx..0x%08lx : consistent mem\n",
430 IOREMAP_TOP, IOREMAP_TOP + CONFIG_CONSISTENT_SIZE);
431#endif /* CONFIG_NOT_COHERENT_CACHE */
Benjamin Herrenschmidtf637a492009-05-27 13:44:50 +1000432 pr_info(" * 0x%08lx..0x%08lx : early ioremap\n",
433 ioremap_bot, IOREMAP_TOP);
434 pr_info(" * 0x%08lx..0x%08lx : vmalloc & ioremap\n",
435 VMALLOC_START, VMALLOC_END);
436#endif /* CONFIG_PPC32 */
437
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000438 mem_init_done = 1;
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000439}
440
Dave Carroll2773fcc2011-06-18 07:36:39 +0000441void free_initmem(void)
442{
Dave Carrolla9c0f412011-06-18 07:36:40 +0000443 ppc_md.progress = ppc_printk_progress;
Jiang Liu5d585e52013-04-29 15:06:47 -0700444 free_initmem_default(POISON_FREE_INITMEM);
Dave Carroll2773fcc2011-06-18 07:36:39 +0000445}
446
Benjamin Herrenschmidt307cfe72011-06-09 16:52:38 +1000447#ifdef CONFIG_BLK_DEV_INITRD
448void __init free_initrd_mem(unsigned long start, unsigned long end)
449{
Jiang Liudbe67df2013-07-03 15:02:51 -0700450 free_reserved_area((void *)start, (void *)end, -1, "initrd");
Benjamin Herrenschmidt307cfe72011-06-09 16:52:38 +1000451}
452#endif
453
Paul Mackerras7c8c6b92005-10-06 12:23:33 +1000454/*
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000455 * This is called when a page has been modified by the kernel.
456 * It just marks the page as not i-cache clean. We do the i-cache
457 * flush later when the page is given to a user process, if necessary.
458 */
459void flush_dcache_page(struct page *page)
460{
461 if (cpu_has_feature(CPU_FTR_COHERENT_ICACHE))
462 return;
463 /* avoid an atomic op if possible */
464 if (test_bit(PG_arch_1, &page->flags))
465 clear_bit(PG_arch_1, &page->flags);
466}
467EXPORT_SYMBOL(flush_dcache_page);
468
469void flush_dcache_icache_page(struct page *page)
470{
David Gibson0895ecd2009-10-26 19:24:31 +0000471#ifdef CONFIG_HUGETLB_PAGE
472 if (PageCompound(page)) {
473 flush_dcache_icache_hugepage(page);
474 return;
475 }
476#endif
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000477#ifdef CONFIG_BOOKE
David Gibson0895ecd2009-10-26 19:24:31 +0000478 {
Cong Wang2480b202011-11-25 23:14:16 +0800479 void *start = kmap_atomic(page);
David Gibson0895ecd2009-10-26 19:24:31 +0000480 __flush_dcache_icache(start);
Cong Wang2480b202011-11-25 23:14:16 +0800481 kunmap_atomic(start);
David Gibson0895ecd2009-10-26 19:24:31 +0000482 }
Paul Mackerrasab1f9da2005-10-10 21:58:35 +1000483#elif defined(CONFIG_8xx) || defined(CONFIG_PPC64)
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000484 /* On 8xx there is no need to kmap since highmem is not supported */
485 __flush_dcache_icache(page_address(page));
486#else
487 __flush_dcache_icache_phys(page_to_pfn(page) << PAGE_SHIFT);
488#endif
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000489}
Alexander Graf249ba1e2012-08-03 13:56:33 +0200490EXPORT_SYMBOL(flush_dcache_icache_page);
David Gibson0895ecd2009-10-26 19:24:31 +0000491
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000492void clear_user_page(void *page, unsigned long vaddr, struct page *pg)
493{
494 clear_page(page);
495
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000496 /*
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300497 * We shouldn't have to do this, but some versions of glibc
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000498 * require it (ld.so assumes zero filled pages are icache clean)
499 * - Anton
500 */
David Gibson09f5dc42006-02-06 13:24:53 +1100501 flush_dcache_page(pg);
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000502}
503EXPORT_SYMBOL(clear_user_page);
504
505void copy_user_page(void *vto, void *vfrom, unsigned long vaddr,
506 struct page *pg)
507{
508 copy_page(vto, vfrom);
509
510 /*
511 * We should be able to use the following optimisation, however
512 * there are two problems.
513 * Firstly a bug in some versions of binutils meant PLT sections
514 * were not marked executable.
515 * Secondly the first word in the GOT section is blrl, used
516 * to establish the GOT address. Until recently the GOT was
517 * not marked executable.
518 * - Anton
519 */
520#if 0
521 if (!vma->vm_file && ((vma->vm_flags & VM_EXEC) == 0))
522 return;
523#endif
524
David Gibson09f5dc42006-02-06 13:24:53 +1100525 flush_dcache_page(pg);
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000526}
527
528void flush_icache_user_range(struct vm_area_struct *vma, struct page *page,
529 unsigned long addr, int len)
530{
531 unsigned long maddr;
532
533 maddr = (unsigned long) kmap(page) + (addr & ~PAGE_MASK);
534 flush_icache_range(maddr, maddr + len);
535 kunmap(page);
536}
537EXPORT_SYMBOL(flush_icache_user_range);
538
539/*
540 * This is called at the end of handling a user page fault, when the
541 * fault has been handled by updating a PTE in the linux page tables.
542 * We use it to preload an HPTE into the hash table corresponding to
543 * the updated linux PTE.
544 *
Hugh Dickins01edcd82005-11-23 13:37:39 -0800545 * This must always be called with the pte lock held.
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000546 */
547void update_mmu_cache(struct vm_area_struct *vma, unsigned long address,
Russell King4b3073e2009-12-18 16:40:18 +0000548 pte_t *ptep)
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000549{
Benjamin Herrenschmidt3c726f82005-11-07 11:06:55 +1100550#ifdef CONFIG_PPC_STD_MMU
Aneesh Kumar K.V0ac52dd2013-06-20 14:30:22 +0530551 /*
552 * We don't need to worry about _PAGE_PRESENT here because we are
553 * called with either mm->page_table_lock held or ptl lock held
554 */
Benjamin Herrenschmidt3c726f82005-11-07 11:06:55 +1100555 unsigned long access = 0, trap;
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000556
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000557 /* We only want HPTEs for linux PTEs that have _PAGE_ACCESSED set */
Russell King4b3073e2009-12-18 16:40:18 +0000558 if (!pte_young(*ptep) || address >= TASK_SIZE)
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000559 return;
Benjamin Herrenschmidt3c726f82005-11-07 11:06:55 +1100560
561 /* We try to figure out if we are coming from an instruction
562 * access fault and pass that down to __hash_page so we avoid
563 * double-faulting on execution of fresh text. We have to test
564 * for regs NULL since init will get here first thing at boot
565 *
566 * We also avoid filling the hash if not coming from a fault
567 */
568 if (current->thread.regs == NULL)
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000569 return;
Benjamin Herrenschmidt3c726f82005-11-07 11:06:55 +1100570 trap = TRAP(current->thread.regs);
571 if (trap == 0x400)
572 access |= _PAGE_EXEC;
573 else if (trap != 0x300)
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000574 return;
Benjamin Herrenschmidt3c726f82005-11-07 11:06:55 +1100575 hash_preload(vma->vm_mm, address, access, trap);
576#endif /* CONFIG_PPC_STD_MMU */
Becky Bruce41151e72011-06-28 09:54:48 +0000577#if (defined(CONFIG_PPC_BOOK3E_64) || defined(CONFIG_PPC_FSL_BOOK3E)) \
578 && defined(CONFIG_HUGETLB_PAGE)
579 if (is_vm_hugetlb_page(vma))
Becky Bruced93e4d72011-11-28 14:43:33 +0000580 book3e_hugetlb_preload(vma, address, *ptep);
Becky Bruce41151e72011-06-28 09:54:48 +0000581#endif
Paul Mackerras14cf11a2005-09-26 16:04:21 +1000582}
Anton Blanchardc40dd2f2011-11-02 14:56:12 +0000583
584/*
585 * System memory should not be in /proc/iomem but various tools expect it
586 * (eg kdump).
587 */
Geert Uytterhoeven4f770922013-09-15 11:39:36 +0200588static int __init add_system_ram_resources(void)
Anton Blanchardc40dd2f2011-11-02 14:56:12 +0000589{
590 struct memblock_region *reg;
591
592 for_each_memblock(memory, reg) {
593 struct resource *res;
594 unsigned long base = reg->base;
595 unsigned long size = reg->size;
596
597 res = kzalloc(sizeof(struct resource), GFP_KERNEL);
598 WARN_ON(!res);
599
600 if (res) {
601 res->name = "System RAM";
602 res->start = base;
603 res->end = base + size - 1;
Nathan Fontenotf748eda2013-08-19 21:52:20 -0500604 res->flags = IORESOURCE_MEM | IORESOURCE_BUSY;
Anton Blanchardc40dd2f2011-11-02 14:56:12 +0000605 WARN_ON(request_resource(&iomem_resource, res) < 0);
606 }
607 }
608
609 return 0;
610}
611subsys_initcall(add_system_ram_resources);
sukadev@linux.vnet.ibm.com1d54cf22011-08-30 09:19:17 +0000612
613#ifdef CONFIG_STRICT_DEVMEM
614/*
615 * devmem_is_allowed(): check to see if /dev/mem access to a certain address
616 * is valid. The argument is a physical page number.
617 *
618 * Access has to be given to non-kernel-ram areas as well, these contain the
619 * PCI mmio resources as well as potential bios/acpi data regions.
620 */
621int devmem_is_allowed(unsigned long pfn)
622{
623 if (iomem_is_exclusive(pfn << PAGE_SHIFT))
624 return 0;
625 if (!page_is_ram(pfn))
626 return 1;
sukadev@linux.vnet.ibm.com8a3e3d32011-12-02 12:26:23 +0000627 if (page_is_rtas_user_buf(pfn))
628 return 1;
sukadev@linux.vnet.ibm.com1d54cf22011-08-30 09:19:17 +0000629 return 0;
630}
631#endif /* CONFIG_STRICT_DEVMEM */