powerpc: Move free_initmem to common code
[linux-block.git] / arch / powerpc / mm / mem.c
CommitLineData
14cf11af
PM
1/*
2 * PowerPC version
3 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
4 *
5 * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au)
6 * and Cort Dougan (PReP) (cort@cs.nmt.edu)
7 * Copyright (C) 1996 Paul Mackerras
14cf11af
PM
8 * PPC44x/36-bit changes by Matt Porter (mporter@mvista.com)
9 *
10 * Derived from "arch/i386/mm/init.c"
11 * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds
12 *
13 * This program is free software; you can redistribute it and/or
14 * modify it under the terms of the GNU General Public License
15 * as published by the Free Software Foundation; either version
16 * 2 of the License, or (at your option) any later version.
17 *
18 */
19
14cf11af
PM
20#include <linux/module.h>
21#include <linux/sched.h>
22#include <linux/kernel.h>
23#include <linux/errno.h>
24#include <linux/string.h>
5a0e3ad6 25#include <linux/gfp.h>
14cf11af
PM
26#include <linux/types.h>
27#include <linux/mm.h>
28#include <linux/stddef.h>
29#include <linux/init.h>
30#include <linux/bootmem.h>
31#include <linux/highmem.h>
32#include <linux/initrd.h>
33#include <linux/pagemap.h>
4e8ad3e8 34#include <linux/suspend.h>
95f72d1e 35#include <linux/memblock.h>
0895ecda 36#include <linux/hugetlb.h>
14cf11af
PM
37
38#include <asm/pgalloc.h>
39#include <asm/prom.h>
40#include <asm/io.h>
41#include <asm/mmu_context.h>
42#include <asm/pgtable.h>
43#include <asm/mmu.h>
44#include <asm/smp.h>
45#include <asm/machdep.h>
46#include <asm/btext.h>
47#include <asm/tlb.h>
7c8c6b97 48#include <asm/sections.h>
db7f37de 49#include <asm/sparsemem.h>
ab1f9dac 50#include <asm/vdso.h>
2c419bde 51#include <asm/fixmap.h>
a9327296 52#include <asm/swiotlb.h>
14cf11af 53
14cf11af
PM
54#include "mmu_decl.h"
55
56#ifndef CPU_FTR_COHERENT_ICACHE
57#define CPU_FTR_COHERENT_ICACHE 0 /* XXX for now */
58#define CPU_FTR_NOEXECUTE 0
59#endif
60
7c8c6b97
PM
61int init_bootmem_done;
62int mem_init_done;
49a84965 63phys_addr_t memory_limit;
7c8c6b97 64
2c419bde
KG
65#ifdef CONFIG_HIGHMEM
66pte_t *kmap_pte;
67pgprot_t kmap_prot;
68
69EXPORT_SYMBOL(kmap_prot);
70EXPORT_SYMBOL(kmap_pte);
71
72static inline pte_t *virt_to_kpte(unsigned long vaddr)
73{
74 return pte_offset_kernel(pmd_offset(pud_offset(pgd_offset_k(vaddr),
75 vaddr), vaddr), vaddr);
76}
77#endif
78
14cf11af
PM
79int page_is_ram(unsigned long pfn)
80{
14cf11af 81#ifndef CONFIG_PPC64 /* XXX for now */
a880e762 82 return pfn < max_pfn;
14cf11af 83#else
a880e762 84 unsigned long paddr = (pfn << PAGE_SHIFT);
28be7072 85 struct memblock_region *reg;
14cf11af 86
28be7072
BH
87 for_each_memblock(memory, reg)
88 if (paddr >= reg->base && paddr < (reg->base + reg->size))
14cf11af 89 return 1;
14cf11af
PM
90 return 0;
91#endif
92}
14cf11af 93
8b150478 94pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
14cf11af
PM
95 unsigned long size, pgprot_t vma_prot)
96{
97 if (ppc_md.phys_mem_access_prot)
8b150478 98 return ppc_md.phys_mem_access_prot(file, pfn, size, vma_prot);
14cf11af 99
8b150478 100 if (!page_is_ram(pfn))
64b3d0e8
BH
101 vma_prot = pgprot_noncached(vma_prot);
102
14cf11af
PM
103 return vma_prot;
104}
105EXPORT_SYMBOL(phys_mem_access_prot);
106
23fd0775
PM
107#ifdef CONFIG_MEMORY_HOTPLUG
108
bc02af93
YG
109#ifdef CONFIG_NUMA
110int memory_add_physaddr_to_nid(u64 start)
111{
112 return hot_add_scn_to_nid(start);
113}
114#endif
115
fa90f70a 116int arch_add_memory(int nid, u64 start, u64 size)
23fd0775 117{
237a0989 118 struct pglist_data *pgdata;
23fd0775
PM
119 struct zone *zone;
120 unsigned long start_pfn = start >> PAGE_SHIFT;
121 unsigned long nr_pages = size >> PAGE_SHIFT;
122
237a0989
MK
123 pgdata = NODE_DATA(nid);
124
2d0eee14 125 start = (unsigned long)__va(start);
54b79248
MK
126 create_section_mapping(start, start + size);
127
23fd0775
PM
128 /* this should work for most non-highmem platforms */
129 zone = pgdata->node_zones;
130
c04fc586 131 return __add_pages(nid, zone, start_pfn, nr_pages);
23fd0775 132}
0d579944 133#endif /* CONFIG_MEMORY_HOTPLUG */
a99824f3
BP
134
135/*
136 * walk_memory_resource() needs to make sure there is no holes in a given
9d88a2eb 137 * memory range. PPC64 does not maintain the memory layout in /proc/iomem.
95f72d1e 138 * Instead it maintains it in memblock.memory structures. Walk through the
9d88a2eb 139 * memory regions, find holes and callback for contiguous regions.
a99824f3
BP
140 */
141int
908eedc6
KH
142walk_system_ram_range(unsigned long start_pfn, unsigned long nr_pages,
143 void *arg, int (*func)(unsigned long, unsigned long, void *))
a99824f3 144{
28be7072
BH
145 struct memblock_region *reg;
146 unsigned long end_pfn = start_pfn + nr_pages;
147 unsigned long tstart, tend;
9d88a2eb
BP
148 int ret = -1;
149
28be7072 150 for_each_memblock(memory, reg) {
c7fc2de0
YL
151 tstart = max(start_pfn, memblock_region_memory_base_pfn(reg));
152 tend = min(end_pfn, memblock_region_memory_end_pfn(reg));
28be7072
BH
153 if (tstart >= tend)
154 continue;
155 ret = (*func)(tstart, tend - tstart, arg);
9d88a2eb
BP
156 if (ret)
157 break;
9d88a2eb
BP
158 }
159 return ret;
a99824f3 160}
908eedc6 161EXPORT_SYMBOL_GPL(walk_system_ram_range);
a99824f3 162
7c8c6b97
PM
163/*
164 * Initialize the bootmem system and give it all the memory we
165 * have available. If we are using highmem, we only put the
166 * lowmem into the bootmem system.
167 */
168#ifndef CONFIG_NEED_MULTIPLE_NODES
169void __init do_init_bootmem(void)
170{
7c8c6b97
PM
171 unsigned long start, bootmap_pages;
172 unsigned long total_pages;
28be7072 173 struct memblock_region *reg;
7c8c6b97
PM
174 int boot_mapsize;
175
95f72d1e
YL
176 max_low_pfn = max_pfn = memblock_end_of_DRAM() >> PAGE_SHIFT;
177 total_pages = (memblock_end_of_DRAM() - memstart_addr) >> PAGE_SHIFT;
7c8c6b97
PM
178#ifdef CONFIG_HIGHMEM
179 total_pages = total_lowmem >> PAGE_SHIFT;
d7917ba7 180 max_low_pfn = lowmem_end_addr >> PAGE_SHIFT;
7c8c6b97
PM
181#endif
182
183 /*
184 * Find an area to use for the bootmem bitmap. Calculate the size of
185 * bitmap required as (Total Memory) / PAGE_SIZE / BITS_PER_BYTE.
186 * Add 1 additional page in case the address isn't page-aligned.
187 */
188 bootmap_pages = bootmem_bootmap_pages(total_pages);
189
95f72d1e 190 start = memblock_alloc(bootmap_pages << PAGE_SHIFT, PAGE_SIZE);
7c8c6b97 191
37dd2bad
KG
192 min_low_pfn = MEMORY_START >> PAGE_SHIFT;
193 boot_mapsize = init_bootmem_node(NODE_DATA(0), start >> PAGE_SHIFT, min_low_pfn, max_low_pfn);
7c8c6b97 194
c67c3cb4 195 /* Add active regions with valid PFNs */
28be7072 196 for_each_memblock(memory, reg) {
c67c3cb4 197 unsigned long start_pfn, end_pfn;
c7fc2de0
YL
198 start_pfn = memblock_region_memory_base_pfn(reg);
199 end_pfn = memblock_region_memory_end_pfn(reg);
c67c3cb4
MG
200 add_active_range(0, start_pfn, end_pfn);
201 }
202
7c8c6b97
PM
203 /* Add all physical memory to the bootmem map, mark each area
204 * present.
205 */
7c8c6b97 206#ifdef CONFIG_HIGHMEM
d7917ba7 207 free_bootmem_with_active_regions(0, lowmem_end_addr >> PAGE_SHIFT);
f98eeb4e
KG
208
209 /* reserve the sections we're already using */
28be7072
BH
210 for_each_memblock(reserved, reg) {
211 unsigned long top = reg->base + reg->size - 1;
212 if (top < lowmem_end_addr)
213 reserve_bootmem(reg->base, reg->size, BOOTMEM_DEFAULT);
214 else if (reg->base < lowmem_end_addr) {
215 unsigned long trunc_size = lowmem_end_addr - reg->base;
216 reserve_bootmem(reg->base, trunc_size, BOOTMEM_DEFAULT);
f98eeb4e
KG
217 }
218 }
c67c3cb4
MG
219#else
220 free_bootmem_with_active_regions(0, max_pfn);
7c8c6b97
PM
221
222 /* reserve the sections we're already using */
28be7072
BH
223 for_each_memblock(reserved, reg)
224 reserve_bootmem(reg->base, reg->size, BOOTMEM_DEFAULT);
f98eeb4e 225#endif
7c8c6b97 226 /* XXX need to clip this if using highmem? */
c67c3cb4
MG
227 sparse_memory_present_with_active_regions(0);
228
7c8c6b97
PM
229 init_bootmem_done = 1;
230}
231
4e8ad3e8
JB
232/* mark pages that don't exist as nosave */
233static int __init mark_nonram_nosave(void)
234{
28be7072
BH
235 struct memblock_region *reg, *prev = NULL;
236
237 for_each_memblock(memory, reg) {
238 if (prev &&
c7fc2de0
YL
239 memblock_region_memory_end_pfn(prev) < memblock_region_memory_base_pfn(reg))
240 register_nosave_region(memblock_region_memory_end_pfn(prev),
241 memblock_region_memory_base_pfn(reg));
28be7072 242 prev = reg;
4e8ad3e8 243 }
4e8ad3e8
JB
244 return 0;
245}
246
7c8c6b97
PM
247/*
248 * paging_init() sets up the page tables - in fact we've already done this.
249 */
250void __init paging_init(void)
251{
95f72d1e
YL
252 unsigned long total_ram = memblock_phys_mem_size();
253 phys_addr_t top_of_ram = memblock_end_of_DRAM();
c67c3cb4 254 unsigned long max_zone_pfns[MAX_NR_ZONES];
7c8c6b97 255
2c419bde
KG
256#ifdef CONFIG_PPC32
257 unsigned long v = __fix_to_virt(__end_of_fixed_addresses - 1);
258 unsigned long end = __fix_to_virt(FIX_HOLE);
259
260 for (; v < end; v += PAGE_SIZE)
261 map_page(v, 0, 0); /* XXX gross */
262#endif
263
7c8c6b97
PM
264#ifdef CONFIG_HIGHMEM
265 map_page(PKMAP_BASE, 0, 0); /* XXX gross */
2c419bde
KG
266 pkmap_page_table = virt_to_kpte(PKMAP_BASE);
267
268 kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN));
7c8c6b97
PM
269 kmap_prot = PAGE_KERNEL;
270#endif /* CONFIG_HIGHMEM */
271
2bf3016f 272 printk(KERN_DEBUG "Top of RAM: 0x%llx, Total RAM: 0x%lx\n",
fb610635 273 (unsigned long long)top_of_ram, total_ram);
e110b281 274 printk(KERN_DEBUG "Memory hole size: %ldMB\n",
2bf3016f 275 (long int)((top_of_ram - total_ram) >> 20));
6391af17 276 memset(max_zone_pfns, 0, sizeof(max_zone_pfns));
7c8c6b97 277#ifdef CONFIG_HIGHMEM
d7917ba7 278 max_zone_pfns[ZONE_DMA] = lowmem_end_addr >> PAGE_SHIFT;
6391af17 279 max_zone_pfns[ZONE_HIGHMEM] = top_of_ram >> PAGE_SHIFT;
7c8c6b97 280#else
6391af17 281 max_zone_pfns[ZONE_DMA] = top_of_ram >> PAGE_SHIFT;
c67c3cb4
MG
282#endif
283 free_area_init_nodes(max_zone_pfns);
4e8ad3e8
JB
284
285 mark_nonram_nosave();
7c8c6b97
PM
286}
287#endif /* ! CONFIG_NEED_MULTIPLE_NODES */
288
289void __init mem_init(void)
290{
291#ifdef CONFIG_NEED_MULTIPLE_NODES
292 int nid;
293#endif
294 pg_data_t *pgdat;
295 unsigned long i;
296 struct page *page;
297 unsigned long reservedpages = 0, codesize, initsize, datasize, bsssize;
298
a9327296
FT
299#ifdef CONFIG_SWIOTLB
300 if (ppc_swiotlb_enable)
301 swiotlb_init(1);
302#endif
303
4734b594 304 num_physpages = memblock_phys_mem_size() >> PAGE_SHIFT;
7c8c6b97
PM
305 high_memory = (void *) __va(max_low_pfn * PAGE_SIZE);
306
307#ifdef CONFIG_NEED_MULTIPLE_NODES
308 for_each_online_node(nid) {
309 if (NODE_DATA(nid)->node_spanned_pages != 0) {
c258dd40 310 printk("freeing bootmem node %d\n", nid);
7c8c6b97
PM
311 totalram_pages +=
312 free_all_bootmem_node(NODE_DATA(nid));
313 }
314 }
315#else
fb6d73d3 316 max_mapnr = max_pfn;
7c8c6b97
PM
317 totalram_pages += free_all_bootmem();
318#endif
ec936fc5 319 for_each_online_pgdat(pgdat) {
7c8c6b97 320 for (i = 0; i < pgdat->node_spanned_pages; i++) {
fb6d73d3
PM
321 if (!pfn_valid(pgdat->node_start_pfn + i))
322 continue;
7c8c6b97
PM
323 page = pgdat_page_nr(pgdat, i);
324 if (PageReserved(page))
325 reservedpages++;
326 }
327 }
328
329 codesize = (unsigned long)&_sdata - (unsigned long)&_stext;
bcb35576 330 datasize = (unsigned long)&_edata - (unsigned long)&_sdata;
7c8c6b97
PM
331 initsize = (unsigned long)&__init_end - (unsigned long)&__init_begin;
332 bsssize = (unsigned long)&__bss_stop - (unsigned long)&__bss_start;
333
334#ifdef CONFIG_HIGHMEM
335 {
336 unsigned long pfn, highmem_mapnr;
337
d7917ba7 338 highmem_mapnr = lowmem_end_addr >> PAGE_SHIFT;
7c8c6b97 339 for (pfn = highmem_mapnr; pfn < max_mapnr; ++pfn) {
3d41e0f6 340 phys_addr_t paddr = (phys_addr_t)pfn << PAGE_SHIFT;
7c8c6b97 341 struct page *page = pfn_to_page(pfn);
3d41e0f6 342 if (memblock_is_reserved(paddr))
f98eeb4e 343 continue;
7c8c6b97 344 ClearPageReserved(page);
7835e98b 345 init_page_count(page);
7c8c6b97
PM
346 __free_page(page);
347 totalhigh_pages++;
f98eeb4e 348 reservedpages--;
7c8c6b97
PM
349 }
350 totalram_pages += totalhigh_pages;
e110b281 351 printk(KERN_DEBUG "High memory: %luk\n",
7c8c6b97
PM
352 totalhigh_pages << (PAGE_SHIFT-10));
353 }
354#endif /* CONFIG_HIGHMEM */
355
356 printk(KERN_INFO "Memory: %luk/%luk available (%luk kernel code, "
357 "%luk reserved, %luk data, %luk bss, %luk init)\n",
cc013a88 358 nr_free_pages() << (PAGE_SHIFT-10),
7c8c6b97
PM
359 num_physpages << (PAGE_SHIFT-10),
360 codesize >> 10,
361 reservedpages << (PAGE_SHIFT-10),
362 datasize >> 10,
363 bsssize >> 10,
364 initsize >> 10);
365
f637a49e
BH
366#ifdef CONFIG_PPC32
367 pr_info("Kernel virtual memory layout:\n");
368 pr_info(" * 0x%08lx..0x%08lx : fixmap\n", FIXADDR_START, FIXADDR_TOP);
369#ifdef CONFIG_HIGHMEM
370 pr_info(" * 0x%08lx..0x%08lx : highmem PTEs\n",
371 PKMAP_BASE, PKMAP_ADDR(LAST_PKMAP));
372#endif /* CONFIG_HIGHMEM */
8b31e49d
BH
373#ifdef CONFIG_NOT_COHERENT_CACHE
374 pr_info(" * 0x%08lx..0x%08lx : consistent mem\n",
375 IOREMAP_TOP, IOREMAP_TOP + CONFIG_CONSISTENT_SIZE);
376#endif /* CONFIG_NOT_COHERENT_CACHE */
f637a49e
BH
377 pr_info(" * 0x%08lx..0x%08lx : early ioremap\n",
378 ioremap_bot, IOREMAP_TOP);
379 pr_info(" * 0x%08lx..0x%08lx : vmalloc & ioremap\n",
380 VMALLOC_START, VMALLOC_END);
381#endif /* CONFIG_PPC32 */
382
7c8c6b97 383 mem_init_done = 1;
7c8c6b97
PM
384}
385
2773fcc8
DC
386void free_initmem(void)
387{
388 unsigned long addr;
389
390 ppc_md.progress = NULL;
391
392 addr = (unsigned long)__init_begin;
393 for (; addr < (unsigned long)__init_end; addr += PAGE_SIZE) {
394 memset((void *)addr, POISON_FREE_INITMEM, PAGE_SIZE);
395 ClearPageReserved(virt_to_page(addr));
396 init_page_count(virt_to_page(addr));
397 free_page(addr);
398 totalram_pages++;
399 }
400 pr_info("Freeing unused kernel memory: %luk freed\n",
401 ((unsigned long)__init_end -
402 (unsigned long)__init_begin) >> 10);
403}
404
307cfe71
BH
405#ifdef CONFIG_BLK_DEV_INITRD
406void __init free_initrd_mem(unsigned long start, unsigned long end)
407{
408 if (start >= end)
409 return;
410
411 start = _ALIGN_DOWN(start, PAGE_SIZE);
412 end = _ALIGN_UP(end, PAGE_SIZE);
413 pr_info("Freeing initrd memory: %ldk freed\n", (end - start) >> 10);
414
415 for (; start < end; start += PAGE_SIZE) {
416 ClearPageReserved(virt_to_page(start));
417 init_page_count(virt_to_page(start));
418 free_page(start);
419 totalram_pages++;
420 }
421}
422#endif
423
14cf11af
PM
424/*
425 * This is called when a page has been modified by the kernel.
426 * It just marks the page as not i-cache clean. We do the i-cache
427 * flush later when the page is given to a user process, if necessary.
428 */
429void flush_dcache_page(struct page *page)
430{
431 if (cpu_has_feature(CPU_FTR_COHERENT_ICACHE))
432 return;
433 /* avoid an atomic op if possible */
434 if (test_bit(PG_arch_1, &page->flags))
435 clear_bit(PG_arch_1, &page->flags);
436}
437EXPORT_SYMBOL(flush_dcache_page);
438
439void flush_dcache_icache_page(struct page *page)
440{
0895ecda
DG
441#ifdef CONFIG_HUGETLB_PAGE
442 if (PageCompound(page)) {
443 flush_dcache_icache_hugepage(page);
444 return;
445 }
446#endif
14cf11af 447#ifdef CONFIG_BOOKE
0895ecda
DG
448 {
449 void *start = kmap_atomic(page, KM_PPC_SYNC_ICACHE);
450 __flush_dcache_icache(start);
451 kunmap_atomic(start, KM_PPC_SYNC_ICACHE);
452 }
ab1f9dac 453#elif defined(CONFIG_8xx) || defined(CONFIG_PPC64)
14cf11af
PM
454 /* On 8xx there is no need to kmap since highmem is not supported */
455 __flush_dcache_icache(page_address(page));
456#else
457 __flush_dcache_icache_phys(page_to_pfn(page) << PAGE_SHIFT);
458#endif
14cf11af 459}
0895ecda 460
14cf11af
PM
461void clear_user_page(void *page, unsigned long vaddr, struct page *pg)
462{
463 clear_page(page);
464
14cf11af 465 /*
25985edc 466 * We shouldn't have to do this, but some versions of glibc
14cf11af
PM
467 * require it (ld.so assumes zero filled pages are icache clean)
468 * - Anton
469 */
09f5dc44 470 flush_dcache_page(pg);
14cf11af
PM
471}
472EXPORT_SYMBOL(clear_user_page);
473
474void copy_user_page(void *vto, void *vfrom, unsigned long vaddr,
475 struct page *pg)
476{
477 copy_page(vto, vfrom);
478
479 /*
480 * We should be able to use the following optimisation, however
481 * there are two problems.
482 * Firstly a bug in some versions of binutils meant PLT sections
483 * were not marked executable.
484 * Secondly the first word in the GOT section is blrl, used
485 * to establish the GOT address. Until recently the GOT was
486 * not marked executable.
487 * - Anton
488 */
489#if 0
490 if (!vma->vm_file && ((vma->vm_flags & VM_EXEC) == 0))
491 return;
492#endif
493
09f5dc44 494 flush_dcache_page(pg);
14cf11af
PM
495}
496
497void flush_icache_user_range(struct vm_area_struct *vma, struct page *page,
498 unsigned long addr, int len)
499{
500 unsigned long maddr;
501
502 maddr = (unsigned long) kmap(page) + (addr & ~PAGE_MASK);
503 flush_icache_range(maddr, maddr + len);
504 kunmap(page);
505}
506EXPORT_SYMBOL(flush_icache_user_range);
507
508/*
509 * This is called at the end of handling a user page fault, when the
510 * fault has been handled by updating a PTE in the linux page tables.
511 * We use it to preload an HPTE into the hash table corresponding to
512 * the updated linux PTE.
513 *
01edcd89 514 * This must always be called with the pte lock held.
14cf11af
PM
515 */
516void update_mmu_cache(struct vm_area_struct *vma, unsigned long address,
4b3073e1 517 pte_t *ptep)
14cf11af 518{
3c726f8d
BH
519#ifdef CONFIG_PPC_STD_MMU
520 unsigned long access = 0, trap;
14cf11af 521
14cf11af 522 /* We only want HPTEs for linux PTEs that have _PAGE_ACCESSED set */
4b3073e1 523 if (!pte_young(*ptep) || address >= TASK_SIZE)
14cf11af 524 return;
14cf11af 525
3c726f8d
BH
526 /* We try to figure out if we are coming from an instruction
527 * access fault and pass that down to __hash_page so we avoid
528 * double-faulting on execution of fresh text. We have to test
529 * for regs NULL since init will get here first thing at boot
530 *
531 * We also avoid filling the hash if not coming from a fault
532 */
533 if (current->thread.regs == NULL)
14cf11af 534 return;
3c726f8d
BH
535 trap = TRAP(current->thread.regs);
536 if (trap == 0x400)
537 access |= _PAGE_EXEC;
538 else if (trap != 0x300)
539 return;
540 hash_preload(vma->vm_mm, address, access, trap);
541#endif /* CONFIG_PPC_STD_MMU */
14cf11af 542}