Commit | Line | Data |
---|---|---|
9b6b563c PM |
1 | /* |
2 | * Procedures for creating, accessing and interpreting the device tree. | |
3 | * | |
4 | * Paul Mackerras August 1996. | |
5 | * Copyright (C) 1996-2005 Paul Mackerras. | |
6 | * | |
7 | * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner. | |
8 | * {engebret|bergner}@us.ibm.com | |
9 | * | |
10 | * This program is free software; you can redistribute it and/or | |
11 | * modify it under the terms of the GNU General Public License | |
12 | * as published by the Free Software Foundation; either version | |
13 | * 2 of the License, or (at your option) any later version. | |
14 | */ | |
15 | ||
16 | #undef DEBUG | |
17 | ||
18 | #include <stdarg.h> | |
9b6b563c PM |
19 | #include <linux/kernel.h> |
20 | #include <linux/string.h> | |
21 | #include <linux/init.h> | |
22 | #include <linux/threads.h> | |
23 | #include <linux/spinlock.h> | |
24 | #include <linux/types.h> | |
25 | #include <linux/pci.h> | |
26 | #include <linux/stringify.h> | |
27 | #include <linux/delay.h> | |
28 | #include <linux/initrd.h> | |
29 | #include <linux/bitops.h> | |
30 | #include <linux/module.h> | |
dcee3036 | 31 | #include <linux/kexec.h> |
7a4571ae | 32 | #include <linux/debugfs.h> |
0ebfff14 | 33 | #include <linux/irq.h> |
95f72d1e | 34 | #include <linux/memblock.h> |
9b6b563c PM |
35 | |
36 | #include <asm/prom.h> | |
37 | #include <asm/rtas.h> | |
9b6b563c PM |
38 | #include <asm/page.h> |
39 | #include <asm/processor.h> | |
40 | #include <asm/irq.h> | |
41 | #include <asm/io.h> | |
0cc4746c | 42 | #include <asm/kdump.h> |
9b6b563c PM |
43 | #include <asm/smp.h> |
44 | #include <asm/system.h> | |
45 | #include <asm/mmu.h> | |
1426d5a3 | 46 | #include <asm/paca.h> |
9b6b563c PM |
47 | #include <asm/pgtable.h> |
48 | #include <asm/pci.h> | |
49 | #include <asm/iommu.h> | |
50 | #include <asm/btext.h> | |
51 | #include <asm/sections.h> | |
52 | #include <asm/machdep.h> | |
53 | #include <asm/pSeries_reconfig.h> | |
40ef8cbc | 54 | #include <asm/pci-bridge.h> |
6ac26c8a | 55 | #include <asm/phyp_dump.h> |
2babf5c2 | 56 | #include <asm/kexec.h> |
37dd2bad | 57 | #include <mm/mmu_decl.h> |
9b6b563c PM |
58 | |
59 | #ifdef DEBUG | |
60 | #define DBG(fmt...) printk(KERN_ERR fmt) | |
61 | #else | |
62 | #define DBG(fmt...) | |
63 | #endif | |
64 | ||
9b6b563c | 65 | #ifdef CONFIG_PPC64 |
28897731 | 66 | int __initdata iommu_is_off; |
9b6b563c | 67 | int __initdata iommu_force_on; |
cf00a8d1 | 68 | unsigned long tce_alloc_start, tce_alloc_end; |
cd3db0c4 | 69 | u64 ppc64_rma_size; |
9b6b563c | 70 | #endif |
03bf469a | 71 | static phys_addr_t first_memblock_size; |
7ac87abb | 72 | static int __initdata boot_cpu_count; |
9b6b563c | 73 | |
2babf5c2 ME |
74 | static int __init early_parse_mem(char *p) |
75 | { | |
76 | if (!p) | |
77 | return 1; | |
78 | ||
79 | memory_limit = PAGE_ALIGN(memparse(p, &p)); | |
49a84965 | 80 | DBG("memory limit = 0x%llx\n", (unsigned long long)memory_limit); |
2babf5c2 ME |
81 | |
82 | return 0; | |
83 | } | |
84 | early_param("mem", early_parse_mem); | |
85 | ||
307cfe71 BH |
86 | /* |
87 | * overlaps_initrd - check for overlap with page aligned extension of | |
88 | * initrd. | |
89 | */ | |
90 | static inline int overlaps_initrd(unsigned long start, unsigned long size) | |
91 | { | |
92 | #ifdef CONFIG_BLK_DEV_INITRD | |
93 | if (!initrd_start) | |
94 | return 0; | |
95 | ||
96 | return (start + size) > _ALIGN_DOWN(initrd_start, PAGE_SIZE) && | |
97 | start <= _ALIGN_UP(initrd_end, PAGE_SIZE); | |
98 | #else | |
99 | return 0; | |
100 | #endif | |
101 | } | |
102 | ||
3c607ce2 LV |
103 | /** |
104 | * move_device_tree - move tree to an unused area, if needed. | |
105 | * | |
106 | * The device tree may be allocated beyond our memory limit, or inside the | |
307cfe71 BH |
107 | * crash kernel region for kdump, or within the page aligned range of initrd. |
108 | * If so, move it out of the way. | |
2babf5c2 | 109 | */ |
18f032cb | 110 | static void __init move_device_tree(void) |
2babf5c2 ME |
111 | { |
112 | unsigned long start, size; | |
113 | void *p; | |
114 | ||
115 | DBG("-> move_device_tree\n"); | |
116 | ||
117 | start = __pa(initial_boot_params); | |
087f79c4 | 118 | size = be32_to_cpu(initial_boot_params->totalsize); |
2babf5c2 | 119 | |
6dd22700 | 120 | if ((memory_limit && (start + size) > PHYSICAL_START + memory_limit) || |
307cfe71 BH |
121 | overlaps_crashkernel(start, size) || |
122 | overlaps_initrd(start, size)) { | |
e63075a3 | 123 | p = __va(memblock_alloc(size, PAGE_SIZE)); |
2babf5c2 ME |
124 | memcpy(p, initial_boot_params, size); |
125 | initial_boot_params = (struct boot_param_header *)p; | |
126 | DBG("Moved device tree to 0x%p\n", p); | |
127 | } | |
128 | ||
129 | DBG("<- move_device_tree\n"); | |
130 | } | |
9b6b563c | 131 | |
d205819e PM |
132 | /* |
133 | * ibm,pa-features is a per-cpu property that contains a string of | |
134 | * attribute descriptors, each of which has a 2 byte header plus up | |
135 | * to 254 bytes worth of processor attribute bits. First header | |
136 | * byte specifies the number of bytes following the header. | |
137 | * Second header byte is an "attribute-specifier" type, of which | |
138 | * zero is the only currently-defined value. | |
139 | * Implementation: Pass in the byte and bit offset for the feature | |
140 | * that we are interested in. The function will return -1 if the | |
141 | * pa-features property is missing, or a 1/0 to indicate if the feature | |
142 | * is supported/not supported. Note that the bit numbers are | |
143 | * big-endian to match the definition in PAPR. | |
144 | */ | |
145 | static struct ibm_pa_feature { | |
146 | unsigned long cpu_features; /* CPU_FTR_xxx bit */ | |
44ae3ab3 | 147 | unsigned long mmu_features; /* MMU_FTR_xxx bit */ |
d205819e PM |
148 | unsigned int cpu_user_ftrs; /* PPC_FEATURE_xxx bit */ |
149 | unsigned char pabyte; /* byte number in ibm,pa-features */ | |
150 | unsigned char pabit; /* bit number (big-endian) */ | |
151 | unsigned char invert; /* if 1, pa bit set => clear feature */ | |
152 | } ibm_pa_features[] __initdata = { | |
44ae3ab3 ME |
153 | {0, 0, PPC_FEATURE_HAS_MMU, 0, 0, 0}, |
154 | {0, 0, PPC_FEATURE_HAS_FPU, 0, 1, 0}, | |
155 | {0, MMU_FTR_SLB, 0, 0, 2, 0}, | |
156 | {CPU_FTR_CTRL, 0, 0, 0, 3, 0}, | |
157 | {CPU_FTR_NOEXECUTE, 0, 0, 0, 6, 0}, | |
158 | {CPU_FTR_NODSISRALIGN, 0, 0, 1, 1, 1}, | |
159 | {0, MMU_FTR_CI_LARGE_PAGE, 0, 1, 2, 0}, | |
339d76c5 | 160 | {CPU_FTR_REAL_LE, PPC_FEATURE_TRUE_LE, 5, 0, 0}, |
d205819e PM |
161 | }; |
162 | ||
974a76f5 PM |
163 | static void __init scan_features(unsigned long node, unsigned char *ftrs, |
164 | unsigned long tablelen, | |
165 | struct ibm_pa_feature *fp, | |
166 | unsigned long ft_size) | |
d205819e | 167 | { |
974a76f5 | 168 | unsigned long i, len, bit; |
d205819e PM |
169 | |
170 | /* find descriptor with type == 0 */ | |
171 | for (;;) { | |
172 | if (tablelen < 3) | |
173 | return; | |
974a76f5 | 174 | len = 2 + ftrs[0]; |
d205819e PM |
175 | if (tablelen < len) |
176 | return; /* descriptor 0 not found */ | |
974a76f5 | 177 | if (ftrs[1] == 0) |
d205819e PM |
178 | break; |
179 | tablelen -= len; | |
974a76f5 | 180 | ftrs += len; |
d205819e PM |
181 | } |
182 | ||
183 | /* loop over bits we know about */ | |
974a76f5 PM |
184 | for (i = 0; i < ft_size; ++i, ++fp) { |
185 | if (fp->pabyte >= ftrs[0]) | |
d205819e | 186 | continue; |
974a76f5 | 187 | bit = (ftrs[2 + fp->pabyte] >> (7 - fp->pabit)) & 1; |
d205819e PM |
188 | if (bit ^ fp->invert) { |
189 | cur_cpu_spec->cpu_features |= fp->cpu_features; | |
190 | cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftrs; | |
44ae3ab3 | 191 | cur_cpu_spec->mmu_features |= fp->mmu_features; |
d205819e PM |
192 | } else { |
193 | cur_cpu_spec->cpu_features &= ~fp->cpu_features; | |
194 | cur_cpu_spec->cpu_user_features &= ~fp->cpu_user_ftrs; | |
44ae3ab3 | 195 | cur_cpu_spec->mmu_features &= ~fp->mmu_features; |
d205819e PM |
196 | } |
197 | } | |
198 | } | |
199 | ||
974a76f5 PM |
200 | static void __init check_cpu_pa_features(unsigned long node) |
201 | { | |
202 | unsigned char *pa_ftrs; | |
203 | unsigned long tablelen; | |
204 | ||
205 | pa_ftrs = of_get_flat_dt_prop(node, "ibm,pa-features", &tablelen); | |
206 | if (pa_ftrs == NULL) | |
207 | return; | |
208 | ||
209 | scan_features(node, pa_ftrs, tablelen, | |
210 | ibm_pa_features, ARRAY_SIZE(ibm_pa_features)); | |
211 | } | |
212 | ||
94491685 | 213 | #ifdef CONFIG_PPC_STD_MMU_64 |
584f8b71 MN |
214 | static void __init check_cpu_slb_size(unsigned long node) |
215 | { | |
216 | u32 *slb_size_ptr; | |
217 | ||
b60c31d8 MN |
218 | slb_size_ptr = of_get_flat_dt_prop(node, "slb-size", NULL); |
219 | if (slb_size_ptr != NULL) { | |
220 | mmu_slb_size = *slb_size_ptr; | |
221 | return; | |
222 | } | |
584f8b71 MN |
223 | slb_size_ptr = of_get_flat_dt_prop(node, "ibm,slb-size", NULL); |
224 | if (slb_size_ptr != NULL) { | |
225 | mmu_slb_size = *slb_size_ptr; | |
226 | } | |
227 | } | |
228 | #else | |
229 | #define check_cpu_slb_size(node) do { } while(0) | |
230 | #endif | |
231 | ||
974a76f5 PM |
232 | static struct feature_property { |
233 | const char *name; | |
234 | u32 min_value; | |
235 | unsigned long cpu_feature; | |
236 | unsigned long cpu_user_ftr; | |
237 | } feature_properties[] __initdata = { | |
238 | #ifdef CONFIG_ALTIVEC | |
239 | {"altivec", 0, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC}, | |
240 | {"ibm,vmx", 1, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC}, | |
241 | #endif /* CONFIG_ALTIVEC */ | |
b962ce9d MN |
242 | #ifdef CONFIG_VSX |
243 | /* Yes, this _really_ is ibm,vmx == 2 to enable VSX */ | |
244 | {"ibm,vmx", 2, CPU_FTR_VSX, PPC_FEATURE_HAS_VSX}, | |
245 | #endif /* CONFIG_VSX */ | |
974a76f5 PM |
246 | #ifdef CONFIG_PPC64 |
247 | {"ibm,dfp", 1, 0, PPC_FEATURE_HAS_DFP}, | |
248 | {"ibm,purr", 1, CPU_FTR_PURR, 0}, | |
249 | {"ibm,spurr", 1, CPU_FTR_SPURR, 0}, | |
250 | #endif /* CONFIG_PPC64 */ | |
251 | }; | |
252 | ||
14b3d926 VB |
253 | #if defined(CONFIG_44x) && defined(CONFIG_PPC_FPU) |
254 | static inline void identical_pvr_fixup(unsigned long node) | |
255 | { | |
256 | unsigned int pvr; | |
257 | char *model = of_get_flat_dt_prop(node, "model", NULL); | |
258 | ||
259 | /* | |
260 | * Since 440GR(x)/440EP(x) processors have the same pvr, | |
261 | * we check the node path and set bit 28 in the cur_cpu_spec | |
262 | * pvr for EP(x) processor version. This bit is always 0 in | |
263 | * the "real" pvr. Then we call identify_cpu again with | |
264 | * the new logical pvr to enable FPU support. | |
265 | */ | |
266 | if (model && strstr(model, "440EP")) { | |
267 | pvr = cur_cpu_spec->pvr_value | 0x8; | |
268 | identify_cpu(0, pvr); | |
269 | DBG("Using logical pvr %x for %s\n", pvr, model); | |
270 | } | |
271 | } | |
272 | #else | |
273 | #define identical_pvr_fixup(node) do { } while(0) | |
274 | #endif | |
275 | ||
974a76f5 PM |
276 | static void __init check_cpu_feature_properties(unsigned long node) |
277 | { | |
278 | unsigned long i; | |
279 | struct feature_property *fp = feature_properties; | |
280 | const u32 *prop; | |
281 | ||
282 | for (i = 0; i < ARRAY_SIZE(feature_properties); ++i, ++fp) { | |
283 | prop = of_get_flat_dt_prop(node, fp->name, NULL); | |
284 | if (prop && *prop >= fp->min_value) { | |
285 | cur_cpu_spec->cpu_features |= fp->cpu_feature; | |
286 | cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftr; | |
287 | } | |
288 | } | |
289 | } | |
290 | ||
9b6b563c | 291 | static int __init early_init_dt_scan_cpus(unsigned long node, |
4df20460 AB |
292 | const char *uname, int depth, |
293 | void *data) | |
9b6b563c | 294 | { |
4df20460 | 295 | char *type = of_get_flat_dt_prop(node, "device_type", NULL); |
974a76f5 PM |
296 | const u32 *prop; |
297 | const u32 *intserv; | |
4df20460 AB |
298 | int i, nthreads; |
299 | unsigned long len; | |
9d07bc84 | 300 | int found = -1; |
208b3a4c | 301 | int found_thread = 0; |
9b6b563c PM |
302 | |
303 | /* We are scanning "cpu" nodes only */ | |
304 | if (type == NULL || strcmp(type, "cpu") != 0) | |
305 | return 0; | |
306 | ||
4df20460 AB |
307 | /* Get physical cpuid */ |
308 | intserv = of_get_flat_dt_prop(node, "ibm,ppc-interrupt-server#s", &len); | |
309 | if (intserv) { | |
310 | nthreads = len / sizeof(int); | |
9b6b563c | 311 | } else { |
4df20460 AB |
312 | intserv = of_get_flat_dt_prop(node, "reg", NULL); |
313 | nthreads = 1; | |
314 | } | |
315 | ||
316 | /* | |
317 | * Now see if any of these threads match our boot cpu. | |
318 | * NOTE: This must match the parsing done in smp_setup_cpu_maps. | |
319 | */ | |
320 | for (i = 0; i < nthreads; i++) { | |
321 | /* | |
322 | * version 2 of the kexec param format adds the phys cpuid of | |
323 | * booted proc. | |
324 | */ | |
208b3a4c BH |
325 | if (initial_boot_params->version >= 2) { |
326 | if (intserv[i] == initial_boot_params->boot_cpuid_phys) { | |
9d07bc84 | 327 | found = boot_cpu_count; |
208b3a4c BH |
328 | found_thread = i; |
329 | } | |
4df20460 AB |
330 | } else { |
331 | /* | |
332 | * Check if it's the boot-cpu, set it's hw index now, | |
333 | * unfortunately this format did not support booting | |
334 | * off secondary threads. | |
335 | */ | |
336 | if (of_get_flat_dt_prop(node, | |
9d07bc84 BH |
337 | "linux,boot-cpu", NULL) != NULL) |
338 | found = boot_cpu_count; | |
9b6b563c | 339 | } |
4df20460 AB |
340 | #ifdef CONFIG_SMP |
341 | /* logical cpu id is always 0 on UP kernels */ | |
9d07bc84 | 342 | boot_cpu_count++; |
4df20460 AB |
343 | #endif |
344 | } | |
345 | ||
9d07bc84 BH |
346 | if (found >= 0) { |
347 | DBG("boot cpu: logical %d physical %d\n", found, | |
208b3a4c | 348 | intserv[found_thread]); |
9d07bc84 | 349 | boot_cpuid = found; |
208b3a4c | 350 | set_hard_smp_processor_id(found, intserv[found_thread]); |
9b6b563c | 351 | |
974a76f5 PM |
352 | /* |
353 | * PAPR defines "logical" PVR values for cpus that | |
354 | * meet various levels of the architecture: | |
355 | * 0x0f000001 Architecture version 2.04 | |
356 | * 0x0f000002 Architecture version 2.05 | |
357 | * If the cpu-version property in the cpu node contains | |
358 | * such a value, we call identify_cpu again with the | |
359 | * logical PVR value in order to use the cpu feature | |
360 | * bits appropriate for the architecture level. | |
361 | * | |
362 | * A POWER6 partition in "POWER6 architected" mode | |
363 | * uses the 0x0f000002 PVR value; in POWER5+ mode | |
364 | * it uses 0x0f000001. | |
365 | */ | |
366 | prop = of_get_flat_dt_prop(node, "cpu-version", NULL); | |
367 | if (prop && (*prop & 0xff000000) == 0x0f000000) | |
368 | identify_cpu(0, *prop); | |
14b3d926 VB |
369 | |
370 | identical_pvr_fixup(node); | |
9b6b563c | 371 | } |
9b6b563c | 372 | |
974a76f5 | 373 | check_cpu_feature_properties(node); |
d205819e | 374 | check_cpu_pa_features(node); |
584f8b71 | 375 | check_cpu_slb_size(node); |
d205819e | 376 | |
9b6b563c | 377 | #ifdef CONFIG_PPC_PSERIES |
4df20460 | 378 | if (nthreads > 1) |
9b6b563c | 379 | cur_cpu_spec->cpu_features |= CPU_FTR_SMT; |
4df20460 AB |
380 | else |
381 | cur_cpu_spec->cpu_features &= ~CPU_FTR_SMT; | |
9b6b563c PM |
382 | #endif |
383 | ||
384 | return 0; | |
385 | } | |
386 | ||
32c97689 GL |
387 | int __init early_init_dt_scan_chosen_ppc(unsigned long node, const char *uname, |
388 | int depth, void *data) | |
9b6b563c | 389 | { |
9b6b563c | 390 | unsigned long *lprop; |
9b6b563c | 391 | |
32c97689 GL |
392 | /* Use common scan routine to determine if this is the chosen node */ |
393 | if (early_init_dt_scan_chosen(node, uname, depth, data) == 0) | |
394 | return 0; | |
395 | ||
9b6b563c PM |
396 | #ifdef CONFIG_PPC64 |
397 | /* check if iommu is forced on or off */ | |
3c726f8d | 398 | if (of_get_flat_dt_prop(node, "linux,iommu-off", NULL) != NULL) |
9b6b563c | 399 | iommu_is_off = 1; |
3c726f8d | 400 | if (of_get_flat_dt_prop(node, "linux,iommu-force-on", NULL) != NULL) |
9b6b563c PM |
401 | iommu_force_on = 1; |
402 | #endif | |
403 | ||
2babf5c2 | 404 | /* mem=x on the command line is the preferred mechanism */ |
86e03221 GL |
405 | lprop = of_get_flat_dt_prop(node, "linux,memory-limit", NULL); |
406 | if (lprop) | |
407 | memory_limit = *lprop; | |
9b6b563c PM |
408 | |
409 | #ifdef CONFIG_PPC64 | |
86e03221 GL |
410 | lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-start", NULL); |
411 | if (lprop) | |
412 | tce_alloc_start = *lprop; | |
413 | lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-end", NULL); | |
414 | if (lprop) | |
415 | tce_alloc_end = *lprop; | |
9b6b563c PM |
416 | #endif |
417 | ||
dcee3036 | 418 | #ifdef CONFIG_KEXEC |
63277161 | 419 | lprop = of_get_flat_dt_prop(node, "linux,crashkernel-base", NULL); |
70c6cc37 LV |
420 | if (lprop) |
421 | crashk_res.start = *lprop; | |
dcee3036 | 422 | |
63277161 | 423 | lprop = of_get_flat_dt_prop(node, "linux,crashkernel-size", NULL); |
70c6cc37 LV |
424 | if (lprop) |
425 | crashk_res.end = crashk_res.start + *lprop - 1; | |
dcee3036 | 426 | #endif |
32c97689 GL |
427 | |
428 | /* break now */ | |
429 | return 1; | |
9b6b563c PM |
430 | } |
431 | ||
0204568a PM |
432 | #ifdef CONFIG_PPC_PSERIES |
433 | /* | |
434 | * Interpret the ibm,dynamic-memory property in the | |
435 | * /ibm,dynamic-reconfiguration-memory node. | |
436 | * This contains a list of memory blocks along with NUMA affinity | |
437 | * information. | |
438 | */ | |
439 | static int __init early_init_dt_scan_drconf_memory(unsigned long node) | |
440 | { | |
0f0b56c3 | 441 | __be32 *dm, *ls, *usm; |
abe76885 | 442 | unsigned long l, n, flags; |
95f72d1e | 443 | u64 base, size, memblock_size; |
cf00085d | 444 | unsigned int is_kexec_kdump = 0, rngs; |
0204568a | 445 | |
3fdfd990 | 446 | ls = of_get_flat_dt_prop(node, "ibm,lmb-size", &l); |
0f0b56c3 | 447 | if (ls == NULL || l < dt_root_size_cells * sizeof(__be32)) |
0204568a | 448 | return 0; |
95f72d1e | 449 | memblock_size = dt_mem_next_cell(dt_root_size_cells, &ls); |
0204568a | 450 | |
63277161 | 451 | dm = of_get_flat_dt_prop(node, "ibm,dynamic-memory", &l); |
0f0b56c3 | 452 | if (dm == NULL || l < sizeof(__be32)) |
0204568a PM |
453 | return 0; |
454 | ||
455 | n = *dm++; /* number of entries */ | |
0f0b56c3 | 456 | if (l < (n * (dt_root_addr_cells + 4) + 1) * sizeof(__be32)) |
0204568a PM |
457 | return 0; |
458 | ||
cf00085d | 459 | /* check if this is a kexec/kdump kernel. */ |
63277161 | 460 | usm = of_get_flat_dt_prop(node, "linux,drconf-usable-memory", |
cf00085d C |
461 | &l); |
462 | if (usm != NULL) | |
463 | is_kexec_kdump = 1; | |
464 | ||
0204568a PM |
465 | for (; n != 0; --n) { |
466 | base = dt_mem_next_cell(dt_root_addr_cells, &dm); | |
467 | flags = dm[3]; | |
468 | /* skip DRC index, pad, assoc. list index, flags */ | |
469 | dm += 4; | |
470 | /* skip this block if the reserved bit is set in flags (0x80) | |
471 | or if the block is not assigned to this partition (0x8) */ | |
472 | if ((flags & 0x80) || !(flags & 0x8)) | |
473 | continue; | |
95f72d1e | 474 | size = memblock_size; |
cf00085d C |
475 | rngs = 1; |
476 | if (is_kexec_kdump) { | |
477 | /* | |
95f72d1e | 478 | * For each memblock in ibm,dynamic-memory, a corresponding |
cf00085d C |
479 | * entry in linux,drconf-usable-memory property contains |
480 | * a counter 'p' followed by 'p' (base, size) duple. | |
481 | * Now read the counter from | |
482 | * linux,drconf-usable-memory property | |
483 | */ | |
484 | rngs = dt_mem_next_cell(dt_root_size_cells, &usm); | |
485 | if (!rngs) /* there are no (base, size) duple */ | |
0204568a | 486 | continue; |
0204568a | 487 | } |
cf00085d C |
488 | do { |
489 | if (is_kexec_kdump) { | |
490 | base = dt_mem_next_cell(dt_root_addr_cells, | |
491 | &usm); | |
492 | size = dt_mem_next_cell(dt_root_size_cells, | |
493 | &usm); | |
494 | } | |
495 | if (iommu_is_off) { | |
496 | if (base >= 0x80000000ul) | |
497 | continue; | |
498 | if ((base + size) > 0x80000000ul) | |
499 | size = 0x80000000ul - base; | |
500 | } | |
95f72d1e | 501 | memblock_add(base, size); |
cf00085d | 502 | } while (--rngs); |
0204568a | 503 | } |
95f72d1e | 504 | memblock_dump_all(); |
0204568a PM |
505 | return 0; |
506 | } | |
507 | #else | |
508 | #define early_init_dt_scan_drconf_memory(node) 0 | |
509 | #endif /* CONFIG_PPC_PSERIES */ | |
9b6b563c | 510 | |
51975db0 GL |
511 | static int __init early_init_dt_scan_memory_ppc(unsigned long node, |
512 | const char *uname, | |
513 | int depth, void *data) | |
9b6b563c | 514 | { |
0204568a PM |
515 | if (depth == 1 && |
516 | strcmp(uname, "ibm,dynamic-reconfiguration-memory") == 0) | |
517 | return early_init_dt_scan_drconf_memory(node); | |
51975db0 GL |
518 | |
519 | return early_init_dt_scan_memory(node, uname, depth, data); | |
520 | } | |
0204568a | 521 | |
51975db0 GL |
522 | void __init early_init_dt_add_memory_arch(u64 base, u64 size) |
523 | { | |
cd3db0c4 | 524 | #ifdef CONFIG_PPC64 |
51975db0 GL |
525 | if (iommu_is_off) { |
526 | if (base >= 0x80000000ul) | |
527 | return; | |
528 | if ((base + size) > 0x80000000ul) | |
529 | size = 0x80000000ul - base; | |
530 | } | |
9b6b563c | 531 | #endif |
03bf469a BH |
532 | /* Keep track of the beginning of memory -and- the size of |
533 | * the very first block in the device-tree as it represents | |
534 | * the RMA on ppc64 server | |
535 | */ | |
536 | if (base < memstart_addr) { | |
537 | memstart_addr = base; | |
538 | first_memblock_size = size; | |
539 | } | |
cd3db0c4 BH |
540 | |
541 | /* Add the chunk to the MEMBLOCK list */ | |
542 | memblock_add(base, size); | |
9b6b563c PM |
543 | } |
544 | ||
672c5446 | 545 | void * __init early_init_dt_alloc_memory_arch(u64 size, u64 align) |
4ef7b373 | 546 | { |
672c5446 | 547 | return __va(memblock_alloc(size, align)); |
4ef7b373 JK |
548 | } |
549 | ||
1406bc2f JK |
550 | #ifdef CONFIG_BLK_DEV_INITRD |
551 | void __init early_init_dt_setup_initrd_arch(unsigned long start, | |
552 | unsigned long end) | |
553 | { | |
554 | initrd_start = (unsigned long)__va(start); | |
555 | initrd_end = (unsigned long)__va(end); | |
556 | initrd_below_start_ok = 1; | |
557 | } | |
558 | #endif | |
559 | ||
9b6b563c PM |
560 | static void __init early_reserve_mem(void) |
561 | { | |
cbbcf340 KG |
562 | u64 base, size; |
563 | u64 *reserve_map; | |
8a300887 JL |
564 | unsigned long self_base; |
565 | unsigned long self_size; | |
9b6b563c | 566 | |
cbbcf340 | 567 | reserve_map = (u64 *)(((unsigned long)initial_boot_params) + |
9b6b563c | 568 | initial_boot_params->off_mem_rsvmap); |
4d1f3f25 JX |
569 | |
570 | /* before we do anything, lets reserve the dt blob */ | |
8a300887 JL |
571 | self_base = __pa((unsigned long)initial_boot_params); |
572 | self_size = initial_boot_params->totalsize; | |
95f72d1e | 573 | memblock_reserve(self_base, self_size); |
4d1f3f25 | 574 | |
30437b3e DG |
575 | #ifdef CONFIG_BLK_DEV_INITRD |
576 | /* then reserve the initrd, if any */ | |
577 | if (initrd_start && (initrd_end > initrd_start)) | |
307cfe71 BH |
578 | memblock_reserve(_ALIGN_DOWN(__pa(initrd_start), PAGE_SIZE), |
579 | _ALIGN_UP(initrd_end, PAGE_SIZE) - | |
580 | _ALIGN_DOWN(initrd_start, PAGE_SIZE)); | |
30437b3e DG |
581 | #endif /* CONFIG_BLK_DEV_INITRD */ |
582 | ||
cbbcf340 KG |
583 | #ifdef CONFIG_PPC32 |
584 | /* | |
585 | * Handle the case where we might be booting from an old kexec | |
586 | * image that setup the mem_rsvmap as pairs of 32-bit values | |
587 | */ | |
588 | if (*reserve_map > 0xffffffffull) { | |
589 | u32 base_32, size_32; | |
590 | u32 *reserve_map_32 = (u32 *)reserve_map; | |
591 | ||
592 | while (1) { | |
593 | base_32 = *(reserve_map_32++); | |
594 | size_32 = *(reserve_map_32++); | |
595 | if (size_32 == 0) | |
596 | break; | |
8a300887 JL |
597 | /* skip if the reservation is for the blob */ |
598 | if (base_32 == self_base && size_32 == self_size) | |
599 | continue; | |
329dda08 | 600 | DBG("reserving: %x -> %x\n", base_32, size_32); |
95f72d1e | 601 | memblock_reserve(base_32, size_32); |
cbbcf340 KG |
602 | } |
603 | return; | |
604 | } | |
605 | #endif | |
9b6b563c PM |
606 | while (1) { |
607 | base = *(reserve_map++); | |
608 | size = *(reserve_map++); | |
609 | if (size == 0) | |
610 | break; | |
cbbcf340 | 611 | DBG("reserving: %llx -> %llx\n", base, size); |
95f72d1e | 612 | memblock_reserve(base, size); |
9b6b563c | 613 | } |
9b6b563c PM |
614 | } |
615 | ||
6ac26c8a | 616 | #ifdef CONFIG_PHYP_DUMP |
37ddd5d0 MA |
617 | /** |
618 | * phyp_dump_calculate_reserve_size() - reserve variable boot area 5% or arg | |
619 | * | |
620 | * Function to find the largest size we need to reserve | |
621 | * during early boot process. | |
622 | * | |
623 | * It either looks for boot param and returns that OR | |
624 | * returns larger of 256 or 5% rounded down to multiples of 256MB. | |
625 | * | |
626 | */ | |
627 | static inline unsigned long phyp_dump_calculate_reserve_size(void) | |
628 | { | |
629 | unsigned long tmp; | |
630 | ||
631 | if (phyp_dump_info->reserve_bootvar) | |
632 | return phyp_dump_info->reserve_bootvar; | |
633 | ||
634 | /* divide by 20 to get 5% of value */ | |
95f72d1e | 635 | tmp = memblock_end_of_DRAM(); |
37ddd5d0 MA |
636 | do_div(tmp, 20); |
637 | ||
638 | /* round it down in multiples of 256 */ | |
639 | tmp = tmp & ~0x0FFFFFFFUL; | |
640 | ||
641 | return (tmp > PHYP_DUMP_RMR_END ? tmp : PHYP_DUMP_RMR_END); | |
642 | } | |
643 | ||
6ac26c8a MA |
644 | /** |
645 | * phyp_dump_reserve_mem() - reserve all not-yet-dumped mmemory | |
646 | * | |
647 | * This routine may reserve memory regions in the kernel only | |
648 | * if the system is supported and a dump was taken in last | |
649 | * boot instance or if the hardware is supported and the | |
650 | * scratch area needs to be setup. In other instances it returns | |
651 | * without reserving anything. The memory in case of dump being | |
652 | * active is freed when the dump is collected (by userland tools). | |
653 | */ | |
654 | static void __init phyp_dump_reserve_mem(void) | |
655 | { | |
656 | unsigned long base, size; | |
37ddd5d0 MA |
657 | unsigned long variable_reserve_size; |
658 | ||
6ac26c8a MA |
659 | if (!phyp_dump_info->phyp_dump_configured) { |
660 | printk(KERN_ERR "Phyp-dump not supported on this hardware\n"); | |
661 | return; | |
662 | } | |
663 | ||
654f596d MA |
664 | if (!phyp_dump_info->phyp_dump_at_boot) { |
665 | printk(KERN_INFO "Phyp-dump disabled at boot time\n"); | |
666 | return; | |
667 | } | |
668 | ||
37ddd5d0 MA |
669 | variable_reserve_size = phyp_dump_calculate_reserve_size(); |
670 | ||
6ac26c8a MA |
671 | if (phyp_dump_info->phyp_dump_is_active) { |
672 | /* Reserve *everything* above RMR.Area freed by userland tools*/ | |
37ddd5d0 | 673 | base = variable_reserve_size; |
95f72d1e | 674 | size = memblock_end_of_DRAM() - base; |
6ac26c8a MA |
675 | |
676 | /* XXX crashed_ram_end is wrong, since it may be beyond | |
677 | * the memory_limit, it will need to be adjusted. */ | |
95f72d1e | 678 | memblock_reserve(base, size); |
6ac26c8a MA |
679 | |
680 | phyp_dump_info->init_reserve_start = base; | |
681 | phyp_dump_info->init_reserve_size = size; | |
682 | } else { | |
683 | size = phyp_dump_info->cpu_state_size + | |
684 | phyp_dump_info->hpte_region_size + | |
37ddd5d0 | 685 | variable_reserve_size; |
95f72d1e YL |
686 | base = memblock_end_of_DRAM() - size; |
687 | memblock_reserve(base, size); | |
6ac26c8a MA |
688 | phyp_dump_info->init_reserve_start = base; |
689 | phyp_dump_info->init_reserve_size = size; | |
690 | } | |
691 | } | |
692 | #else | |
693 | static inline void __init phyp_dump_reserve_mem(void) {} | |
694 | #endif /* CONFIG_PHYP_DUMP && CONFIG_PPC_RTAS */ | |
695 | ||
9b6b563c PM |
696 | void __init early_init_devtree(void *params) |
697 | { | |
49a84965 | 698 | phys_addr_t limit; |
6ca4f749 | 699 | |
44348105 | 700 | DBG(" -> early_init_devtree(%p)\n", params); |
9b6b563c PM |
701 | |
702 | /* Setup flat device-tree pointer */ | |
703 | initial_boot_params = params; | |
704 | ||
458148c0 ME |
705 | #ifdef CONFIG_PPC_RTAS |
706 | /* Some machines might need RTAS info for debugging, grab it now. */ | |
707 | of_scan_flat_dt(early_init_dt_scan_rtas, NULL); | |
708 | #endif | |
709 | ||
6ac26c8a | 710 | #ifdef CONFIG_PHYP_DUMP |
25985edc | 711 | /* scan tree to see if dump occurred during last boot */ |
6ac26c8a MA |
712 | of_scan_flat_dt(early_init_dt_scan_phyp_dump, NULL); |
713 | #endif | |
714 | ||
817c21ad BH |
715 | /* Pre-initialize the cmd_line with the content of boot_commmand_line, |
716 | * which will be empty except when the content of the variable has | |
717 | * been overriden by a bootloading mechanism. This happens typically | |
718 | * with HAL takeover | |
719 | */ | |
720 | strlcpy(cmd_line, boot_command_line, COMMAND_LINE_SIZE); | |
721 | ||
9b6b563c PM |
722 | /* Retrieve various informations from the /chosen node of the |
723 | * device-tree, including the platform type, initrd location and | |
724 | * size, TCE reserve, and more ... | |
725 | */ | |
85f60ae4 | 726 | of_scan_flat_dt(early_init_dt_scan_chosen_ppc, cmd_line); |
9b6b563c | 727 | |
95f72d1e YL |
728 | /* Scan memory nodes and rebuild MEMBLOCKs */ |
729 | memblock_init(); | |
e63075a3 | 730 | |
3c726f8d | 731 | of_scan_flat_dt(early_init_dt_scan_root, NULL); |
51975db0 | 732 | of_scan_flat_dt(early_init_dt_scan_memory_ppc, NULL); |
03bf469a | 733 | setup_initial_memory_limit(memstart_addr, first_memblock_size); |
846f77b0 ME |
734 | |
735 | /* Save command line for /proc/cmdline and then parse parameters */ | |
b8757b21 | 736 | strlcpy(boot_command_line, cmd_line, COMMAND_LINE_SIZE); |
846f77b0 ME |
737 | parse_early_param(); |
738 | ||
95f72d1e YL |
739 | /* Reserve MEMBLOCK regions used by kernel, initrd, dt, etc... */ |
740 | memblock_reserve(PHYSICAL_START, __pa(klimit) - PHYSICAL_START); | |
549e8152 PM |
741 | /* If relocatable, reserve first 32k for interrupt vectors etc. */ |
742 | if (PHYSICAL_START > MEMORY_START) | |
95f72d1e | 743 | memblock_reserve(MEMORY_START, 0x8000); |
47310413 | 744 | reserve_kdump_trampoline(); |
35dd5432 | 745 | reserve_crashkernel(); |
9b6b563c | 746 | early_reserve_mem(); |
6ac26c8a | 747 | phyp_dump_reserve_mem(); |
9b6b563c | 748 | |
6ca4f749 HB |
749 | limit = memory_limit; |
750 | if (! limit) { | |
49a84965 | 751 | phys_addr_t memsize; |
6ca4f749 HB |
752 | |
753 | /* Ensure that total memory size is page-aligned, because | |
754 | * otherwise mark_bootmem() gets upset. */ | |
95f72d1e YL |
755 | memblock_analyze(); |
756 | memsize = memblock_phys_mem_size(); | |
6ca4f749 HB |
757 | if ((memsize & PAGE_MASK) != memsize) |
758 | limit = memsize & PAGE_MASK; | |
759 | } | |
95f72d1e | 760 | memblock_enforce_memory_limit(limit); |
6ca4f749 | 761 | |
95f72d1e YL |
762 | memblock_analyze(); |
763 | memblock_dump_all(); | |
2babf5c2 | 764 | |
95f72d1e | 765 | DBG("Phys. mem: %llx\n", memblock_phys_mem_size()); |
2babf5c2 ME |
766 | |
767 | /* We may need to relocate the flat tree, do it now. | |
768 | * FIXME .. and the initrd too? */ | |
769 | move_device_tree(); | |
770 | ||
1426d5a3 ME |
771 | allocate_pacas(); |
772 | ||
9b6b563c PM |
773 | DBG("Scanning CPUs ...\n"); |
774 | ||
25985edc | 775 | /* Retrieve CPU related informations from the flat tree |
3c726f8d | 776 | * (altivec support, boot CPU ID, ...) |
9b6b563c | 777 | */ |
3c726f8d | 778 | of_scan_flat_dt(early_init_dt_scan_cpus, NULL); |
9b6b563c | 779 | |
7ac87abb ME |
780 | #if defined(CONFIG_SMP) && defined(CONFIG_PPC64) |
781 | /* We'll later wait for secondaries to check in; there are | |
782 | * NCPUS-1 non-boot CPUs :-) | |
783 | */ | |
784 | spinning_secondaries = boot_cpu_count - 1; | |
785 | #endif | |
786 | ||
9b6b563c PM |
787 | DBG(" <- early_init_devtree()\n"); |
788 | } | |
789 | ||
9b6b563c PM |
790 | /******* |
791 | * | |
792 | * New implementation of the OF "find" APIs, return a refcounted | |
793 | * object, call of_node_put() when done. The device tree and list | |
794 | * are protected by a rw_lock. | |
795 | * | |
796 | * Note that property management will need some locking as well, | |
797 | * this isn't dealt with yet. | |
798 | * | |
799 | *******/ | |
800 | ||
e523f723 NL |
801 | /** |
802 | * of_find_next_cache_node - Find a node's subsidiary cache | |
803 | * @np: node of type "cpu" or "cache" | |
804 | * | |
805 | * Returns a node pointer with refcount incremented, use | |
806 | * of_node_put() on it when done. Caller should hold a reference | |
807 | * to np. | |
808 | */ | |
809 | struct device_node *of_find_next_cache_node(struct device_node *np) | |
810 | { | |
811 | struct device_node *child; | |
812 | const phandle *handle; | |
813 | ||
814 | handle = of_get_property(np, "l2-cache", NULL); | |
815 | if (!handle) | |
816 | handle = of_get_property(np, "next-level-cache", NULL); | |
817 | ||
818 | if (handle) | |
819 | return of_find_node_by_phandle(*handle); | |
820 | ||
821 | /* OF on pmac has nodes instead of properties named "l2-cache" | |
822 | * beneath CPU nodes. | |
823 | */ | |
824 | if (!strcmp(np->type, "cpu")) | |
825 | for_each_child_of_node(np, child) | |
826 | if (!strcmp(child->type, "cache")) | |
827 | return child; | |
828 | ||
829 | return NULL; | |
830 | } | |
831 | ||
9b6b563c PM |
832 | #ifdef CONFIG_PPC_PSERIES |
833 | /* | |
834 | * Fix up the uninitialized fields in a new device node: | |
0ebfff14 | 835 | * name, type and pci-specific fields |
9b6b563c PM |
836 | */ |
837 | ||
cc5d0189 | 838 | static int of_finish_dynamic_node(struct device_node *node) |
9b6b563c PM |
839 | { |
840 | struct device_node *parent = of_get_parent(node); | |
841 | int err = 0; | |
a7f67bdf | 842 | const phandle *ibm_phandle; |
9b6b563c | 843 | |
0e56efc7 SR |
844 | node->name = of_get_property(node, "name", NULL); |
845 | node->type = of_get_property(node, "device_type", NULL); | |
9b6b563c | 846 | |
847f5976 BH |
847 | if (!node->name) |
848 | node->name = "<NULL>"; | |
849 | if (!node->type) | |
850 | node->type = "<NULL>"; | |
851 | ||
9b6b563c PM |
852 | if (!parent) { |
853 | err = -ENODEV; | |
854 | goto out; | |
855 | } | |
856 | ||
857 | /* We don't support that function on PowerMac, at least | |
858 | * not yet | |
859 | */ | |
e8222502 | 860 | if (machine_is(powermac)) |
9b6b563c PM |
861 | return -ENODEV; |
862 | ||
6016a363 | 863 | /* fix up new node's phandle field */ |
0e56efc7 | 864 | if ((ibm_phandle = of_get_property(node, "ibm,phandle", NULL))) |
6016a363 | 865 | node->phandle = *ibm_phandle; |
9b6b563c PM |
866 | |
867 | out: | |
868 | of_node_put(parent); | |
869 | return err; | |
870 | } | |
871 | ||
872 | static int prom_reconfig_notifier(struct notifier_block *nb, | |
873 | unsigned long action, void *node) | |
874 | { | |
875 | int err; | |
876 | ||
877 | switch (action) { | |
878 | case PSERIES_RECONFIG_ADD: | |
cc5d0189 | 879 | err = of_finish_dynamic_node(node); |
de2780a3 | 880 | if (err < 0) |
9b6b563c | 881 | printk(KERN_ERR "finish_node returned %d\n", err); |
9b6b563c PM |
882 | break; |
883 | default: | |
de2780a3 | 884 | err = 0; |
9b6b563c PM |
885 | break; |
886 | } | |
de2780a3 | 887 | return notifier_from_errno(err); |
9b6b563c PM |
888 | } |
889 | ||
890 | static struct notifier_block prom_reconfig_nb = { | |
891 | .notifier_call = prom_reconfig_notifier, | |
892 | .priority = 10, /* This one needs to run first */ | |
893 | }; | |
894 | ||
895 | static int __init prom_reconfig_setup(void) | |
896 | { | |
897 | return pSeries_reconfig_notifier_register(&prom_reconfig_nb); | |
898 | } | |
899 | __initcall(prom_reconfig_setup); | |
900 | #endif | |
901 | ||
acf7d768 BH |
902 | /* Find the device node for a given logical cpu number, also returns the cpu |
903 | * local thread number (index in ibm,interrupt-server#s) if relevant and | |
904 | * asked for (non NULL) | |
905 | */ | |
906 | struct device_node *of_get_cpu_node(int cpu, unsigned int *thread) | |
907 | { | |
908 | int hardid; | |
909 | struct device_node *np; | |
910 | ||
911 | hardid = get_hard_smp_processor_id(cpu); | |
912 | ||
913 | for_each_node_by_type(np, "cpu") { | |
a7f67bdf | 914 | const u32 *intserv; |
acf7d768 BH |
915 | unsigned int plen, t; |
916 | ||
917 | /* Check for ibm,ppc-interrupt-server#s. If it doesn't exist | |
918 | * fallback to "reg" property and assume no threads | |
919 | */ | |
0e56efc7 | 920 | intserv = of_get_property(np, "ibm,ppc-interrupt-server#s", |
a7f67bdf | 921 | &plen); |
acf7d768 | 922 | if (intserv == NULL) { |
0e56efc7 | 923 | const u32 *reg = of_get_property(np, "reg", NULL); |
acf7d768 BH |
924 | if (reg == NULL) |
925 | continue; | |
926 | if (*reg == hardid) { | |
927 | if (thread) | |
928 | *thread = 0; | |
929 | return np; | |
930 | } | |
931 | } else { | |
932 | plen /= sizeof(u32); | |
933 | for (t = 0; t < plen; t++) { | |
934 | if (hardid == intserv[t]) { | |
935 | if (thread) | |
936 | *thread = t; | |
937 | return np; | |
938 | } | |
939 | } | |
940 | } | |
941 | } | |
942 | return NULL; | |
943 | } | |
36ca4ba4 | 944 | EXPORT_SYMBOL(of_get_cpu_node); |
7a4571ae | 945 | |
94a3807c | 946 | #if defined(CONFIG_DEBUG_FS) && defined(DEBUG) |
7a4571ae ME |
947 | static struct debugfs_blob_wrapper flat_dt_blob; |
948 | ||
949 | static int __init export_flat_device_tree(void) | |
950 | { | |
951 | struct dentry *d; | |
952 | ||
7a4571ae ME |
953 | flat_dt_blob.data = initial_boot_params; |
954 | flat_dt_blob.size = initial_boot_params->totalsize; | |
955 | ||
956 | d = debugfs_create_blob("flat-device-tree", S_IFREG | S_IRUSR, | |
94a3807c | 957 | powerpc_debugfs_root, &flat_dt_blob); |
7a4571ae ME |
958 | if (!d) |
959 | return 1; | |
960 | ||
961 | return 0; | |
962 | } | |
963 | __initcall(export_flat_device_tree); | |
964 | #endif |