xref: /linux/arch/powerpc/kernel/prom.c (revision 5499b45190237ca90dd2ac86395cf464fe1f4cc7)
1 /*
2  * Procedures for creating, accessing and interpreting the device tree.
3  *
4  * Paul Mackerras	August 1996.
5  * Copyright (C) 1996-2005 Paul Mackerras.
6  *
7  *  Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
8  *    {engebret|bergner}@us.ibm.com
9  *
10  *      This program is free software; you can redistribute it and/or
11  *      modify it under the terms of the GNU General Public License
12  *      as published by the Free Software Foundation; either version
13  *      2 of the License, or (at your option) any later version.
14  */
15 
16 #undef DEBUG
17 
18 #include <stdarg.h>
19 #include <linux/kernel.h>
20 #include <linux/string.h>
21 #include <linux/init.h>
22 #include <linux/threads.h>
23 #include <linux/spinlock.h>
24 #include <linux/types.h>
25 #include <linux/pci.h>
26 #include <linux/stringify.h>
27 #include <linux/delay.h>
28 #include <linux/initrd.h>
29 #include <linux/bitops.h>
30 #include <linux/module.h>
31 #include <linux/kexec.h>
32 #include <linux/debugfs.h>
33 #include <linux/irq.h>
34 #include <linux/lmb.h>
35 
36 #include <asm/prom.h>
37 #include <asm/rtas.h>
38 #include <asm/page.h>
39 #include <asm/processor.h>
40 #include <asm/irq.h>
41 #include <asm/io.h>
42 #include <asm/kdump.h>
43 #include <asm/smp.h>
44 #include <asm/system.h>
45 #include <asm/mmu.h>
46 #include <asm/pgtable.h>
47 #include <asm/pci.h>
48 #include <asm/iommu.h>
49 #include <asm/btext.h>
50 #include <asm/sections.h>
51 #include <asm/machdep.h>
52 #include <asm/pSeries_reconfig.h>
53 #include <asm/pci-bridge.h>
54 #include <asm/phyp_dump.h>
55 #include <asm/kexec.h>
56 #include <mm/mmu_decl.h>
57 
58 #ifdef DEBUG
59 #define DBG(fmt...) printk(KERN_ERR fmt)
60 #else
61 #define DBG(fmt...)
62 #endif
63 
64 #ifdef CONFIG_PPC64
65 int __initdata iommu_is_off;
66 int __initdata iommu_force_on;
67 unsigned long tce_alloc_start, tce_alloc_end;
68 #endif
69 
70 static int __init early_parse_mem(char *p)
71 {
72 	if (!p)
73 		return 1;
74 
75 	memory_limit = PAGE_ALIGN(memparse(p, &p));
76 	DBG("memory limit = 0x%llx\n", (unsigned long long)memory_limit);
77 
78 	return 0;
79 }
80 early_param("mem", early_parse_mem);
81 
82 /**
83  * move_device_tree - move tree to an unused area, if needed.
84  *
85  * The device tree may be allocated beyond our memory limit, or inside the
86  * crash kernel region for kdump. If so, move it out of the way.
87  */
88 static void __init move_device_tree(void)
89 {
90 	unsigned long start, size;
91 	void *p;
92 
93 	DBG("-> move_device_tree\n");
94 
95 	start = __pa(initial_boot_params);
96 	size = be32_to_cpu(initial_boot_params->totalsize);
97 
98 	if ((memory_limit && (start + size) > memory_limit) ||
99 			overlaps_crashkernel(start, size)) {
100 		p = __va(lmb_alloc_base(size, PAGE_SIZE, lmb.rmo_size));
101 		memcpy(p, initial_boot_params, size);
102 		initial_boot_params = (struct boot_param_header *)p;
103 		DBG("Moved device tree to 0x%p\n", p);
104 	}
105 
106 	DBG("<- move_device_tree\n");
107 }
108 
109 /*
110  * ibm,pa-features is a per-cpu property that contains a string of
111  * attribute descriptors, each of which has a 2 byte header plus up
112  * to 254 bytes worth of processor attribute bits.  First header
113  * byte specifies the number of bytes following the header.
114  * Second header byte is an "attribute-specifier" type, of which
115  * zero is the only currently-defined value.
116  * Implementation:  Pass in the byte and bit offset for the feature
117  * that we are interested in.  The function will return -1 if the
118  * pa-features property is missing, or a 1/0 to indicate if the feature
119  * is supported/not supported.  Note that the bit numbers are
120  * big-endian to match the definition in PAPR.
121  */
122 static struct ibm_pa_feature {
123 	unsigned long	cpu_features;	/* CPU_FTR_xxx bit */
124 	unsigned int	cpu_user_ftrs;	/* PPC_FEATURE_xxx bit */
125 	unsigned char	pabyte;		/* byte number in ibm,pa-features */
126 	unsigned char	pabit;		/* bit number (big-endian) */
127 	unsigned char	invert;		/* if 1, pa bit set => clear feature */
128 } ibm_pa_features[] __initdata = {
129 	{0, PPC_FEATURE_HAS_MMU,	0, 0, 0},
130 	{0, PPC_FEATURE_HAS_FPU,	0, 1, 0},
131 	{CPU_FTR_SLB, 0,		0, 2, 0},
132 	{CPU_FTR_CTRL, 0,		0, 3, 0},
133 	{CPU_FTR_NOEXECUTE, 0,		0, 6, 0},
134 	{CPU_FTR_NODSISRALIGN, 0,	1, 1, 1},
135 	{CPU_FTR_CI_LARGE_PAGE, 0,	1, 2, 0},
136 	{CPU_FTR_REAL_LE, PPC_FEATURE_TRUE_LE, 5, 0, 0},
137 };
138 
139 static void __init scan_features(unsigned long node, unsigned char *ftrs,
140 				 unsigned long tablelen,
141 				 struct ibm_pa_feature *fp,
142 				 unsigned long ft_size)
143 {
144 	unsigned long i, len, bit;
145 
146 	/* find descriptor with type == 0 */
147 	for (;;) {
148 		if (tablelen < 3)
149 			return;
150 		len = 2 + ftrs[0];
151 		if (tablelen < len)
152 			return;		/* descriptor 0 not found */
153 		if (ftrs[1] == 0)
154 			break;
155 		tablelen -= len;
156 		ftrs += len;
157 	}
158 
159 	/* loop over bits we know about */
160 	for (i = 0; i < ft_size; ++i, ++fp) {
161 		if (fp->pabyte >= ftrs[0])
162 			continue;
163 		bit = (ftrs[2 + fp->pabyte] >> (7 - fp->pabit)) & 1;
164 		if (bit ^ fp->invert) {
165 			cur_cpu_spec->cpu_features |= fp->cpu_features;
166 			cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftrs;
167 		} else {
168 			cur_cpu_spec->cpu_features &= ~fp->cpu_features;
169 			cur_cpu_spec->cpu_user_features &= ~fp->cpu_user_ftrs;
170 		}
171 	}
172 }
173 
174 static void __init check_cpu_pa_features(unsigned long node)
175 {
176 	unsigned char *pa_ftrs;
177 	unsigned long tablelen;
178 
179 	pa_ftrs = of_get_flat_dt_prop(node, "ibm,pa-features", &tablelen);
180 	if (pa_ftrs == NULL)
181 		return;
182 
183 	scan_features(node, pa_ftrs, tablelen,
184 		      ibm_pa_features, ARRAY_SIZE(ibm_pa_features));
185 }
186 
187 #ifdef CONFIG_PPC_STD_MMU_64
188 static void __init check_cpu_slb_size(unsigned long node)
189 {
190 	u32 *slb_size_ptr;
191 
192 	slb_size_ptr = of_get_flat_dt_prop(node, "slb-size", NULL);
193 	if (slb_size_ptr != NULL) {
194 		mmu_slb_size = *slb_size_ptr;
195 		return;
196 	}
197 	slb_size_ptr = of_get_flat_dt_prop(node, "ibm,slb-size", NULL);
198 	if (slb_size_ptr != NULL) {
199 		mmu_slb_size = *slb_size_ptr;
200 	}
201 }
202 #else
203 #define check_cpu_slb_size(node) do { } while(0)
204 #endif
205 
206 static struct feature_property {
207 	const char *name;
208 	u32 min_value;
209 	unsigned long cpu_feature;
210 	unsigned long cpu_user_ftr;
211 } feature_properties[] __initdata = {
212 #ifdef CONFIG_ALTIVEC
213 	{"altivec", 0, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
214 	{"ibm,vmx", 1, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
215 #endif /* CONFIG_ALTIVEC */
216 #ifdef CONFIG_VSX
217 	/* Yes, this _really_ is ibm,vmx == 2 to enable VSX */
218 	{"ibm,vmx", 2, CPU_FTR_VSX, PPC_FEATURE_HAS_VSX},
219 #endif /* CONFIG_VSX */
220 #ifdef CONFIG_PPC64
221 	{"ibm,dfp", 1, 0, PPC_FEATURE_HAS_DFP},
222 	{"ibm,purr", 1, CPU_FTR_PURR, 0},
223 	{"ibm,spurr", 1, CPU_FTR_SPURR, 0},
224 #endif /* CONFIG_PPC64 */
225 };
226 
227 #if defined(CONFIG_44x) && defined(CONFIG_PPC_FPU)
228 static inline void identical_pvr_fixup(unsigned long node)
229 {
230 	unsigned int pvr;
231 	char *model = of_get_flat_dt_prop(node, "model", NULL);
232 
233 	/*
234 	 * Since 440GR(x)/440EP(x) processors have the same pvr,
235 	 * we check the node path and set bit 28 in the cur_cpu_spec
236 	 * pvr for EP(x) processor version. This bit is always 0 in
237 	 * the "real" pvr. Then we call identify_cpu again with
238 	 * the new logical pvr to enable FPU support.
239 	 */
240 	if (model && strstr(model, "440EP")) {
241 		pvr = cur_cpu_spec->pvr_value | 0x8;
242 		identify_cpu(0, pvr);
243 		DBG("Using logical pvr %x for %s\n", pvr, model);
244 	}
245 }
246 #else
247 #define identical_pvr_fixup(node) do { } while(0)
248 #endif
249 
250 static void __init check_cpu_feature_properties(unsigned long node)
251 {
252 	unsigned long i;
253 	struct feature_property *fp = feature_properties;
254 	const u32 *prop;
255 
256 	for (i = 0; i < ARRAY_SIZE(feature_properties); ++i, ++fp) {
257 		prop = of_get_flat_dt_prop(node, fp->name, NULL);
258 		if (prop && *prop >= fp->min_value) {
259 			cur_cpu_spec->cpu_features |= fp->cpu_feature;
260 			cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftr;
261 		}
262 	}
263 }
264 
265 static int __init early_init_dt_scan_cpus(unsigned long node,
266 					  const char *uname, int depth,
267 					  void *data)
268 {
269 	static int logical_cpuid = 0;
270 	char *type = of_get_flat_dt_prop(node, "device_type", NULL);
271 	const u32 *prop;
272 	const u32 *intserv;
273 	int i, nthreads;
274 	unsigned long len;
275 	int found = 0;
276 
277 	/* We are scanning "cpu" nodes only */
278 	if (type == NULL || strcmp(type, "cpu") != 0)
279 		return 0;
280 
281 	/* Get physical cpuid */
282 	intserv = of_get_flat_dt_prop(node, "ibm,ppc-interrupt-server#s", &len);
283 	if (intserv) {
284 		nthreads = len / sizeof(int);
285 	} else {
286 		intserv = of_get_flat_dt_prop(node, "reg", NULL);
287 		nthreads = 1;
288 	}
289 
290 	/*
291 	 * Now see if any of these threads match our boot cpu.
292 	 * NOTE: This must match the parsing done in smp_setup_cpu_maps.
293 	 */
294 	for (i = 0; i < nthreads; i++) {
295 		/*
296 		 * version 2 of the kexec param format adds the phys cpuid of
297 		 * booted proc.
298 		 */
299 		if (initial_boot_params && initial_boot_params->version >= 2) {
300 			if (intserv[i] ==
301 					initial_boot_params->boot_cpuid_phys) {
302 				found = 1;
303 				break;
304 			}
305 		} else {
306 			/*
307 			 * Check if it's the boot-cpu, set it's hw index now,
308 			 * unfortunately this format did not support booting
309 			 * off secondary threads.
310 			 */
311 			if (of_get_flat_dt_prop(node,
312 					"linux,boot-cpu", NULL) != NULL) {
313 				found = 1;
314 				break;
315 			}
316 		}
317 
318 #ifdef CONFIG_SMP
319 		/* logical cpu id is always 0 on UP kernels */
320 		logical_cpuid++;
321 #endif
322 	}
323 
324 	if (found) {
325 		DBG("boot cpu: logical %d physical %d\n", logical_cpuid,
326 			intserv[i]);
327 		boot_cpuid = logical_cpuid;
328 		set_hard_smp_processor_id(boot_cpuid, intserv[i]);
329 
330 		/*
331 		 * PAPR defines "logical" PVR values for cpus that
332 		 * meet various levels of the architecture:
333 		 * 0x0f000001	Architecture version 2.04
334 		 * 0x0f000002	Architecture version 2.05
335 		 * If the cpu-version property in the cpu node contains
336 		 * such a value, we call identify_cpu again with the
337 		 * logical PVR value in order to use the cpu feature
338 		 * bits appropriate for the architecture level.
339 		 *
340 		 * A POWER6 partition in "POWER6 architected" mode
341 		 * uses the 0x0f000002 PVR value; in POWER5+ mode
342 		 * it uses 0x0f000001.
343 		 */
344 		prop = of_get_flat_dt_prop(node, "cpu-version", NULL);
345 		if (prop && (*prop & 0xff000000) == 0x0f000000)
346 			identify_cpu(0, *prop);
347 
348 		identical_pvr_fixup(node);
349 	}
350 
351 	check_cpu_feature_properties(node);
352 	check_cpu_pa_features(node);
353 	check_cpu_slb_size(node);
354 
355 #ifdef CONFIG_PPC_PSERIES
356 	if (nthreads > 1)
357 		cur_cpu_spec->cpu_features |= CPU_FTR_SMT;
358 	else
359 		cur_cpu_spec->cpu_features &= ~CPU_FTR_SMT;
360 #endif
361 
362 	return 0;
363 }
364 
365 void __init early_init_dt_scan_chosen_arch(unsigned long node)
366 {
367 	unsigned long *lprop;
368 
369 #ifdef CONFIG_PPC64
370 	/* check if iommu is forced on or off */
371 	if (of_get_flat_dt_prop(node, "linux,iommu-off", NULL) != NULL)
372 		iommu_is_off = 1;
373 	if (of_get_flat_dt_prop(node, "linux,iommu-force-on", NULL) != NULL)
374 		iommu_force_on = 1;
375 #endif
376 
377 	/* mem=x on the command line is the preferred mechanism */
378 	lprop = of_get_flat_dt_prop(node, "linux,memory-limit", NULL);
379 	if (lprop)
380 		memory_limit = *lprop;
381 
382 #ifdef CONFIG_PPC64
383 	lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-start", NULL);
384 	if (lprop)
385 		tce_alloc_start = *lprop;
386 	lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-end", NULL);
387 	if (lprop)
388 		tce_alloc_end = *lprop;
389 #endif
390 
391 #ifdef CONFIG_KEXEC
392 	lprop = of_get_flat_dt_prop(node, "linux,crashkernel-base", NULL);
393 	if (lprop)
394 		crashk_res.start = *lprop;
395 
396 	lprop = of_get_flat_dt_prop(node, "linux,crashkernel-size", NULL);
397 	if (lprop)
398 		crashk_res.end = crashk_res.start + *lprop - 1;
399 #endif
400 }
401 
402 #ifdef CONFIG_PPC_PSERIES
403 /*
404  * Interpret the ibm,dynamic-memory property in the
405  * /ibm,dynamic-reconfiguration-memory node.
406  * This contains a list of memory blocks along with NUMA affinity
407  * information.
408  */
409 static int __init early_init_dt_scan_drconf_memory(unsigned long node)
410 {
411 	__be32 *dm, *ls, *usm;
412 	unsigned long l, n, flags;
413 	u64 base, size, lmb_size;
414 	unsigned int is_kexec_kdump = 0, rngs;
415 
416 	ls = of_get_flat_dt_prop(node, "ibm,lmb-size", &l);
417 	if (ls == NULL || l < dt_root_size_cells * sizeof(__be32))
418 		return 0;
419 	lmb_size = dt_mem_next_cell(dt_root_size_cells, &ls);
420 
421 	dm = of_get_flat_dt_prop(node, "ibm,dynamic-memory", &l);
422 	if (dm == NULL || l < sizeof(__be32))
423 		return 0;
424 
425 	n = *dm++;	/* number of entries */
426 	if (l < (n * (dt_root_addr_cells + 4) + 1) * sizeof(__be32))
427 		return 0;
428 
429 	/* check if this is a kexec/kdump kernel. */
430 	usm = of_get_flat_dt_prop(node, "linux,drconf-usable-memory",
431 						 &l);
432 	if (usm != NULL)
433 		is_kexec_kdump = 1;
434 
435 	for (; n != 0; --n) {
436 		base = dt_mem_next_cell(dt_root_addr_cells, &dm);
437 		flags = dm[3];
438 		/* skip DRC index, pad, assoc. list index, flags */
439 		dm += 4;
440 		/* skip this block if the reserved bit is set in flags (0x80)
441 		   or if the block is not assigned to this partition (0x8) */
442 		if ((flags & 0x80) || !(flags & 0x8))
443 			continue;
444 		size = lmb_size;
445 		rngs = 1;
446 		if (is_kexec_kdump) {
447 			/*
448 			 * For each lmb in ibm,dynamic-memory, a corresponding
449 			 * entry in linux,drconf-usable-memory property contains
450 			 * a counter 'p' followed by 'p' (base, size) duple.
451 			 * Now read the counter from
452 			 * linux,drconf-usable-memory property
453 			 */
454 			rngs = dt_mem_next_cell(dt_root_size_cells, &usm);
455 			if (!rngs) /* there are no (base, size) duple */
456 				continue;
457 		}
458 		do {
459 			if (is_kexec_kdump) {
460 				base = dt_mem_next_cell(dt_root_addr_cells,
461 							 &usm);
462 				size = dt_mem_next_cell(dt_root_size_cells,
463 							 &usm);
464 			}
465 			if (iommu_is_off) {
466 				if (base >= 0x80000000ul)
467 					continue;
468 				if ((base + size) > 0x80000000ul)
469 					size = 0x80000000ul - base;
470 			}
471 			lmb_add(base, size);
472 		} while (--rngs);
473 	}
474 	lmb_dump_all();
475 	return 0;
476 }
477 #else
478 #define early_init_dt_scan_drconf_memory(node)	0
479 #endif /* CONFIG_PPC_PSERIES */
480 
481 static int __init early_init_dt_scan_memory_ppc(unsigned long node,
482 						const char *uname,
483 						int depth, void *data)
484 {
485 	if (depth == 1 &&
486 	    strcmp(uname, "ibm,dynamic-reconfiguration-memory") == 0)
487 		return early_init_dt_scan_drconf_memory(node);
488 
489 	return early_init_dt_scan_memory(node, uname, depth, data);
490 }
491 
492 void __init early_init_dt_add_memory_arch(u64 base, u64 size)
493 {
494 #if defined(CONFIG_PPC64)
495 	if (iommu_is_off) {
496 		if (base >= 0x80000000ul)
497 			return;
498 		if ((base + size) > 0x80000000ul)
499 			size = 0x80000000ul - base;
500 	}
501 #endif
502 
503 	lmb_add(base, size);
504 
505 	memstart_addr = min((u64)memstart_addr, base);
506 }
507 
508 u64 __init early_init_dt_alloc_memory_arch(u64 size, u64 align)
509 {
510 	return lmb_alloc(size, align);
511 }
512 
513 #ifdef CONFIG_BLK_DEV_INITRD
514 void __init early_init_dt_setup_initrd_arch(unsigned long start,
515 		unsigned long end)
516 {
517 	initrd_start = (unsigned long)__va(start);
518 	initrd_end = (unsigned long)__va(end);
519 	initrd_below_start_ok = 1;
520 }
521 #endif
522 
523 static void __init early_reserve_mem(void)
524 {
525 	u64 base, size;
526 	u64 *reserve_map;
527 	unsigned long self_base;
528 	unsigned long self_size;
529 
530 	reserve_map = (u64 *)(((unsigned long)initial_boot_params) +
531 					initial_boot_params->off_mem_rsvmap);
532 
533 	/* before we do anything, lets reserve the dt blob */
534 	self_base = __pa((unsigned long)initial_boot_params);
535 	self_size = initial_boot_params->totalsize;
536 	lmb_reserve(self_base, self_size);
537 
538 #ifdef CONFIG_BLK_DEV_INITRD
539 	/* then reserve the initrd, if any */
540 	if (initrd_start && (initrd_end > initrd_start))
541 		lmb_reserve(__pa(initrd_start), initrd_end - initrd_start);
542 #endif /* CONFIG_BLK_DEV_INITRD */
543 
544 #ifdef CONFIG_PPC32
545 	/*
546 	 * Handle the case where we might be booting from an old kexec
547 	 * image that setup the mem_rsvmap as pairs of 32-bit values
548 	 */
549 	if (*reserve_map > 0xffffffffull) {
550 		u32 base_32, size_32;
551 		u32 *reserve_map_32 = (u32 *)reserve_map;
552 
553 		while (1) {
554 			base_32 = *(reserve_map_32++);
555 			size_32 = *(reserve_map_32++);
556 			if (size_32 == 0)
557 				break;
558 			/* skip if the reservation is for the blob */
559 			if (base_32 == self_base && size_32 == self_size)
560 				continue;
561 			DBG("reserving: %x -> %x\n", base_32, size_32);
562 			lmb_reserve(base_32, size_32);
563 		}
564 		return;
565 	}
566 #endif
567 	while (1) {
568 		base = *(reserve_map++);
569 		size = *(reserve_map++);
570 		if (size == 0)
571 			break;
572 		DBG("reserving: %llx -> %llx\n", base, size);
573 		lmb_reserve(base, size);
574 	}
575 }
576 
577 #ifdef CONFIG_PHYP_DUMP
578 /**
579  * phyp_dump_calculate_reserve_size() - reserve variable boot area 5% or arg
580  *
581  * Function to find the largest size we need to reserve
582  * during early boot process.
583  *
584  * It either looks for boot param and returns that OR
585  * returns larger of 256 or 5% rounded down to multiples of 256MB.
586  *
587  */
588 static inline unsigned long phyp_dump_calculate_reserve_size(void)
589 {
590 	unsigned long tmp;
591 
592 	if (phyp_dump_info->reserve_bootvar)
593 		return phyp_dump_info->reserve_bootvar;
594 
595 	/* divide by 20 to get 5% of value */
596 	tmp = lmb_end_of_DRAM();
597 	do_div(tmp, 20);
598 
599 	/* round it down in multiples of 256 */
600 	tmp = tmp & ~0x0FFFFFFFUL;
601 
602 	return (tmp > PHYP_DUMP_RMR_END ? tmp : PHYP_DUMP_RMR_END);
603 }
604 
605 /**
606  * phyp_dump_reserve_mem() - reserve all not-yet-dumped mmemory
607  *
608  * This routine may reserve memory regions in the kernel only
609  * if the system is supported and a dump was taken in last
610  * boot instance or if the hardware is supported and the
611  * scratch area needs to be setup. In other instances it returns
612  * without reserving anything. The memory in case of dump being
613  * active is freed when the dump is collected (by userland tools).
614  */
615 static void __init phyp_dump_reserve_mem(void)
616 {
617 	unsigned long base, size;
618 	unsigned long variable_reserve_size;
619 
620 	if (!phyp_dump_info->phyp_dump_configured) {
621 		printk(KERN_ERR "Phyp-dump not supported on this hardware\n");
622 		return;
623 	}
624 
625 	if (!phyp_dump_info->phyp_dump_at_boot) {
626 		printk(KERN_INFO "Phyp-dump disabled at boot time\n");
627 		return;
628 	}
629 
630 	variable_reserve_size = phyp_dump_calculate_reserve_size();
631 
632 	if (phyp_dump_info->phyp_dump_is_active) {
633 		/* Reserve *everything* above RMR.Area freed by userland tools*/
634 		base = variable_reserve_size;
635 		size = lmb_end_of_DRAM() - base;
636 
637 		/* XXX crashed_ram_end is wrong, since it may be beyond
638 		 * the memory_limit, it will need to be adjusted. */
639 		lmb_reserve(base, size);
640 
641 		phyp_dump_info->init_reserve_start = base;
642 		phyp_dump_info->init_reserve_size = size;
643 	} else {
644 		size = phyp_dump_info->cpu_state_size +
645 			phyp_dump_info->hpte_region_size +
646 			variable_reserve_size;
647 		base = lmb_end_of_DRAM() - size;
648 		lmb_reserve(base, size);
649 		phyp_dump_info->init_reserve_start = base;
650 		phyp_dump_info->init_reserve_size = size;
651 	}
652 }
653 #else
654 static inline void __init phyp_dump_reserve_mem(void) {}
655 #endif /* CONFIG_PHYP_DUMP  && CONFIG_PPC_RTAS */
656 
657 
658 void __init early_init_devtree(void *params)
659 {
660 	phys_addr_t limit;
661 
662 	DBG(" -> early_init_devtree(%p)\n", params);
663 
664 	/* Setup flat device-tree pointer */
665 	initial_boot_params = params;
666 
667 #ifdef CONFIG_PPC_RTAS
668 	/* Some machines might need RTAS info for debugging, grab it now. */
669 	of_scan_flat_dt(early_init_dt_scan_rtas, NULL);
670 #endif
671 
672 #ifdef CONFIG_PHYP_DUMP
673 	/* scan tree to see if dump occured during last boot */
674 	of_scan_flat_dt(early_init_dt_scan_phyp_dump, NULL);
675 #endif
676 
677 	/* Retrieve various informations from the /chosen node of the
678 	 * device-tree, including the platform type, initrd location and
679 	 * size, TCE reserve, and more ...
680 	 */
681 	of_scan_flat_dt(early_init_dt_scan_chosen, NULL);
682 
683 	/* Scan memory nodes and rebuild LMBs */
684 	lmb_init();
685 	of_scan_flat_dt(early_init_dt_scan_root, NULL);
686 	of_scan_flat_dt(early_init_dt_scan_memory_ppc, NULL);
687 
688 	/* Save command line for /proc/cmdline and then parse parameters */
689 	strlcpy(boot_command_line, cmd_line, COMMAND_LINE_SIZE);
690 	parse_early_param();
691 
692 	/* Reserve LMB regions used by kernel, initrd, dt, etc... */
693 	lmb_reserve(PHYSICAL_START, __pa(klimit) - PHYSICAL_START);
694 	/* If relocatable, reserve first 32k for interrupt vectors etc. */
695 	if (PHYSICAL_START > MEMORY_START)
696 		lmb_reserve(MEMORY_START, 0x8000);
697 	reserve_kdump_trampoline();
698 	reserve_crashkernel();
699 	early_reserve_mem();
700 	phyp_dump_reserve_mem();
701 
702 	limit = memory_limit;
703 	if (! limit) {
704 		phys_addr_t memsize;
705 
706 		/* Ensure that total memory size is page-aligned, because
707 		 * otherwise mark_bootmem() gets upset. */
708 		lmb_analyze();
709 		memsize = lmb_phys_mem_size();
710 		if ((memsize & PAGE_MASK) != memsize)
711 			limit = memsize & PAGE_MASK;
712 	}
713 	lmb_enforce_memory_limit(limit);
714 
715 	lmb_analyze();
716 	lmb_dump_all();
717 
718 	DBG("Phys. mem: %llx\n", lmb_phys_mem_size());
719 
720 	/* We may need to relocate the flat tree, do it now.
721 	 * FIXME .. and the initrd too? */
722 	move_device_tree();
723 
724 	DBG("Scanning CPUs ...\n");
725 
726 	/* Retreive CPU related informations from the flat tree
727 	 * (altivec support, boot CPU ID, ...)
728 	 */
729 	of_scan_flat_dt(early_init_dt_scan_cpus, NULL);
730 
731 	DBG(" <- early_init_devtree()\n");
732 }
733 
734 /*******
735  *
736  * New implementation of the OF "find" APIs, return a refcounted
737  * object, call of_node_put() when done.  The device tree and list
738  * are protected by a rw_lock.
739  *
740  * Note that property management will need some locking as well,
741  * this isn't dealt with yet.
742  *
743  *******/
744 
745 /**
746  *	of_find_next_cache_node - Find a node's subsidiary cache
747  *	@np:	node of type "cpu" or "cache"
748  *
749  *	Returns a node pointer with refcount incremented, use
750  *	of_node_put() on it when done.  Caller should hold a reference
751  *	to np.
752  */
753 struct device_node *of_find_next_cache_node(struct device_node *np)
754 {
755 	struct device_node *child;
756 	const phandle *handle;
757 
758 	handle = of_get_property(np, "l2-cache", NULL);
759 	if (!handle)
760 		handle = of_get_property(np, "next-level-cache", NULL);
761 
762 	if (handle)
763 		return of_find_node_by_phandle(*handle);
764 
765 	/* OF on pmac has nodes instead of properties named "l2-cache"
766 	 * beneath CPU nodes.
767 	 */
768 	if (!strcmp(np->type, "cpu"))
769 		for_each_child_of_node(np, child)
770 			if (!strcmp(child->type, "cache"))
771 				return child;
772 
773 	return NULL;
774 }
775 
776 #ifdef CONFIG_PPC_PSERIES
777 /*
778  * Fix up the uninitialized fields in a new device node:
779  * name, type and pci-specific fields
780  */
781 
782 static int of_finish_dynamic_node(struct device_node *node)
783 {
784 	struct device_node *parent = of_get_parent(node);
785 	int err = 0;
786 	const phandle *ibm_phandle;
787 
788 	node->name = of_get_property(node, "name", NULL);
789 	node->type = of_get_property(node, "device_type", NULL);
790 
791 	if (!node->name)
792 		node->name = "<NULL>";
793 	if (!node->type)
794 		node->type = "<NULL>";
795 
796 	if (!parent) {
797 		err = -ENODEV;
798 		goto out;
799 	}
800 
801 	/* We don't support that function on PowerMac, at least
802 	 * not yet
803 	 */
804 	if (machine_is(powermac))
805 		return -ENODEV;
806 
807 	/* fix up new node's phandle field */
808 	if ((ibm_phandle = of_get_property(node, "ibm,phandle", NULL)))
809 		node->phandle = *ibm_phandle;
810 
811 out:
812 	of_node_put(parent);
813 	return err;
814 }
815 
816 static int prom_reconfig_notifier(struct notifier_block *nb,
817 				  unsigned long action, void *node)
818 {
819 	int err;
820 
821 	switch (action) {
822 	case PSERIES_RECONFIG_ADD:
823 		err = of_finish_dynamic_node(node);
824 		if (err < 0) {
825 			printk(KERN_ERR "finish_node returned %d\n", err);
826 			err = NOTIFY_BAD;
827 		}
828 		break;
829 	default:
830 		err = NOTIFY_DONE;
831 		break;
832 	}
833 	return err;
834 }
835 
836 static struct notifier_block prom_reconfig_nb = {
837 	.notifier_call = prom_reconfig_notifier,
838 	.priority = 10, /* This one needs to run first */
839 };
840 
841 static int __init prom_reconfig_setup(void)
842 {
843 	return pSeries_reconfig_notifier_register(&prom_reconfig_nb);
844 }
845 __initcall(prom_reconfig_setup);
846 #endif
847 
848 /* Find the device node for a given logical cpu number, also returns the cpu
849  * local thread number (index in ibm,interrupt-server#s) if relevant and
850  * asked for (non NULL)
851  */
852 struct device_node *of_get_cpu_node(int cpu, unsigned int *thread)
853 {
854 	int hardid;
855 	struct device_node *np;
856 
857 	hardid = get_hard_smp_processor_id(cpu);
858 
859 	for_each_node_by_type(np, "cpu") {
860 		const u32 *intserv;
861 		unsigned int plen, t;
862 
863 		/* Check for ibm,ppc-interrupt-server#s. If it doesn't exist
864 		 * fallback to "reg" property and assume no threads
865 		 */
866 		intserv = of_get_property(np, "ibm,ppc-interrupt-server#s",
867 				&plen);
868 		if (intserv == NULL) {
869 			const u32 *reg = of_get_property(np, "reg", NULL);
870 			if (reg == NULL)
871 				continue;
872 			if (*reg == hardid) {
873 				if (thread)
874 					*thread = 0;
875 				return np;
876 			}
877 		} else {
878 			plen /= sizeof(u32);
879 			for (t = 0; t < plen; t++) {
880 				if (hardid == intserv[t]) {
881 					if (thread)
882 						*thread = t;
883 					return np;
884 				}
885 			}
886 		}
887 	}
888 	return NULL;
889 }
890 EXPORT_SYMBOL(of_get_cpu_node);
891 
892 #if defined(CONFIG_DEBUG_FS) && defined(DEBUG)
893 static struct debugfs_blob_wrapper flat_dt_blob;
894 
895 static int __init export_flat_device_tree(void)
896 {
897 	struct dentry *d;
898 
899 	flat_dt_blob.data = initial_boot_params;
900 	flat_dt_blob.size = initial_boot_params->totalsize;
901 
902 	d = debugfs_create_blob("flat-device-tree", S_IFREG | S_IRUSR,
903 				powerpc_debugfs_root, &flat_dt_blob);
904 	if (!d)
905 		return 1;
906 
907 	return 0;
908 }
909 __initcall(export_flat_device_tree);
910 #endif
911