1 /* 2 * Procedures for creating, accessing and interpreting the device tree. 3 * 4 * Paul Mackerras August 1996. 5 * Copyright (C) 1996-2005 Paul Mackerras. 6 * 7 * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner. 8 * {engebret|bergner}@us.ibm.com 9 * 10 * This program is free software; you can redistribute it and/or 11 * modify it under the terms of the GNU General Public License 12 * as published by the Free Software Foundation; either version 13 * 2 of the License, or (at your option) any later version. 14 */ 15 16 #undef DEBUG 17 18 #include <stdarg.h> 19 #include <linux/kernel.h> 20 #include <linux/string.h> 21 #include <linux/init.h> 22 #include <linux/threads.h> 23 #include <linux/spinlock.h> 24 #include <linux/types.h> 25 #include <linux/pci.h> 26 #include <linux/stringify.h> 27 #include <linux/delay.h> 28 #include <linux/initrd.h> 29 #include <linux/bitops.h> 30 #include <linux/module.h> 31 #include <linux/kexec.h> 32 #include <linux/debugfs.h> 33 #include <linux/irq.h> 34 #include <linux/memblock.h> 35 36 #include <asm/prom.h> 37 #include <asm/rtas.h> 38 #include <asm/page.h> 39 #include <asm/processor.h> 40 #include <asm/irq.h> 41 #include <asm/io.h> 42 #include <asm/kdump.h> 43 #include <asm/smp.h> 44 #include <asm/system.h> 45 #include <asm/mmu.h> 46 #include <asm/paca.h> 47 #include <asm/pgtable.h> 48 #include <asm/pci.h> 49 #include <asm/iommu.h> 50 #include <asm/btext.h> 51 #include <asm/sections.h> 52 #include <asm/machdep.h> 53 #include <asm/pSeries_reconfig.h> 54 #include <asm/pci-bridge.h> 55 #include <asm/phyp_dump.h> 56 #include <asm/kexec.h> 57 #include <mm/mmu_decl.h> 58 59 #ifdef DEBUG 60 #define DBG(fmt...) printk(KERN_ERR fmt) 61 #else 62 #define DBG(fmt...) 63 #endif 64 65 #ifdef CONFIG_PPC64 66 int __initdata iommu_is_off; 67 int __initdata iommu_force_on; 68 unsigned long tce_alloc_start, tce_alloc_end; 69 u64 ppc64_rma_size; 70 #endif 71 72 static int __init early_parse_mem(char *p) 73 { 74 if (!p) 75 return 1; 76 77 memory_limit = PAGE_ALIGN(memparse(p, &p)); 78 DBG("memory limit = 0x%llx\n", (unsigned long long)memory_limit); 79 80 return 0; 81 } 82 early_param("mem", early_parse_mem); 83 84 /** 85 * move_device_tree - move tree to an unused area, if needed. 86 * 87 * The device tree may be allocated beyond our memory limit, or inside the 88 * crash kernel region for kdump. If so, move it out of the way. 89 */ 90 static void __init move_device_tree(void) 91 { 92 unsigned long start, size; 93 void *p; 94 95 DBG("-> move_device_tree\n"); 96 97 start = __pa(initial_boot_params); 98 size = be32_to_cpu(initial_boot_params->totalsize); 99 100 if ((memory_limit && (start + size) > memory_limit) || 101 overlaps_crashkernel(start, size)) { 102 p = __va(memblock_alloc(size, PAGE_SIZE)); 103 memcpy(p, initial_boot_params, size); 104 initial_boot_params = (struct boot_param_header *)p; 105 DBG("Moved device tree to 0x%p\n", p); 106 } 107 108 DBG("<- move_device_tree\n"); 109 } 110 111 /* 112 * ibm,pa-features is a per-cpu property that contains a string of 113 * attribute descriptors, each of which has a 2 byte header plus up 114 * to 254 bytes worth of processor attribute bits. First header 115 * byte specifies the number of bytes following the header. 116 * Second header byte is an "attribute-specifier" type, of which 117 * zero is the only currently-defined value. 118 * Implementation: Pass in the byte and bit offset for the feature 119 * that we are interested in. The function will return -1 if the 120 * pa-features property is missing, or a 1/0 to indicate if the feature 121 * is supported/not supported. Note that the bit numbers are 122 * big-endian to match the definition in PAPR. 123 */ 124 static struct ibm_pa_feature { 125 unsigned long cpu_features; /* CPU_FTR_xxx bit */ 126 unsigned int cpu_user_ftrs; /* PPC_FEATURE_xxx bit */ 127 unsigned char pabyte; /* byte number in ibm,pa-features */ 128 unsigned char pabit; /* bit number (big-endian) */ 129 unsigned char invert; /* if 1, pa bit set => clear feature */ 130 } ibm_pa_features[] __initdata = { 131 {0, PPC_FEATURE_HAS_MMU, 0, 0, 0}, 132 {0, PPC_FEATURE_HAS_FPU, 0, 1, 0}, 133 {CPU_FTR_SLB, 0, 0, 2, 0}, 134 {CPU_FTR_CTRL, 0, 0, 3, 0}, 135 {CPU_FTR_NOEXECUTE, 0, 0, 6, 0}, 136 {CPU_FTR_NODSISRALIGN, 0, 1, 1, 1}, 137 {CPU_FTR_CI_LARGE_PAGE, 0, 1, 2, 0}, 138 {CPU_FTR_REAL_LE, PPC_FEATURE_TRUE_LE, 5, 0, 0}, 139 }; 140 141 static void __init scan_features(unsigned long node, unsigned char *ftrs, 142 unsigned long tablelen, 143 struct ibm_pa_feature *fp, 144 unsigned long ft_size) 145 { 146 unsigned long i, len, bit; 147 148 /* find descriptor with type == 0 */ 149 for (;;) { 150 if (tablelen < 3) 151 return; 152 len = 2 + ftrs[0]; 153 if (tablelen < len) 154 return; /* descriptor 0 not found */ 155 if (ftrs[1] == 0) 156 break; 157 tablelen -= len; 158 ftrs += len; 159 } 160 161 /* loop over bits we know about */ 162 for (i = 0; i < ft_size; ++i, ++fp) { 163 if (fp->pabyte >= ftrs[0]) 164 continue; 165 bit = (ftrs[2 + fp->pabyte] >> (7 - fp->pabit)) & 1; 166 if (bit ^ fp->invert) { 167 cur_cpu_spec->cpu_features |= fp->cpu_features; 168 cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftrs; 169 } else { 170 cur_cpu_spec->cpu_features &= ~fp->cpu_features; 171 cur_cpu_spec->cpu_user_features &= ~fp->cpu_user_ftrs; 172 } 173 } 174 } 175 176 static void __init check_cpu_pa_features(unsigned long node) 177 { 178 unsigned char *pa_ftrs; 179 unsigned long tablelen; 180 181 pa_ftrs = of_get_flat_dt_prop(node, "ibm,pa-features", &tablelen); 182 if (pa_ftrs == NULL) 183 return; 184 185 scan_features(node, pa_ftrs, tablelen, 186 ibm_pa_features, ARRAY_SIZE(ibm_pa_features)); 187 } 188 189 #ifdef CONFIG_PPC_STD_MMU_64 190 static void __init check_cpu_slb_size(unsigned long node) 191 { 192 u32 *slb_size_ptr; 193 194 slb_size_ptr = of_get_flat_dt_prop(node, "slb-size", NULL); 195 if (slb_size_ptr != NULL) { 196 mmu_slb_size = *slb_size_ptr; 197 return; 198 } 199 slb_size_ptr = of_get_flat_dt_prop(node, "ibm,slb-size", NULL); 200 if (slb_size_ptr != NULL) { 201 mmu_slb_size = *slb_size_ptr; 202 } 203 } 204 #else 205 #define check_cpu_slb_size(node) do { } while(0) 206 #endif 207 208 static struct feature_property { 209 const char *name; 210 u32 min_value; 211 unsigned long cpu_feature; 212 unsigned long cpu_user_ftr; 213 } feature_properties[] __initdata = { 214 #ifdef CONFIG_ALTIVEC 215 {"altivec", 0, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC}, 216 {"ibm,vmx", 1, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC}, 217 #endif /* CONFIG_ALTIVEC */ 218 #ifdef CONFIG_VSX 219 /* Yes, this _really_ is ibm,vmx == 2 to enable VSX */ 220 {"ibm,vmx", 2, CPU_FTR_VSX, PPC_FEATURE_HAS_VSX}, 221 #endif /* CONFIG_VSX */ 222 #ifdef CONFIG_PPC64 223 {"ibm,dfp", 1, 0, PPC_FEATURE_HAS_DFP}, 224 {"ibm,purr", 1, CPU_FTR_PURR, 0}, 225 {"ibm,spurr", 1, CPU_FTR_SPURR, 0}, 226 #endif /* CONFIG_PPC64 */ 227 }; 228 229 #if defined(CONFIG_44x) && defined(CONFIG_PPC_FPU) 230 static inline void identical_pvr_fixup(unsigned long node) 231 { 232 unsigned int pvr; 233 char *model = of_get_flat_dt_prop(node, "model", NULL); 234 235 /* 236 * Since 440GR(x)/440EP(x) processors have the same pvr, 237 * we check the node path and set bit 28 in the cur_cpu_spec 238 * pvr for EP(x) processor version. This bit is always 0 in 239 * the "real" pvr. Then we call identify_cpu again with 240 * the new logical pvr to enable FPU support. 241 */ 242 if (model && strstr(model, "440EP")) { 243 pvr = cur_cpu_spec->pvr_value | 0x8; 244 identify_cpu(0, pvr); 245 DBG("Using logical pvr %x for %s\n", pvr, model); 246 } 247 } 248 #else 249 #define identical_pvr_fixup(node) do { } while(0) 250 #endif 251 252 static void __init check_cpu_feature_properties(unsigned long node) 253 { 254 unsigned long i; 255 struct feature_property *fp = feature_properties; 256 const u32 *prop; 257 258 for (i = 0; i < ARRAY_SIZE(feature_properties); ++i, ++fp) { 259 prop = of_get_flat_dt_prop(node, fp->name, NULL); 260 if (prop && *prop >= fp->min_value) { 261 cur_cpu_spec->cpu_features |= fp->cpu_feature; 262 cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftr; 263 } 264 } 265 } 266 267 static int __init early_init_dt_scan_cpus(unsigned long node, 268 const char *uname, int depth, 269 void *data) 270 { 271 static int logical_cpuid = 0; 272 char *type = of_get_flat_dt_prop(node, "device_type", NULL); 273 const u32 *prop; 274 const u32 *intserv; 275 int i, nthreads; 276 unsigned long len; 277 int found = 0; 278 279 /* We are scanning "cpu" nodes only */ 280 if (type == NULL || strcmp(type, "cpu") != 0) 281 return 0; 282 283 /* Get physical cpuid */ 284 intserv = of_get_flat_dt_prop(node, "ibm,ppc-interrupt-server#s", &len); 285 if (intserv) { 286 nthreads = len / sizeof(int); 287 } else { 288 intserv = of_get_flat_dt_prop(node, "reg", NULL); 289 nthreads = 1; 290 } 291 292 /* 293 * Now see if any of these threads match our boot cpu. 294 * NOTE: This must match the parsing done in smp_setup_cpu_maps. 295 */ 296 for (i = 0; i < nthreads; i++) { 297 /* 298 * version 2 of the kexec param format adds the phys cpuid of 299 * booted proc. 300 */ 301 if (initial_boot_params && initial_boot_params->version >= 2) { 302 if (intserv[i] == 303 initial_boot_params->boot_cpuid_phys) { 304 found = 1; 305 break; 306 } 307 } else { 308 /* 309 * Check if it's the boot-cpu, set it's hw index now, 310 * unfortunately this format did not support booting 311 * off secondary threads. 312 */ 313 if (of_get_flat_dt_prop(node, 314 "linux,boot-cpu", NULL) != NULL) { 315 found = 1; 316 break; 317 } 318 } 319 320 #ifdef CONFIG_SMP 321 /* logical cpu id is always 0 on UP kernels */ 322 logical_cpuid++; 323 #endif 324 } 325 326 if (found) { 327 DBG("boot cpu: logical %d physical %d\n", logical_cpuid, 328 intserv[i]); 329 boot_cpuid = logical_cpuid; 330 set_hard_smp_processor_id(boot_cpuid, intserv[i]); 331 332 /* 333 * PAPR defines "logical" PVR values for cpus that 334 * meet various levels of the architecture: 335 * 0x0f000001 Architecture version 2.04 336 * 0x0f000002 Architecture version 2.05 337 * If the cpu-version property in the cpu node contains 338 * such a value, we call identify_cpu again with the 339 * logical PVR value in order to use the cpu feature 340 * bits appropriate for the architecture level. 341 * 342 * A POWER6 partition in "POWER6 architected" mode 343 * uses the 0x0f000002 PVR value; in POWER5+ mode 344 * it uses 0x0f000001. 345 */ 346 prop = of_get_flat_dt_prop(node, "cpu-version", NULL); 347 if (prop && (*prop & 0xff000000) == 0x0f000000) 348 identify_cpu(0, *prop); 349 350 identical_pvr_fixup(node); 351 } 352 353 check_cpu_feature_properties(node); 354 check_cpu_pa_features(node); 355 check_cpu_slb_size(node); 356 357 #ifdef CONFIG_PPC_PSERIES 358 if (nthreads > 1) 359 cur_cpu_spec->cpu_features |= CPU_FTR_SMT; 360 else 361 cur_cpu_spec->cpu_features &= ~CPU_FTR_SMT; 362 #endif 363 364 return 0; 365 } 366 367 void __init early_init_dt_scan_chosen_arch(unsigned long node) 368 { 369 unsigned long *lprop; 370 371 #ifdef CONFIG_PPC64 372 /* check if iommu is forced on or off */ 373 if (of_get_flat_dt_prop(node, "linux,iommu-off", NULL) != NULL) 374 iommu_is_off = 1; 375 if (of_get_flat_dt_prop(node, "linux,iommu-force-on", NULL) != NULL) 376 iommu_force_on = 1; 377 #endif 378 379 /* mem=x on the command line is the preferred mechanism */ 380 lprop = of_get_flat_dt_prop(node, "linux,memory-limit", NULL); 381 if (lprop) 382 memory_limit = *lprop; 383 384 #ifdef CONFIG_PPC64 385 lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-start", NULL); 386 if (lprop) 387 tce_alloc_start = *lprop; 388 lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-end", NULL); 389 if (lprop) 390 tce_alloc_end = *lprop; 391 #endif 392 393 #ifdef CONFIG_KEXEC 394 lprop = of_get_flat_dt_prop(node, "linux,crashkernel-base", NULL); 395 if (lprop) 396 crashk_res.start = *lprop; 397 398 lprop = of_get_flat_dt_prop(node, "linux,crashkernel-size", NULL); 399 if (lprop) 400 crashk_res.end = crashk_res.start + *lprop - 1; 401 #endif 402 } 403 404 #ifdef CONFIG_PPC_PSERIES 405 /* 406 * Interpret the ibm,dynamic-memory property in the 407 * /ibm,dynamic-reconfiguration-memory node. 408 * This contains a list of memory blocks along with NUMA affinity 409 * information. 410 */ 411 static int __init early_init_dt_scan_drconf_memory(unsigned long node) 412 { 413 __be32 *dm, *ls, *usm; 414 unsigned long l, n, flags; 415 u64 base, size, memblock_size; 416 unsigned int is_kexec_kdump = 0, rngs; 417 418 ls = of_get_flat_dt_prop(node, "ibm,lmb-size", &l); 419 if (ls == NULL || l < dt_root_size_cells * sizeof(__be32)) 420 return 0; 421 memblock_size = dt_mem_next_cell(dt_root_size_cells, &ls); 422 423 dm = of_get_flat_dt_prop(node, "ibm,dynamic-memory", &l); 424 if (dm == NULL || l < sizeof(__be32)) 425 return 0; 426 427 n = *dm++; /* number of entries */ 428 if (l < (n * (dt_root_addr_cells + 4) + 1) * sizeof(__be32)) 429 return 0; 430 431 /* check if this is a kexec/kdump kernel. */ 432 usm = of_get_flat_dt_prop(node, "linux,drconf-usable-memory", 433 &l); 434 if (usm != NULL) 435 is_kexec_kdump = 1; 436 437 for (; n != 0; --n) { 438 base = dt_mem_next_cell(dt_root_addr_cells, &dm); 439 flags = dm[3]; 440 /* skip DRC index, pad, assoc. list index, flags */ 441 dm += 4; 442 /* skip this block if the reserved bit is set in flags (0x80) 443 or if the block is not assigned to this partition (0x8) */ 444 if ((flags & 0x80) || !(flags & 0x8)) 445 continue; 446 size = memblock_size; 447 rngs = 1; 448 if (is_kexec_kdump) { 449 /* 450 * For each memblock in ibm,dynamic-memory, a corresponding 451 * entry in linux,drconf-usable-memory property contains 452 * a counter 'p' followed by 'p' (base, size) duple. 453 * Now read the counter from 454 * linux,drconf-usable-memory property 455 */ 456 rngs = dt_mem_next_cell(dt_root_size_cells, &usm); 457 if (!rngs) /* there are no (base, size) duple */ 458 continue; 459 } 460 do { 461 if (is_kexec_kdump) { 462 base = dt_mem_next_cell(dt_root_addr_cells, 463 &usm); 464 size = dt_mem_next_cell(dt_root_size_cells, 465 &usm); 466 } 467 if (iommu_is_off) { 468 if (base >= 0x80000000ul) 469 continue; 470 if ((base + size) > 0x80000000ul) 471 size = 0x80000000ul - base; 472 } 473 memblock_add(base, size); 474 } while (--rngs); 475 } 476 memblock_dump_all(); 477 return 0; 478 } 479 #else 480 #define early_init_dt_scan_drconf_memory(node) 0 481 #endif /* CONFIG_PPC_PSERIES */ 482 483 static int __init early_init_dt_scan_memory_ppc(unsigned long node, 484 const char *uname, 485 int depth, void *data) 486 { 487 if (depth == 1 && 488 strcmp(uname, "ibm,dynamic-reconfiguration-memory") == 0) 489 return early_init_dt_scan_drconf_memory(node); 490 491 return early_init_dt_scan_memory(node, uname, depth, data); 492 } 493 494 void __init early_init_dt_add_memory_arch(u64 base, u64 size) 495 { 496 #ifdef CONFIG_PPC64 497 if (iommu_is_off) { 498 if (base >= 0x80000000ul) 499 return; 500 if ((base + size) > 0x80000000ul) 501 size = 0x80000000ul - base; 502 } 503 #endif 504 505 /* First MEMBLOCK added, do some special initializations */ 506 if (memstart_addr == ~(phys_addr_t)0) 507 setup_initial_memory_limit(base, size); 508 memstart_addr = min((u64)memstart_addr, base); 509 510 /* Add the chunk to the MEMBLOCK list */ 511 memblock_add(base, size); 512 } 513 514 u64 __init early_init_dt_alloc_memory_arch(u64 size, u64 align) 515 { 516 return memblock_alloc(size, align); 517 } 518 519 #ifdef CONFIG_BLK_DEV_INITRD 520 void __init early_init_dt_setup_initrd_arch(unsigned long start, 521 unsigned long end) 522 { 523 initrd_start = (unsigned long)__va(start); 524 initrd_end = (unsigned long)__va(end); 525 initrd_below_start_ok = 1; 526 } 527 #endif 528 529 static void __init early_reserve_mem(void) 530 { 531 u64 base, size; 532 u64 *reserve_map; 533 unsigned long self_base; 534 unsigned long self_size; 535 536 reserve_map = (u64 *)(((unsigned long)initial_boot_params) + 537 initial_boot_params->off_mem_rsvmap); 538 539 /* before we do anything, lets reserve the dt blob */ 540 self_base = __pa((unsigned long)initial_boot_params); 541 self_size = initial_boot_params->totalsize; 542 memblock_reserve(self_base, self_size); 543 544 #ifdef CONFIG_BLK_DEV_INITRD 545 /* then reserve the initrd, if any */ 546 if (initrd_start && (initrd_end > initrd_start)) 547 memblock_reserve(__pa(initrd_start), initrd_end - initrd_start); 548 #endif /* CONFIG_BLK_DEV_INITRD */ 549 550 #ifdef CONFIG_PPC32 551 /* 552 * Handle the case where we might be booting from an old kexec 553 * image that setup the mem_rsvmap as pairs of 32-bit values 554 */ 555 if (*reserve_map > 0xffffffffull) { 556 u32 base_32, size_32; 557 u32 *reserve_map_32 = (u32 *)reserve_map; 558 559 while (1) { 560 base_32 = *(reserve_map_32++); 561 size_32 = *(reserve_map_32++); 562 if (size_32 == 0) 563 break; 564 /* skip if the reservation is for the blob */ 565 if (base_32 == self_base && size_32 == self_size) 566 continue; 567 DBG("reserving: %x -> %x\n", base_32, size_32); 568 memblock_reserve(base_32, size_32); 569 } 570 return; 571 } 572 #endif 573 while (1) { 574 base = *(reserve_map++); 575 size = *(reserve_map++); 576 if (size == 0) 577 break; 578 DBG("reserving: %llx -> %llx\n", base, size); 579 memblock_reserve(base, size); 580 } 581 } 582 583 #ifdef CONFIG_PHYP_DUMP 584 /** 585 * phyp_dump_calculate_reserve_size() - reserve variable boot area 5% or arg 586 * 587 * Function to find the largest size we need to reserve 588 * during early boot process. 589 * 590 * It either looks for boot param and returns that OR 591 * returns larger of 256 or 5% rounded down to multiples of 256MB. 592 * 593 */ 594 static inline unsigned long phyp_dump_calculate_reserve_size(void) 595 { 596 unsigned long tmp; 597 598 if (phyp_dump_info->reserve_bootvar) 599 return phyp_dump_info->reserve_bootvar; 600 601 /* divide by 20 to get 5% of value */ 602 tmp = memblock_end_of_DRAM(); 603 do_div(tmp, 20); 604 605 /* round it down in multiples of 256 */ 606 tmp = tmp & ~0x0FFFFFFFUL; 607 608 return (tmp > PHYP_DUMP_RMR_END ? tmp : PHYP_DUMP_RMR_END); 609 } 610 611 /** 612 * phyp_dump_reserve_mem() - reserve all not-yet-dumped mmemory 613 * 614 * This routine may reserve memory regions in the kernel only 615 * if the system is supported and a dump was taken in last 616 * boot instance or if the hardware is supported and the 617 * scratch area needs to be setup. In other instances it returns 618 * without reserving anything. The memory in case of dump being 619 * active is freed when the dump is collected (by userland tools). 620 */ 621 static void __init phyp_dump_reserve_mem(void) 622 { 623 unsigned long base, size; 624 unsigned long variable_reserve_size; 625 626 if (!phyp_dump_info->phyp_dump_configured) { 627 printk(KERN_ERR "Phyp-dump not supported on this hardware\n"); 628 return; 629 } 630 631 if (!phyp_dump_info->phyp_dump_at_boot) { 632 printk(KERN_INFO "Phyp-dump disabled at boot time\n"); 633 return; 634 } 635 636 variable_reserve_size = phyp_dump_calculate_reserve_size(); 637 638 if (phyp_dump_info->phyp_dump_is_active) { 639 /* Reserve *everything* above RMR.Area freed by userland tools*/ 640 base = variable_reserve_size; 641 size = memblock_end_of_DRAM() - base; 642 643 /* XXX crashed_ram_end is wrong, since it may be beyond 644 * the memory_limit, it will need to be adjusted. */ 645 memblock_reserve(base, size); 646 647 phyp_dump_info->init_reserve_start = base; 648 phyp_dump_info->init_reserve_size = size; 649 } else { 650 size = phyp_dump_info->cpu_state_size + 651 phyp_dump_info->hpte_region_size + 652 variable_reserve_size; 653 base = memblock_end_of_DRAM() - size; 654 memblock_reserve(base, size); 655 phyp_dump_info->init_reserve_start = base; 656 phyp_dump_info->init_reserve_size = size; 657 } 658 } 659 #else 660 static inline void __init phyp_dump_reserve_mem(void) {} 661 #endif /* CONFIG_PHYP_DUMP && CONFIG_PPC_RTAS */ 662 663 void __init early_init_devtree(void *params) 664 { 665 phys_addr_t limit; 666 667 DBG(" -> early_init_devtree(%p)\n", params); 668 669 /* Setup flat device-tree pointer */ 670 initial_boot_params = params; 671 672 #ifdef CONFIG_PPC_RTAS 673 /* Some machines might need RTAS info for debugging, grab it now. */ 674 of_scan_flat_dt(early_init_dt_scan_rtas, NULL); 675 #endif 676 677 #ifdef CONFIG_PHYP_DUMP 678 /* scan tree to see if dump occured during last boot */ 679 of_scan_flat_dt(early_init_dt_scan_phyp_dump, NULL); 680 #endif 681 682 /* Retrieve various informations from the /chosen node of the 683 * device-tree, including the platform type, initrd location and 684 * size, TCE reserve, and more ... 685 */ 686 of_scan_flat_dt(early_init_dt_scan_chosen, NULL); 687 688 /* Scan memory nodes and rebuild MEMBLOCKs */ 689 memblock_init(); 690 691 of_scan_flat_dt(early_init_dt_scan_root, NULL); 692 of_scan_flat_dt(early_init_dt_scan_memory_ppc, NULL); 693 694 /* Save command line for /proc/cmdline and then parse parameters */ 695 strlcpy(boot_command_line, cmd_line, COMMAND_LINE_SIZE); 696 parse_early_param(); 697 698 /* Reserve MEMBLOCK regions used by kernel, initrd, dt, etc... */ 699 memblock_reserve(PHYSICAL_START, __pa(klimit) - PHYSICAL_START); 700 /* If relocatable, reserve first 32k for interrupt vectors etc. */ 701 if (PHYSICAL_START > MEMORY_START) 702 memblock_reserve(MEMORY_START, 0x8000); 703 reserve_kdump_trampoline(); 704 reserve_crashkernel(); 705 early_reserve_mem(); 706 phyp_dump_reserve_mem(); 707 708 limit = memory_limit; 709 if (! limit) { 710 phys_addr_t memsize; 711 712 /* Ensure that total memory size is page-aligned, because 713 * otherwise mark_bootmem() gets upset. */ 714 memblock_analyze(); 715 memsize = memblock_phys_mem_size(); 716 if ((memsize & PAGE_MASK) != memsize) 717 limit = memsize & PAGE_MASK; 718 } 719 memblock_enforce_memory_limit(limit); 720 721 memblock_analyze(); 722 memblock_dump_all(); 723 724 DBG("Phys. mem: %llx\n", memblock_phys_mem_size()); 725 726 /* We may need to relocate the flat tree, do it now. 727 * FIXME .. and the initrd too? */ 728 move_device_tree(); 729 730 allocate_pacas(); 731 732 DBG("Scanning CPUs ...\n"); 733 734 /* Retreive CPU related informations from the flat tree 735 * (altivec support, boot CPU ID, ...) 736 */ 737 of_scan_flat_dt(early_init_dt_scan_cpus, NULL); 738 739 DBG(" <- early_init_devtree()\n"); 740 } 741 742 /******* 743 * 744 * New implementation of the OF "find" APIs, return a refcounted 745 * object, call of_node_put() when done. The device tree and list 746 * are protected by a rw_lock. 747 * 748 * Note that property management will need some locking as well, 749 * this isn't dealt with yet. 750 * 751 *******/ 752 753 /** 754 * of_find_next_cache_node - Find a node's subsidiary cache 755 * @np: node of type "cpu" or "cache" 756 * 757 * Returns a node pointer with refcount incremented, use 758 * of_node_put() on it when done. Caller should hold a reference 759 * to np. 760 */ 761 struct device_node *of_find_next_cache_node(struct device_node *np) 762 { 763 struct device_node *child; 764 const phandle *handle; 765 766 handle = of_get_property(np, "l2-cache", NULL); 767 if (!handle) 768 handle = of_get_property(np, "next-level-cache", NULL); 769 770 if (handle) 771 return of_find_node_by_phandle(*handle); 772 773 /* OF on pmac has nodes instead of properties named "l2-cache" 774 * beneath CPU nodes. 775 */ 776 if (!strcmp(np->type, "cpu")) 777 for_each_child_of_node(np, child) 778 if (!strcmp(child->type, "cache")) 779 return child; 780 781 return NULL; 782 } 783 784 #ifdef CONFIG_PPC_PSERIES 785 /* 786 * Fix up the uninitialized fields in a new device node: 787 * name, type and pci-specific fields 788 */ 789 790 static int of_finish_dynamic_node(struct device_node *node) 791 { 792 struct device_node *parent = of_get_parent(node); 793 int err = 0; 794 const phandle *ibm_phandle; 795 796 node->name = of_get_property(node, "name", NULL); 797 node->type = of_get_property(node, "device_type", NULL); 798 799 if (!node->name) 800 node->name = "<NULL>"; 801 if (!node->type) 802 node->type = "<NULL>"; 803 804 if (!parent) { 805 err = -ENODEV; 806 goto out; 807 } 808 809 /* We don't support that function on PowerMac, at least 810 * not yet 811 */ 812 if (machine_is(powermac)) 813 return -ENODEV; 814 815 /* fix up new node's phandle field */ 816 if ((ibm_phandle = of_get_property(node, "ibm,phandle", NULL))) 817 node->phandle = *ibm_phandle; 818 819 out: 820 of_node_put(parent); 821 return err; 822 } 823 824 static int prom_reconfig_notifier(struct notifier_block *nb, 825 unsigned long action, void *node) 826 { 827 int err; 828 829 switch (action) { 830 case PSERIES_RECONFIG_ADD: 831 err = of_finish_dynamic_node(node); 832 if (err < 0) { 833 printk(KERN_ERR "finish_node returned %d\n", err); 834 err = NOTIFY_BAD; 835 } 836 break; 837 default: 838 err = NOTIFY_DONE; 839 break; 840 } 841 return err; 842 } 843 844 static struct notifier_block prom_reconfig_nb = { 845 .notifier_call = prom_reconfig_notifier, 846 .priority = 10, /* This one needs to run first */ 847 }; 848 849 static int __init prom_reconfig_setup(void) 850 { 851 return pSeries_reconfig_notifier_register(&prom_reconfig_nb); 852 } 853 __initcall(prom_reconfig_setup); 854 #endif 855 856 /* Find the device node for a given logical cpu number, also returns the cpu 857 * local thread number (index in ibm,interrupt-server#s) if relevant and 858 * asked for (non NULL) 859 */ 860 struct device_node *of_get_cpu_node(int cpu, unsigned int *thread) 861 { 862 int hardid; 863 struct device_node *np; 864 865 hardid = get_hard_smp_processor_id(cpu); 866 867 for_each_node_by_type(np, "cpu") { 868 const u32 *intserv; 869 unsigned int plen, t; 870 871 /* Check for ibm,ppc-interrupt-server#s. If it doesn't exist 872 * fallback to "reg" property and assume no threads 873 */ 874 intserv = of_get_property(np, "ibm,ppc-interrupt-server#s", 875 &plen); 876 if (intserv == NULL) { 877 const u32 *reg = of_get_property(np, "reg", NULL); 878 if (reg == NULL) 879 continue; 880 if (*reg == hardid) { 881 if (thread) 882 *thread = 0; 883 return np; 884 } 885 } else { 886 plen /= sizeof(u32); 887 for (t = 0; t < plen; t++) { 888 if (hardid == intserv[t]) { 889 if (thread) 890 *thread = t; 891 return np; 892 } 893 } 894 } 895 } 896 return NULL; 897 } 898 EXPORT_SYMBOL(of_get_cpu_node); 899 900 #if defined(CONFIG_DEBUG_FS) && defined(DEBUG) 901 static struct debugfs_blob_wrapper flat_dt_blob; 902 903 static int __init export_flat_device_tree(void) 904 { 905 struct dentry *d; 906 907 flat_dt_blob.data = initial_boot_params; 908 flat_dt_blob.size = initial_boot_params->totalsize; 909 910 d = debugfs_create_blob("flat-device-tree", S_IFREG | S_IRUSR, 911 powerpc_debugfs_root, &flat_dt_blob); 912 if (!d) 913 return 1; 914 915 return 0; 916 } 917 __initcall(export_flat_device_tree); 918 #endif 919