1 /* 2 * Copyright (C) 2004, 2005 MIPS Technologies, Inc. All rights reserved. 3 * 4 * This program is free software; you can distribute it and/or modify it 5 * under the terms of the GNU General Public License (Version 2) as 6 * published by the Free Software Foundation. 7 * 8 * This program is distributed in the hope it will be useful, but WITHOUT 9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 11 * for more details. 12 * 13 * You should have received a copy of the GNU General Public License along 14 * with this program; if not, write to the Free Software Foundation, Inc., 15 * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA. 16 */ 17 18 /* 19 * VPE support module 20 * 21 * Provides support for loading a MIPS SP program on VPE1. 22 * The SP enviroment is rather simple, no tlb's. It needs to be relocatable 23 * (or partially linked). You should initialise your stack in the startup 24 * code. This loader looks for the symbol __start and sets up 25 * execution to resume from there. The MIPS SDE kit contains suitable examples. 26 * 27 * To load and run, simply cat a SP 'program file' to /dev/vpe1. 28 * i.e cat spapp >/dev/vpe1. 29 */ 30 #include <linux/kernel.h> 31 #include <linux/device.h> 32 #include <linux/module.h> 33 #include <linux/fs.h> 34 #include <linux/init.h> 35 #include <asm/uaccess.h> 36 #include <linux/slab.h> 37 #include <linux/list.h> 38 #include <linux/vmalloc.h> 39 #include <linux/elf.h> 40 #include <linux/seq_file.h> 41 #include <linux/syscalls.h> 42 #include <linux/moduleloader.h> 43 #include <linux/interrupt.h> 44 #include <linux/poll.h> 45 #include <linux/bootmem.h> 46 #include <asm/mipsregs.h> 47 #include <asm/mipsmtregs.h> 48 #include <asm/cacheflush.h> 49 #include <asm/atomic.h> 50 #include <asm/cpu.h> 51 #include <asm/mips_mt.h> 52 #include <asm/processor.h> 53 #include <asm/system.h> 54 #include <asm/vpe.h> 55 #include <asm/kspd.h> 56 57 typedef void *vpe_handle; 58 59 #ifndef ARCH_SHF_SMALL 60 #define ARCH_SHF_SMALL 0 61 #endif 62 63 /* If this is set, the section belongs in the init part of the module */ 64 #define INIT_OFFSET_MASK (1UL << (BITS_PER_LONG-1)) 65 66 /* 67 * The number of TCs and VPEs physically available on the core 68 */ 69 static int hw_tcs, hw_vpes; 70 static char module_name[] = "vpe"; 71 static int major; 72 static const int minor = 1; /* fixed for now */ 73 74 #ifdef CONFIG_MIPS_APSP_KSPD 75 static struct kspd_notifications kspd_events; 76 static int kspd_events_reqd; 77 #endif 78 79 /* grab the likely amount of memory we will need. */ 80 #ifdef CONFIG_MIPS_VPE_LOADER_TOM 81 #define P_SIZE (2 * 1024 * 1024) 82 #else 83 /* add an overhead to the max kmalloc size for non-striped symbols/etc */ 84 #define P_SIZE (256 * 1024) 85 #endif 86 87 extern unsigned long physical_memsize; 88 89 #define MAX_VPES 16 90 #define VPE_PATH_MAX 256 91 92 enum vpe_state { 93 VPE_STATE_UNUSED = 0, 94 VPE_STATE_INUSE, 95 VPE_STATE_RUNNING 96 }; 97 98 enum tc_state { 99 TC_STATE_UNUSED = 0, 100 TC_STATE_INUSE, 101 TC_STATE_RUNNING, 102 TC_STATE_DYNAMIC 103 }; 104 105 struct vpe { 106 enum vpe_state state; 107 108 /* (device) minor associated with this vpe */ 109 int minor; 110 111 /* elfloader stuff */ 112 void *load_addr; 113 unsigned long len; 114 char *pbuffer; 115 unsigned long plen; 116 unsigned int uid, gid; 117 char cwd[VPE_PATH_MAX]; 118 119 unsigned long __start; 120 121 /* tc's associated with this vpe */ 122 struct list_head tc; 123 124 /* The list of vpe's */ 125 struct list_head list; 126 127 /* shared symbol address */ 128 void *shared_ptr; 129 130 /* the list of who wants to know when something major happens */ 131 struct list_head notify; 132 133 unsigned int ntcs; 134 }; 135 136 struct tc { 137 enum tc_state state; 138 int index; 139 140 struct vpe *pvpe; /* parent VPE */ 141 struct list_head tc; /* The list of TC's with this VPE */ 142 struct list_head list; /* The global list of tc's */ 143 }; 144 145 struct { 146 spinlock_t vpe_list_lock; 147 struct list_head vpe_list; /* Virtual processing elements */ 148 spinlock_t tc_list_lock; 149 struct list_head tc_list; /* Thread contexts */ 150 } vpecontrol = { 151 .vpe_list_lock = SPIN_LOCK_UNLOCKED, 152 .vpe_list = LIST_HEAD_INIT(vpecontrol.vpe_list), 153 .tc_list_lock = SPIN_LOCK_UNLOCKED, 154 .tc_list = LIST_HEAD_INIT(vpecontrol.tc_list) 155 }; 156 157 static void release_progmem(void *ptr); 158 159 /* get the vpe associated with this minor */ 160 static struct vpe *get_vpe(int minor) 161 { 162 struct vpe *res, *v; 163 164 if (!cpu_has_mipsmt) 165 return NULL; 166 167 res = NULL; 168 spin_lock(&vpecontrol.vpe_list_lock); 169 list_for_each_entry(v, &vpecontrol.vpe_list, list) { 170 if (v->minor == minor) { 171 res = v; 172 break; 173 } 174 } 175 spin_unlock(&vpecontrol.vpe_list_lock); 176 177 return res; 178 } 179 180 /* get the vpe associated with this minor */ 181 static struct tc *get_tc(int index) 182 { 183 struct tc *res, *t; 184 185 res = NULL; 186 spin_lock(&vpecontrol.tc_list_lock); 187 list_for_each_entry(t, &vpecontrol.tc_list, list) { 188 if (t->index == index) { 189 res = t; 190 break; 191 } 192 } 193 spin_unlock(&vpecontrol.tc_list_lock); 194 195 return NULL; 196 } 197 198 /* allocate a vpe and associate it with this minor (or index) */ 199 static struct vpe *alloc_vpe(int minor) 200 { 201 struct vpe *v; 202 203 if ((v = kzalloc(sizeof(struct vpe), GFP_KERNEL)) == NULL) 204 return NULL; 205 206 INIT_LIST_HEAD(&v->tc); 207 spin_lock(&vpecontrol.vpe_list_lock); 208 list_add_tail(&v->list, &vpecontrol.vpe_list); 209 spin_unlock(&vpecontrol.vpe_list_lock); 210 211 INIT_LIST_HEAD(&v->notify); 212 v->minor = minor; 213 214 return v; 215 } 216 217 /* allocate a tc. At startup only tc0 is running, all other can be halted. */ 218 static struct tc *alloc_tc(int index) 219 { 220 struct tc *tc; 221 222 if ((tc = kzalloc(sizeof(struct tc), GFP_KERNEL)) == NULL) 223 goto out; 224 225 INIT_LIST_HEAD(&tc->tc); 226 tc->index = index; 227 228 spin_lock(&vpecontrol.tc_list_lock); 229 list_add_tail(&tc->list, &vpecontrol.tc_list); 230 spin_unlock(&vpecontrol.tc_list_lock); 231 232 out: 233 return tc; 234 } 235 236 /* clean up and free everything */ 237 static void release_vpe(struct vpe *v) 238 { 239 list_del(&v->list); 240 if (v->load_addr) 241 release_progmem(v); 242 kfree(v); 243 } 244 245 static void __maybe_unused dump_mtregs(void) 246 { 247 unsigned long val; 248 249 val = read_c0_config3(); 250 printk("config3 0x%lx MT %ld\n", val, 251 (val & CONFIG3_MT) >> CONFIG3_MT_SHIFT); 252 253 val = read_c0_mvpcontrol(); 254 printk("MVPControl 0x%lx, STLB %ld VPC %ld EVP %ld\n", val, 255 (val & MVPCONTROL_STLB) >> MVPCONTROL_STLB_SHIFT, 256 (val & MVPCONTROL_VPC) >> MVPCONTROL_VPC_SHIFT, 257 (val & MVPCONTROL_EVP)); 258 259 val = read_c0_mvpconf0(); 260 printk("mvpconf0 0x%lx, PVPE %ld PTC %ld M %ld\n", val, 261 (val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT, 262 val & MVPCONF0_PTC, (val & MVPCONF0_M) >> MVPCONF0_M_SHIFT); 263 } 264 265 /* Find some VPE program space */ 266 static void *alloc_progmem(unsigned long len) 267 { 268 void *addr; 269 270 #ifdef CONFIG_MIPS_VPE_LOADER_TOM 271 /* 272 * This means you must tell Linux to use less memory than you 273 * physically have, for example by passing a mem= boot argument. 274 */ 275 addr = pfn_to_kaddr(max_low_pfn); 276 memset(addr, 0, len); 277 #else 278 /* simple grab some mem for now */ 279 addr = kzalloc(len, GFP_KERNEL); 280 #endif 281 282 return addr; 283 } 284 285 static void release_progmem(void *ptr) 286 { 287 #ifndef CONFIG_MIPS_VPE_LOADER_TOM 288 kfree(ptr); 289 #endif 290 } 291 292 /* Update size with this section: return offset. */ 293 static long get_offset(unsigned long *size, Elf_Shdr * sechdr) 294 { 295 long ret; 296 297 ret = ALIGN(*size, sechdr->sh_addralign ? : 1); 298 *size = ret + sechdr->sh_size; 299 return ret; 300 } 301 302 /* Lay out the SHF_ALLOC sections in a way not dissimilar to how ld 303 might -- code, read-only data, read-write data, small data. Tally 304 sizes, and place the offsets into sh_entsize fields: high bit means it 305 belongs in init. */ 306 static void layout_sections(struct module *mod, const Elf_Ehdr * hdr, 307 Elf_Shdr * sechdrs, const char *secstrings) 308 { 309 static unsigned long const masks[][2] = { 310 /* NOTE: all executable code must be the first section 311 * in this array; otherwise modify the text_size 312 * finder in the two loops below */ 313 {SHF_EXECINSTR | SHF_ALLOC, ARCH_SHF_SMALL}, 314 {SHF_ALLOC, SHF_WRITE | ARCH_SHF_SMALL}, 315 {SHF_WRITE | SHF_ALLOC, ARCH_SHF_SMALL}, 316 {ARCH_SHF_SMALL | SHF_ALLOC, 0} 317 }; 318 unsigned int m, i; 319 320 for (i = 0; i < hdr->e_shnum; i++) 321 sechdrs[i].sh_entsize = ~0UL; 322 323 for (m = 0; m < ARRAY_SIZE(masks); ++m) { 324 for (i = 0; i < hdr->e_shnum; ++i) { 325 Elf_Shdr *s = &sechdrs[i]; 326 327 // || strncmp(secstrings + s->sh_name, ".init", 5) == 0) 328 if ((s->sh_flags & masks[m][0]) != masks[m][0] 329 || (s->sh_flags & masks[m][1]) 330 || s->sh_entsize != ~0UL) 331 continue; 332 s->sh_entsize = 333 get_offset((unsigned long *)&mod->core_size, s); 334 } 335 336 if (m == 0) 337 mod->core_text_size = mod->core_size; 338 339 } 340 } 341 342 343 /* from module-elf32.c, but subverted a little */ 344 345 struct mips_hi16 { 346 struct mips_hi16 *next; 347 Elf32_Addr *addr; 348 Elf32_Addr value; 349 }; 350 351 static struct mips_hi16 *mips_hi16_list; 352 static unsigned int gp_offs, gp_addr; 353 354 static int apply_r_mips_none(struct module *me, uint32_t *location, 355 Elf32_Addr v) 356 { 357 return 0; 358 } 359 360 static int apply_r_mips_gprel16(struct module *me, uint32_t *location, 361 Elf32_Addr v) 362 { 363 int rel; 364 365 if( !(*location & 0xffff) ) { 366 rel = (int)v - gp_addr; 367 } 368 else { 369 /* .sbss + gp(relative) + offset */ 370 /* kludge! */ 371 rel = (int)(short)((int)v + gp_offs + 372 (int)(short)(*location & 0xffff) - gp_addr); 373 } 374 375 if( (rel > 32768) || (rel < -32768) ) { 376 printk(KERN_DEBUG "VPE loader: apply_r_mips_gprel16: " 377 "relative address 0x%x out of range of gp register\n", 378 rel); 379 return -ENOEXEC; 380 } 381 382 *location = (*location & 0xffff0000) | (rel & 0xffff); 383 384 return 0; 385 } 386 387 static int apply_r_mips_pc16(struct module *me, uint32_t *location, 388 Elf32_Addr v) 389 { 390 int rel; 391 rel = (((unsigned int)v - (unsigned int)location)); 392 rel >>= 2; // because the offset is in _instructions_ not bytes. 393 rel -= 1; // and one instruction less due to the branch delay slot. 394 395 if( (rel > 32768) || (rel < -32768) ) { 396 printk(KERN_DEBUG "VPE loader: " 397 "apply_r_mips_pc16: relative address out of range 0x%x\n", rel); 398 return -ENOEXEC; 399 } 400 401 *location = (*location & 0xffff0000) | (rel & 0xffff); 402 403 return 0; 404 } 405 406 static int apply_r_mips_32(struct module *me, uint32_t *location, 407 Elf32_Addr v) 408 { 409 *location += v; 410 411 return 0; 412 } 413 414 static int apply_r_mips_26(struct module *me, uint32_t *location, 415 Elf32_Addr v) 416 { 417 if (v % 4) { 418 printk(KERN_DEBUG "VPE loader: apply_r_mips_26 " 419 " unaligned relocation\n"); 420 return -ENOEXEC; 421 } 422 423 /* 424 * Not desperately convinced this is a good check of an overflow condition 425 * anyway. But it gets in the way of handling undefined weak symbols which 426 * we want to set to zero. 427 * if ((v & 0xf0000000) != (((unsigned long)location + 4) & 0xf0000000)) { 428 * printk(KERN_ERR 429 * "module %s: relocation overflow\n", 430 * me->name); 431 * return -ENOEXEC; 432 * } 433 */ 434 435 *location = (*location & ~0x03ffffff) | 436 ((*location + (v >> 2)) & 0x03ffffff); 437 return 0; 438 } 439 440 static int apply_r_mips_hi16(struct module *me, uint32_t *location, 441 Elf32_Addr v) 442 { 443 struct mips_hi16 *n; 444 445 /* 446 * We cannot relocate this one now because we don't know the value of 447 * the carry we need to add. Save the information, and let LO16 do the 448 * actual relocation. 449 */ 450 n = kmalloc(sizeof *n, GFP_KERNEL); 451 if (!n) 452 return -ENOMEM; 453 454 n->addr = location; 455 n->value = v; 456 n->next = mips_hi16_list; 457 mips_hi16_list = n; 458 459 return 0; 460 } 461 462 static int apply_r_mips_lo16(struct module *me, uint32_t *location, 463 Elf32_Addr v) 464 { 465 unsigned long insnlo = *location; 466 Elf32_Addr val, vallo; 467 struct mips_hi16 *l, *next; 468 469 /* Sign extend the addend we extract from the lo insn. */ 470 vallo = ((insnlo & 0xffff) ^ 0x8000) - 0x8000; 471 472 if (mips_hi16_list != NULL) { 473 474 l = mips_hi16_list; 475 while (l != NULL) { 476 unsigned long insn; 477 478 /* 479 * The value for the HI16 had best be the same. 480 */ 481 if (v != l->value) { 482 printk(KERN_DEBUG "VPE loader: " 483 "apply_r_mips_lo16/hi16: \t" 484 "inconsistent value information\n"); 485 goto out_free; 486 } 487 488 /* 489 * Do the HI16 relocation. Note that we actually don't 490 * need to know anything about the LO16 itself, except 491 * where to find the low 16 bits of the addend needed 492 * by the LO16. 493 */ 494 insn = *l->addr; 495 val = ((insn & 0xffff) << 16) + vallo; 496 val += v; 497 498 /* 499 * Account for the sign extension that will happen in 500 * the low bits. 501 */ 502 val = ((val >> 16) + ((val & 0x8000) != 0)) & 0xffff; 503 504 insn = (insn & ~0xffff) | val; 505 *l->addr = insn; 506 507 next = l->next; 508 kfree(l); 509 l = next; 510 } 511 512 mips_hi16_list = NULL; 513 } 514 515 /* 516 * Ok, we're done with the HI16 relocs. Now deal with the LO16. 517 */ 518 val = v + vallo; 519 insnlo = (insnlo & ~0xffff) | (val & 0xffff); 520 *location = insnlo; 521 522 return 0; 523 524 out_free: 525 while (l != NULL) { 526 next = l->next; 527 kfree(l); 528 l = next; 529 } 530 mips_hi16_list = NULL; 531 532 return -ENOEXEC; 533 } 534 535 static int (*reloc_handlers[]) (struct module *me, uint32_t *location, 536 Elf32_Addr v) = { 537 [R_MIPS_NONE] = apply_r_mips_none, 538 [R_MIPS_32] = apply_r_mips_32, 539 [R_MIPS_26] = apply_r_mips_26, 540 [R_MIPS_HI16] = apply_r_mips_hi16, 541 [R_MIPS_LO16] = apply_r_mips_lo16, 542 [R_MIPS_GPREL16] = apply_r_mips_gprel16, 543 [R_MIPS_PC16] = apply_r_mips_pc16 544 }; 545 546 static char *rstrs[] = { 547 [R_MIPS_NONE] = "MIPS_NONE", 548 [R_MIPS_32] = "MIPS_32", 549 [R_MIPS_26] = "MIPS_26", 550 [R_MIPS_HI16] = "MIPS_HI16", 551 [R_MIPS_LO16] = "MIPS_LO16", 552 [R_MIPS_GPREL16] = "MIPS_GPREL16", 553 [R_MIPS_PC16] = "MIPS_PC16" 554 }; 555 556 static int apply_relocations(Elf32_Shdr *sechdrs, 557 const char *strtab, 558 unsigned int symindex, 559 unsigned int relsec, 560 struct module *me) 561 { 562 Elf32_Rel *rel = (void *) sechdrs[relsec].sh_addr; 563 Elf32_Sym *sym; 564 uint32_t *location; 565 unsigned int i; 566 Elf32_Addr v; 567 int res; 568 569 for (i = 0; i < sechdrs[relsec].sh_size / sizeof(*rel); i++) { 570 Elf32_Word r_info = rel[i].r_info; 571 572 /* This is where to make the change */ 573 location = (void *)sechdrs[sechdrs[relsec].sh_info].sh_addr 574 + rel[i].r_offset; 575 /* This is the symbol it is referring to */ 576 sym = (Elf32_Sym *)sechdrs[symindex].sh_addr 577 + ELF32_R_SYM(r_info); 578 579 if (!sym->st_value) { 580 printk(KERN_DEBUG "%s: undefined weak symbol %s\n", 581 me->name, strtab + sym->st_name); 582 /* just print the warning, dont barf */ 583 } 584 585 v = sym->st_value; 586 587 res = reloc_handlers[ELF32_R_TYPE(r_info)](me, location, v); 588 if( res ) { 589 char *r = rstrs[ELF32_R_TYPE(r_info)]; 590 printk(KERN_WARNING "VPE loader: .text+0x%x " 591 "relocation type %s for symbol \"%s\" failed\n", 592 rel[i].r_offset, r ? r : "UNKNOWN", 593 strtab + sym->st_name); 594 return res; 595 } 596 } 597 598 return 0; 599 } 600 601 static inline void save_gp_address(unsigned int secbase, unsigned int rel) 602 { 603 gp_addr = secbase + rel; 604 gp_offs = gp_addr - (secbase & 0xffff0000); 605 } 606 /* end module-elf32.c */ 607 608 609 610 /* Change all symbols so that sh_value encodes the pointer directly. */ 611 static void simplify_symbols(Elf_Shdr * sechdrs, 612 unsigned int symindex, 613 const char *strtab, 614 const char *secstrings, 615 unsigned int nsecs, struct module *mod) 616 { 617 Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; 618 unsigned long secbase, bssbase = 0; 619 unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); 620 int size; 621 622 /* find the .bss section for COMMON symbols */ 623 for (i = 0; i < nsecs; i++) { 624 if (strncmp(secstrings + sechdrs[i].sh_name, ".bss", 4) == 0) { 625 bssbase = sechdrs[i].sh_addr; 626 break; 627 } 628 } 629 630 for (i = 1; i < n; i++) { 631 switch (sym[i].st_shndx) { 632 case SHN_COMMON: 633 /* Allocate space for the symbol in the .bss section. 634 st_value is currently size. 635 We want it to have the address of the symbol. */ 636 637 size = sym[i].st_value; 638 sym[i].st_value = bssbase; 639 640 bssbase += size; 641 break; 642 643 case SHN_ABS: 644 /* Don't need to do anything */ 645 break; 646 647 case SHN_UNDEF: 648 /* ret = -ENOENT; */ 649 break; 650 651 case SHN_MIPS_SCOMMON: 652 printk(KERN_DEBUG "simplify_symbols: ignoring SHN_MIPS_SCOMMON " 653 "symbol <%s> st_shndx %d\n", strtab + sym[i].st_name, 654 sym[i].st_shndx); 655 // .sbss section 656 break; 657 658 default: 659 secbase = sechdrs[sym[i].st_shndx].sh_addr; 660 661 if (strncmp(strtab + sym[i].st_name, "_gp", 3) == 0) { 662 save_gp_address(secbase, sym[i].st_value); 663 } 664 665 sym[i].st_value += secbase; 666 break; 667 } 668 } 669 } 670 671 #ifdef DEBUG_ELFLOADER 672 static void dump_elfsymbols(Elf_Shdr * sechdrs, unsigned int symindex, 673 const char *strtab, struct module *mod) 674 { 675 Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; 676 unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); 677 678 printk(KERN_DEBUG "dump_elfsymbols: n %d\n", n); 679 for (i = 1; i < n; i++) { 680 printk(KERN_DEBUG " i %d name <%s> 0x%x\n", i, 681 strtab + sym[i].st_name, sym[i].st_value); 682 } 683 } 684 #endif 685 686 /* We are prepared so configure and start the VPE... */ 687 static int vpe_run(struct vpe * v) 688 { 689 unsigned long flags, val, dmt_flag; 690 struct vpe_notifications *n; 691 unsigned int vpeflags; 692 struct tc *t; 693 694 /* check we are the Master VPE */ 695 local_irq_save(flags); 696 val = read_c0_vpeconf0(); 697 if (!(val & VPECONF0_MVP)) { 698 printk(KERN_WARNING 699 "VPE loader: only Master VPE's are allowed to configure MT\n"); 700 local_irq_restore(flags); 701 702 return -1; 703 } 704 705 dmt_flag = dmt(); 706 vpeflags = dvpe(); 707 708 if (!list_empty(&v->tc)) { 709 if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { 710 evpe(vpeflags); 711 emt(dmt_flag); 712 local_irq_restore(flags); 713 714 printk(KERN_WARNING 715 "VPE loader: TC %d is already in use.\n", 716 t->index); 717 return -ENOEXEC; 718 } 719 } else { 720 evpe(vpeflags); 721 emt(dmt_flag); 722 local_irq_restore(flags); 723 724 printk(KERN_WARNING 725 "VPE loader: No TC's associated with VPE %d\n", 726 v->minor); 727 728 return -ENOEXEC; 729 } 730 731 /* Put MVPE's into 'configuration state' */ 732 set_c0_mvpcontrol(MVPCONTROL_VPC); 733 734 settc(t->index); 735 736 /* should check it is halted, and not activated */ 737 if ((read_tc_c0_tcstatus() & TCSTATUS_A) || !(read_tc_c0_tchalt() & TCHALT_H)) { 738 evpe(vpeflags); 739 emt(dmt_flag); 740 local_irq_restore(flags); 741 742 printk(KERN_WARNING "VPE loader: TC %d is already active!\n", 743 t->index); 744 745 return -ENOEXEC; 746 } 747 748 /* Write the address we want it to start running from in the TCPC register. */ 749 write_tc_c0_tcrestart((unsigned long)v->__start); 750 write_tc_c0_tccontext((unsigned long)0); 751 752 /* 753 * Mark the TC as activated, not interrupt exempt and not dynamically 754 * allocatable 755 */ 756 val = read_tc_c0_tcstatus(); 757 val = (val & ~(TCSTATUS_DA | TCSTATUS_IXMT)) | TCSTATUS_A; 758 write_tc_c0_tcstatus(val); 759 760 write_tc_c0_tchalt(read_tc_c0_tchalt() & ~TCHALT_H); 761 762 /* 763 * The sde-kit passes 'memsize' to __start in $a3, so set something 764 * here... Or set $a3 to zero and define DFLT_STACK_SIZE and 765 * DFLT_HEAP_SIZE when you compile your program 766 */ 767 mttgpr(6, v->ntcs); 768 mttgpr(7, physical_memsize); 769 770 /* set up VPE1 */ 771 /* 772 * bind the TC to VPE 1 as late as possible so we only have the final 773 * VPE registers to set up, and so an EJTAG probe can trigger on it 774 */ 775 write_tc_c0_tcbind((read_tc_c0_tcbind() & ~TCBIND_CURVPE) | 1); 776 777 write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~(VPECONF0_VPA)); 778 779 back_to_back_c0_hazard(); 780 781 /* Set up the XTC bit in vpeconf0 to point at our tc */ 782 write_vpe_c0_vpeconf0( (read_vpe_c0_vpeconf0() & ~(VPECONF0_XTC)) 783 | (t->index << VPECONF0_XTC_SHIFT)); 784 785 back_to_back_c0_hazard(); 786 787 /* enable this VPE */ 788 write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() | VPECONF0_VPA); 789 790 /* clear out any left overs from a previous program */ 791 write_vpe_c0_status(0); 792 write_vpe_c0_cause(0); 793 794 /* take system out of configuration state */ 795 clear_c0_mvpcontrol(MVPCONTROL_VPC); 796 797 /* 798 * SMTC/SMVP kernels manage VPE enable independently, 799 * but uniprocessor kernels need to turn it on, even 800 * if that wasn't the pre-dvpe() state. 801 */ 802 #ifdef CONFIG_SMP 803 evpe(vpeflags); 804 #else 805 evpe(EVPE_ENABLE); 806 #endif 807 emt(dmt_flag); 808 local_irq_restore(flags); 809 810 list_for_each_entry(n, &v->notify, list) 811 n->start(minor); 812 813 return 0; 814 } 815 816 static int find_vpe_symbols(struct vpe * v, Elf_Shdr * sechdrs, 817 unsigned int symindex, const char *strtab, 818 struct module *mod) 819 { 820 Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; 821 unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); 822 823 for (i = 1; i < n; i++) { 824 if (strcmp(strtab + sym[i].st_name, "__start") == 0) { 825 v->__start = sym[i].st_value; 826 } 827 828 if (strcmp(strtab + sym[i].st_name, "vpe_shared") == 0) { 829 v->shared_ptr = (void *)sym[i].st_value; 830 } 831 } 832 833 if ( (v->__start == 0) || (v->shared_ptr == NULL)) 834 return -1; 835 836 return 0; 837 } 838 839 /* 840 * Allocates a VPE with some program code space(the load address), copies the 841 * contents of the program (p)buffer performing relocatations/etc, free's it 842 * when finished. 843 */ 844 static int vpe_elfload(struct vpe * v) 845 { 846 Elf_Ehdr *hdr; 847 Elf_Shdr *sechdrs; 848 long err = 0; 849 char *secstrings, *strtab = NULL; 850 unsigned int len, i, symindex = 0, strindex = 0, relocate = 0; 851 struct module mod; // so we can re-use the relocations code 852 853 memset(&mod, 0, sizeof(struct module)); 854 strcpy(mod.name, "VPE loader"); 855 856 hdr = (Elf_Ehdr *) v->pbuffer; 857 len = v->plen; 858 859 /* Sanity checks against insmoding binaries or wrong arch, 860 weird elf version */ 861 if (memcmp(hdr->e_ident, ELFMAG, SELFMAG) != 0 862 || (hdr->e_type != ET_REL && hdr->e_type != ET_EXEC) 863 || !elf_check_arch(hdr) 864 || hdr->e_shentsize != sizeof(*sechdrs)) { 865 printk(KERN_WARNING 866 "VPE loader: program wrong arch or weird elf version\n"); 867 868 return -ENOEXEC; 869 } 870 871 if (hdr->e_type == ET_REL) 872 relocate = 1; 873 874 if (len < hdr->e_shoff + hdr->e_shnum * sizeof(Elf_Shdr)) { 875 printk(KERN_ERR "VPE loader: program length %u truncated\n", 876 len); 877 878 return -ENOEXEC; 879 } 880 881 /* Convenience variables */ 882 sechdrs = (void *)hdr + hdr->e_shoff; 883 secstrings = (void *)hdr + sechdrs[hdr->e_shstrndx].sh_offset; 884 sechdrs[0].sh_addr = 0; 885 886 /* And these should exist, but gcc whinges if we don't init them */ 887 symindex = strindex = 0; 888 889 if (relocate) { 890 for (i = 1; i < hdr->e_shnum; i++) { 891 if (sechdrs[i].sh_type != SHT_NOBITS 892 && len < sechdrs[i].sh_offset + sechdrs[i].sh_size) { 893 printk(KERN_ERR "VPE program length %u truncated\n", 894 len); 895 return -ENOEXEC; 896 } 897 898 /* Mark all sections sh_addr with their address in the 899 temporary image. */ 900 sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; 901 902 /* Internal symbols and strings. */ 903 if (sechdrs[i].sh_type == SHT_SYMTAB) { 904 symindex = i; 905 strindex = sechdrs[i].sh_link; 906 strtab = (char *)hdr + sechdrs[strindex].sh_offset; 907 } 908 } 909 layout_sections(&mod, hdr, sechdrs, secstrings); 910 } 911 912 v->load_addr = alloc_progmem(mod.core_size); 913 if (!v->load_addr) 914 return -ENOMEM; 915 916 pr_info("VPE loader: loading to %p\n", v->load_addr); 917 918 if (relocate) { 919 for (i = 0; i < hdr->e_shnum; i++) { 920 void *dest; 921 922 if (!(sechdrs[i].sh_flags & SHF_ALLOC)) 923 continue; 924 925 dest = v->load_addr + sechdrs[i].sh_entsize; 926 927 if (sechdrs[i].sh_type != SHT_NOBITS) 928 memcpy(dest, (void *)sechdrs[i].sh_addr, 929 sechdrs[i].sh_size); 930 /* Update sh_addr to point to copy in image. */ 931 sechdrs[i].sh_addr = (unsigned long)dest; 932 933 printk(KERN_DEBUG " section sh_name %s sh_addr 0x%x\n", 934 secstrings + sechdrs[i].sh_name, sechdrs[i].sh_addr); 935 } 936 937 /* Fix up syms, so that st_value is a pointer to location. */ 938 simplify_symbols(sechdrs, symindex, strtab, secstrings, 939 hdr->e_shnum, &mod); 940 941 /* Now do relocations. */ 942 for (i = 1; i < hdr->e_shnum; i++) { 943 const char *strtab = (char *)sechdrs[strindex].sh_addr; 944 unsigned int info = sechdrs[i].sh_info; 945 946 /* Not a valid relocation section? */ 947 if (info >= hdr->e_shnum) 948 continue; 949 950 /* Don't bother with non-allocated sections */ 951 if (!(sechdrs[info].sh_flags & SHF_ALLOC)) 952 continue; 953 954 if (sechdrs[i].sh_type == SHT_REL) 955 err = apply_relocations(sechdrs, strtab, symindex, i, 956 &mod); 957 else if (sechdrs[i].sh_type == SHT_RELA) 958 err = apply_relocate_add(sechdrs, strtab, symindex, i, 959 &mod); 960 if (err < 0) 961 return err; 962 963 } 964 } else { 965 struct elf_phdr *phdr = (struct elf_phdr *) ((char *)hdr + hdr->e_phoff); 966 967 for (i = 0; i < hdr->e_phnum; i++) { 968 if (phdr->p_type == PT_LOAD) { 969 memcpy((void *)phdr->p_paddr, 970 (char *)hdr + phdr->p_offset, 971 phdr->p_filesz); 972 memset((void *)phdr->p_paddr + phdr->p_filesz, 973 0, phdr->p_memsz - phdr->p_filesz); 974 } 975 phdr++; 976 } 977 978 for (i = 0; i < hdr->e_shnum; i++) { 979 /* Internal symbols and strings. */ 980 if (sechdrs[i].sh_type == SHT_SYMTAB) { 981 symindex = i; 982 strindex = sechdrs[i].sh_link; 983 strtab = (char *)hdr + sechdrs[strindex].sh_offset; 984 985 /* mark the symtab's address for when we try to find the 986 magic symbols */ 987 sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; 988 } 989 } 990 } 991 992 /* make sure it's physically written out */ 993 flush_icache_range((unsigned long)v->load_addr, 994 (unsigned long)v->load_addr + v->len); 995 996 if ((find_vpe_symbols(v, sechdrs, symindex, strtab, &mod)) < 0) { 997 if (v->__start == 0) { 998 printk(KERN_WARNING "VPE loader: program does not contain " 999 "a __start symbol\n"); 1000 return -ENOEXEC; 1001 } 1002 1003 if (v->shared_ptr == NULL) 1004 printk(KERN_WARNING "VPE loader: " 1005 "program does not contain vpe_shared symbol.\n" 1006 " Unable to use AMVP (AP/SP) facilities.\n"); 1007 } 1008 1009 printk(" elf loaded\n"); 1010 return 0; 1011 } 1012 1013 static void cleanup_tc(struct tc *tc) 1014 { 1015 unsigned long flags; 1016 unsigned int mtflags, vpflags; 1017 int tmp; 1018 1019 local_irq_save(flags); 1020 mtflags = dmt(); 1021 vpflags = dvpe(); 1022 /* Put MVPE's into 'configuration state' */ 1023 set_c0_mvpcontrol(MVPCONTROL_VPC); 1024 1025 settc(tc->index); 1026 tmp = read_tc_c0_tcstatus(); 1027 1028 /* mark not allocated and not dynamically allocatable */ 1029 tmp &= ~(TCSTATUS_A | TCSTATUS_DA); 1030 tmp |= TCSTATUS_IXMT; /* interrupt exempt */ 1031 write_tc_c0_tcstatus(tmp); 1032 1033 write_tc_c0_tchalt(TCHALT_H); 1034 mips_ihb(); 1035 1036 /* bind it to anything other than VPE1 */ 1037 // write_tc_c0_tcbind(read_tc_c0_tcbind() & ~TCBIND_CURVPE); // | TCBIND_CURVPE 1038 1039 clear_c0_mvpcontrol(MVPCONTROL_VPC); 1040 evpe(vpflags); 1041 emt(mtflags); 1042 local_irq_restore(flags); 1043 } 1044 1045 static int getcwd(char *buff, int size) 1046 { 1047 mm_segment_t old_fs; 1048 int ret; 1049 1050 old_fs = get_fs(); 1051 set_fs(KERNEL_DS); 1052 1053 ret = sys_getcwd(buff, size); 1054 1055 set_fs(old_fs); 1056 1057 return ret; 1058 } 1059 1060 /* checks VPE is unused and gets ready to load program */ 1061 static int vpe_open(struct inode *inode, struct file *filp) 1062 { 1063 enum vpe_state state; 1064 struct vpe_notifications *not; 1065 struct vpe *v; 1066 int ret; 1067 1068 if (minor != iminor(inode)) { 1069 /* assume only 1 device at the moment. */ 1070 pr_warning("VPE loader: only vpe1 is supported\n"); 1071 1072 return -ENODEV; 1073 } 1074 1075 if ((v = get_vpe(tclimit)) == NULL) { 1076 pr_warning("VPE loader: unable to get vpe\n"); 1077 1078 return -ENODEV; 1079 } 1080 1081 state = xchg(&v->state, VPE_STATE_INUSE); 1082 if (state != VPE_STATE_UNUSED) { 1083 printk(KERN_DEBUG "VPE loader: tc in use dumping regs\n"); 1084 1085 list_for_each_entry(not, &v->notify, list) { 1086 not->stop(tclimit); 1087 } 1088 1089 release_progmem(v->load_addr); 1090 cleanup_tc(get_tc(tclimit)); 1091 } 1092 1093 /* this of-course trashes what was there before... */ 1094 v->pbuffer = vmalloc(P_SIZE); 1095 v->plen = P_SIZE; 1096 v->load_addr = NULL; 1097 v->len = 0; 1098 1099 v->uid = filp->f_cred->fsuid; 1100 v->gid = filp->f_cred->fsgid; 1101 1102 #ifdef CONFIG_MIPS_APSP_KSPD 1103 /* get kspd to tell us when a syscall_exit happens */ 1104 if (!kspd_events_reqd) { 1105 kspd_notify(&kspd_events); 1106 kspd_events_reqd++; 1107 } 1108 #endif 1109 1110 v->cwd[0] = 0; 1111 ret = getcwd(v->cwd, VPE_PATH_MAX); 1112 if (ret < 0) 1113 printk(KERN_WARNING "VPE loader: open, getcwd returned %d\n", ret); 1114 1115 v->shared_ptr = NULL; 1116 v->__start = 0; 1117 1118 return 0; 1119 } 1120 1121 static int vpe_release(struct inode *inode, struct file *filp) 1122 { 1123 struct vpe *v; 1124 Elf_Ehdr *hdr; 1125 int ret = 0; 1126 1127 v = get_vpe(tclimit); 1128 if (v == NULL) 1129 return -ENODEV; 1130 1131 hdr = (Elf_Ehdr *) v->pbuffer; 1132 if (memcmp(hdr->e_ident, ELFMAG, SELFMAG) == 0) { 1133 if (vpe_elfload(v) >= 0) { 1134 vpe_run(v); 1135 } else { 1136 printk(KERN_WARNING "VPE loader: ELF load failed.\n"); 1137 ret = -ENOEXEC; 1138 } 1139 } else { 1140 printk(KERN_WARNING "VPE loader: only elf files are supported\n"); 1141 ret = -ENOEXEC; 1142 } 1143 1144 /* It's good to be able to run the SP and if it chokes have a look at 1145 the /dev/rt?. But if we reset the pointer to the shared struct we 1146 lose what has happened. So perhaps if garbage is sent to the vpe 1147 device, use it as a trigger for the reset. Hopefully a nice 1148 executable will be along shortly. */ 1149 if (ret < 0) 1150 v->shared_ptr = NULL; 1151 1152 // cleanup any temp buffers 1153 if (v->pbuffer) 1154 vfree(v->pbuffer); 1155 v->plen = 0; 1156 return ret; 1157 } 1158 1159 static ssize_t vpe_write(struct file *file, const char __user * buffer, 1160 size_t count, loff_t * ppos) 1161 { 1162 size_t ret = count; 1163 struct vpe *v; 1164 1165 if (iminor(file->f_path.dentry->d_inode) != minor) 1166 return -ENODEV; 1167 1168 v = get_vpe(tclimit); 1169 if (v == NULL) 1170 return -ENODEV; 1171 1172 if (v->pbuffer == NULL) { 1173 printk(KERN_ERR "VPE loader: no buffer for program\n"); 1174 return -ENOMEM; 1175 } 1176 1177 if ((count + v->len) > v->plen) { 1178 printk(KERN_WARNING 1179 "VPE loader: elf size too big. Perhaps strip uneeded symbols\n"); 1180 return -ENOMEM; 1181 } 1182 1183 count -= copy_from_user(v->pbuffer + v->len, buffer, count); 1184 if (!count) 1185 return -EFAULT; 1186 1187 v->len += count; 1188 return ret; 1189 } 1190 1191 static const struct file_operations vpe_fops = { 1192 .owner = THIS_MODULE, 1193 .open = vpe_open, 1194 .release = vpe_release, 1195 .write = vpe_write 1196 }; 1197 1198 /* module wrapper entry points */ 1199 /* give me a vpe */ 1200 vpe_handle vpe_alloc(void) 1201 { 1202 int i; 1203 struct vpe *v; 1204 1205 /* find a vpe */ 1206 for (i = 1; i < MAX_VPES; i++) { 1207 if ((v = get_vpe(i)) != NULL) { 1208 v->state = VPE_STATE_INUSE; 1209 return v; 1210 } 1211 } 1212 return NULL; 1213 } 1214 1215 EXPORT_SYMBOL(vpe_alloc); 1216 1217 /* start running from here */ 1218 int vpe_start(vpe_handle vpe, unsigned long start) 1219 { 1220 struct vpe *v = vpe; 1221 1222 v->__start = start; 1223 return vpe_run(v); 1224 } 1225 1226 EXPORT_SYMBOL(vpe_start); 1227 1228 /* halt it for now */ 1229 int vpe_stop(vpe_handle vpe) 1230 { 1231 struct vpe *v = vpe; 1232 struct tc *t; 1233 unsigned int evpe_flags; 1234 1235 evpe_flags = dvpe(); 1236 1237 if ((t = list_entry(v->tc.next, struct tc, tc)) != NULL) { 1238 1239 settc(t->index); 1240 write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); 1241 } 1242 1243 evpe(evpe_flags); 1244 1245 return 0; 1246 } 1247 1248 EXPORT_SYMBOL(vpe_stop); 1249 1250 /* I've done with it thank you */ 1251 int vpe_free(vpe_handle vpe) 1252 { 1253 struct vpe *v = vpe; 1254 struct tc *t; 1255 unsigned int evpe_flags; 1256 1257 if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { 1258 return -ENOEXEC; 1259 } 1260 1261 evpe_flags = dvpe(); 1262 1263 /* Put MVPE's into 'configuration state' */ 1264 set_c0_mvpcontrol(MVPCONTROL_VPC); 1265 1266 settc(t->index); 1267 write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); 1268 1269 /* halt the TC */ 1270 write_tc_c0_tchalt(TCHALT_H); 1271 mips_ihb(); 1272 1273 /* mark the TC unallocated */ 1274 write_tc_c0_tcstatus(read_tc_c0_tcstatus() & ~TCSTATUS_A); 1275 1276 v->state = VPE_STATE_UNUSED; 1277 1278 clear_c0_mvpcontrol(MVPCONTROL_VPC); 1279 evpe(evpe_flags); 1280 1281 return 0; 1282 } 1283 1284 EXPORT_SYMBOL(vpe_free); 1285 1286 void *vpe_get_shared(int index) 1287 { 1288 struct vpe *v; 1289 1290 if ((v = get_vpe(index)) == NULL) 1291 return NULL; 1292 1293 return v->shared_ptr; 1294 } 1295 1296 EXPORT_SYMBOL(vpe_get_shared); 1297 1298 int vpe_getuid(int index) 1299 { 1300 struct vpe *v; 1301 1302 if ((v = get_vpe(index)) == NULL) 1303 return -1; 1304 1305 return v->uid; 1306 } 1307 1308 EXPORT_SYMBOL(vpe_getuid); 1309 1310 int vpe_getgid(int index) 1311 { 1312 struct vpe *v; 1313 1314 if ((v = get_vpe(index)) == NULL) 1315 return -1; 1316 1317 return v->gid; 1318 } 1319 1320 EXPORT_SYMBOL(vpe_getgid); 1321 1322 int vpe_notify(int index, struct vpe_notifications *notify) 1323 { 1324 struct vpe *v; 1325 1326 if ((v = get_vpe(index)) == NULL) 1327 return -1; 1328 1329 list_add(¬ify->list, &v->notify); 1330 return 0; 1331 } 1332 1333 EXPORT_SYMBOL(vpe_notify); 1334 1335 char *vpe_getcwd(int index) 1336 { 1337 struct vpe *v; 1338 1339 if ((v = get_vpe(index)) == NULL) 1340 return NULL; 1341 1342 return v->cwd; 1343 } 1344 1345 EXPORT_SYMBOL(vpe_getcwd); 1346 1347 #ifdef CONFIG_MIPS_APSP_KSPD 1348 static void kspd_sp_exit( int sp_id) 1349 { 1350 cleanup_tc(get_tc(sp_id)); 1351 } 1352 #endif 1353 1354 static ssize_t store_kill(struct device *dev, struct device_attribute *attr, 1355 const char *buf, size_t len) 1356 { 1357 struct vpe *vpe = get_vpe(tclimit); 1358 struct vpe_notifications *not; 1359 1360 list_for_each_entry(not, &vpe->notify, list) { 1361 not->stop(tclimit); 1362 } 1363 1364 release_progmem(vpe->load_addr); 1365 cleanup_tc(get_tc(tclimit)); 1366 vpe_stop(vpe); 1367 vpe_free(vpe); 1368 1369 return len; 1370 } 1371 1372 static ssize_t show_ntcs(struct device *cd, struct device_attribute *attr, 1373 char *buf) 1374 { 1375 struct vpe *vpe = get_vpe(tclimit); 1376 1377 return sprintf(buf, "%d\n", vpe->ntcs); 1378 } 1379 1380 static ssize_t store_ntcs(struct device *dev, struct device_attribute *attr, 1381 const char *buf, size_t len) 1382 { 1383 struct vpe *vpe = get_vpe(tclimit); 1384 unsigned long new; 1385 char *endp; 1386 1387 new = simple_strtoul(buf, &endp, 0); 1388 if (endp == buf) 1389 goto out_einval; 1390 1391 if (new == 0 || new > (hw_tcs - tclimit)) 1392 goto out_einval; 1393 1394 vpe->ntcs = new; 1395 1396 return len; 1397 1398 out_einval: 1399 return -EINVAL; 1400 } 1401 1402 static struct device_attribute vpe_class_attributes[] = { 1403 __ATTR(kill, S_IWUSR, NULL, store_kill), 1404 __ATTR(ntcs, S_IRUGO | S_IWUSR, show_ntcs, store_ntcs), 1405 {} 1406 }; 1407 1408 static void vpe_device_release(struct device *cd) 1409 { 1410 kfree(cd); 1411 } 1412 1413 struct class vpe_class = { 1414 .name = "vpe", 1415 .owner = THIS_MODULE, 1416 .dev_release = vpe_device_release, 1417 .dev_attrs = vpe_class_attributes, 1418 }; 1419 1420 struct device vpe_device; 1421 1422 static int __init vpe_module_init(void) 1423 { 1424 unsigned int mtflags, vpflags; 1425 unsigned long flags, val; 1426 struct vpe *v = NULL; 1427 struct tc *t; 1428 int tc, err; 1429 1430 if (!cpu_has_mipsmt) { 1431 printk("VPE loader: not a MIPS MT capable processor\n"); 1432 return -ENODEV; 1433 } 1434 1435 if (vpelimit == 0) { 1436 printk(KERN_WARNING "No VPEs reserved for AP/SP, not " 1437 "initializing VPE loader.\nPass maxvpes=<n> argument as " 1438 "kernel argument\n"); 1439 1440 return -ENODEV; 1441 } 1442 1443 if (tclimit == 0) { 1444 printk(KERN_WARNING "No TCs reserved for AP/SP, not " 1445 "initializing VPE loader.\nPass maxtcs=<n> argument as " 1446 "kernel argument\n"); 1447 1448 return -ENODEV; 1449 } 1450 1451 major = register_chrdev(0, module_name, &vpe_fops); 1452 if (major < 0) { 1453 printk("VPE loader: unable to register character device\n"); 1454 return major; 1455 } 1456 1457 err = class_register(&vpe_class); 1458 if (err) { 1459 printk(KERN_ERR "vpe_class registration failed\n"); 1460 goto out_chrdev; 1461 } 1462 1463 device_initialize(&vpe_device); 1464 vpe_device.class = &vpe_class, 1465 vpe_device.parent = NULL, 1466 dev_set_name(&vpe_device, "vpe1"); 1467 vpe_device.devt = MKDEV(major, minor); 1468 err = device_add(&vpe_device); 1469 if (err) { 1470 printk(KERN_ERR "Adding vpe_device failed\n"); 1471 goto out_class; 1472 } 1473 1474 local_irq_save(flags); 1475 mtflags = dmt(); 1476 vpflags = dvpe(); 1477 1478 /* Put MVPE's into 'configuration state' */ 1479 set_c0_mvpcontrol(MVPCONTROL_VPC); 1480 1481 /* dump_mtregs(); */ 1482 1483 val = read_c0_mvpconf0(); 1484 hw_tcs = (val & MVPCONF0_PTC) + 1; 1485 hw_vpes = ((val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT) + 1; 1486 1487 for (tc = tclimit; tc < hw_tcs; tc++) { 1488 /* 1489 * Must re-enable multithreading temporarily or in case we 1490 * reschedule send IPIs or similar we might hang. 1491 */ 1492 clear_c0_mvpcontrol(MVPCONTROL_VPC); 1493 evpe(vpflags); 1494 emt(mtflags); 1495 local_irq_restore(flags); 1496 t = alloc_tc(tc); 1497 if (!t) { 1498 err = -ENOMEM; 1499 goto out; 1500 } 1501 1502 local_irq_save(flags); 1503 mtflags = dmt(); 1504 vpflags = dvpe(); 1505 set_c0_mvpcontrol(MVPCONTROL_VPC); 1506 1507 /* VPE's */ 1508 if (tc < hw_tcs) { 1509 settc(tc); 1510 1511 if ((v = alloc_vpe(tc)) == NULL) { 1512 printk(KERN_WARNING "VPE: unable to allocate VPE\n"); 1513 1514 goto out_reenable; 1515 } 1516 1517 v->ntcs = hw_tcs - tclimit; 1518 1519 /* add the tc to the list of this vpe's tc's. */ 1520 list_add(&t->tc, &v->tc); 1521 1522 /* deactivate all but vpe0 */ 1523 if (tc >= tclimit) { 1524 unsigned long tmp = read_vpe_c0_vpeconf0(); 1525 1526 tmp &= ~VPECONF0_VPA; 1527 1528 /* master VPE */ 1529 tmp |= VPECONF0_MVP; 1530 write_vpe_c0_vpeconf0(tmp); 1531 } 1532 1533 /* disable multi-threading with TC's */ 1534 write_vpe_c0_vpecontrol(read_vpe_c0_vpecontrol() & ~VPECONTROL_TE); 1535 1536 if (tc >= vpelimit) { 1537 /* 1538 * Set config to be the same as vpe0, 1539 * particularly kseg0 coherency alg 1540 */ 1541 write_vpe_c0_config(read_c0_config()); 1542 } 1543 } 1544 1545 /* TC's */ 1546 t->pvpe = v; /* set the parent vpe */ 1547 1548 if (tc >= tclimit) { 1549 unsigned long tmp; 1550 1551 settc(tc); 1552 1553 /* Any TC that is bound to VPE0 gets left as is - in case 1554 we are running SMTC on VPE0. A TC that is bound to any 1555 other VPE gets bound to VPE0, ideally I'd like to make 1556 it homeless but it doesn't appear to let me bind a TC 1557 to a non-existent VPE. Which is perfectly reasonable. 1558 1559 The (un)bound state is visible to an EJTAG probe so may 1560 notify GDB... 1561 */ 1562 1563 if (((tmp = read_tc_c0_tcbind()) & TCBIND_CURVPE)) { 1564 /* tc is bound >vpe0 */ 1565 write_tc_c0_tcbind(tmp & ~TCBIND_CURVPE); 1566 1567 t->pvpe = get_vpe(0); /* set the parent vpe */ 1568 } 1569 1570 /* halt the TC */ 1571 write_tc_c0_tchalt(TCHALT_H); 1572 mips_ihb(); 1573 1574 tmp = read_tc_c0_tcstatus(); 1575 1576 /* mark not activated and not dynamically allocatable */ 1577 tmp &= ~(TCSTATUS_A | TCSTATUS_DA); 1578 tmp |= TCSTATUS_IXMT; /* interrupt exempt */ 1579 write_tc_c0_tcstatus(tmp); 1580 } 1581 } 1582 1583 out_reenable: 1584 /* release config state */ 1585 clear_c0_mvpcontrol(MVPCONTROL_VPC); 1586 1587 evpe(vpflags); 1588 emt(mtflags); 1589 local_irq_restore(flags); 1590 1591 #ifdef CONFIG_MIPS_APSP_KSPD 1592 kspd_events.kspd_sp_exit = kspd_sp_exit; 1593 #endif 1594 return 0; 1595 1596 out_class: 1597 class_unregister(&vpe_class); 1598 out_chrdev: 1599 unregister_chrdev(major, module_name); 1600 1601 out: 1602 return err; 1603 } 1604 1605 static void __exit vpe_module_exit(void) 1606 { 1607 struct vpe *v, *n; 1608 1609 device_del(&vpe_device); 1610 unregister_chrdev(major, module_name); 1611 1612 /* No locking needed here */ 1613 list_for_each_entry_safe(v, n, &vpecontrol.vpe_list, list) { 1614 if (v->state != VPE_STATE_UNUSED) 1615 release_vpe(v); 1616 } 1617 } 1618 1619 module_init(vpe_module_init); 1620 module_exit(vpe_module_exit); 1621 MODULE_DESCRIPTION("MIPS VPE Loader"); 1622 MODULE_AUTHOR("Elizabeth Oldham, MIPS Technologies, Inc."); 1623 MODULE_LICENSE("GPL"); 1624