xref: /freebsd/sys/powerpc/powerpc/machdep.c (revision 5bf5ca772c6de2d53344a78cf461447cc322ccea)
1 /*-
2  * Copyright (C) 1995, 1996 Wolfgang Solfrank.
3  * Copyright (C) 1995, 1996 TooLs GmbH.
4  * All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  * 3. All advertising materials mentioning features or use of this software
15  *    must display the following acknowledgement:
16  *      This product includes software developed by TooLs GmbH.
17  * 4. The name of TooLs GmbH may not be used to endorse or promote products
18  *    derived from this software without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY TOOLS GMBH ``AS IS'' AND ANY EXPRESS OR
21  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
22  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
23  * IN NO EVENT SHALL TOOLS GMBH BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
26  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
27  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
28  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
29  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30  */
31 /*-
32  * Copyright (C) 2001 Benno Rice
33  * All rights reserved.
34  *
35  * Redistribution and use in source and binary forms, with or without
36  * modification, are permitted provided that the following conditions
37  * are met:
38  * 1. Redistributions of source code must retain the above copyright
39  *    notice, this list of conditions and the following disclaimer.
40  * 2. Redistributions in binary form must reproduce the above copyright
41  *    notice, this list of conditions and the following disclaimer in the
42  *    documentation and/or other materials provided with the distribution.
43  *
44  * THIS SOFTWARE IS PROVIDED BY Benno Rice ``AS IS'' AND ANY EXPRESS OR
45  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
46  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
47  * IN NO EVENT SHALL TOOLS GMBH BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
48  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
49  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
50  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
51  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
52  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
53  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
54  *	$NetBSD: machdep.c,v 1.74.2.1 2000/11/01 16:13:48 tv Exp $
55  */
56 
57 #include <sys/cdefs.h>
58 __FBSDID("$FreeBSD$");
59 
60 #include "opt_compat.h"
61 #include "opt_ddb.h"
62 #include "opt_kstack_pages.h"
63 #include "opt_platform.h"
64 
65 #include <sys/param.h>
66 #include <sys/proc.h>
67 #include <sys/systm.h>
68 #include <sys/bio.h>
69 #include <sys/buf.h>
70 #include <sys/bus.h>
71 #include <sys/cons.h>
72 #include <sys/cpu.h>
73 #include <sys/eventhandler.h>
74 #include <sys/exec.h>
75 #include <sys/imgact.h>
76 #include <sys/kdb.h>
77 #include <sys/kernel.h>
78 #include <sys/ktr.h>
79 #include <sys/linker.h>
80 #include <sys/lock.h>
81 #include <sys/malloc.h>
82 #include <sys/mbuf.h>
83 #include <sys/msgbuf.h>
84 #include <sys/mutex.h>
85 #include <sys/ptrace.h>
86 #include <sys/reboot.h>
87 #include <sys/rwlock.h>
88 #include <sys/signalvar.h>
89 #include <sys/syscallsubr.h>
90 #include <sys/sysctl.h>
91 #include <sys/sysent.h>
92 #include <sys/sysproto.h>
93 #include <sys/ucontext.h>
94 #include <sys/uio.h>
95 #include <sys/vmmeter.h>
96 #include <sys/vnode.h>
97 
98 #include <net/netisr.h>
99 
100 #include <vm/vm.h>
101 #include <vm/vm_extern.h>
102 #include <vm/vm_kern.h>
103 #include <vm/vm_page.h>
104 #include <vm/vm_map.h>
105 #include <vm/vm_object.h>
106 #include <vm/vm_pager.h>
107 
108 #include <machine/altivec.h>
109 #ifndef __powerpc64__
110 #include <machine/bat.h>
111 #endif
112 #include <machine/cpu.h>
113 #include <machine/elf.h>
114 #include <machine/fpu.h>
115 #include <machine/hid.h>
116 #include <machine/kdb.h>
117 #include <machine/md_var.h>
118 #include <machine/metadata.h>
119 #include <machine/mmuvar.h>
120 #include <machine/pcb.h>
121 #include <machine/reg.h>
122 #include <machine/sigframe.h>
123 #include <machine/spr.h>
124 #include <machine/trap.h>
125 #include <machine/vmparam.h>
126 #include <machine/ofw_machdep.h>
127 
128 #include <ddb/ddb.h>
129 
130 #include <dev/ofw/openfirm.h>
131 #include <dev/ofw/ofw_subr.h>
132 
133 int cold = 1;
134 #ifdef __powerpc64__
135 int cacheline_size = 128;
136 #else
137 int cacheline_size = 32;
138 #endif
139 int hw_direct_map = 1;
140 
141 extern void *ap_pcpu;
142 
143 struct pcpu __pcpu[MAXCPU];
144 static char init_kenv[2048];
145 
146 static struct trapframe frame0;
147 
148 char		machine[] = "powerpc";
149 SYSCTL_STRING(_hw, HW_MACHINE, machine, CTLFLAG_RD, machine, 0, "");
150 
151 static void	cpu_startup(void *);
152 SYSINIT(cpu, SI_SUB_CPU, SI_ORDER_FIRST, cpu_startup, NULL);
153 
154 SYSCTL_INT(_machdep, CPU_CACHELINE, cacheline_size,
155 	   CTLFLAG_RD, &cacheline_size, 0, "");
156 
157 uintptr_t	powerpc_init(vm_offset_t, vm_offset_t, vm_offset_t, void *,
158 		    uint32_t);
159 
160 long		Maxmem = 0;
161 long		realmem = 0;
162 
163 /* Default MSR values set in the AIM/Book-E early startup code */
164 register_t	psl_kernset;
165 register_t	psl_userset;
166 register_t	psl_userstatic;
167 #ifdef __powerpc64__
168 register_t	psl_userset32;
169 #endif
170 
171 struct kva_md_info kmi;
172 
173 static void
174 cpu_startup(void *dummy)
175 {
176 
177 	/*
178 	 * Initialise the decrementer-based clock.
179 	 */
180 	decr_init();
181 
182 	/*
183 	 * Good {morning,afternoon,evening,night}.
184 	 */
185 	cpu_setup(PCPU_GET(cpuid));
186 
187 #ifdef PERFMON
188 	perfmon_init();
189 #endif
190 	printf("real memory  = %ju (%ju MB)\n", ptoa((uintmax_t)physmem),
191 	    ptoa((uintmax_t)physmem) / 1048576);
192 	realmem = physmem;
193 
194 	if (bootverbose)
195 		printf("available KVA = %zu (%zu MB)\n",
196 		    virtual_end - virtual_avail,
197 		    (virtual_end - virtual_avail) / 1048576);
198 
199 	/*
200 	 * Display any holes after the first chunk of extended memory.
201 	 */
202 	if (bootverbose) {
203 		int indx;
204 
205 		printf("Physical memory chunk(s):\n");
206 		for (indx = 0; phys_avail[indx + 1] != 0; indx += 2) {
207 			vm_paddr_t size1 =
208 			    phys_avail[indx + 1] - phys_avail[indx];
209 
210 			#ifdef __powerpc64__
211 			printf("0x%016jx - 0x%016jx, %ju bytes (%ju pages)\n",
212 			#else
213 			printf("0x%09jx - 0x%09jx, %ju bytes (%ju pages)\n",
214 			#endif
215 			    (uintmax_t)phys_avail[indx],
216 			    (uintmax_t)phys_avail[indx + 1] - 1,
217 			    (uintmax_t)size1, (uintmax_t)size1 / PAGE_SIZE);
218 		}
219 	}
220 
221 	vm_ksubmap_init(&kmi);
222 
223 	printf("avail memory = %ju (%ju MB)\n",
224 	    ptoa((uintmax_t)vm_free_count()),
225 	    ptoa((uintmax_t)vm_free_count()) / 1048576);
226 
227 	/*
228 	 * Set up buffers, so they can be used to read disk labels.
229 	 */
230 	bufinit();
231 	vm_pager_bufferinit();
232 }
233 
234 extern vm_offset_t	__startkernel, __endkernel;
235 extern unsigned char	__bss_start[];
236 extern unsigned char	__sbss_start[];
237 extern unsigned char	__sbss_end[];
238 extern unsigned char	_end[];
239 
240 void aim_cpu_init(vm_offset_t toc);
241 void booke_cpu_init(void);
242 
243 uintptr_t
244 powerpc_init(vm_offset_t fdt, vm_offset_t toc, vm_offset_t ofentry, void *mdp,
245     uint32_t mdp_cookie)
246 {
247 	struct		pcpu *pc;
248 	struct cpuref	bsp;
249 	vm_offset_t	startkernel, endkernel;
250 	void		*kmdp;
251 	char		*env;
252         bool		ofw_bootargs = false;
253 #ifdef DDB
254 	vm_offset_t ksym_start;
255 	vm_offset_t ksym_end;
256 #endif
257 
258 	kmdp = NULL;
259 
260 	/* First guess at start/end kernel positions */
261 	startkernel = __startkernel;
262 	endkernel = __endkernel;
263 
264 	/*
265 	 * If the metadata pointer cookie is not set to the magic value,
266 	 * the number in mdp should be treated as nonsense.
267 	 */
268 	if (mdp_cookie != 0xfb5d104d)
269 		mdp = NULL;
270 
271 #if !defined(BOOKE)
272 	/*
273 	 * On BOOKE the BSS is already cleared and some variables
274 	 * initialized.  Do not wipe them out.
275 	 */
276 	bzero(__sbss_start, __sbss_end - __sbss_start);
277 	bzero(__bss_start, _end - __bss_start);
278 #endif
279 
280 #ifdef AIM
281 	/*
282 	 * If running from an FDT, make sure we are in real mode to avoid
283 	 * tromping on firmware page tables. Everything in the kernel assumes
284 	 * 1:1 mappings out of firmware, so this won't break anything not
285 	 * already broken. This doesn't work if there is live OF, since OF
286 	 * may internally use non-1:1 mappings.
287 	 */
288 	if (ofentry == 0)
289 		mtmsr(mfmsr() & ~(PSL_IR | PSL_DR));
290 #endif
291 
292 	/*
293 	 * Parse metadata if present and fetch parameters.  Must be done
294 	 * before console is inited so cninit gets the right value of
295 	 * boothowto.
296 	 */
297 	if (mdp != NULL) {
298 		preload_metadata = mdp;
299 		kmdp = preload_search_by_type("elf kernel");
300 		if (kmdp != NULL) {
301 			boothowto = MD_FETCH(kmdp, MODINFOMD_HOWTO, int);
302 			init_static_kenv(MD_FETCH(kmdp, MODINFOMD_ENVP, char *),
303 			    0);
304 			endkernel = ulmax(endkernel, MD_FETCH(kmdp,
305 			    MODINFOMD_KERNEND, vm_offset_t));
306 #ifdef DDB
307 			ksym_start = MD_FETCH(kmdp, MODINFOMD_SSYM, uintptr_t);
308 			ksym_end = MD_FETCH(kmdp, MODINFOMD_ESYM, uintptr_t);
309 			db_fetch_ksymtab(ksym_start, ksym_end);
310 #endif
311 		}
312 	} else {
313 		init_static_kenv(init_kenv, sizeof(init_kenv));
314 		ofw_bootargs = true;
315 	}
316 	/* Store boot environment state */
317 	OF_initial_setup((void *)fdt, NULL, (int (*)(void *))ofentry);
318 
319 	/*
320 	 * Init params/tunables that can be overridden by the loader
321 	 */
322 	init_param1();
323 
324 	/*
325 	 * Start initializing proc0 and thread0.
326 	 */
327 	proc_linkup0(&proc0, &thread0);
328 	thread0.td_frame = &frame0;
329 #ifdef __powerpc64__
330 	__asm __volatile("mr 13,%0" :: "r"(&thread0));
331 #else
332 	__asm __volatile("mr 2,%0" :: "r"(&thread0));
333 #endif
334 
335 	/*
336 	 * Init mutexes, which we use heavily in PMAP
337 	 */
338 	mutex_init();
339 
340 	/*
341 	 * Install the OF client interface
342 	 */
343 	OF_bootstrap();
344 
345 	if (ofw_bootargs)
346 		ofw_parse_bootargs();
347 
348 	/*
349 	 * Initialize the console before printing anything.
350 	 */
351 	cninit();
352 
353 #ifdef AIM
354 	aim_cpu_init(toc);
355 #else /* BOOKE */
356 	booke_cpu_init();
357 
358 	/* Make sure the kernel icache is valid before we go too much further */
359 	__syncicache((caddr_t)startkernel, endkernel - startkernel);
360 #endif
361 
362 	/*
363 	 * Choose a platform module so we can get the physical memory map.
364 	 */
365 
366 	platform_probe_and_attach();
367 
368 	/*
369 	 * Set up per-cpu data for the BSP now that the platform can tell
370 	 * us which that is.
371 	 */
372 	if (platform_smp_get_bsp(&bsp) != 0)
373 		bsp.cr_cpuid = 0;
374 	pc = &__pcpu[bsp.cr_cpuid];
375 	pcpu_init(pc, bsp.cr_cpuid, sizeof(struct pcpu));
376 	pc->pc_curthread = &thread0;
377 	thread0.td_oncpu = bsp.cr_cpuid;
378 	pc->pc_cpuid = bsp.cr_cpuid;
379 	pc->pc_hwref = bsp.cr_hwref;
380 	__asm __volatile("mtsprg 0, %0" :: "r"(pc));
381 
382 	/*
383 	 * Init KDB
384 	 */
385 	kdb_init();
386 
387 	/*
388 	 * Bring up MMU
389 	 */
390 	pmap_bootstrap(startkernel, endkernel);
391 	mtmsr(psl_kernset & ~PSL_EE);
392 
393 	/*
394 	 * Initialize params/tunables that are derived from memsize
395 	 */
396 	init_param2(physmem);
397 
398 	/*
399 	 * Grab booted kernel's name
400 	 */
401         env = kern_getenv("kernelname");
402         if (env != NULL) {
403 		strlcpy(kernelname, env, sizeof(kernelname));
404 		freeenv(env);
405 	}
406 
407 	/*
408 	 * Finish setting up thread0.
409 	 */
410 	thread0.td_pcb = (struct pcb *)
411 	    ((thread0.td_kstack + thread0.td_kstack_pages * PAGE_SIZE -
412 	    sizeof(struct pcb)) & ~15UL);
413 	bzero((void *)thread0.td_pcb, sizeof(struct pcb));
414 	pc->pc_curpcb = thread0.td_pcb;
415 
416 	/* Initialise the message buffer. */
417 	msgbufinit(msgbufp, msgbufsize);
418 
419 #ifdef KDB
420 	if (boothowto & RB_KDB)
421 		kdb_enter(KDB_WHY_BOOTFLAGS,
422 		    "Boot flags requested debugger");
423 #endif
424 
425 	return (((uintptr_t)thread0.td_pcb -
426 	    (sizeof(struct callframe) - 3*sizeof(register_t))) & ~15UL);
427 }
428 
429 /*
430  * Flush the D-cache for non-DMA I/O so that the I-cache can
431  * be made coherent later.
432  */
433 void
434 cpu_flush_dcache(void *ptr, size_t len)
435 {
436 	register_t addr, off;
437 
438 	/*
439 	 * Align the address to a cacheline and adjust the length
440 	 * accordingly. Then round the length to a multiple of the
441 	 * cacheline for easy looping.
442 	 */
443 	addr = (uintptr_t)ptr;
444 	off = addr & (cacheline_size - 1);
445 	addr -= off;
446 	len = roundup2(len + off, cacheline_size);
447 
448 	while (len > 0) {
449 		__asm __volatile ("dcbf 0,%0" :: "r"(addr));
450 		__asm __volatile ("sync");
451 		addr += cacheline_size;
452 		len -= cacheline_size;
453 	}
454 }
455 
456 int
457 ptrace_set_pc(struct thread *td, unsigned long addr)
458 {
459 	struct trapframe *tf;
460 
461 	tf = td->td_frame;
462 	tf->srr0 = (register_t)addr;
463 
464 	return (0);
465 }
466 
467 void
468 spinlock_enter(void)
469 {
470 	struct thread *td;
471 	register_t msr;
472 
473 	td = curthread;
474 	if (td->td_md.md_spinlock_count == 0) {
475 		__asm __volatile("or 2,2,2"); /* Set high thread priority */
476 		msr = intr_disable();
477 		td->td_md.md_spinlock_count = 1;
478 		td->td_md.md_saved_msr = msr;
479 	} else
480 		td->td_md.md_spinlock_count++;
481 	critical_enter();
482 }
483 
484 void
485 spinlock_exit(void)
486 {
487 	struct thread *td;
488 	register_t msr;
489 
490 	td = curthread;
491 	critical_exit();
492 	msr = td->td_md.md_saved_msr;
493 	td->td_md.md_spinlock_count--;
494 	if (td->td_md.md_spinlock_count == 0) {
495 		intr_restore(msr);
496 		__asm __volatile("or 6,6,6"); /* Set normal thread priority */
497 	}
498 }
499 
500 /*
501  * Simple ddb(4) command/hack to view any SPR on the running CPU.
502  * Uses a trivial asm function to perform the mfspr, and rewrites the mfspr
503  * instruction each time.
504  * XXX: Since it uses code modification, it won't work if the kernel code pages
505  * are marked RO.
506  */
507 extern register_t get_spr(int);
508 
509 #ifdef DDB
510 DB_SHOW_COMMAND(spr, db_show_spr)
511 {
512 	register_t spr;
513 	volatile uint32_t *p;
514 	int sprno, saved_sprno;
515 
516 	if (!have_addr)
517 		return;
518 
519 	saved_sprno = sprno = (intptr_t) addr;
520 	sprno = ((sprno & 0x3e0) >> 5) | ((sprno & 0x1f) << 5);
521 	p = (uint32_t *)(void *)&get_spr;
522 	*p = (*p & ~0x001ff800) | (sprno << 11);
523 	__syncicache(get_spr, cacheline_size);
524 	spr = get_spr(sprno);
525 
526 	db_printf("SPR %d(%x): %lx\n", saved_sprno, saved_sprno,
527 	    (unsigned long)spr);
528 }
529 #endif
530 
531 #undef bzero
532 void
533 bzero(void *buf, size_t len)
534 {
535 	caddr_t	p;
536 
537 	p = buf;
538 
539 	while (((vm_offset_t) p & (sizeof(u_long) - 1)) && len) {
540 		*p++ = 0;
541 		len--;
542 	}
543 
544 	while (len >= sizeof(u_long) * 8) {
545 		*(u_long*) p = 0;
546 		*((u_long*) p + 1) = 0;
547 		*((u_long*) p + 2) = 0;
548 		*((u_long*) p + 3) = 0;
549 		len -= sizeof(u_long) * 8;
550 		*((u_long*) p + 4) = 0;
551 		*((u_long*) p + 5) = 0;
552 		*((u_long*) p + 6) = 0;
553 		*((u_long*) p + 7) = 0;
554 		p += sizeof(u_long) * 8;
555 	}
556 
557 	while (len >= sizeof(u_long)) {
558 		*(u_long*) p = 0;
559 		len -= sizeof(u_long);
560 		p += sizeof(u_long);
561 	}
562 
563 	while (len) {
564 		*p++ = 0;
565 		len--;
566 	}
567 }
568