xref: /freebsd/sys/powerpc/powernv/platform_powernv.c (revision 4b50c451720d8b427757a6da1dd2bb4c52cd9e35)
1 /*-
2  * Copyright (c) 2015 Nathan Whitehorn
3  * Copyright (c) 2017-2018 Semihalf
4  * All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  *
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
21  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
22  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
23  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
25  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 
28 #include <sys/cdefs.h>
29 __FBSDID("$FreeBSD$");
30 
31 #include <sys/param.h>
32 #include <sys/systm.h>
33 #include <sys/kernel.h>
34 #include <sys/bus.h>
35 #include <sys/pcpu.h>
36 #include <sys/proc.h>
37 #include <sys/smp.h>
38 #include <vm/vm.h>
39 #include <vm/pmap.h>
40 
41 #include <machine/bus.h>
42 #include <machine/cpu.h>
43 #include <machine/hid.h>
44 #include <machine/platformvar.h>
45 #include <machine/pmap.h>
46 #include <machine/rtas.h>
47 #include <machine/smp.h>
48 #include <machine/spr.h>
49 #include <machine/trap.h>
50 
51 #include <dev/ofw/openfirm.h>
52 #include <machine/ofw_machdep.h>
53 #include <powerpc/aim/mmu_oea64.h>
54 
55 #include "platform_if.h"
56 #include "opal.h"
57 
58 #ifdef SMP
59 extern void *ap_pcpu;
60 #endif
61 
62 void (*powernv_smp_ap_extra_init)(void);
63 
64 static int powernv_probe(platform_t);
65 static int powernv_attach(platform_t);
66 void powernv_mem_regions(platform_t, struct mem_region *phys, int *physsz,
67     struct mem_region *avail, int *availsz);
68 static void powernv_numa_mem_regions(platform_t plat, struct numa_mem_region *phys, int *physsz);
69 static u_long powernv_timebase_freq(platform_t, struct cpuref *cpuref);
70 static int powernv_smp_first_cpu(platform_t, struct cpuref *cpuref);
71 static int powernv_smp_next_cpu(platform_t, struct cpuref *cpuref);
72 static int powernv_smp_get_bsp(platform_t, struct cpuref *cpuref);
73 static void powernv_smp_ap_init(platform_t);
74 #ifdef SMP
75 static int powernv_smp_start_cpu(platform_t, struct pcpu *cpu);
76 static void powernv_smp_probe_threads(platform_t);
77 static struct cpu_group *powernv_smp_topo(platform_t plat);
78 #endif
79 static void powernv_reset(platform_t);
80 static void powernv_cpu_idle(sbintime_t sbt);
81 static int powernv_cpuref_init(void);
82 
83 static platform_method_t powernv_methods[] = {
84 	PLATFORMMETHOD(platform_probe, 		powernv_probe),
85 	PLATFORMMETHOD(platform_attach,		powernv_attach),
86 	PLATFORMMETHOD(platform_mem_regions,	powernv_mem_regions),
87 	PLATFORMMETHOD(platform_numa_mem_regions,	powernv_numa_mem_regions),
88 	PLATFORMMETHOD(platform_timebase_freq,	powernv_timebase_freq),
89 
90 	PLATFORMMETHOD(platform_smp_ap_init,	powernv_smp_ap_init),
91 	PLATFORMMETHOD(platform_smp_first_cpu,	powernv_smp_first_cpu),
92 	PLATFORMMETHOD(platform_smp_next_cpu,	powernv_smp_next_cpu),
93 	PLATFORMMETHOD(platform_smp_get_bsp,	powernv_smp_get_bsp),
94 #ifdef SMP
95 	PLATFORMMETHOD(platform_smp_start_cpu,	powernv_smp_start_cpu),
96 	PLATFORMMETHOD(platform_smp_probe_threads,	powernv_smp_probe_threads),
97 	PLATFORMMETHOD(platform_smp_topo,	powernv_smp_topo),
98 #endif
99 
100 	PLATFORMMETHOD(platform_reset,		powernv_reset),
101 
102 	{ 0, 0 }
103 };
104 
105 static platform_def_t powernv_platform = {
106 	"powernv",
107 	powernv_methods,
108 	0
109 };
110 
111 static struct cpuref platform_cpuref[MAXCPU];
112 static int platform_cpuref_cnt;
113 static int platform_cpuref_valid;
114 
115 PLATFORM_DEF(powernv_platform);
116 
117 static uint64_t powernv_boot_pir;
118 
119 static int
120 powernv_probe(platform_t plat)
121 {
122 	if (opal_check() == 0)
123 		return (BUS_PROBE_SPECIFIC);
124 
125 	return (ENXIO);
126 }
127 
128 static int
129 powernv_attach(platform_t plat)
130 {
131 	uint32_t nptlp, shift = 0, slb_encoding = 0;
132 	int32_t lp_size, lp_encoding;
133 	char buf[255];
134 	pcell_t prop;
135 	phandle_t cpu;
136 	int res, len, idx;
137 	register_t msr;
138 
139 	/* Ping OPAL again just to make sure */
140 	opal_check();
141 
142 #if BYTE_ORDER == LITTLE_ENDIAN
143 	opal_call(OPAL_REINIT_CPUS, 2 /* Little endian */);
144 #else
145 	opal_call(OPAL_REINIT_CPUS, 1 /* Big endian */);
146 #endif
147 
148        if (cpu_idle_hook == NULL)
149                 cpu_idle_hook = powernv_cpu_idle;
150 
151 	powernv_boot_pir = mfspr(SPR_PIR);
152 
153 	/* LPID must not be altered when PSL_DR or PSL_IR is set */
154 	msr = mfmsr();
155 	mtmsr(msr & ~(PSL_DR | PSL_IR));
156 
157 	/* Direct interrupts to SRR instead of HSRR and reset LPCR otherwise */
158 	mtspr(SPR_LPID, 0);
159 	isync();
160 
161 	if (cpu_features2 & PPC_FEATURE2_ARCH_3_00)
162 		lpcr |= LPCR_HVICE;
163 
164 	mtspr(SPR_LPCR, lpcr);
165 	isync();
166 
167 	mtmsr(msr);
168 
169 	powernv_cpuref_init();
170 
171 	/* Set SLB count from device tree */
172 	cpu = OF_peer(0);
173 	cpu = OF_child(cpu);
174 	while (cpu != 0) {
175 		res = OF_getprop(cpu, "name", buf, sizeof(buf));
176 		if (res > 0 && strcmp(buf, "cpus") == 0)
177 			break;
178 		cpu = OF_peer(cpu);
179 	}
180 	if (cpu == 0)
181 		goto out;
182 
183 	cpu = OF_child(cpu);
184 	while (cpu != 0) {
185 		res = OF_getprop(cpu, "device_type", buf, sizeof(buf));
186 		if (res > 0 && strcmp(buf, "cpu") == 0)
187 			break;
188 		cpu = OF_peer(cpu);
189 	}
190 	if (cpu == 0)
191 		goto out;
192 
193 	res = OF_getencprop(cpu, "ibm,slb-size", &prop, sizeof(prop));
194 	if (res > 0)
195 		n_slbs = prop;
196 
197 	/*
198 	 * Scan the large page size property for PAPR compatible machines.
199 	 * See PAPR D.5 Changes to Section 5.1.4, 'CPU Node Properties'
200 	 * for the encoding of the property.
201 	 */
202 
203 	len = OF_getproplen(cpu, "ibm,segment-page-sizes");
204 	if (len > 0) {
205 		/*
206 		 * We have to use a variable length array on the stack
207 		 * since we have very limited stack space.
208 		 */
209 		pcell_t arr[len/sizeof(cell_t)];
210 		res = OF_getencprop(cpu, "ibm,segment-page-sizes", arr,
211 		    sizeof(arr));
212 		len /= 4;
213 		idx = 0;
214 		while (len > 0) {
215 			shift = arr[idx];
216 			slb_encoding = arr[idx + 1];
217 			nptlp = arr[idx + 2];
218 			idx += 3;
219 			len -= 3;
220 			while (len > 0 && nptlp) {
221 				lp_size = arr[idx];
222 				lp_encoding = arr[idx+1];
223 				if (slb_encoding == SLBV_L && lp_encoding == 0)
224 					break;
225 
226 				idx += 2;
227 				len -= 2;
228 				nptlp--;
229 			}
230 			if (nptlp && slb_encoding == SLBV_L && lp_encoding == 0)
231 				break;
232 		}
233 
234 		if (len == 0)
235 			panic("Standard large pages (SLB[L] = 1, PTE[LP] = 0) "
236 			    "not supported by this system.");
237 
238 		moea64_large_page_shift = shift;
239 		moea64_large_page_size = 1ULL << lp_size;
240 	}
241 
242 out:
243 	return (0);
244 }
245 
246 
247 void
248 powernv_mem_regions(platform_t plat, struct mem_region *phys, int *physsz,
249     struct mem_region *avail, int *availsz)
250 {
251 
252 	ofw_mem_regions(phys, physsz, avail, availsz);
253 }
254 
255 static void
256 powernv_numa_mem_regions(platform_t plat, struct numa_mem_region *phys, int *physsz)
257 {
258 
259 	ofw_numa_mem_regions(phys, physsz);
260 }
261 
262 static u_long
263 powernv_timebase_freq(platform_t plat, struct cpuref *cpuref)
264 {
265 	char buf[8];
266 	phandle_t cpu, dev, root;
267 	int res;
268 	int32_t ticks = -1;
269 
270 	root = OF_peer(0);
271 	dev = OF_child(root);
272 	while (dev != 0) {
273 		res = OF_getprop(dev, "name", buf, sizeof(buf));
274 		if (res > 0 && strcmp(buf, "cpus") == 0)
275 			break;
276 		dev = OF_peer(dev);
277 	}
278 
279 	for (cpu = OF_child(dev); cpu != 0; cpu = OF_peer(cpu)) {
280 		res = OF_getprop(cpu, "device_type", buf, sizeof(buf));
281 		if (res > 0 && strcmp(buf, "cpu") == 0)
282 			break;
283 	}
284 	if (cpu == 0)
285 		return (512000000);
286 
287 	OF_getencprop(cpu, "timebase-frequency", &ticks, sizeof(ticks));
288 
289 	if (ticks <= 0)
290 		panic("Unable to determine timebase frequency!");
291 
292 	return (ticks);
293 
294 }
295 
296 static int
297 powernv_cpuref_init(void)
298 {
299 	phandle_t cpu, dev;
300 	char buf[32];
301 	int a, res, tmp_cpuref_cnt;
302 	static struct cpuref tmp_cpuref[MAXCPU];
303 	cell_t interrupt_servers[32];
304 	uint64_t bsp;
305 
306 	if (platform_cpuref_valid)
307 		return (0);
308 
309 	dev = OF_peer(0);
310 	dev = OF_child(dev);
311 	while (dev != 0) {
312 		res = OF_getprop(dev, "name", buf, sizeof(buf));
313 		if (res > 0 && strcmp(buf, "cpus") == 0)
314 			break;
315 		dev = OF_peer(dev);
316 	}
317 
318 	bsp = 0;
319 	tmp_cpuref_cnt = 0;
320 	for (cpu = OF_child(dev); cpu != 0; cpu = OF_peer(cpu)) {
321 		res = OF_getprop(cpu, "device_type", buf, sizeof(buf));
322 		if (res > 0 && strcmp(buf, "cpu") == 0) {
323 			res = OF_getproplen(cpu, "ibm,ppc-interrupt-server#s");
324 			if (res > 0) {
325 				OF_getencprop(cpu, "ibm,ppc-interrupt-server#s",
326 				    interrupt_servers, res);
327 
328 				for (a = 0; a < res/sizeof(cell_t); a++) {
329 					tmp_cpuref[tmp_cpuref_cnt].cr_hwref = interrupt_servers[a];
330 					tmp_cpuref[tmp_cpuref_cnt].cr_cpuid = tmp_cpuref_cnt;
331 					tmp_cpuref[tmp_cpuref_cnt].cr_domain = interrupt_servers[a] >> 11;
332 					if (interrupt_servers[a] == (uint32_t)powernv_boot_pir)
333 						bsp = tmp_cpuref_cnt;
334 
335 					tmp_cpuref_cnt++;
336 				}
337 			}
338 		}
339 	}
340 
341 	/* Map IDs, so BSP has CPUID 0 regardless of hwref */
342 	for (a = bsp; a < tmp_cpuref_cnt; a++) {
343 		platform_cpuref[platform_cpuref_cnt].cr_hwref = tmp_cpuref[a].cr_hwref;
344 		platform_cpuref[platform_cpuref_cnt].cr_cpuid = platform_cpuref_cnt;
345 		platform_cpuref[platform_cpuref_cnt].cr_domain = tmp_cpuref[a].cr_domain;
346 		platform_cpuref_cnt++;
347 	}
348 	for (a = 0; a < bsp; a++) {
349 		platform_cpuref[platform_cpuref_cnt].cr_hwref = tmp_cpuref[a].cr_hwref;
350 		platform_cpuref[platform_cpuref_cnt].cr_cpuid = platform_cpuref_cnt;
351 		platform_cpuref[platform_cpuref_cnt].cr_domain = tmp_cpuref[a].cr_domain;
352 		platform_cpuref_cnt++;
353 	}
354 
355 	platform_cpuref_valid = 1;
356 
357 	return (0);
358 }
359 
360 static int
361 powernv_smp_first_cpu(platform_t plat, struct cpuref *cpuref)
362 {
363 	if (platform_cpuref_valid == 0)
364 		return (EINVAL);
365 
366 	cpuref->cr_cpuid = 0;
367 	cpuref->cr_hwref = platform_cpuref[0].cr_hwref;
368 	cpuref->cr_domain = platform_cpuref[0].cr_domain;
369 
370 	return (0);
371 }
372 
373 static int
374 powernv_smp_next_cpu(platform_t plat, struct cpuref *cpuref)
375 {
376 	int id;
377 
378 	if (platform_cpuref_valid == 0)
379 		return (EINVAL);
380 
381 	id = cpuref->cr_cpuid + 1;
382 	if (id >= platform_cpuref_cnt)
383 		return (ENOENT);
384 
385 	cpuref->cr_cpuid = platform_cpuref[id].cr_cpuid;
386 	cpuref->cr_hwref = platform_cpuref[id].cr_hwref;
387 	cpuref->cr_domain = platform_cpuref[id].cr_domain;
388 
389 	return (0);
390 }
391 
392 static int
393 powernv_smp_get_bsp(platform_t plat, struct cpuref *cpuref)
394 {
395 
396 	cpuref->cr_cpuid = platform_cpuref[0].cr_cpuid;
397 	cpuref->cr_hwref = platform_cpuref[0].cr_hwref;
398 	cpuref->cr_domain = platform_cpuref[0].cr_domain;
399 	return (0);
400 }
401 
402 #ifdef SMP
403 static int
404 powernv_smp_start_cpu(platform_t plat, struct pcpu *pc)
405 {
406 	int result;
407 
408 	ap_pcpu = pc;
409 	powerpc_sync();
410 
411 	result = opal_call(OPAL_START_CPU, pc->pc_hwref, EXC_RST);
412 	if (result != OPAL_SUCCESS) {
413 		printf("OPAL error (%d): unable to start AP %d\n",
414 		    result, (int)pc->pc_hwref);
415 		return (ENXIO);
416 	}
417 
418 	return (0);
419 }
420 
421 static void
422 powernv_smp_probe_threads(platform_t plat)
423 {
424 	char buf[8];
425 	phandle_t cpu, dev, root;
426 	int res, nthreads;
427 
428 	root = OF_peer(0);
429 
430 	dev = OF_child(root);
431 	while (dev != 0) {
432 		res = OF_getprop(dev, "name", buf, sizeof(buf));
433 		if (res > 0 && strcmp(buf, "cpus") == 0)
434 			break;
435 		dev = OF_peer(dev);
436 	}
437 
438 	nthreads = 1;
439 	for (cpu = OF_child(dev); cpu != 0; cpu = OF_peer(cpu)) {
440 		res = OF_getprop(cpu, "device_type", buf, sizeof(buf));
441 		if (res <= 0 || strcmp(buf, "cpu") != 0)
442 			continue;
443 
444 		res = OF_getproplen(cpu, "ibm,ppc-interrupt-server#s");
445 
446 		if (res >= 0)
447 			nthreads = res / sizeof(cell_t);
448 		else
449 			nthreads = 1;
450 		break;
451 	}
452 
453 	smp_threads_per_core = nthreads;
454 	if (mp_ncpus % nthreads == 0)
455 		mp_ncores = mp_ncpus / nthreads;
456 }
457 
458 static struct cpu_group *
459 powernv_smp_topo(platform_t plat)
460 {
461 	if (mp_ncpus % smp_threads_per_core != 0) {
462 		printf("WARNING: Irregular SMP topology. Performance may be "
463 		     "suboptimal (%d threads, %d on first core)\n",
464 		     mp_ncpus, smp_threads_per_core);
465 		return (smp_topo_none());
466 	}
467 
468 	/* Don't do anything fancier for non-threaded SMP */
469 	if (smp_threads_per_core == 1)
470 		return (smp_topo_none());
471 
472 	return (smp_topo_1level(CG_SHARE_L1, smp_threads_per_core,
473 	    CG_FLAG_SMT));
474 }
475 
476 #endif
477 
478 static void
479 powernv_reset(platform_t platform)
480 {
481 
482 	opal_call(OPAL_CEC_REBOOT);
483 }
484 
485 static void
486 powernv_smp_ap_init(platform_t platform)
487 {
488 
489 	if (powernv_smp_ap_extra_init != NULL)
490 		powernv_smp_ap_extra_init();
491 }
492 
493 static void
494 powernv_cpu_idle(sbintime_t sbt)
495 {
496 }
497 
498 /* Set up the Nest MMU on POWER9 relatively early, but after pmap is setup. */
499 static void
500 powernv_setup_nmmu(void *unused)
501 {
502 	if (opal_check() != 0)
503 		return;
504 	opal_call(OPAL_NMMU_SET_PTCR, -1, mfspr(SPR_PTCR));
505 }
506 
507 SYSINIT(powernv_setup_nmmu, SI_SUB_CPU, SI_ORDER_ANY, powernv_setup_nmmu, NULL);
508