xref: /freebsd/sys/powerpc/powerpc/mp_machdep.c (revision b4af4f93c682e445bf159f0d1ec90b636296c946)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2008 Marcel Moolenaar
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  *
17  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27  */
28 
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
31 
32 #include <sys/param.h>
33 #include <sys/systm.h>
34 #include <sys/kernel.h>
35 #include <sys/ktr.h>
36 #include <sys/bus.h>
37 #include <sys/cpuset.h>
38 #include <sys/domainset.h>
39 #include <sys/lock.h>
40 #include <sys/malloc.h>
41 #include <sys/mutex.h>
42 #include <sys/pcpu.h>
43 #include <sys/proc.h>
44 #include <sys/sched.h>
45 #include <sys/smp.h>
46 
47 #include <vm/vm.h>
48 #include <vm/vm_param.h>
49 #include <vm/pmap.h>
50 #include <vm/vm_map.h>
51 #include <vm/vm_extern.h>
52 #include <vm/vm_kern.h>
53 
54 #include <machine/bus.h>
55 #include <machine/cpu.h>
56 #include <machine/intr_machdep.h>
57 #include <machine/pcb.h>
58 #include <machine/platform.h>
59 #include <machine/md_var.h>
60 #include <machine/setjmp.h>
61 #include <machine/smp.h>
62 
63 #include "pic_if.h"
64 
65 volatile static int ap_awake;
66 volatile static u_int ap_letgo;
67 volatile static u_quad_t ap_timebase;
68 static u_int ipi_msg_cnt[32];
69 static struct mtx ap_boot_mtx;
70 struct pcb stoppcbs[MAXCPU];
71 
72 void
73 machdep_ap_bootstrap(void)
74 {
75 
76 	PCPU_SET(awake, 1);
77 	__asm __volatile("msync; isync");
78 
79 	while (ap_letgo == 0)
80 		nop_prio_vlow();
81 	nop_prio_medium();
82 
83 	/*
84 	 * Set timebase as soon as possible to meet an implicit rendezvous
85 	 * from cpu_mp_unleash(), which sets ap_letgo and then immediately
86 	 * sets timebase.
87 	 *
88 	 * Note that this is instrinsically racy and is only relevant on
89 	 * platforms that do not support better mechanisms.
90 	 */
91 	platform_smp_timebase_sync(ap_timebase, 1);
92 
93 	/* Give platform code a chance to do anything else necessary */
94 	platform_smp_ap_init();
95 
96 	/* Initialize decrementer */
97 	decr_ap_init();
98 
99 	/* Serialize console output and AP count increment */
100 	mtx_lock_spin(&ap_boot_mtx);
101 	ap_awake++;
102 	if (bootverbose)
103 		printf("SMP: AP CPU #%d launched\n", PCPU_GET(cpuid));
104 	else
105 		printf("%s%d%s", ap_awake == 2 ? "Launching APs: " : "",
106 		    PCPU_GET(cpuid), ap_awake == mp_ncpus ? "\n" : " ");
107 	mtx_unlock_spin(&ap_boot_mtx);
108 
109 	while(smp_started == 0)
110 		;
111 
112 	/* Start per-CPU event timers. */
113 	cpu_initclocks_ap();
114 
115 	/* Announce ourselves awake, and enter the scheduler */
116 	sched_throw(NULL);
117 }
118 
119 void
120 cpu_mp_setmaxid(void)
121 {
122 	struct cpuref cpuref;
123 	int error;
124 
125 	mp_ncpus = 0;
126 	mp_maxid = 0;
127 	error = platform_smp_first_cpu(&cpuref);
128 	while (!error) {
129 		mp_ncpus++;
130 		mp_maxid = max(cpuref.cr_cpuid, mp_maxid);
131 		error = platform_smp_next_cpu(&cpuref);
132 	}
133 	/* Sanity. */
134 	if (mp_ncpus == 0)
135 		mp_ncpus = 1;
136 }
137 
138 int
139 cpu_mp_probe(void)
140 {
141 
142 	/*
143 	 * We're not going to enable SMP if there's only 1 processor.
144 	 */
145 	return (mp_ncpus > 1);
146 }
147 
148 void
149 cpu_mp_start(void)
150 {
151 	struct cpuref bsp, cpu;
152 	struct pcpu *pc;
153 	int domain, error;
154 
155 	error = platform_smp_get_bsp(&bsp);
156 	KASSERT(error == 0, ("Don't know BSP"));
157 
158 	error = platform_smp_first_cpu(&cpu);
159 	while (!error) {
160 		if (cpu.cr_cpuid >= MAXCPU) {
161 			printf("SMP: cpu%d: skipped -- ID out of range\n",
162 			    cpu.cr_cpuid);
163 			goto next;
164 		}
165 		if (CPU_ISSET(cpu.cr_cpuid, &all_cpus)) {
166 			printf("SMP: cpu%d: skipped - duplicate ID\n",
167 			    cpu.cr_cpuid);
168 			goto next;
169 		}
170 
171 		if (vm_ndomains > 1)
172 			domain = cpu.cr_domain;
173 		else
174 			domain = 0;
175 
176 		if (cpu.cr_cpuid != bsp.cr_cpuid) {
177 			void *dpcpu;
178 
179 			pc = &__pcpu[cpu.cr_cpuid];
180 			dpcpu = (void *)kmem_malloc_domainset(DOMAINSET_PREF(domain),
181 			    DPCPU_SIZE, M_WAITOK | M_ZERO);
182 			pcpu_init(pc, cpu.cr_cpuid, sizeof(*pc));
183 			dpcpu_init(dpcpu, cpu.cr_cpuid);
184 		} else {
185 			pc = pcpup;
186 			pc->pc_cpuid = bsp.cr_cpuid;
187 			pc->pc_bsp = 1;
188 		}
189 		pc->pc_domain = domain;
190 		pc->pc_hwref = cpu.cr_hwref;
191 
192 		CPU_SET(pc->pc_cpuid, &cpuset_domain[pc->pc_domain]);
193 		KASSERT(pc->pc_domain < MAXMEMDOM, ("bad domain value %d\n",
194 		    pc->pc_domain));
195 		CPU_SET(pc->pc_cpuid, &all_cpus);
196 next:
197 		error = platform_smp_next_cpu(&cpu);
198 	}
199 
200 #ifdef SMP
201 	platform_smp_probe_threads();
202 #endif
203 }
204 
205 void
206 cpu_mp_announce(void)
207 {
208 	struct pcpu *pc;
209 	int i;
210 
211 	if (!bootverbose)
212 		return;
213 
214 	CPU_FOREACH(i) {
215 		pc = pcpu_find(i);
216 		if (pc == NULL)
217 			continue;
218 		printf("cpu%d: dev=%x domain=%d ", i, (int)pc->pc_hwref, pc->pc_domain);
219 		if (pc->pc_bsp)
220 			printf(" (BSP)");
221 		printf("\n");
222 	}
223 }
224 
225 static void
226 cpu_mp_unleash(void *dummy)
227 {
228 	struct pcpu *pc;
229 	int cpus, timeout;
230 	int ret;
231 
232 	if (mp_ncpus <= 1)
233 		return;
234 
235 	mtx_init(&ap_boot_mtx, "ap boot", NULL, MTX_SPIN);
236 
237 	cpus = 0;
238 	smp_cpus = 0;
239 #ifdef BOOKE
240 	tlb1_ap_prep();
241 #endif
242 	STAILQ_FOREACH(pc, &cpuhead, pc_allcpu) {
243 		cpus++;
244 		if (!pc->pc_bsp) {
245 			if (bootverbose)
246 				printf("Waking up CPU %d (dev=%x)\n",
247 				    pc->pc_cpuid, (int)pc->pc_hwref);
248 
249 			pc->pc_flags = PCPU_GET(flags); /* Copy cached CPU flags */
250 			ret = platform_smp_start_cpu(pc);
251 			if (ret == 0) {
252 				timeout = 2000;	/* wait 2sec for the AP */
253 				while (!pc->pc_awake && --timeout > 0)
254 					DELAY(1000);
255 			}
256 		} else {
257 			pc->pc_awake = 1;
258 		}
259 		if (pc->pc_awake) {
260 			if (bootverbose)
261 				printf("Adding CPU %d, hwref=%jx, awake=%x\n",
262 				    pc->pc_cpuid, (uintmax_t)pc->pc_hwref,
263 				    pc->pc_awake);
264 			smp_cpus++;
265 		} else
266 			CPU_SET(pc->pc_cpuid, &stopped_cpus);
267 	}
268 
269 	ap_awake = 1;
270 
271 	/* Provide our current DEC and TB values for APs */
272 	ap_timebase = mftb() + 10;
273 	__asm __volatile("msync; isync");
274 
275 	/* Let APs continue */
276 	atomic_store_rel_int(&ap_letgo, 1);
277 
278 	platform_smp_timebase_sync(ap_timebase, 0);
279 
280 	while (ap_awake < smp_cpus)
281 		;
282 
283 	if (smp_cpus != cpus || cpus != mp_ncpus) {
284 		printf("SMP: %d CPUs found; %d CPUs usable; %d CPUs woken\n",
285 		    mp_ncpus, cpus, smp_cpus);
286 	}
287 
288 	if (smp_cpus > 1)
289 		atomic_store_rel_int(&smp_started, 1);
290 
291 	/* Let the APs get into the scheduler */
292 	DELAY(10000);
293 
294 }
295 
296 SYSINIT(start_aps, SI_SUB_SMP, SI_ORDER_FIRST, cpu_mp_unleash, NULL);
297 
298 int
299 powerpc_ipi_handler(void *arg)
300 {
301 	u_int cpuid;
302 	uint32_t ipimask;
303 	int msg;
304 
305 	CTR2(KTR_SMP, "%s: MSR 0x%08x", __func__, mfmsr());
306 
307 	ipimask = atomic_readandclear_32(&(pcpup->pc_ipimask));
308 	if (ipimask == 0)
309 		return (FILTER_STRAY);
310 	while ((msg = ffs(ipimask) - 1) != -1) {
311 		ipimask &= ~(1u << msg);
312 		ipi_msg_cnt[msg]++;
313 		switch (msg) {
314 		case IPI_AST:
315 			CTR1(KTR_SMP, "%s: IPI_AST", __func__);
316 			break;
317 		case IPI_PREEMPT:
318 			CTR1(KTR_SMP, "%s: IPI_PREEMPT", __func__);
319 			sched_preempt(curthread);
320 			break;
321 		case IPI_RENDEZVOUS:
322 			CTR1(KTR_SMP, "%s: IPI_RENDEZVOUS", __func__);
323 			smp_rendezvous_action();
324 			break;
325 		case IPI_STOP:
326 
327 			/*
328 			 * IPI_STOP_HARD is mapped to IPI_STOP so it is not
329 			 * necessary to add such case in the switch.
330 			 */
331 			CTR1(KTR_SMP, "%s: IPI_STOP or IPI_STOP_HARD (stop)",
332 			    __func__);
333 			cpuid = PCPU_GET(cpuid);
334 			savectx(&stoppcbs[cpuid]);
335 			CPU_SET_ATOMIC(cpuid, &stopped_cpus);
336 			while (!CPU_ISSET(cpuid, &started_cpus))
337 				cpu_spinwait();
338 			CPU_CLR_ATOMIC(cpuid, &stopped_cpus);
339 			CPU_CLR_ATOMIC(cpuid, &started_cpus);
340 			CTR1(KTR_SMP, "%s: IPI_STOP (restart)", __func__);
341 			break;
342 		case IPI_HARDCLOCK:
343 			CTR1(KTR_SMP, "%s: IPI_HARDCLOCK", __func__);
344 			hardclockintr();
345 			break;
346 		}
347 	}
348 
349 	return (FILTER_HANDLED);
350 }
351 
352 static void
353 ipi_send(struct pcpu *pc, int ipi)
354 {
355 
356 	CTR4(KTR_SMP, "%s: pc=%p, targetcpu=%d, IPI=%d", __func__,
357 	    pc, pc->pc_cpuid, ipi);
358 
359 	atomic_set_32(&pc->pc_ipimask, (1 << ipi));
360 	powerpc_sync();
361 	PIC_IPI(root_pic, pc->pc_cpuid);
362 
363 	CTR1(KTR_SMP, "%s: sent", __func__);
364 }
365 
366 /* Send an IPI to a set of cpus. */
367 void
368 ipi_selected(cpuset_t cpus, int ipi)
369 {
370 	struct pcpu *pc;
371 
372 	STAILQ_FOREACH(pc, &cpuhead, pc_allcpu) {
373 		if (CPU_ISSET(pc->pc_cpuid, &cpus))
374 			ipi_send(pc, ipi);
375 	}
376 }
377 
378 /* Send an IPI to a specific CPU. */
379 void
380 ipi_cpu(int cpu, u_int ipi)
381 {
382 
383 	ipi_send(cpuid_to_pcpu[cpu], ipi);
384 }
385 
386 /* Send an IPI to all CPUs EXCEPT myself. */
387 void
388 ipi_all_but_self(int ipi)
389 {
390 	struct pcpu *pc;
391 
392 	STAILQ_FOREACH(pc, &cpuhead, pc_allcpu) {
393 		if (pc != pcpup)
394 			ipi_send(pc, ipi);
395 	}
396 }
397