xref: /freebsd/sys/kern/kern_pmc.c (revision cbd30a72ca196976c1c700400ecd424baa1b9c16)
1 /*-
2  * Copyright (c) 2003-2008 Joseph Koshy
3  * Copyright (c) 2007 The FreeBSD Foundation
4  * All rights reserved.
5  *
6  * Portions of this software were developed by A. Joseph Koshy under
7  * sponsorship from the FreeBSD Foundation and Google, Inc.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
19  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
22  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28  * SUCH DAMAGE.
29  */
30 
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
33 
34 #include "opt_hwpmc_hooks.h"
35 
36 #include <sys/types.h>
37 #include <sys/ctype.h>
38 #include <sys/param.h>
39 #include <sys/malloc.h>
40 #include <sys/kernel.h>
41 #include <sys/lock.h>
42 #include <sys/mutex.h>
43 #include <sys/pmc.h>
44 #include <sys/pmckern.h>
45 #include <sys/smp.h>
46 #include <sys/sysctl.h>
47 #include <sys/systm.h>
48 
49 #ifdef	HWPMC_HOOKS
50 FEATURE(hwpmc_hooks, "Kernel support for HW PMC");
51 #define	PMC_KERNEL_VERSION	PMC_VERSION
52 #else
53 #define	PMC_KERNEL_VERSION	0
54 #endif
55 
56 MALLOC_DECLARE(M_PMCHOOKS);
57 MALLOC_DEFINE(M_PMCHOOKS, "pmchooks", "Memory space for PMC hooks");
58 
59 const int pmc_kernel_version = PMC_KERNEL_VERSION;
60 
61 /* Hook variable. */
62 int __read_mostly (*pmc_hook)(struct thread *td, int function, void *arg) = NULL;
63 
64 /* Interrupt handler */
65 int __read_mostly (*pmc_intr)(int cpu, struct trapframe *tf) = NULL;
66 
67 /* Bitmask of CPUs requiring servicing at hardclock time */
68 volatile cpuset_t pmc_cpumask;
69 
70 /*
71  * A global count of SS mode PMCs.  When non-zero, this means that
72  * we have processes that are sampling the system as a whole.
73  */
74 volatile int pmc_ss_count;
75 
76 /*
77  * Since PMC(4) may not be loaded in the current kernel, the
78  * convention followed is that a non-NULL value of 'pmc_hook' implies
79  * the presence of this kernel module.
80  *
81  * This requires us to protect 'pmc_hook' with a
82  * shared (sx) lock -- thus making the process of calling into PMC(4)
83  * somewhat more expensive than a simple 'if' check and indirect call.
84  */
85 struct sx pmc_sx;
86 
87 /*
88  * PMC Soft per cpu trapframe.
89  */
90 struct trapframe pmc_tf[MAXCPU];
91 
92 /*
93  * PMC Soft use a global table to store registered events.
94  */
95 
96 SYSCTL_NODE(_kern, OID_AUTO, hwpmc, CTLFLAG_RW, 0, "HWPMC parameters");
97 
98 static int pmc_softevents = 16;
99 SYSCTL_INT(_kern_hwpmc, OID_AUTO, softevents, CTLFLAG_RDTUN,
100     &pmc_softevents, 0, "maximum number of soft events");
101 
102 struct mtx pmc_softs_mtx;
103 int pmc_softs_count;
104 struct pmc_soft **pmc_softs;
105 
106 MTX_SYSINIT(pmc_soft_mtx, &pmc_softs_mtx, "pmc-softs", MTX_SPIN);
107 
108 static void
109 pmc_init_sx(void)
110 {
111 	sx_init_flags(&pmc_sx, "pmc-sx", SX_NOWITNESS);
112 }
113 
114 SYSINIT(pmcsx, SI_SUB_LOCK, SI_ORDER_MIDDLE, pmc_init_sx, NULL);
115 
116 /*
117  * Helper functions.
118  */
119 
120 /*
121  * A note on the CPU numbering scheme used by the hwpmc(4) driver.
122  *
123  * CPUs are denoted using numbers in the range 0..[pmc_cpu_max()-1].
124  * CPUs could be numbered "sparsely" in this range; the predicate
125  * `pmc_cpu_is_present()' is used to test whether a given CPU is
126  * physically present.
127  *
128  * Further, a CPU that is physically present may be administratively
129  * disabled or otherwise unavailable for use by hwpmc(4).  The
130  * `pmc_cpu_is_active()' predicate tests for CPU usability.  An
131  * "active" CPU participates in thread scheduling and can field
132  * interrupts raised by PMC hardware.
133  *
134  * On systems with hyperthreaded CPUs, multiple logical CPUs may share
135  * PMC hardware resources.  For such processors one logical CPU is
136  * denoted as the primary owner of the in-CPU PMC resources. The
137  * pmc_cpu_is_primary() predicate is used to distinguish this primary
138  * CPU from the others.
139  */
140 
141 int
142 pmc_cpu_is_active(int cpu)
143 {
144 #ifdef	SMP
145 	return (pmc_cpu_is_present(cpu) &&
146 	    !CPU_ISSET(cpu, &hlt_cpus_mask));
147 #else
148 	return (1);
149 #endif
150 }
151 
152 /* Deprecated. */
153 int
154 pmc_cpu_is_disabled(int cpu)
155 {
156 	return (!pmc_cpu_is_active(cpu));
157 }
158 
159 int
160 pmc_cpu_is_present(int cpu)
161 {
162 #ifdef	SMP
163 	return (!CPU_ABSENT(cpu));
164 #else
165 	return (1);
166 #endif
167 }
168 
169 int
170 pmc_cpu_is_primary(int cpu)
171 {
172 #ifdef	SMP
173 	return (!CPU_ISSET(cpu, &logical_cpus_mask));
174 #else
175 	return (1);
176 #endif
177 }
178 
179 
180 /*
181  * Return the maximum CPU number supported by the system.  The return
182  * value is used for scaling internal data structures and for runtime
183  * checks.
184  */
185 unsigned int
186 pmc_cpu_max(void)
187 {
188 #ifdef	SMP
189 	return (mp_maxid+1);
190 #else
191 	return (1);
192 #endif
193 }
194 
195 #ifdef	INVARIANTS
196 
197 /*
198  * Return the count of CPUs in the `active' state in the system.
199  */
200 int
201 pmc_cpu_max_active(void)
202 {
203 #ifdef	SMP
204 	/*
205 	 * When support for CPU hot-plugging is added to the kernel,
206 	 * this function would change to return the current number
207 	 * of "active" CPUs.
208 	 */
209 	return (mp_ncpus);
210 #else
211 	return (1);
212 #endif
213 }
214 
215 #endif
216 
217 /*
218  * Cleanup event name:
219  * - remove duplicate '_'
220  * - all uppercase
221  */
222 static void
223 pmc_soft_namecleanup(char *name)
224 {
225 	char *p, *q;
226 
227 	p = q = name;
228 
229 	for ( ; *p == '_' ; p++)
230 		;
231 	for ( ; *p ; p++) {
232 		if (*p == '_' && (*(p + 1) == '_' || *(p + 1) == '\0'))
233 			continue;
234 		else
235 			*q++ = toupper(*p);
236 	}
237 	*q = '\0';
238 }
239 
240 void
241 pmc_soft_ev_register(struct pmc_soft *ps)
242 {
243 	static int warned = 0;
244 	int n;
245 
246 	ps->ps_running  = 0;
247 	ps->ps_ev.pm_ev_code = 0; /* invalid */
248 	pmc_soft_namecleanup(ps->ps_ev.pm_ev_name);
249 
250 	mtx_lock_spin(&pmc_softs_mtx);
251 
252 	if (pmc_softs_count >= pmc_softevents) {
253 		/*
254 		 * XXX Reusing events can enter a race condition where
255 		 * new allocated event will be used as an old one.
256 		 */
257 		for (n = 0; n < pmc_softevents; n++)
258 			if (pmc_softs[n] == NULL)
259 				break;
260 		if (n == pmc_softevents) {
261 			mtx_unlock_spin(&pmc_softs_mtx);
262 			if (!warned) {
263 				printf("hwpmc: too many soft events, "
264 				    "increase kern.hwpmc.softevents tunable\n");
265 				warned = 1;
266 			}
267 			return;
268 		}
269 
270 		ps->ps_ev.pm_ev_code = PMC_EV_SOFT_FIRST + n;
271 		pmc_softs[n] = ps;
272 	} else {
273 		ps->ps_ev.pm_ev_code = PMC_EV_SOFT_FIRST + pmc_softs_count;
274 		pmc_softs[pmc_softs_count++] = ps;
275 	}
276 
277 	mtx_unlock_spin(&pmc_softs_mtx);
278 }
279 
280 void
281 pmc_soft_ev_deregister(struct pmc_soft *ps)
282 {
283 
284 	KASSERT(ps != NULL, ("pmc_soft_deregister: called with NULL"));
285 
286 	mtx_lock_spin(&pmc_softs_mtx);
287 
288 	if (ps->ps_ev.pm_ev_code != 0 &&
289 	    (ps->ps_ev.pm_ev_code - PMC_EV_SOFT_FIRST) < pmc_softevents) {
290 		KASSERT((int)ps->ps_ev.pm_ev_code >= PMC_EV_SOFT_FIRST &&
291 		    (int)ps->ps_ev.pm_ev_code <= PMC_EV_SOFT_LAST,
292 		    ("pmc_soft_deregister: invalid event value"));
293 		pmc_softs[ps->ps_ev.pm_ev_code - PMC_EV_SOFT_FIRST] = NULL;
294 	}
295 
296 	mtx_unlock_spin(&pmc_softs_mtx);
297 }
298 
299 struct pmc_soft *
300 pmc_soft_ev_acquire(enum pmc_event ev)
301 {
302 	struct pmc_soft *ps;
303 
304 	if (ev == 0 || (ev - PMC_EV_SOFT_FIRST) >= pmc_softevents)
305 		return NULL;
306 
307 	KASSERT((int)ev >= PMC_EV_SOFT_FIRST &&
308 	    (int)ev <= PMC_EV_SOFT_LAST,
309 	    ("event out of range"));
310 
311 	mtx_lock_spin(&pmc_softs_mtx);
312 
313 	ps = pmc_softs[ev - PMC_EV_SOFT_FIRST];
314 	if (ps == NULL)
315 		mtx_unlock_spin(&pmc_softs_mtx);
316 
317 	return ps;
318 }
319 
320 void
321 pmc_soft_ev_release(struct pmc_soft *ps)
322 {
323 
324 	mtx_unlock_spin(&pmc_softs_mtx);
325 }
326 
327 /*
328  *  Initialise hwpmc.
329  */
330 static void
331 init_hwpmc(void *dummy __unused)
332 {
333 	if (pmc_softevents <= 0 ||
334 	    pmc_softevents > PMC_EV_DYN_COUNT) {
335 		(void) printf("hwpmc: tunable \"softevents\"=%d out of "
336 		    "range.\n", pmc_softevents);
337 		pmc_softevents = PMC_EV_DYN_COUNT;
338 	}
339 	pmc_softs = malloc(pmc_softevents * sizeof(struct pmc_soft *), M_PMCHOOKS, M_NOWAIT|M_ZERO);
340 	KASSERT(pmc_softs != NULL, ("cannot allocate soft events table"));
341 }
342 
343 SYSINIT(hwpmc, SI_SUB_KDTRACE, SI_ORDER_FIRST, init_hwpmc, NULL);
344 
345