xref: /linux/tools/lib/perf/evlist.c (revision f4f346c3465949ebba80c6cc52cd8d2eeaa545fd)
1 // SPDX-License-Identifier: GPL-2.0
2 #include <perf/evlist.h>
3 #include <perf/evsel.h>
4 #include <linux/bitops.h>
5 #include <linux/list.h>
6 #include <linux/hash.h>
7 #include <sys/ioctl.h>
8 #include <internal/evlist.h>
9 #include <internal/evsel.h>
10 #include <internal/xyarray.h>
11 #include <internal/mmap.h>
12 #include <internal/cpumap.h>
13 #include <internal/threadmap.h>
14 #include <internal/lib.h>
15 #include <linux/zalloc.h>
16 #include <stdlib.h>
17 #include <errno.h>
18 #include <unistd.h>
19 #include <fcntl.h>
20 #include <signal.h>
21 #include <poll.h>
22 #include <sys/mman.h>
23 #include <perf/cpumap.h>
24 #include <perf/threadmap.h>
25 #include <api/fd/array.h>
26 #include "internal.h"
27 
perf_evlist__init(struct perf_evlist * evlist)28 void perf_evlist__init(struct perf_evlist *evlist)
29 {
30 	INIT_LIST_HEAD(&evlist->entries);
31 	evlist->nr_entries = 0;
32 	fdarray__init(&evlist->pollfd, 64);
33 	perf_evlist__reset_id_hash(evlist);
34 }
35 
__perf_evlist__propagate_maps(struct perf_evlist * evlist,struct perf_evsel * evsel)36 static void __perf_evlist__propagate_maps(struct perf_evlist *evlist,
37 					  struct perf_evsel *evsel)
38 {
39 	if (perf_cpu_map__is_empty(evsel->cpus)) {
40 		if (perf_cpu_map__is_empty(evsel->pmu_cpus)) {
41 			/*
42 			 * Assume the unset PMU cpus were for a system-wide
43 			 * event, like a software or tracepoint.
44 			 */
45 			evsel->pmu_cpus = perf_cpu_map__new_online_cpus();
46 		}
47 		if (evlist->has_user_cpus && !evsel->system_wide) {
48 			/*
49 			 * Use the user CPUs unless the evsel is set to be
50 			 * system wide, such as the dummy event.
51 			 */
52 			evsel->cpus = perf_cpu_map__get(evlist->user_requested_cpus);
53 		} else {
54 			/*
55 			 * System wide and other modes, assume the cpu map
56 			 * should be set to all PMU CPUs.
57 			 */
58 			evsel->cpus = perf_cpu_map__get(evsel->pmu_cpus);
59 		}
60 	}
61 	/*
62 	 * Avoid "any CPU"(-1) for uncore and PMUs that require a CPU, even if
63 	 * requested.
64 	 */
65 	if (evsel->requires_cpu && perf_cpu_map__has_any_cpu(evsel->cpus)) {
66 		perf_cpu_map__put(evsel->cpus);
67 		evsel->cpus = perf_cpu_map__get(evsel->pmu_cpus);
68 	}
69 
70 	/*
71 	 * Globally requested CPUs replace user requested unless the evsel is
72 	 * set to be system wide.
73 	 */
74 	if (evlist->has_user_cpus && !evsel->system_wide) {
75 		assert(!perf_cpu_map__has_any_cpu(evlist->user_requested_cpus));
76 		if (!perf_cpu_map__equal(evsel->cpus, evlist->user_requested_cpus)) {
77 			perf_cpu_map__put(evsel->cpus);
78 			evsel->cpus = perf_cpu_map__get(evlist->user_requested_cpus);
79 		}
80 	}
81 
82 	/* Ensure cpus only references valid PMU CPUs. */
83 	if (!perf_cpu_map__has_any_cpu(evsel->cpus) &&
84 	    !perf_cpu_map__is_subset(evsel->pmu_cpus, evsel->cpus)) {
85 		struct perf_cpu_map *tmp = perf_cpu_map__intersect(evsel->pmu_cpus, evsel->cpus);
86 
87 		perf_cpu_map__put(evsel->cpus);
88 		evsel->cpus = tmp;
89 	}
90 
91 	/*
92 	 * Was event requested on all the PMU's CPUs but the user requested is
93 	 * any CPU (-1)? If so switch to using any CPU (-1) to reduce the number
94 	 * of events.
95 	 */
96 	if (!evsel->system_wide &&
97 	    !evsel->requires_cpu &&
98 	    perf_cpu_map__equal(evsel->cpus, evsel->pmu_cpus) &&
99 	    perf_cpu_map__has_any_cpu(evlist->user_requested_cpus)) {
100 		perf_cpu_map__put(evsel->cpus);
101 		evsel->cpus = perf_cpu_map__get(evlist->user_requested_cpus);
102 	}
103 
104 	/* Sanity check assert before the evsel is potentially removed. */
105 	assert(!evsel->requires_cpu || !perf_cpu_map__has_any_cpu(evsel->cpus));
106 
107 	/*
108 	 * Empty cpu lists would eventually get opened as "any" so remove
109 	 * genuinely empty ones before they're opened in the wrong place.
110 	 */
111 	if (perf_cpu_map__is_empty(evsel->cpus)) {
112 		struct perf_evsel *next = perf_evlist__next(evlist, evsel);
113 
114 		perf_evlist__remove(evlist, evsel);
115 		/* Keep idx contiguous */
116 		if (next)
117 			list_for_each_entry_from(next, &evlist->entries, node)
118 				next->idx--;
119 
120 		return;
121 	}
122 
123 	if (evsel->system_wide) {
124 		perf_thread_map__put(evsel->threads);
125 		evsel->threads = perf_thread_map__new_dummy();
126 	} else {
127 		perf_thread_map__put(evsel->threads);
128 		evsel->threads = perf_thread_map__get(evlist->threads);
129 	}
130 
131 	perf_cpu_map__merge(&evlist->all_cpus, evsel->cpus);
132 }
133 
perf_evlist__propagate_maps(struct perf_evlist * evlist)134 static void perf_evlist__propagate_maps(struct perf_evlist *evlist)
135 {
136 	struct perf_evsel *evsel, *n;
137 
138 	evlist->needs_map_propagation = true;
139 
140 	/* Clear the all_cpus set which will be merged into during propagation. */
141 	perf_cpu_map__put(evlist->all_cpus);
142 	evlist->all_cpus = NULL;
143 
144 	list_for_each_entry_safe(evsel, n, &evlist->entries, node)
145 		__perf_evlist__propagate_maps(evlist, evsel);
146 }
147 
perf_evlist__add(struct perf_evlist * evlist,struct perf_evsel * evsel)148 void perf_evlist__add(struct perf_evlist *evlist,
149 		      struct perf_evsel *evsel)
150 {
151 	evsel->idx = evlist->nr_entries;
152 	list_add_tail(&evsel->node, &evlist->entries);
153 	evlist->nr_entries += 1;
154 
155 	if (evlist->needs_map_propagation)
156 		__perf_evlist__propagate_maps(evlist, evsel);
157 }
158 
perf_evlist__remove(struct perf_evlist * evlist,struct perf_evsel * evsel)159 void perf_evlist__remove(struct perf_evlist *evlist,
160 			 struct perf_evsel *evsel)
161 {
162 	list_del_init(&evsel->node);
163 	evlist->nr_entries -= 1;
164 }
165 
perf_evlist__new(void)166 struct perf_evlist *perf_evlist__new(void)
167 {
168 	struct perf_evlist *evlist = zalloc(sizeof(*evlist));
169 
170 	if (evlist != NULL)
171 		perf_evlist__init(evlist);
172 
173 	return evlist;
174 }
175 
176 struct perf_evsel *
perf_evlist__next(struct perf_evlist * evlist,struct perf_evsel * prev)177 perf_evlist__next(struct perf_evlist *evlist, struct perf_evsel *prev)
178 {
179 	struct perf_evsel *next;
180 
181 	if (!prev) {
182 		next = list_first_entry(&evlist->entries,
183 					struct perf_evsel,
184 					node);
185 	} else {
186 		next = list_next_entry(prev, node);
187 	}
188 
189 	/* Empty list is noticed here so don't need checking on entry. */
190 	if (&next->node == &evlist->entries)
191 		return NULL;
192 
193 	return next;
194 }
195 
perf_evlist__purge(struct perf_evlist * evlist)196 static void perf_evlist__purge(struct perf_evlist *evlist)
197 {
198 	struct perf_evsel *pos, *n;
199 
200 	perf_evlist__for_each_entry_safe(evlist, n, pos) {
201 		list_del_init(&pos->node);
202 		perf_evsel__delete(pos);
203 	}
204 
205 	evlist->nr_entries = 0;
206 }
207 
perf_evlist__exit(struct perf_evlist * evlist)208 void perf_evlist__exit(struct perf_evlist *evlist)
209 {
210 	perf_cpu_map__put(evlist->user_requested_cpus);
211 	perf_cpu_map__put(evlist->all_cpus);
212 	perf_thread_map__put(evlist->threads);
213 	evlist->user_requested_cpus = NULL;
214 	evlist->all_cpus = NULL;
215 	evlist->threads = NULL;
216 	fdarray__exit(&evlist->pollfd);
217 }
218 
perf_evlist__delete(struct perf_evlist * evlist)219 void perf_evlist__delete(struct perf_evlist *evlist)
220 {
221 	if (evlist == NULL)
222 		return;
223 
224 	perf_evlist__munmap(evlist);
225 	perf_evlist__close(evlist);
226 	perf_evlist__purge(evlist);
227 	perf_evlist__exit(evlist);
228 	free(evlist);
229 }
230 
perf_evlist__set_maps(struct perf_evlist * evlist,struct perf_cpu_map * cpus,struct perf_thread_map * threads)231 void perf_evlist__set_maps(struct perf_evlist *evlist,
232 			   struct perf_cpu_map *cpus,
233 			   struct perf_thread_map *threads)
234 {
235 	/*
236 	 * Allow for the possibility that one or another of the maps isn't being
237 	 * changed i.e. don't put it.  Note we are assuming the maps that are
238 	 * being applied are brand new and evlist is taking ownership of the
239 	 * original reference count of 1.  If that is not the case it is up to
240 	 * the caller to increase the reference count.
241 	 */
242 	if (cpus != evlist->user_requested_cpus) {
243 		perf_cpu_map__put(evlist->user_requested_cpus);
244 		evlist->user_requested_cpus = perf_cpu_map__get(cpus);
245 	}
246 
247 	if (threads != evlist->threads) {
248 		perf_thread_map__put(evlist->threads);
249 		evlist->threads = perf_thread_map__get(threads);
250 	}
251 
252 	perf_evlist__propagate_maps(evlist);
253 }
254 
perf_evlist__open(struct perf_evlist * evlist)255 int perf_evlist__open(struct perf_evlist *evlist)
256 {
257 	struct perf_evsel *evsel;
258 	int err;
259 
260 	perf_evlist__for_each_entry(evlist, evsel) {
261 		err = perf_evsel__open(evsel, evsel->cpus, evsel->threads);
262 		if (err < 0)
263 			goto out_err;
264 	}
265 
266 	return 0;
267 
268 out_err:
269 	perf_evlist__close(evlist);
270 	return err;
271 }
272 
perf_evlist__close(struct perf_evlist * evlist)273 void perf_evlist__close(struct perf_evlist *evlist)
274 {
275 	struct perf_evsel *evsel;
276 
277 	perf_evlist__for_each_entry_reverse(evlist, evsel)
278 		perf_evsel__close(evsel);
279 }
280 
perf_evlist__enable(struct perf_evlist * evlist)281 void perf_evlist__enable(struct perf_evlist *evlist)
282 {
283 	struct perf_evsel *evsel;
284 
285 	perf_evlist__for_each_entry(evlist, evsel)
286 		perf_evsel__enable(evsel);
287 }
288 
perf_evlist__disable(struct perf_evlist * evlist)289 void perf_evlist__disable(struct perf_evlist *evlist)
290 {
291 	struct perf_evsel *evsel;
292 
293 	perf_evlist__for_each_entry(evlist, evsel)
294 		perf_evsel__disable(evsel);
295 }
296 
perf_evlist__read_format(struct perf_evlist * evlist)297 u64 perf_evlist__read_format(struct perf_evlist *evlist)
298 {
299 	struct perf_evsel *first = perf_evlist__first(evlist);
300 
301 	return first->attr.read_format;
302 }
303 
304 #define SID(e, x, y) xyarray__entry(e->sample_id, x, y)
305 
perf_evlist__id_hash(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu_map_idx,int thread,u64 id)306 static void perf_evlist__id_hash(struct perf_evlist *evlist,
307 				 struct perf_evsel *evsel,
308 				 int cpu_map_idx, int thread, u64 id)
309 {
310 	int hash;
311 	struct perf_sample_id *sid = SID(evsel, cpu_map_idx, thread);
312 
313 	sid->id = id;
314 	sid->evsel = evsel;
315 	hash = hash_64(sid->id, PERF_EVLIST__HLIST_BITS);
316 	hlist_add_head(&sid->node, &evlist->heads[hash]);
317 }
318 
perf_evlist__reset_id_hash(struct perf_evlist * evlist)319 void perf_evlist__reset_id_hash(struct perf_evlist *evlist)
320 {
321 	int i;
322 
323 	for (i = 0; i < PERF_EVLIST__HLIST_SIZE; ++i)
324 		INIT_HLIST_HEAD(&evlist->heads[i]);
325 }
326 
perf_evlist__id_add(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu_map_idx,int thread,u64 id)327 void perf_evlist__id_add(struct perf_evlist *evlist,
328 			 struct perf_evsel *evsel,
329 			 int cpu_map_idx, int thread, u64 id)
330 {
331 	if (!SID(evsel, cpu_map_idx, thread))
332 		return;
333 
334 	perf_evlist__id_hash(evlist, evsel, cpu_map_idx, thread, id);
335 	evsel->id[evsel->ids++] = id;
336 }
337 
perf_evlist__id_add_fd(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu_map_idx,int thread,int fd)338 int perf_evlist__id_add_fd(struct perf_evlist *evlist,
339 			   struct perf_evsel *evsel,
340 			   int cpu_map_idx, int thread, int fd)
341 {
342 	u64 read_data[4] = { 0, };
343 	int id_idx = 1; /* The first entry is the counter value */
344 	u64 id;
345 	int ret;
346 
347 	if (!SID(evsel, cpu_map_idx, thread))
348 		return -1;
349 
350 	ret = ioctl(fd, PERF_EVENT_IOC_ID, &id);
351 	if (!ret)
352 		goto add;
353 
354 	if (errno != ENOTTY)
355 		return -1;
356 
357 	/* Legacy way to get event id.. All hail to old kernels! */
358 
359 	/*
360 	 * This way does not work with group format read, so bail
361 	 * out in that case.
362 	 */
363 	if (perf_evlist__read_format(evlist) & PERF_FORMAT_GROUP)
364 		return -1;
365 
366 	if (!(evsel->attr.read_format & PERF_FORMAT_ID) ||
367 	    read(fd, &read_data, sizeof(read_data)) == -1)
368 		return -1;
369 
370 	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
371 		++id_idx;
372 	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
373 		++id_idx;
374 
375 	id = read_data[id_idx];
376 
377 add:
378 	perf_evlist__id_add(evlist, evsel, cpu_map_idx, thread, id);
379 	return 0;
380 }
381 
perf_evlist__alloc_pollfd(struct perf_evlist * evlist)382 int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
383 {
384 	int nr_cpus = perf_cpu_map__nr(evlist->all_cpus);
385 	int nr_threads = perf_thread_map__nr(evlist->threads);
386 	int nfds = 0;
387 	struct perf_evsel *evsel;
388 
389 	perf_evlist__for_each_entry(evlist, evsel) {
390 		if (evsel->system_wide)
391 			nfds += nr_cpus;
392 		else
393 			nfds += nr_cpus * nr_threads;
394 	}
395 
396 	if (fdarray__available_entries(&evlist->pollfd) < nfds &&
397 	    fdarray__grow(&evlist->pollfd, nfds) < 0)
398 		return -ENOMEM;
399 
400 	return 0;
401 }
402 
perf_evlist__add_pollfd(struct perf_evlist * evlist,int fd,void * ptr,short revent,enum fdarray_flags flags)403 int perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd,
404 			    void *ptr, short revent, enum fdarray_flags flags)
405 {
406 	int pos = fdarray__add(&evlist->pollfd, fd, revent | POLLERR | POLLHUP, flags);
407 
408 	if (pos >= 0) {
409 		evlist->pollfd.priv[pos].ptr = ptr;
410 		fcntl(fd, F_SETFL, O_NONBLOCK);
411 	}
412 
413 	return pos;
414 }
415 
perf_evlist__munmap_filtered(struct fdarray * fda,int fd,void * arg __maybe_unused)416 static void perf_evlist__munmap_filtered(struct fdarray *fda, int fd,
417 					 void *arg __maybe_unused)
418 {
419 	struct perf_mmap *map = fda->priv[fd].ptr;
420 
421 	if (map)
422 		perf_mmap__put(map);
423 }
424 
perf_evlist__filter_pollfd(struct perf_evlist * evlist,short revents_and_mask)425 int perf_evlist__filter_pollfd(struct perf_evlist *evlist, short revents_and_mask)
426 {
427 	return fdarray__filter(&evlist->pollfd, revents_and_mask,
428 			       perf_evlist__munmap_filtered, NULL);
429 }
430 
perf_evlist__poll(struct perf_evlist * evlist,int timeout)431 int perf_evlist__poll(struct perf_evlist *evlist, int timeout)
432 {
433 	return fdarray__poll(&evlist->pollfd, timeout);
434 }
435 
perf_evlist__alloc_mmap(struct perf_evlist * evlist,bool overwrite)436 static struct perf_mmap* perf_evlist__alloc_mmap(struct perf_evlist *evlist, bool overwrite)
437 {
438 	int i;
439 	struct perf_mmap *map;
440 
441 	map = zalloc(evlist->nr_mmaps * sizeof(struct perf_mmap));
442 	if (!map)
443 		return NULL;
444 
445 	for (i = 0; i < evlist->nr_mmaps; i++) {
446 		struct perf_mmap *prev = i ? &map[i - 1] : NULL;
447 
448 		/*
449 		 * When the perf_mmap() call is made we grab one refcount, plus
450 		 * one extra to let perf_mmap__consume() get the last
451 		 * events after all real references (perf_mmap__get()) are
452 		 * dropped.
453 		 *
454 		 * Each PERF_EVENT_IOC_SET_OUTPUT points to this mmap and
455 		 * thus does perf_mmap__get() on it.
456 		 */
457 		perf_mmap__init(&map[i], prev, overwrite, NULL);
458 	}
459 
460 	return map;
461 }
462 
perf_evsel__set_sid_idx(struct perf_evsel * evsel,int idx,int cpu,int thread)463 static void perf_evsel__set_sid_idx(struct perf_evsel *evsel, int idx, int cpu, int thread)
464 {
465 	struct perf_sample_id *sid = SID(evsel, cpu, thread);
466 
467 	sid->idx = idx;
468 	sid->cpu = perf_cpu_map__cpu(evsel->cpus, cpu);
469 	sid->tid = perf_thread_map__pid(evsel->threads, thread);
470 }
471 
472 static struct perf_mmap*
perf_evlist__mmap_cb_get(struct perf_evlist * evlist,bool overwrite,int idx)473 perf_evlist__mmap_cb_get(struct perf_evlist *evlist, bool overwrite, int idx)
474 {
475 	struct perf_mmap *maps;
476 
477 	maps = overwrite ? evlist->mmap_ovw : evlist->mmap;
478 
479 	if (!maps) {
480 		maps = perf_evlist__alloc_mmap(evlist, overwrite);
481 		if (!maps)
482 			return NULL;
483 
484 		if (overwrite)
485 			evlist->mmap_ovw = maps;
486 		else
487 			evlist->mmap = maps;
488 	}
489 
490 	return &maps[idx];
491 }
492 
493 #define FD(e, x, y) (*(int *) xyarray__entry(e->fd, x, y))
494 
495 static int
perf_evlist__mmap_cb_mmap(struct perf_mmap * map,struct perf_mmap_param * mp,int output,struct perf_cpu cpu)496 perf_evlist__mmap_cb_mmap(struct perf_mmap *map, struct perf_mmap_param *mp,
497 			  int output, struct perf_cpu cpu)
498 {
499 	return perf_mmap__mmap(map, mp, output, cpu);
500 }
501 
perf_evlist__set_mmap_first(struct perf_evlist * evlist,struct perf_mmap * map,bool overwrite)502 static void perf_evlist__set_mmap_first(struct perf_evlist *evlist, struct perf_mmap *map,
503 					bool overwrite)
504 {
505 	if (overwrite)
506 		evlist->mmap_ovw_first = map;
507 	else
508 		evlist->mmap_first = map;
509 }
510 
511 static int
mmap_per_evsel(struct perf_evlist * evlist,struct perf_evlist_mmap_ops * ops,int idx,struct perf_mmap_param * mp,int cpu_idx,int thread,int * _output,int * _output_overwrite,int * nr_mmaps)512 mmap_per_evsel(struct perf_evlist *evlist, struct perf_evlist_mmap_ops *ops,
513 	       int idx, struct perf_mmap_param *mp, int cpu_idx,
514 	       int thread, int *_output, int *_output_overwrite, int *nr_mmaps)
515 {
516 	struct perf_cpu evlist_cpu = perf_cpu_map__cpu(evlist->all_cpus, cpu_idx);
517 	struct perf_evsel *evsel;
518 	int revent;
519 
520 	perf_evlist__for_each_entry(evlist, evsel) {
521 		bool overwrite = evsel->attr.write_backward;
522 		enum fdarray_flags flgs;
523 		struct perf_mmap *map;
524 		int *output, fd, cpu;
525 
526 		if (evsel->system_wide && thread)
527 			continue;
528 
529 		cpu = perf_cpu_map__idx(evsel->cpus, evlist_cpu);
530 		if (cpu == -1)
531 			continue;
532 
533 		map = ops->get(evlist, overwrite, idx);
534 		if (map == NULL)
535 			return -ENOMEM;
536 
537 		if (overwrite) {
538 			mp->prot = PROT_READ;
539 			output   = _output_overwrite;
540 		} else {
541 			mp->prot = PROT_READ | PROT_WRITE;
542 			output   = _output;
543 		}
544 
545 		fd = FD(evsel, cpu, thread);
546 
547 		if (*output == -1) {
548 			*output = fd;
549 
550 			/*
551 			 * The last one will be done at perf_mmap__consume(), so that we
552 			 * make sure we don't prevent tools from consuming every last event in
553 			 * the ring buffer.
554 			 *
555 			 * I.e. we can get the POLLHUP meaning that the fd doesn't exist
556 			 * anymore, but the last events for it are still in the ring buffer,
557 			 * waiting to be consumed.
558 			 *
559 			 * Tools can chose to ignore this at their own discretion, but the
560 			 * evlist layer can't just drop it when filtering events in
561 			 * perf_evlist__filter_pollfd().
562 			 */
563 			refcount_set(&map->refcnt, 2);
564 
565 			if (ops->idx)
566 				ops->idx(evlist, evsel, mp, idx);
567 
568 			/* Debug message used by test scripts */
569 			pr_debug("idx %d: mmapping fd %d\n", idx, *output);
570 			if (ops->mmap(map, mp, *output, evlist_cpu) < 0)
571 				return -1;
572 
573 			*nr_mmaps += 1;
574 
575 			if (!idx)
576 				perf_evlist__set_mmap_first(evlist, map, overwrite);
577 		} else {
578 			/* Debug message used by test scripts */
579 			pr_debug("idx %d: set output fd %d -> %d\n", idx, fd, *output);
580 			if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT, *output) != 0)
581 				return -1;
582 
583 			perf_mmap__get(map);
584 		}
585 
586 		revent = !overwrite ? POLLIN : 0;
587 
588 		flgs = evsel->system_wide ? fdarray_flag__nonfilterable : fdarray_flag__default;
589 		if (perf_evlist__add_pollfd(evlist, fd, map, revent, flgs) < 0) {
590 			perf_mmap__put(map);
591 			return -1;
592 		}
593 
594 		if (evsel->attr.read_format & PERF_FORMAT_ID) {
595 			if (perf_evlist__id_add_fd(evlist, evsel, cpu, thread,
596 						   fd) < 0)
597 				return -1;
598 			perf_evsel__set_sid_idx(evsel, idx, cpu, thread);
599 		}
600 	}
601 
602 	return 0;
603 }
604 
605 static int
mmap_per_thread(struct perf_evlist * evlist,struct perf_evlist_mmap_ops * ops,struct perf_mmap_param * mp)606 mmap_per_thread(struct perf_evlist *evlist, struct perf_evlist_mmap_ops *ops,
607 		struct perf_mmap_param *mp)
608 {
609 	int nr_threads = perf_thread_map__nr(evlist->threads);
610 	int nr_cpus    = perf_cpu_map__nr(evlist->all_cpus);
611 	int cpu, thread, idx = 0;
612 	int nr_mmaps = 0;
613 
614 	pr_debug("%s: nr cpu values (may include -1) %d nr threads %d\n",
615 		 __func__, nr_cpus, nr_threads);
616 
617 	/* per-thread mmaps */
618 	for (thread = 0; thread < nr_threads; thread++, idx++) {
619 		int output = -1;
620 		int output_overwrite = -1;
621 
622 		if (mmap_per_evsel(evlist, ops, idx, mp, 0, thread, &output,
623 				   &output_overwrite, &nr_mmaps))
624 			goto out_unmap;
625 	}
626 
627 	/* system-wide mmaps i.e. per-cpu */
628 	for (cpu = 1; cpu < nr_cpus; cpu++, idx++) {
629 		int output = -1;
630 		int output_overwrite = -1;
631 
632 		if (mmap_per_evsel(evlist, ops, idx, mp, cpu, 0, &output,
633 				   &output_overwrite, &nr_mmaps))
634 			goto out_unmap;
635 	}
636 
637 	if (nr_mmaps != evlist->nr_mmaps)
638 		pr_err("Miscounted nr_mmaps %d vs %d\n", nr_mmaps, evlist->nr_mmaps);
639 
640 	return 0;
641 
642 out_unmap:
643 	perf_evlist__munmap(evlist);
644 	return -1;
645 }
646 
647 static int
mmap_per_cpu(struct perf_evlist * evlist,struct perf_evlist_mmap_ops * ops,struct perf_mmap_param * mp)648 mmap_per_cpu(struct perf_evlist *evlist, struct perf_evlist_mmap_ops *ops,
649 	     struct perf_mmap_param *mp)
650 {
651 	int nr_threads = perf_thread_map__nr(evlist->threads);
652 	int nr_cpus    = perf_cpu_map__nr(evlist->all_cpus);
653 	int nr_mmaps = 0;
654 	int cpu, thread;
655 
656 	pr_debug("%s: nr cpu values %d nr threads %d\n", __func__, nr_cpus, nr_threads);
657 
658 	for (cpu = 0; cpu < nr_cpus; cpu++) {
659 		int output = -1;
660 		int output_overwrite = -1;
661 
662 		for (thread = 0; thread < nr_threads; thread++) {
663 			if (mmap_per_evsel(evlist, ops, cpu, mp, cpu,
664 					   thread, &output, &output_overwrite, &nr_mmaps))
665 				goto out_unmap;
666 		}
667 	}
668 
669 	if (nr_mmaps != evlist->nr_mmaps)
670 		pr_err("Miscounted nr_mmaps %d vs %d\n", nr_mmaps, evlist->nr_mmaps);
671 
672 	return 0;
673 
674 out_unmap:
675 	perf_evlist__munmap(evlist);
676 	return -1;
677 }
678 
perf_evlist__nr_mmaps(struct perf_evlist * evlist)679 static int perf_evlist__nr_mmaps(struct perf_evlist *evlist)
680 {
681 	int nr_mmaps;
682 
683 	/* One for each CPU */
684 	nr_mmaps = perf_cpu_map__nr(evlist->all_cpus);
685 	if (perf_cpu_map__has_any_cpu_or_is_empty(evlist->all_cpus)) {
686 		/* Plus one for each thread */
687 		nr_mmaps += perf_thread_map__nr(evlist->threads);
688 		/* Minus the per-thread CPU (-1) */
689 		nr_mmaps -= 1;
690 	}
691 
692 	return nr_mmaps;
693 }
694 
perf_evlist__mmap_ops(struct perf_evlist * evlist,struct perf_evlist_mmap_ops * ops,struct perf_mmap_param * mp)695 int perf_evlist__mmap_ops(struct perf_evlist *evlist,
696 			  struct perf_evlist_mmap_ops *ops,
697 			  struct perf_mmap_param *mp)
698 {
699 	const struct perf_cpu_map *cpus = evlist->all_cpus;
700 	struct perf_evsel *evsel;
701 
702 	if (!ops || !ops->get || !ops->mmap)
703 		return -EINVAL;
704 
705 	mp->mask = evlist->mmap_len - page_size - 1;
706 
707 	evlist->nr_mmaps = perf_evlist__nr_mmaps(evlist);
708 
709 	perf_evlist__for_each_entry(evlist, evsel) {
710 		if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
711 		    evsel->sample_id == NULL &&
712 		    perf_evsel__alloc_id(evsel, evsel->fd->max_x, evsel->fd->max_y) < 0)
713 			return -ENOMEM;
714 	}
715 
716 	if (evlist->pollfd.entries == NULL && perf_evlist__alloc_pollfd(evlist) < 0)
717 		return -ENOMEM;
718 
719 	if (perf_cpu_map__has_any_cpu_or_is_empty(cpus))
720 		return mmap_per_thread(evlist, ops, mp);
721 
722 	return mmap_per_cpu(evlist, ops, mp);
723 }
724 
perf_evlist__mmap(struct perf_evlist * evlist,int pages)725 int perf_evlist__mmap(struct perf_evlist *evlist, int pages)
726 {
727 	struct perf_mmap_param mp;
728 	struct perf_evlist_mmap_ops ops = {
729 		.get  = perf_evlist__mmap_cb_get,
730 		.mmap = perf_evlist__mmap_cb_mmap,
731 	};
732 
733 	evlist->mmap_len = (pages + 1) * page_size;
734 
735 	return perf_evlist__mmap_ops(evlist, &ops, &mp);
736 }
737 
perf_evlist__munmap(struct perf_evlist * evlist)738 void perf_evlist__munmap(struct perf_evlist *evlist)
739 {
740 	int i;
741 
742 	if (evlist->mmap) {
743 		for (i = 0; i < evlist->nr_mmaps; i++)
744 			perf_mmap__munmap(&evlist->mmap[i]);
745 	}
746 
747 	if (evlist->mmap_ovw) {
748 		for (i = 0; i < evlist->nr_mmaps; i++)
749 			perf_mmap__munmap(&evlist->mmap_ovw[i]);
750 	}
751 
752 	zfree(&evlist->mmap);
753 	zfree(&evlist->mmap_ovw);
754 }
755 
756 struct perf_mmap*
perf_evlist__next_mmap(struct perf_evlist * evlist,struct perf_mmap * map,bool overwrite)757 perf_evlist__next_mmap(struct perf_evlist *evlist, struct perf_mmap *map,
758 		       bool overwrite)
759 {
760 	if (map)
761 		return map->next;
762 
763 	return overwrite ? evlist->mmap_ovw_first : evlist->mmap_first;
764 }
765 
__perf_evlist__set_leader(struct list_head * list,struct perf_evsel * leader)766 void __perf_evlist__set_leader(struct list_head *list, struct perf_evsel *leader)
767 {
768 	struct perf_evsel *evsel;
769 	int n = 0;
770 
771 	__perf_evlist__for_each_entry(list, evsel) {
772 		evsel->leader = leader;
773 		n++;
774 	}
775 	leader->nr_members = n;
776 }
777 
perf_evlist__set_leader(struct perf_evlist * evlist)778 void perf_evlist__set_leader(struct perf_evlist *evlist)
779 {
780 	if (evlist->nr_entries) {
781 		struct perf_evsel *first = list_entry(evlist->entries.next,
782 						struct perf_evsel, node);
783 
784 		__perf_evlist__set_leader(&evlist->entries, first);
785 	}
786 }
787 
perf_evlist__nr_groups(struct perf_evlist * evlist)788 int perf_evlist__nr_groups(struct perf_evlist *evlist)
789 {
790 	struct perf_evsel *evsel;
791 	int nr_groups = 0;
792 
793 	perf_evlist__for_each_evsel(evlist, evsel) {
794 		/*
795 		 * evsels by default have a nr_members of 1, and they are their
796 		 * own leader. If the nr_members is >1 then this is an
797 		 * indication of a group.
798 		 */
799 		if (evsel->leader == evsel && evsel->nr_members > 1)
800 			nr_groups++;
801 	}
802 	return nr_groups;
803 }
804 
perf_evlist__go_system_wide(struct perf_evlist * evlist,struct perf_evsel * evsel)805 void perf_evlist__go_system_wide(struct perf_evlist *evlist, struct perf_evsel *evsel)
806 {
807 	if (!evsel->system_wide) {
808 		evsel->system_wide = true;
809 		if (evlist->needs_map_propagation)
810 			__perf_evlist__propagate_maps(evlist, evsel);
811 	}
812 }
813