xref: /linux/tools/perf/util/record.c (revision 5643b1a59e581ac3f66d36caba8124313cc446c0)
1 // SPDX-License-Identifier: GPL-2.0
2 #include "evlist.h"
3 #include "evsel.h"
4 #include "cpumap.h"
5 #include "parse-events.h"
6 #include <errno.h>
7 #include <api/fs/fs.h>
8 #include <subcmd/parse-options.h>
9 #include <perf/cpumap.h>
10 #include "util.h"
11 #include "cloexec.h"
12 
13 typedef void (*setup_probe_fn_t)(struct evsel *evsel);
14 
15 static int perf_do_probe_api(setup_probe_fn_t fn, int cpu, const char *str)
16 {
17 	struct evlist *evlist;
18 	struct evsel *evsel;
19 	unsigned long flags = perf_event_open_cloexec_flag();
20 	int err = -EAGAIN, fd;
21 	static pid_t pid = -1;
22 
23 	evlist = evlist__new();
24 	if (!evlist)
25 		return -ENOMEM;
26 
27 	if (parse_events(evlist, str, NULL))
28 		goto out_delete;
29 
30 	evsel = perf_evlist__first(evlist);
31 
32 	while (1) {
33 		fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags);
34 		if (fd < 0) {
35 			if (pid == -1 && errno == EACCES) {
36 				pid = 0;
37 				continue;
38 			}
39 			goto out_delete;
40 		}
41 		break;
42 	}
43 	close(fd);
44 
45 	fn(evsel);
46 
47 	fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags);
48 	if (fd < 0) {
49 		if (errno == EINVAL)
50 			err = -EINVAL;
51 		goto out_delete;
52 	}
53 	close(fd);
54 	err = 0;
55 
56 out_delete:
57 	evlist__delete(evlist);
58 	return err;
59 }
60 
61 static bool perf_probe_api(setup_probe_fn_t fn)
62 {
63 	const char *try[] = {"cycles:u", "instructions:u", "cpu-clock:u", NULL};
64 	struct perf_cpu_map *cpus;
65 	int cpu, ret, i = 0;
66 
67 	cpus = perf_cpu_map__new(NULL);
68 	if (!cpus)
69 		return false;
70 	cpu = cpus->map[0];
71 	perf_cpu_map__put(cpus);
72 
73 	do {
74 		ret = perf_do_probe_api(fn, cpu, try[i++]);
75 		if (!ret)
76 			return true;
77 	} while (ret == -EAGAIN && try[i]);
78 
79 	return false;
80 }
81 
82 static void perf_probe_sample_identifier(struct evsel *evsel)
83 {
84 	evsel->core.attr.sample_type |= PERF_SAMPLE_IDENTIFIER;
85 }
86 
87 static void perf_probe_comm_exec(struct evsel *evsel)
88 {
89 	evsel->core.attr.comm_exec = 1;
90 }
91 
92 static void perf_probe_context_switch(struct evsel *evsel)
93 {
94 	evsel->core.attr.context_switch = 1;
95 }
96 
97 bool perf_can_sample_identifier(void)
98 {
99 	return perf_probe_api(perf_probe_sample_identifier);
100 }
101 
102 static bool perf_can_comm_exec(void)
103 {
104 	return perf_probe_api(perf_probe_comm_exec);
105 }
106 
107 bool perf_can_record_switch_events(void)
108 {
109 	return perf_probe_api(perf_probe_context_switch);
110 }
111 
112 bool perf_can_record_cpu_wide(void)
113 {
114 	struct perf_event_attr attr = {
115 		.type = PERF_TYPE_SOFTWARE,
116 		.config = PERF_COUNT_SW_CPU_CLOCK,
117 		.exclude_kernel = 1,
118 	};
119 	struct perf_cpu_map *cpus;
120 	int cpu, fd;
121 
122 	cpus = perf_cpu_map__new(NULL);
123 	if (!cpus)
124 		return false;
125 	cpu = cpus->map[0];
126 	perf_cpu_map__put(cpus);
127 
128 	fd = sys_perf_event_open(&attr, -1, cpu, -1, 0);
129 	if (fd < 0)
130 		return false;
131 	close(fd);
132 
133 	return true;
134 }
135 
136 void perf_evlist__config(struct evlist *evlist, struct record_opts *opts,
137 			 struct callchain_param *callchain)
138 {
139 	struct evsel *evsel;
140 	bool use_sample_identifier = false;
141 	bool use_comm_exec;
142 	bool sample_id = opts->sample_id;
143 
144 	/*
145 	 * Set the evsel leader links before we configure attributes,
146 	 * since some might depend on this info.
147 	 */
148 	if (opts->group)
149 		perf_evlist__set_leader(evlist);
150 
151 	if (evlist->core.cpus->map[0] < 0)
152 		opts->no_inherit = true;
153 
154 	use_comm_exec = perf_can_comm_exec();
155 
156 	evlist__for_each_entry(evlist, evsel) {
157 		perf_evsel__config(evsel, opts, callchain);
158 		if (evsel->tracking && use_comm_exec)
159 			evsel->core.attr.comm_exec = 1;
160 	}
161 
162 	if (opts->full_auxtrace) {
163 		/*
164 		 * Need to be able to synthesize and parse selected events with
165 		 * arbitrary sample types, which requires always being able to
166 		 * match the id.
167 		 */
168 		use_sample_identifier = perf_can_sample_identifier();
169 		sample_id = true;
170 	} else if (evlist->core.nr_entries > 1) {
171 		struct evsel *first = perf_evlist__first(evlist);
172 
173 		evlist__for_each_entry(evlist, evsel) {
174 			if (evsel->core.attr.sample_type == first->core.attr.sample_type)
175 				continue;
176 			use_sample_identifier = perf_can_sample_identifier();
177 			break;
178 		}
179 		sample_id = true;
180 	}
181 
182 	if (sample_id) {
183 		evlist__for_each_entry(evlist, evsel)
184 			perf_evsel__set_sample_id(evsel, use_sample_identifier);
185 	}
186 
187 	perf_evlist__set_id_pos(evlist);
188 }
189 
190 static int get_max_rate(unsigned int *rate)
191 {
192 	return sysctl__read_int("kernel/perf_event_max_sample_rate", (int *)rate);
193 }
194 
195 static int record_opts__config_freq(struct record_opts *opts)
196 {
197 	bool user_freq = opts->user_freq != UINT_MAX;
198 	unsigned int max_rate;
199 
200 	if (opts->user_interval != ULLONG_MAX)
201 		opts->default_interval = opts->user_interval;
202 	if (user_freq)
203 		opts->freq = opts->user_freq;
204 
205 	/*
206 	 * User specified count overrides default frequency.
207 	 */
208 	if (opts->default_interval)
209 		opts->freq = 0;
210 	else if (opts->freq) {
211 		opts->default_interval = opts->freq;
212 	} else {
213 		pr_err("frequency and count are zero, aborting\n");
214 		return -1;
215 	}
216 
217 	if (get_max_rate(&max_rate))
218 		return 0;
219 
220 	/*
221 	 * User specified frequency is over current maximum.
222 	 */
223 	if (user_freq && (max_rate < opts->freq)) {
224 		if (opts->strict_freq) {
225 			pr_err("error: Maximum frequency rate (%'u Hz) exceeded.\n"
226 			       "       Please use -F freq option with a lower value or consider\n"
227 			       "       tweaking /proc/sys/kernel/perf_event_max_sample_rate.\n",
228 			       max_rate);
229 			return -1;
230 		} else {
231 			pr_warning("warning: Maximum frequency rate (%'u Hz) exceeded, throttling from %'u Hz to %'u Hz.\n"
232 				   "         The limit can be raised via /proc/sys/kernel/perf_event_max_sample_rate.\n"
233 				   "         The kernel will lower it when perf's interrupts take too long.\n"
234 				   "         Use --strict-freq to disable this throttling, refusing to record.\n",
235 				   max_rate, opts->freq, max_rate);
236 
237 			opts->freq = max_rate;
238 		}
239 	}
240 
241 	/*
242 	 * Default frequency is over current maximum.
243 	 */
244 	if (max_rate < opts->freq) {
245 		pr_warning("Lowering default frequency rate to %u.\n"
246 			   "Please consider tweaking "
247 			   "/proc/sys/kernel/perf_event_max_sample_rate.\n",
248 			   max_rate);
249 		opts->freq = max_rate;
250 	}
251 
252 	return 0;
253 }
254 
255 int record_opts__config(struct record_opts *opts)
256 {
257 	return record_opts__config_freq(opts);
258 }
259 
260 bool perf_evlist__can_select_event(struct evlist *evlist, const char *str)
261 {
262 	struct evlist *temp_evlist;
263 	struct evsel *evsel;
264 	int err, fd, cpu;
265 	bool ret = false;
266 	pid_t pid = -1;
267 
268 	temp_evlist = evlist__new();
269 	if (!temp_evlist)
270 		return false;
271 
272 	err = parse_events(temp_evlist, str, NULL);
273 	if (err)
274 		goto out_delete;
275 
276 	evsel = perf_evlist__last(temp_evlist);
277 
278 	if (!evlist || cpu_map__empty(evlist->core.cpus)) {
279 		struct perf_cpu_map *cpus = perf_cpu_map__new(NULL);
280 
281 		cpu =  cpus ? cpus->map[0] : 0;
282 		perf_cpu_map__put(cpus);
283 	} else {
284 		cpu = evlist->core.cpus->map[0];
285 	}
286 
287 	while (1) {
288 		fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1,
289 					 perf_event_open_cloexec_flag());
290 		if (fd < 0) {
291 			if (pid == -1 && errno == EACCES) {
292 				pid = 0;
293 				continue;
294 			}
295 			goto out_delete;
296 		}
297 		break;
298 	}
299 	close(fd);
300 	ret = true;
301 
302 out_delete:
303 	evlist__delete(temp_evlist);
304 	return ret;
305 }
306 
307 int record__parse_freq(const struct option *opt, const char *str, int unset __maybe_unused)
308 {
309 	unsigned int freq;
310 	struct record_opts *opts = opt->value;
311 
312 	if (!str)
313 		return -EINVAL;
314 
315 	if (strcasecmp(str, "max") == 0) {
316 		if (get_max_rate(&freq)) {
317 			pr_err("couldn't read /proc/sys/kernel/perf_event_max_sample_rate\n");
318 			return -1;
319 		}
320 		pr_info("info: Using a maximum frequency rate of %'d Hz\n", freq);
321 	} else {
322 		freq = atoi(str);
323 	}
324 
325 	opts->user_freq = freq;
326 	return 0;
327 }
328