1 // SPDX-License-Identifier: GPL-2.0 2 #include "evlist.h" 3 #include "evsel.h" 4 #include "cpumap.h" 5 #include "parse-events.h" 6 #include <errno.h> 7 #include <api/fs/fs.h> 8 #include <subcmd/parse-options.h> 9 #include <perf/cpumap.h> 10 #include "util.h" 11 #include "cloexec.h" 12 13 typedef void (*setup_probe_fn_t)(struct evsel *evsel); 14 15 static int perf_do_probe_api(setup_probe_fn_t fn, int cpu, const char *str) 16 { 17 struct evlist *evlist; 18 struct evsel *evsel; 19 unsigned long flags = perf_event_open_cloexec_flag(); 20 int err = -EAGAIN, fd; 21 static pid_t pid = -1; 22 23 evlist = evlist__new(); 24 if (!evlist) 25 return -ENOMEM; 26 27 if (parse_events(evlist, str, NULL)) 28 goto out_delete; 29 30 evsel = perf_evlist__first(evlist); 31 32 while (1) { 33 fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags); 34 if (fd < 0) { 35 if (pid == -1 && errno == EACCES) { 36 pid = 0; 37 continue; 38 } 39 goto out_delete; 40 } 41 break; 42 } 43 close(fd); 44 45 fn(evsel); 46 47 fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags); 48 if (fd < 0) { 49 if (errno == EINVAL) 50 err = -EINVAL; 51 goto out_delete; 52 } 53 close(fd); 54 err = 0; 55 56 out_delete: 57 evlist__delete(evlist); 58 return err; 59 } 60 61 static bool perf_probe_api(setup_probe_fn_t fn) 62 { 63 const char *try[] = {"cycles:u", "instructions:u", "cpu-clock:u", NULL}; 64 struct perf_cpu_map *cpus; 65 int cpu, ret, i = 0; 66 67 cpus = perf_cpu_map__new(NULL); 68 if (!cpus) 69 return false; 70 cpu = cpus->map[0]; 71 perf_cpu_map__put(cpus); 72 73 do { 74 ret = perf_do_probe_api(fn, cpu, try[i++]); 75 if (!ret) 76 return true; 77 } while (ret == -EAGAIN && try[i]); 78 79 return false; 80 } 81 82 static void perf_probe_sample_identifier(struct evsel *evsel) 83 { 84 evsel->core.attr.sample_type |= PERF_SAMPLE_IDENTIFIER; 85 } 86 87 static void perf_probe_comm_exec(struct evsel *evsel) 88 { 89 evsel->core.attr.comm_exec = 1; 90 } 91 92 static void perf_probe_context_switch(struct evsel *evsel) 93 { 94 evsel->core.attr.context_switch = 1; 95 } 96 97 bool perf_can_sample_identifier(void) 98 { 99 return perf_probe_api(perf_probe_sample_identifier); 100 } 101 102 static bool perf_can_comm_exec(void) 103 { 104 return perf_probe_api(perf_probe_comm_exec); 105 } 106 107 bool perf_can_record_switch_events(void) 108 { 109 return perf_probe_api(perf_probe_context_switch); 110 } 111 112 bool perf_can_record_cpu_wide(void) 113 { 114 struct perf_event_attr attr = { 115 .type = PERF_TYPE_SOFTWARE, 116 .config = PERF_COUNT_SW_CPU_CLOCK, 117 .exclude_kernel = 1, 118 }; 119 struct perf_cpu_map *cpus; 120 int cpu, fd; 121 122 cpus = perf_cpu_map__new(NULL); 123 if (!cpus) 124 return false; 125 cpu = cpus->map[0]; 126 perf_cpu_map__put(cpus); 127 128 fd = sys_perf_event_open(&attr, -1, cpu, -1, 0); 129 if (fd < 0) 130 return false; 131 close(fd); 132 133 return true; 134 } 135 136 void perf_evlist__config(struct evlist *evlist, struct record_opts *opts, 137 struct callchain_param *callchain) 138 { 139 struct evsel *evsel; 140 bool use_sample_identifier = false; 141 bool use_comm_exec; 142 bool sample_id = opts->sample_id; 143 144 /* 145 * Set the evsel leader links before we configure attributes, 146 * since some might depend on this info. 147 */ 148 if (opts->group) 149 perf_evlist__set_leader(evlist); 150 151 if (evlist->core.cpus->map[0] < 0) 152 opts->no_inherit = true; 153 154 use_comm_exec = perf_can_comm_exec(); 155 156 evlist__for_each_entry(evlist, evsel) { 157 perf_evsel__config(evsel, opts, callchain); 158 if (evsel->tracking && use_comm_exec) 159 evsel->core.attr.comm_exec = 1; 160 } 161 162 if (opts->full_auxtrace) { 163 /* 164 * Need to be able to synthesize and parse selected events with 165 * arbitrary sample types, which requires always being able to 166 * match the id. 167 */ 168 use_sample_identifier = perf_can_sample_identifier(); 169 sample_id = true; 170 } else if (evlist->core.nr_entries > 1) { 171 struct evsel *first = perf_evlist__first(evlist); 172 173 evlist__for_each_entry(evlist, evsel) { 174 if (evsel->core.attr.sample_type == first->core.attr.sample_type) 175 continue; 176 use_sample_identifier = perf_can_sample_identifier(); 177 break; 178 } 179 sample_id = true; 180 } 181 182 if (sample_id) { 183 evlist__for_each_entry(evlist, evsel) 184 perf_evsel__set_sample_id(evsel, use_sample_identifier); 185 } 186 187 perf_evlist__set_id_pos(evlist); 188 } 189 190 static int get_max_rate(unsigned int *rate) 191 { 192 return sysctl__read_int("kernel/perf_event_max_sample_rate", (int *)rate); 193 } 194 195 static int record_opts__config_freq(struct record_opts *opts) 196 { 197 bool user_freq = opts->user_freq != UINT_MAX; 198 unsigned int max_rate; 199 200 if (opts->user_interval != ULLONG_MAX) 201 opts->default_interval = opts->user_interval; 202 if (user_freq) 203 opts->freq = opts->user_freq; 204 205 /* 206 * User specified count overrides default frequency. 207 */ 208 if (opts->default_interval) 209 opts->freq = 0; 210 else if (opts->freq) { 211 opts->default_interval = opts->freq; 212 } else { 213 pr_err("frequency and count are zero, aborting\n"); 214 return -1; 215 } 216 217 if (get_max_rate(&max_rate)) 218 return 0; 219 220 /* 221 * User specified frequency is over current maximum. 222 */ 223 if (user_freq && (max_rate < opts->freq)) { 224 if (opts->strict_freq) { 225 pr_err("error: Maximum frequency rate (%'u Hz) exceeded.\n" 226 " Please use -F freq option with a lower value or consider\n" 227 " tweaking /proc/sys/kernel/perf_event_max_sample_rate.\n", 228 max_rate); 229 return -1; 230 } else { 231 pr_warning("warning: Maximum frequency rate (%'u Hz) exceeded, throttling from %'u Hz to %'u Hz.\n" 232 " The limit can be raised via /proc/sys/kernel/perf_event_max_sample_rate.\n" 233 " The kernel will lower it when perf's interrupts take too long.\n" 234 " Use --strict-freq to disable this throttling, refusing to record.\n", 235 max_rate, opts->freq, max_rate); 236 237 opts->freq = max_rate; 238 } 239 } 240 241 /* 242 * Default frequency is over current maximum. 243 */ 244 if (max_rate < opts->freq) { 245 pr_warning("Lowering default frequency rate to %u.\n" 246 "Please consider tweaking " 247 "/proc/sys/kernel/perf_event_max_sample_rate.\n", 248 max_rate); 249 opts->freq = max_rate; 250 } 251 252 return 0; 253 } 254 255 int record_opts__config(struct record_opts *opts) 256 { 257 return record_opts__config_freq(opts); 258 } 259 260 bool perf_evlist__can_select_event(struct evlist *evlist, const char *str) 261 { 262 struct evlist *temp_evlist; 263 struct evsel *evsel; 264 int err, fd, cpu; 265 bool ret = false; 266 pid_t pid = -1; 267 268 temp_evlist = evlist__new(); 269 if (!temp_evlist) 270 return false; 271 272 err = parse_events(temp_evlist, str, NULL); 273 if (err) 274 goto out_delete; 275 276 evsel = perf_evlist__last(temp_evlist); 277 278 if (!evlist || cpu_map__empty(evlist->core.cpus)) { 279 struct perf_cpu_map *cpus = perf_cpu_map__new(NULL); 280 281 cpu = cpus ? cpus->map[0] : 0; 282 perf_cpu_map__put(cpus); 283 } else { 284 cpu = evlist->core.cpus->map[0]; 285 } 286 287 while (1) { 288 fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, 289 perf_event_open_cloexec_flag()); 290 if (fd < 0) { 291 if (pid == -1 && errno == EACCES) { 292 pid = 0; 293 continue; 294 } 295 goto out_delete; 296 } 297 break; 298 } 299 close(fd); 300 ret = true; 301 302 out_delete: 303 evlist__delete(temp_evlist); 304 return ret; 305 } 306 307 int record__parse_freq(const struct option *opt, const char *str, int unset __maybe_unused) 308 { 309 unsigned int freq; 310 struct record_opts *opts = opt->value; 311 312 if (!str) 313 return -EINVAL; 314 315 if (strcasecmp(str, "max") == 0) { 316 if (get_max_rate(&freq)) { 317 pr_err("couldn't read /proc/sys/kernel/perf_event_max_sample_rate\n"); 318 return -1; 319 } 320 pr_info("info: Using a maximum frequency rate of %'d Hz\n", freq); 321 } else { 322 freq = atoi(str); 323 } 324 325 opts->user_freq = freq; 326 return 0; 327 } 328