xref: /linux/tools/lib/bpf/libbpf_probes.c (revision c83b49383b595be50647f0c764a48c78b5f3c4f8)
1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2 /* Copyright (c) 2019 Netronome Systems, Inc. */
3 
4 #include <errno.h>
5 #include <fcntl.h>
6 #include <string.h>
7 #include <stdlib.h>
8 #include <unistd.h>
9 #include <net/if.h>
10 #include <sys/utsname.h>
11 
12 #include <linux/btf.h>
13 #include <linux/filter.h>
14 #include <linux/kernel.h>
15 #include <linux/version.h>
16 
17 #include "bpf.h"
18 #include "libbpf.h"
19 #include "libbpf_internal.h"
20 
21 /* On Ubuntu LINUX_VERSION_CODE doesn't correspond to info.release,
22  * but Ubuntu provides /proc/version_signature file, as described at
23  * https://ubuntu.com/kernel, with an example contents below, which we
24  * can use to get a proper LINUX_VERSION_CODE.
25  *
26  *   Ubuntu 5.4.0-12.15-generic 5.4.8
27  *
28  * In the above, 5.4.8 is what kernel is actually expecting, while
29  * uname() call will return 5.4.0 in info.release.
30  */
31 static __u32 get_ubuntu_kernel_version(void)
32 {
33 	const char *ubuntu_kver_file = "/proc/version_signature";
34 	__u32 major, minor, patch;
35 	int ret;
36 	FILE *f;
37 
38 	if (faccessat(AT_FDCWD, ubuntu_kver_file, R_OK, AT_EACCESS) != 0)
39 		return 0;
40 
41 	f = fopen(ubuntu_kver_file, "r");
42 	if (!f)
43 		return 0;
44 
45 	ret = fscanf(f, "%*s %*s %u.%u.%u\n", &major, &minor, &patch);
46 	fclose(f);
47 	if (ret != 3)
48 		return 0;
49 
50 	return KERNEL_VERSION(major, minor, patch);
51 }
52 
53 /* On Debian LINUX_VERSION_CODE doesn't correspond to info.release.
54  * Instead, it is provided in info.version. An example content of
55  * Debian 10 looks like the below.
56  *
57  *   utsname::release   4.19.0-22-amd64
58  *   utsname::version   #1 SMP Debian 4.19.260-1 (2022-09-29)
59  *
60  * In the above, 4.19.260 is what kernel is actually expecting, while
61  * uname() call will return 4.19.0 in info.release.
62  */
63 static __u32 get_debian_kernel_version(struct utsname *info)
64 {
65 	__u32 major, minor, patch;
66 	char *p;
67 
68 	p = strstr(info->version, "Debian ");
69 	if (!p) {
70 		/* This is not a Debian kernel. */
71 		return 0;
72 	}
73 
74 	if (sscanf(p, "Debian %u.%u.%u", &major, &minor, &patch) != 3)
75 		return 0;
76 
77 	return KERNEL_VERSION(major, minor, patch);
78 }
79 
80 __u32 get_kernel_version(void)
81 {
82 	__u32 major, minor, patch, version;
83 	struct utsname info;
84 
85 	/* Check if this is an Ubuntu kernel. */
86 	version = get_ubuntu_kernel_version();
87 	if (version != 0)
88 		return version;
89 
90 	uname(&info);
91 
92 	/* Check if this is a Debian kernel. */
93 	version = get_debian_kernel_version(&info);
94 	if (version != 0)
95 		return version;
96 
97 	if (sscanf(info.release, "%u.%u.%u", &major, &minor, &patch) != 3)
98 		return 0;
99 
100 	return KERNEL_VERSION(major, minor, patch);
101 }
102 
103 static int probe_prog_load(enum bpf_prog_type prog_type,
104 			   const struct bpf_insn *insns, size_t insns_cnt,
105 			   char *log_buf, size_t log_buf_sz)
106 {
107 	LIBBPF_OPTS(bpf_prog_load_opts, opts,
108 		.log_buf = log_buf,
109 		.log_size = log_buf_sz,
110 		.log_level = log_buf ? 1 : 0,
111 	);
112 	int fd, err, exp_err = 0;
113 	const char *exp_msg = NULL;
114 	char buf[4096];
115 
116 	switch (prog_type) {
117 	case BPF_PROG_TYPE_CGROUP_SOCK_ADDR:
118 		opts.expected_attach_type = BPF_CGROUP_INET4_CONNECT;
119 		break;
120 	case BPF_PROG_TYPE_CGROUP_SOCKOPT:
121 		opts.expected_attach_type = BPF_CGROUP_GETSOCKOPT;
122 		break;
123 	case BPF_PROG_TYPE_SK_LOOKUP:
124 		opts.expected_attach_type = BPF_SK_LOOKUP;
125 		break;
126 	case BPF_PROG_TYPE_KPROBE:
127 		opts.kern_version = get_kernel_version();
128 		break;
129 	case BPF_PROG_TYPE_LIRC_MODE2:
130 		opts.expected_attach_type = BPF_LIRC_MODE2;
131 		break;
132 	case BPF_PROG_TYPE_TRACING:
133 	case BPF_PROG_TYPE_LSM:
134 		opts.log_buf = buf;
135 		opts.log_size = sizeof(buf);
136 		opts.log_level = 1;
137 		if (prog_type == BPF_PROG_TYPE_TRACING)
138 			opts.expected_attach_type = BPF_TRACE_FENTRY;
139 		else
140 			opts.expected_attach_type = BPF_MODIFY_RETURN;
141 		opts.attach_btf_id = 1;
142 
143 		exp_err = -EINVAL;
144 		exp_msg = "attach_btf_id 1 is not a function";
145 		break;
146 	case BPF_PROG_TYPE_EXT:
147 		opts.log_buf = buf;
148 		opts.log_size = sizeof(buf);
149 		opts.log_level = 1;
150 		opts.attach_btf_id = 1;
151 
152 		exp_err = -EINVAL;
153 		exp_msg = "Cannot replace kernel functions";
154 		break;
155 	case BPF_PROG_TYPE_SYSCALL:
156 		opts.prog_flags = BPF_F_SLEEPABLE;
157 		break;
158 	case BPF_PROG_TYPE_STRUCT_OPS:
159 		exp_err = -524; /* -ENOTSUPP */
160 		break;
161 	case BPF_PROG_TYPE_UNSPEC:
162 	case BPF_PROG_TYPE_SOCKET_FILTER:
163 	case BPF_PROG_TYPE_SCHED_CLS:
164 	case BPF_PROG_TYPE_SCHED_ACT:
165 	case BPF_PROG_TYPE_TRACEPOINT:
166 	case BPF_PROG_TYPE_XDP:
167 	case BPF_PROG_TYPE_PERF_EVENT:
168 	case BPF_PROG_TYPE_CGROUP_SKB:
169 	case BPF_PROG_TYPE_CGROUP_SOCK:
170 	case BPF_PROG_TYPE_LWT_IN:
171 	case BPF_PROG_TYPE_LWT_OUT:
172 	case BPF_PROG_TYPE_LWT_XMIT:
173 	case BPF_PROG_TYPE_SOCK_OPS:
174 	case BPF_PROG_TYPE_SK_SKB:
175 	case BPF_PROG_TYPE_CGROUP_DEVICE:
176 	case BPF_PROG_TYPE_SK_MSG:
177 	case BPF_PROG_TYPE_RAW_TRACEPOINT:
178 	case BPF_PROG_TYPE_RAW_TRACEPOINT_WRITABLE:
179 	case BPF_PROG_TYPE_LWT_SEG6LOCAL:
180 	case BPF_PROG_TYPE_SK_REUSEPORT:
181 	case BPF_PROG_TYPE_FLOW_DISSECTOR:
182 	case BPF_PROG_TYPE_CGROUP_SYSCTL:
183 	case BPF_PROG_TYPE_NETFILTER:
184 		break;
185 	default:
186 		return -EOPNOTSUPP;
187 	}
188 
189 	fd = bpf_prog_load(prog_type, NULL, "GPL", insns, insns_cnt, &opts);
190 	err = -errno;
191 	if (fd >= 0)
192 		close(fd);
193 	if (exp_err) {
194 		if (fd >= 0 || err != exp_err)
195 			return 0;
196 		if (exp_msg && !strstr(buf, exp_msg))
197 			return 0;
198 		return 1;
199 	}
200 	return fd >= 0 ? 1 : 0;
201 }
202 
203 int libbpf_probe_bpf_prog_type(enum bpf_prog_type prog_type, const void *opts)
204 {
205 	struct bpf_insn insns[] = {
206 		BPF_MOV64_IMM(BPF_REG_0, 0),
207 		BPF_EXIT_INSN()
208 	};
209 	const size_t insn_cnt = ARRAY_SIZE(insns);
210 	int ret;
211 
212 	if (opts)
213 		return libbpf_err(-EINVAL);
214 
215 	ret = probe_prog_load(prog_type, insns, insn_cnt, NULL, 0);
216 	return libbpf_err(ret);
217 }
218 
219 int libbpf__load_raw_btf(const char *raw_types, size_t types_len,
220 			 const char *str_sec, size_t str_len)
221 {
222 	struct btf_header hdr = {
223 		.magic = BTF_MAGIC,
224 		.version = BTF_VERSION,
225 		.hdr_len = sizeof(struct btf_header),
226 		.type_len = types_len,
227 		.str_off = types_len,
228 		.str_len = str_len,
229 	};
230 	int btf_fd, btf_len;
231 	__u8 *raw_btf;
232 
233 	btf_len = hdr.hdr_len + hdr.type_len + hdr.str_len;
234 	raw_btf = malloc(btf_len);
235 	if (!raw_btf)
236 		return -ENOMEM;
237 
238 	memcpy(raw_btf, &hdr, sizeof(hdr));
239 	memcpy(raw_btf + hdr.hdr_len, raw_types, hdr.type_len);
240 	memcpy(raw_btf + hdr.hdr_len + hdr.type_len, str_sec, hdr.str_len);
241 
242 	btf_fd = bpf_btf_load(raw_btf, btf_len, NULL);
243 
244 	free(raw_btf);
245 	return btf_fd;
246 }
247 
248 static int load_local_storage_btf(void)
249 {
250 	const char strs[] = "\0bpf_spin_lock\0val\0cnt\0l";
251 	/* struct bpf_spin_lock {
252 	 *   int val;
253 	 * };
254 	 * struct val {
255 	 *   int cnt;
256 	 *   struct bpf_spin_lock l;
257 	 * };
258 	 */
259 	__u32 types[] = {
260 		/* int */
261 		BTF_TYPE_INT_ENC(0, BTF_INT_SIGNED, 0, 32, 4),  /* [1] */
262 		/* struct bpf_spin_lock */                      /* [2] */
263 		BTF_TYPE_ENC(1, BTF_INFO_ENC(BTF_KIND_STRUCT, 0, 1), 4),
264 		BTF_MEMBER_ENC(15, 1, 0), /* int val; */
265 		/* struct val */                                /* [3] */
266 		BTF_TYPE_ENC(15, BTF_INFO_ENC(BTF_KIND_STRUCT, 0, 2), 8),
267 		BTF_MEMBER_ENC(19, 1, 0), /* int cnt; */
268 		BTF_MEMBER_ENC(23, 2, 32),/* struct bpf_spin_lock l; */
269 	};
270 
271 	return libbpf__load_raw_btf((char *)types, sizeof(types),
272 				     strs, sizeof(strs));
273 }
274 
275 static int probe_map_create(enum bpf_map_type map_type)
276 {
277 	LIBBPF_OPTS(bpf_map_create_opts, opts);
278 	int key_size, value_size, max_entries;
279 	__u32 btf_key_type_id = 0, btf_value_type_id = 0;
280 	int fd = -1, btf_fd = -1, fd_inner = -1, exp_err = 0, err = 0;
281 
282 	key_size	= sizeof(__u32);
283 	value_size	= sizeof(__u32);
284 	max_entries	= 1;
285 
286 	switch (map_type) {
287 	case BPF_MAP_TYPE_STACK_TRACE:
288 		value_size	= sizeof(__u64);
289 		break;
290 	case BPF_MAP_TYPE_LPM_TRIE:
291 		key_size	= sizeof(__u64);
292 		value_size	= sizeof(__u64);
293 		opts.map_flags	= BPF_F_NO_PREALLOC;
294 		break;
295 	case BPF_MAP_TYPE_CGROUP_STORAGE:
296 	case BPF_MAP_TYPE_PERCPU_CGROUP_STORAGE:
297 		key_size	= sizeof(struct bpf_cgroup_storage_key);
298 		value_size	= sizeof(__u64);
299 		max_entries	= 0;
300 		break;
301 	case BPF_MAP_TYPE_QUEUE:
302 	case BPF_MAP_TYPE_STACK:
303 		key_size	= 0;
304 		break;
305 	case BPF_MAP_TYPE_SK_STORAGE:
306 	case BPF_MAP_TYPE_INODE_STORAGE:
307 	case BPF_MAP_TYPE_TASK_STORAGE:
308 	case BPF_MAP_TYPE_CGRP_STORAGE:
309 		btf_key_type_id = 1;
310 		btf_value_type_id = 3;
311 		value_size = 8;
312 		max_entries = 0;
313 		opts.map_flags = BPF_F_NO_PREALLOC;
314 		btf_fd = load_local_storage_btf();
315 		if (btf_fd < 0)
316 			return btf_fd;
317 		break;
318 	case BPF_MAP_TYPE_RINGBUF:
319 	case BPF_MAP_TYPE_USER_RINGBUF:
320 		key_size = 0;
321 		value_size = 0;
322 		max_entries = sysconf(_SC_PAGE_SIZE);
323 		break;
324 	case BPF_MAP_TYPE_STRUCT_OPS:
325 		/* we'll get -ENOTSUPP for invalid BTF type ID for struct_ops */
326 		opts.btf_vmlinux_value_type_id = 1;
327 		exp_err = -524; /* -ENOTSUPP */
328 		break;
329 	case BPF_MAP_TYPE_BLOOM_FILTER:
330 		key_size = 0;
331 		max_entries = 1;
332 		break;
333 	case BPF_MAP_TYPE_HASH:
334 	case BPF_MAP_TYPE_ARRAY:
335 	case BPF_MAP_TYPE_PROG_ARRAY:
336 	case BPF_MAP_TYPE_PERF_EVENT_ARRAY:
337 	case BPF_MAP_TYPE_PERCPU_HASH:
338 	case BPF_MAP_TYPE_PERCPU_ARRAY:
339 	case BPF_MAP_TYPE_CGROUP_ARRAY:
340 	case BPF_MAP_TYPE_LRU_HASH:
341 	case BPF_MAP_TYPE_LRU_PERCPU_HASH:
342 	case BPF_MAP_TYPE_ARRAY_OF_MAPS:
343 	case BPF_MAP_TYPE_HASH_OF_MAPS:
344 	case BPF_MAP_TYPE_DEVMAP:
345 	case BPF_MAP_TYPE_DEVMAP_HASH:
346 	case BPF_MAP_TYPE_SOCKMAP:
347 	case BPF_MAP_TYPE_CPUMAP:
348 	case BPF_MAP_TYPE_XSKMAP:
349 	case BPF_MAP_TYPE_SOCKHASH:
350 	case BPF_MAP_TYPE_REUSEPORT_SOCKARRAY:
351 		break;
352 	case BPF_MAP_TYPE_UNSPEC:
353 	default:
354 		return -EOPNOTSUPP;
355 	}
356 
357 	if (map_type == BPF_MAP_TYPE_ARRAY_OF_MAPS ||
358 	    map_type == BPF_MAP_TYPE_HASH_OF_MAPS) {
359 		fd_inner = bpf_map_create(BPF_MAP_TYPE_HASH, NULL,
360 					  sizeof(__u32), sizeof(__u32), 1, NULL);
361 		if (fd_inner < 0)
362 			goto cleanup;
363 
364 		opts.inner_map_fd = fd_inner;
365 	}
366 
367 	if (btf_fd >= 0) {
368 		opts.btf_fd = btf_fd;
369 		opts.btf_key_type_id = btf_key_type_id;
370 		opts.btf_value_type_id = btf_value_type_id;
371 	}
372 
373 	fd = bpf_map_create(map_type, NULL, key_size, value_size, max_entries, &opts);
374 	err = -errno;
375 
376 cleanup:
377 	if (fd >= 0)
378 		close(fd);
379 	if (fd_inner >= 0)
380 		close(fd_inner);
381 	if (btf_fd >= 0)
382 		close(btf_fd);
383 
384 	if (exp_err)
385 		return fd < 0 && err == exp_err ? 1 : 0;
386 	else
387 		return fd >= 0 ? 1 : 0;
388 }
389 
390 int libbpf_probe_bpf_map_type(enum bpf_map_type map_type, const void *opts)
391 {
392 	int ret;
393 
394 	if (opts)
395 		return libbpf_err(-EINVAL);
396 
397 	ret = probe_map_create(map_type);
398 	return libbpf_err(ret);
399 }
400 
401 int libbpf_probe_bpf_helper(enum bpf_prog_type prog_type, enum bpf_func_id helper_id,
402 			    const void *opts)
403 {
404 	struct bpf_insn insns[] = {
405 		BPF_EMIT_CALL((__u32)helper_id),
406 		BPF_EXIT_INSN(),
407 	};
408 	const size_t insn_cnt = ARRAY_SIZE(insns);
409 	char buf[4096];
410 	int ret;
411 
412 	if (opts)
413 		return libbpf_err(-EINVAL);
414 
415 	/* we can't successfully load all prog types to check for BPF helper
416 	 * support, so bail out with -EOPNOTSUPP error
417 	 */
418 	switch (prog_type) {
419 	case BPF_PROG_TYPE_TRACING:
420 	case BPF_PROG_TYPE_EXT:
421 	case BPF_PROG_TYPE_LSM:
422 	case BPF_PROG_TYPE_STRUCT_OPS:
423 		return -EOPNOTSUPP;
424 	default:
425 		break;
426 	}
427 
428 	buf[0] = '\0';
429 	ret = probe_prog_load(prog_type, insns, insn_cnt, buf, sizeof(buf));
430 	if (ret < 0)
431 		return libbpf_err(ret);
432 
433 	/* If BPF verifier doesn't recognize BPF helper ID (enum bpf_func_id)
434 	 * at all, it will emit something like "invalid func unknown#181".
435 	 * If BPF verifier recognizes BPF helper but it's not supported for
436 	 * given BPF program type, it will emit "unknown func bpf_sys_bpf#166".
437 	 * In both cases, provided combination of BPF program type and BPF
438 	 * helper is not supported by the kernel.
439 	 * In all other cases, probe_prog_load() above will either succeed (e.g.,
440 	 * because BPF helper happens to accept no input arguments or it
441 	 * accepts one input argument and initial PTR_TO_CTX is fine for
442 	 * that), or we'll get some more specific BPF verifier error about
443 	 * some unsatisfied conditions.
444 	 */
445 	if (ret == 0 && (strstr(buf, "invalid func ") || strstr(buf, "unknown func ")))
446 		return 0;
447 	return 1; /* assume supported */
448 }
449