1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2
3 /*
4 * common eBPF ELF operations.
5 *
6 * Copyright (C) 2013-2015 Alexei Starovoitov <ast@kernel.org>
7 * Copyright (C) 2015 Wang Nan <wangnan0@huawei.com>
8 * Copyright (C) 2015 Huawei Inc.
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU Lesser General Public
12 * License as published by the Free Software Foundation;
13 * version 2.1 of the License (not later!)
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU Lesser General Public License for more details.
19 *
20 * You should have received a copy of the GNU Lesser General Public
21 * License along with this program; if not, see <http://www.gnu.org/licenses>
22 */
23
24 #include <stdlib.h>
25 #include <string.h>
26 #include <memory.h>
27 #include <unistd.h>
28 #include <asm/unistd.h>
29 #include <errno.h>
30 #include <linux/bpf.h>
31 #include <linux/filter.h>
32 #include <linux/kernel.h>
33 #include <limits.h>
34 #include <sys/resource.h>
35 #include "bpf.h"
36 #include "libbpf.h"
37 #include "libbpf_internal.h"
38
39 /*
40 * When building perf, unistd.h is overridden. __NR_bpf is
41 * required to be defined explicitly.
42 */
43 #ifndef __NR_bpf
44 # if defined(__i386__)
45 # define __NR_bpf 357
46 # elif defined(__x86_64__)
47 # define __NR_bpf 321
48 # elif defined(__aarch64__)
49 # define __NR_bpf 280
50 # elif defined(__sparc__)
51 # define __NR_bpf 349
52 # elif defined(__s390__)
53 # define __NR_bpf 351
54 # elif defined(__arc__)
55 # define __NR_bpf 280
56 # elif defined(__mips__) && defined(_ABIO32)
57 # define __NR_bpf 4355
58 # elif defined(__mips__) && defined(_ABIN32)
59 # define __NR_bpf 6319
60 # elif defined(__mips__) && defined(_ABI64)
61 # define __NR_bpf 5315
62 # else
63 # error __NR_bpf not defined. libbpf does not support your arch.
64 # endif
65 #endif
66
ptr_to_u64(const void * ptr)67 static inline __u64 ptr_to_u64(const void *ptr)
68 {
69 return (__u64) (unsigned long) ptr;
70 }
71
sys_bpf(enum bpf_cmd cmd,union bpf_attr * attr,unsigned int size)72 static inline int sys_bpf(enum bpf_cmd cmd, union bpf_attr *attr,
73 unsigned int size)
74 {
75 return syscall(__NR_bpf, cmd, attr, size);
76 }
77
sys_bpf_fd(enum bpf_cmd cmd,union bpf_attr * attr,unsigned int size)78 static inline int sys_bpf_fd(enum bpf_cmd cmd, union bpf_attr *attr,
79 unsigned int size)
80 {
81 int fd;
82
83 fd = sys_bpf(cmd, attr, size);
84 return ensure_good_fd(fd);
85 }
86
sys_bpf_prog_load(union bpf_attr * attr,unsigned int size,int attempts)87 int sys_bpf_prog_load(union bpf_attr *attr, unsigned int size, int attempts)
88 {
89 int fd;
90
91 do {
92 fd = sys_bpf_fd(BPF_PROG_LOAD, attr, size);
93 } while (fd < 0 && errno == EAGAIN && --attempts > 0);
94
95 return fd;
96 }
97
98 /* Probe whether kernel switched from memlock-based (RLIMIT_MEMLOCK) to
99 * memcg-based memory accounting for BPF maps and progs. This was done in [0].
100 * We use the support for bpf_ktime_get_coarse_ns() helper, which was added in
101 * the same 5.11 Linux release ([1]), to detect memcg-based accounting for BPF.
102 *
103 * [0] https://lore.kernel.org/bpf/20201201215900.3569844-1-guro@fb.com/
104 * [1] d05512618056 ("bpf: Add bpf_ktime_get_coarse_ns helper")
105 */
probe_memcg_account(int token_fd)106 int probe_memcg_account(int token_fd)
107 {
108 const size_t attr_sz = offsetofend(union bpf_attr, prog_token_fd);
109 struct bpf_insn insns[] = {
110 BPF_EMIT_CALL(BPF_FUNC_ktime_get_coarse_ns),
111 BPF_EXIT_INSN(),
112 };
113 size_t insn_cnt = ARRAY_SIZE(insns);
114 union bpf_attr attr;
115 int prog_fd;
116
117 /* attempt loading freplace trying to use custom BTF */
118 memset(&attr, 0, attr_sz);
119 attr.prog_type = BPF_PROG_TYPE_SOCKET_FILTER;
120 attr.insns = ptr_to_u64(insns);
121 attr.insn_cnt = insn_cnt;
122 attr.license = ptr_to_u64("GPL");
123 attr.prog_token_fd = token_fd;
124 if (token_fd)
125 attr.prog_flags |= BPF_F_TOKEN_FD;
126
127 prog_fd = sys_bpf_fd(BPF_PROG_LOAD, &attr, attr_sz);
128 if (prog_fd >= 0) {
129 close(prog_fd);
130 return 1;
131 }
132 return 0;
133 }
134
135 static bool memlock_bumped;
136 static rlim_t memlock_rlim = RLIM_INFINITY;
137
libbpf_set_memlock_rlim(size_t memlock_bytes)138 int libbpf_set_memlock_rlim(size_t memlock_bytes)
139 {
140 if (memlock_bumped)
141 return libbpf_err(-EBUSY);
142
143 memlock_rlim = memlock_bytes;
144 return 0;
145 }
146
bump_rlimit_memlock(void)147 int bump_rlimit_memlock(void)
148 {
149 struct rlimit rlim;
150
151 /* if kernel supports memcg-based accounting, skip bumping RLIMIT_MEMLOCK */
152 if (memlock_bumped || feat_supported(NULL, FEAT_MEMCG_ACCOUNT))
153 return 0;
154
155 memlock_bumped = true;
156
157 /* zero memlock_rlim_max disables auto-bumping RLIMIT_MEMLOCK */
158 if (memlock_rlim == 0)
159 return 0;
160
161 rlim.rlim_cur = rlim.rlim_max = memlock_rlim;
162 if (setrlimit(RLIMIT_MEMLOCK, &rlim))
163 return -errno;
164
165 return 0;
166 }
167
bpf_map_create(enum bpf_map_type map_type,const char * map_name,__u32 key_size,__u32 value_size,__u32 max_entries,const struct bpf_map_create_opts * opts)168 int bpf_map_create(enum bpf_map_type map_type,
169 const char *map_name,
170 __u32 key_size,
171 __u32 value_size,
172 __u32 max_entries,
173 const struct bpf_map_create_opts *opts)
174 {
175 const size_t attr_sz = offsetofend(union bpf_attr, map_token_fd);
176 union bpf_attr attr;
177 int fd;
178
179 bump_rlimit_memlock();
180
181 memset(&attr, 0, attr_sz);
182
183 if (!OPTS_VALID(opts, bpf_map_create_opts))
184 return libbpf_err(-EINVAL);
185
186 attr.map_type = map_type;
187 if (map_name && feat_supported(NULL, FEAT_PROG_NAME))
188 libbpf_strlcpy(attr.map_name, map_name, sizeof(attr.map_name));
189 attr.key_size = key_size;
190 attr.value_size = value_size;
191 attr.max_entries = max_entries;
192
193 attr.btf_fd = OPTS_GET(opts, btf_fd, 0);
194 attr.btf_key_type_id = OPTS_GET(opts, btf_key_type_id, 0);
195 attr.btf_value_type_id = OPTS_GET(opts, btf_value_type_id, 0);
196 attr.btf_vmlinux_value_type_id = OPTS_GET(opts, btf_vmlinux_value_type_id, 0);
197 attr.value_type_btf_obj_fd = OPTS_GET(opts, value_type_btf_obj_fd, 0);
198
199 attr.inner_map_fd = OPTS_GET(opts, inner_map_fd, 0);
200 attr.map_flags = OPTS_GET(opts, map_flags, 0);
201 attr.map_extra = OPTS_GET(opts, map_extra, 0);
202 attr.numa_node = OPTS_GET(opts, numa_node, 0);
203 attr.map_ifindex = OPTS_GET(opts, map_ifindex, 0);
204
205 attr.map_token_fd = OPTS_GET(opts, token_fd, 0);
206
207 fd = sys_bpf_fd(BPF_MAP_CREATE, &attr, attr_sz);
208 return libbpf_err_errno(fd);
209 }
210
211 static void *
alloc_zero_tailing_info(const void * orecord,__u32 cnt,__u32 actual_rec_size,__u32 expected_rec_size)212 alloc_zero_tailing_info(const void *orecord, __u32 cnt,
213 __u32 actual_rec_size, __u32 expected_rec_size)
214 {
215 __u64 info_len = (__u64)actual_rec_size * cnt;
216 void *info, *nrecord;
217 int i;
218
219 info = malloc(info_len);
220 if (!info)
221 return NULL;
222
223 /* zero out bytes kernel does not understand */
224 nrecord = info;
225 for (i = 0; i < cnt; i++) {
226 memcpy(nrecord, orecord, expected_rec_size);
227 memset(nrecord + expected_rec_size, 0,
228 actual_rec_size - expected_rec_size);
229 orecord += actual_rec_size;
230 nrecord += actual_rec_size;
231 }
232
233 return info;
234 }
235
bpf_prog_load(enum bpf_prog_type prog_type,const char * prog_name,const char * license,const struct bpf_insn * insns,size_t insn_cnt,struct bpf_prog_load_opts * opts)236 int bpf_prog_load(enum bpf_prog_type prog_type,
237 const char *prog_name, const char *license,
238 const struct bpf_insn *insns, size_t insn_cnt,
239 struct bpf_prog_load_opts *opts)
240 {
241 const size_t attr_sz = offsetofend(union bpf_attr, fd_array_cnt);
242 void *finfo = NULL, *linfo = NULL;
243 const char *func_info, *line_info;
244 __u32 log_size, log_level, attach_prog_fd, attach_btf_obj_fd;
245 __u32 func_info_rec_size, line_info_rec_size;
246 int fd, attempts;
247 union bpf_attr attr;
248 char *log_buf;
249
250 bump_rlimit_memlock();
251
252 if (!OPTS_VALID(opts, bpf_prog_load_opts))
253 return libbpf_err(-EINVAL);
254
255 attempts = OPTS_GET(opts, attempts, 0);
256 if (attempts < 0)
257 return libbpf_err(-EINVAL);
258 if (attempts == 0)
259 attempts = PROG_LOAD_ATTEMPTS;
260
261 memset(&attr, 0, attr_sz);
262
263 attr.prog_type = prog_type;
264 attr.expected_attach_type = OPTS_GET(opts, expected_attach_type, 0);
265
266 attr.prog_btf_fd = OPTS_GET(opts, prog_btf_fd, 0);
267 attr.prog_flags = OPTS_GET(opts, prog_flags, 0);
268 attr.prog_ifindex = OPTS_GET(opts, prog_ifindex, 0);
269 attr.kern_version = OPTS_GET(opts, kern_version, 0);
270 attr.prog_token_fd = OPTS_GET(opts, token_fd, 0);
271
272 if (prog_name && feat_supported(NULL, FEAT_PROG_NAME))
273 libbpf_strlcpy(attr.prog_name, prog_name, sizeof(attr.prog_name));
274 attr.license = ptr_to_u64(license);
275
276 if (insn_cnt > UINT_MAX)
277 return libbpf_err(-E2BIG);
278
279 attr.insns = ptr_to_u64(insns);
280 attr.insn_cnt = (__u32)insn_cnt;
281
282 attach_prog_fd = OPTS_GET(opts, attach_prog_fd, 0);
283 attach_btf_obj_fd = OPTS_GET(opts, attach_btf_obj_fd, 0);
284
285 if (attach_prog_fd && attach_btf_obj_fd)
286 return libbpf_err(-EINVAL);
287
288 attr.attach_btf_id = OPTS_GET(opts, attach_btf_id, 0);
289 if (attach_prog_fd)
290 attr.attach_prog_fd = attach_prog_fd;
291 else
292 attr.attach_btf_obj_fd = attach_btf_obj_fd;
293
294 log_buf = OPTS_GET(opts, log_buf, NULL);
295 log_size = OPTS_GET(opts, log_size, 0);
296 log_level = OPTS_GET(opts, log_level, 0);
297
298 if (!!log_buf != !!log_size)
299 return libbpf_err(-EINVAL);
300
301 func_info_rec_size = OPTS_GET(opts, func_info_rec_size, 0);
302 func_info = OPTS_GET(opts, func_info, NULL);
303 attr.func_info_rec_size = func_info_rec_size;
304 attr.func_info = ptr_to_u64(func_info);
305 attr.func_info_cnt = OPTS_GET(opts, func_info_cnt, 0);
306
307 line_info_rec_size = OPTS_GET(opts, line_info_rec_size, 0);
308 line_info = OPTS_GET(opts, line_info, NULL);
309 attr.line_info_rec_size = line_info_rec_size;
310 attr.line_info = ptr_to_u64(line_info);
311 attr.line_info_cnt = OPTS_GET(opts, line_info_cnt, 0);
312
313 attr.fd_array = ptr_to_u64(OPTS_GET(opts, fd_array, NULL));
314 attr.fd_array_cnt = OPTS_GET(opts, fd_array_cnt, 0);
315
316 if (log_level) {
317 attr.log_buf = ptr_to_u64(log_buf);
318 attr.log_size = log_size;
319 attr.log_level = log_level;
320 }
321
322 fd = sys_bpf_prog_load(&attr, attr_sz, attempts);
323 OPTS_SET(opts, log_true_size, attr.log_true_size);
324 if (fd >= 0)
325 return fd;
326
327 /* After bpf_prog_load, the kernel may modify certain attributes
328 * to give user space a hint how to deal with loading failure.
329 * Check to see whether we can make some changes and load again.
330 */
331 while (errno == E2BIG && (!finfo || !linfo)) {
332 if (!finfo && attr.func_info_cnt &&
333 attr.func_info_rec_size < func_info_rec_size) {
334 /* try with corrected func info records */
335 finfo = alloc_zero_tailing_info(func_info,
336 attr.func_info_cnt,
337 func_info_rec_size,
338 attr.func_info_rec_size);
339 if (!finfo) {
340 errno = E2BIG;
341 goto done;
342 }
343
344 attr.func_info = ptr_to_u64(finfo);
345 attr.func_info_rec_size = func_info_rec_size;
346 } else if (!linfo && attr.line_info_cnt &&
347 attr.line_info_rec_size < line_info_rec_size) {
348 linfo = alloc_zero_tailing_info(line_info,
349 attr.line_info_cnt,
350 line_info_rec_size,
351 attr.line_info_rec_size);
352 if (!linfo) {
353 errno = E2BIG;
354 goto done;
355 }
356
357 attr.line_info = ptr_to_u64(linfo);
358 attr.line_info_rec_size = line_info_rec_size;
359 } else {
360 break;
361 }
362
363 fd = sys_bpf_prog_load(&attr, attr_sz, attempts);
364 OPTS_SET(opts, log_true_size, attr.log_true_size);
365 if (fd >= 0)
366 goto done;
367 }
368
369 if (log_level == 0 && log_buf) {
370 /* log_level == 0 with non-NULL log_buf requires retrying on error
371 * with log_level == 1 and log_buf/log_buf_size set, to get details of
372 * failure
373 */
374 attr.log_buf = ptr_to_u64(log_buf);
375 attr.log_size = log_size;
376 attr.log_level = 1;
377
378 fd = sys_bpf_prog_load(&attr, attr_sz, attempts);
379 OPTS_SET(opts, log_true_size, attr.log_true_size);
380 }
381 done:
382 /* free() doesn't affect errno, so we don't need to restore it */
383 free(finfo);
384 free(linfo);
385 return libbpf_err_errno(fd);
386 }
387
bpf_map_update_elem(int fd,const void * key,const void * value,__u64 flags)388 int bpf_map_update_elem(int fd, const void *key, const void *value,
389 __u64 flags)
390 {
391 const size_t attr_sz = offsetofend(union bpf_attr, flags);
392 union bpf_attr attr;
393 int ret;
394
395 memset(&attr, 0, attr_sz);
396 attr.map_fd = fd;
397 attr.key = ptr_to_u64(key);
398 attr.value = ptr_to_u64(value);
399 attr.flags = flags;
400
401 ret = sys_bpf(BPF_MAP_UPDATE_ELEM, &attr, attr_sz);
402 return libbpf_err_errno(ret);
403 }
404
bpf_map_lookup_elem(int fd,const void * key,void * value)405 int bpf_map_lookup_elem(int fd, const void *key, void *value)
406 {
407 const size_t attr_sz = offsetofend(union bpf_attr, flags);
408 union bpf_attr attr;
409 int ret;
410
411 memset(&attr, 0, attr_sz);
412 attr.map_fd = fd;
413 attr.key = ptr_to_u64(key);
414 attr.value = ptr_to_u64(value);
415
416 ret = sys_bpf(BPF_MAP_LOOKUP_ELEM, &attr, attr_sz);
417 return libbpf_err_errno(ret);
418 }
419
bpf_map_lookup_elem_flags(int fd,const void * key,void * value,__u64 flags)420 int bpf_map_lookup_elem_flags(int fd, const void *key, void *value, __u64 flags)
421 {
422 const size_t attr_sz = offsetofend(union bpf_attr, flags);
423 union bpf_attr attr;
424 int ret;
425
426 memset(&attr, 0, attr_sz);
427 attr.map_fd = fd;
428 attr.key = ptr_to_u64(key);
429 attr.value = ptr_to_u64(value);
430 attr.flags = flags;
431
432 ret = sys_bpf(BPF_MAP_LOOKUP_ELEM, &attr, attr_sz);
433 return libbpf_err_errno(ret);
434 }
435
bpf_map_lookup_and_delete_elem(int fd,const void * key,void * value)436 int bpf_map_lookup_and_delete_elem(int fd, const void *key, void *value)
437 {
438 const size_t attr_sz = offsetofend(union bpf_attr, flags);
439 union bpf_attr attr;
440 int ret;
441
442 memset(&attr, 0, attr_sz);
443 attr.map_fd = fd;
444 attr.key = ptr_to_u64(key);
445 attr.value = ptr_to_u64(value);
446
447 ret = sys_bpf(BPF_MAP_LOOKUP_AND_DELETE_ELEM, &attr, attr_sz);
448 return libbpf_err_errno(ret);
449 }
450
bpf_map_lookup_and_delete_elem_flags(int fd,const void * key,void * value,__u64 flags)451 int bpf_map_lookup_and_delete_elem_flags(int fd, const void *key, void *value, __u64 flags)
452 {
453 const size_t attr_sz = offsetofend(union bpf_attr, flags);
454 union bpf_attr attr;
455 int ret;
456
457 memset(&attr, 0, attr_sz);
458 attr.map_fd = fd;
459 attr.key = ptr_to_u64(key);
460 attr.value = ptr_to_u64(value);
461 attr.flags = flags;
462
463 ret = sys_bpf(BPF_MAP_LOOKUP_AND_DELETE_ELEM, &attr, attr_sz);
464 return libbpf_err_errno(ret);
465 }
466
bpf_map_delete_elem(int fd,const void * key)467 int bpf_map_delete_elem(int fd, const void *key)
468 {
469 const size_t attr_sz = offsetofend(union bpf_attr, flags);
470 union bpf_attr attr;
471 int ret;
472
473 memset(&attr, 0, attr_sz);
474 attr.map_fd = fd;
475 attr.key = ptr_to_u64(key);
476
477 ret = sys_bpf(BPF_MAP_DELETE_ELEM, &attr, attr_sz);
478 return libbpf_err_errno(ret);
479 }
480
bpf_map_delete_elem_flags(int fd,const void * key,__u64 flags)481 int bpf_map_delete_elem_flags(int fd, const void *key, __u64 flags)
482 {
483 const size_t attr_sz = offsetofend(union bpf_attr, flags);
484 union bpf_attr attr;
485 int ret;
486
487 memset(&attr, 0, attr_sz);
488 attr.map_fd = fd;
489 attr.key = ptr_to_u64(key);
490 attr.flags = flags;
491
492 ret = sys_bpf(BPF_MAP_DELETE_ELEM, &attr, attr_sz);
493 return libbpf_err_errno(ret);
494 }
495
bpf_map_get_next_key(int fd,const void * key,void * next_key)496 int bpf_map_get_next_key(int fd, const void *key, void *next_key)
497 {
498 const size_t attr_sz = offsetofend(union bpf_attr, next_key);
499 union bpf_attr attr;
500 int ret;
501
502 memset(&attr, 0, attr_sz);
503 attr.map_fd = fd;
504 attr.key = ptr_to_u64(key);
505 attr.next_key = ptr_to_u64(next_key);
506
507 ret = sys_bpf(BPF_MAP_GET_NEXT_KEY, &attr, attr_sz);
508 return libbpf_err_errno(ret);
509 }
510
bpf_map_freeze(int fd)511 int bpf_map_freeze(int fd)
512 {
513 const size_t attr_sz = offsetofend(union bpf_attr, map_fd);
514 union bpf_attr attr;
515 int ret;
516
517 memset(&attr, 0, attr_sz);
518 attr.map_fd = fd;
519
520 ret = sys_bpf(BPF_MAP_FREEZE, &attr, attr_sz);
521 return libbpf_err_errno(ret);
522 }
523
bpf_map_batch_common(int cmd,int fd,void * in_batch,void * out_batch,void * keys,void * values,__u32 * count,const struct bpf_map_batch_opts * opts)524 static int bpf_map_batch_common(int cmd, int fd, void *in_batch,
525 void *out_batch, void *keys, void *values,
526 __u32 *count,
527 const struct bpf_map_batch_opts *opts)
528 {
529 const size_t attr_sz = offsetofend(union bpf_attr, batch);
530 union bpf_attr attr;
531 int ret;
532
533 if (!OPTS_VALID(opts, bpf_map_batch_opts))
534 return libbpf_err(-EINVAL);
535
536 memset(&attr, 0, attr_sz);
537 attr.batch.map_fd = fd;
538 attr.batch.in_batch = ptr_to_u64(in_batch);
539 attr.batch.out_batch = ptr_to_u64(out_batch);
540 attr.batch.keys = ptr_to_u64(keys);
541 attr.batch.values = ptr_to_u64(values);
542 attr.batch.count = *count;
543 attr.batch.elem_flags = OPTS_GET(opts, elem_flags, 0);
544 attr.batch.flags = OPTS_GET(opts, flags, 0);
545
546 ret = sys_bpf(cmd, &attr, attr_sz);
547 *count = attr.batch.count;
548
549 return libbpf_err_errno(ret);
550 }
551
bpf_map_delete_batch(int fd,const void * keys,__u32 * count,const struct bpf_map_batch_opts * opts)552 int bpf_map_delete_batch(int fd, const void *keys, __u32 *count,
553 const struct bpf_map_batch_opts *opts)
554 {
555 return bpf_map_batch_common(BPF_MAP_DELETE_BATCH, fd, NULL,
556 NULL, (void *)keys, NULL, count, opts);
557 }
558
bpf_map_lookup_batch(int fd,void * in_batch,void * out_batch,void * keys,void * values,__u32 * count,const struct bpf_map_batch_opts * opts)559 int bpf_map_lookup_batch(int fd, void *in_batch, void *out_batch, void *keys,
560 void *values, __u32 *count,
561 const struct bpf_map_batch_opts *opts)
562 {
563 return bpf_map_batch_common(BPF_MAP_LOOKUP_BATCH, fd, in_batch,
564 out_batch, keys, values, count, opts);
565 }
566
bpf_map_lookup_and_delete_batch(int fd,void * in_batch,void * out_batch,void * keys,void * values,__u32 * count,const struct bpf_map_batch_opts * opts)567 int bpf_map_lookup_and_delete_batch(int fd, void *in_batch, void *out_batch,
568 void *keys, void *values, __u32 *count,
569 const struct bpf_map_batch_opts *opts)
570 {
571 return bpf_map_batch_common(BPF_MAP_LOOKUP_AND_DELETE_BATCH,
572 fd, in_batch, out_batch, keys, values,
573 count, opts);
574 }
575
bpf_map_update_batch(int fd,const void * keys,const void * values,__u32 * count,const struct bpf_map_batch_opts * opts)576 int bpf_map_update_batch(int fd, const void *keys, const void *values, __u32 *count,
577 const struct bpf_map_batch_opts *opts)
578 {
579 return bpf_map_batch_common(BPF_MAP_UPDATE_BATCH, fd, NULL, NULL,
580 (void *)keys, (void *)values, count, opts);
581 }
582
bpf_obj_pin_opts(int fd,const char * pathname,const struct bpf_obj_pin_opts * opts)583 int bpf_obj_pin_opts(int fd, const char *pathname, const struct bpf_obj_pin_opts *opts)
584 {
585 const size_t attr_sz = offsetofend(union bpf_attr, path_fd);
586 union bpf_attr attr;
587 int ret;
588
589 if (!OPTS_VALID(opts, bpf_obj_pin_opts))
590 return libbpf_err(-EINVAL);
591
592 memset(&attr, 0, attr_sz);
593 attr.path_fd = OPTS_GET(opts, path_fd, 0);
594 attr.pathname = ptr_to_u64((void *)pathname);
595 attr.file_flags = OPTS_GET(opts, file_flags, 0);
596 attr.bpf_fd = fd;
597
598 ret = sys_bpf(BPF_OBJ_PIN, &attr, attr_sz);
599 return libbpf_err_errno(ret);
600 }
601
bpf_obj_pin(int fd,const char * pathname)602 int bpf_obj_pin(int fd, const char *pathname)
603 {
604 return bpf_obj_pin_opts(fd, pathname, NULL);
605 }
606
bpf_obj_get(const char * pathname)607 int bpf_obj_get(const char *pathname)
608 {
609 return bpf_obj_get_opts(pathname, NULL);
610 }
611
bpf_obj_get_opts(const char * pathname,const struct bpf_obj_get_opts * opts)612 int bpf_obj_get_opts(const char *pathname, const struct bpf_obj_get_opts *opts)
613 {
614 const size_t attr_sz = offsetofend(union bpf_attr, path_fd);
615 union bpf_attr attr;
616 int fd;
617
618 if (!OPTS_VALID(opts, bpf_obj_get_opts))
619 return libbpf_err(-EINVAL);
620
621 memset(&attr, 0, attr_sz);
622 attr.path_fd = OPTS_GET(opts, path_fd, 0);
623 attr.pathname = ptr_to_u64((void *)pathname);
624 attr.file_flags = OPTS_GET(opts, file_flags, 0);
625
626 fd = sys_bpf_fd(BPF_OBJ_GET, &attr, attr_sz);
627 return libbpf_err_errno(fd);
628 }
629
bpf_prog_attach(int prog_fd,int target_fd,enum bpf_attach_type type,unsigned int flags)630 int bpf_prog_attach(int prog_fd, int target_fd, enum bpf_attach_type type,
631 unsigned int flags)
632 {
633 DECLARE_LIBBPF_OPTS(bpf_prog_attach_opts, opts,
634 .flags = flags,
635 );
636
637 return bpf_prog_attach_opts(prog_fd, target_fd, type, &opts);
638 }
639
bpf_prog_attach_opts(int prog_fd,int target,enum bpf_attach_type type,const struct bpf_prog_attach_opts * opts)640 int bpf_prog_attach_opts(int prog_fd, int target, enum bpf_attach_type type,
641 const struct bpf_prog_attach_opts *opts)
642 {
643 const size_t attr_sz = offsetofend(union bpf_attr, expected_revision);
644 __u32 relative_id, flags;
645 int ret, relative_fd;
646 union bpf_attr attr;
647
648 if (!OPTS_VALID(opts, bpf_prog_attach_opts))
649 return libbpf_err(-EINVAL);
650
651 relative_id = OPTS_GET(opts, relative_id, 0);
652 relative_fd = OPTS_GET(opts, relative_fd, 0);
653 flags = OPTS_GET(opts, flags, 0);
654
655 /* validate we don't have unexpected combinations of non-zero fields */
656 if (relative_fd && relative_id)
657 return libbpf_err(-EINVAL);
658
659 memset(&attr, 0, attr_sz);
660 attr.target_fd = target;
661 attr.attach_bpf_fd = prog_fd;
662 attr.attach_type = type;
663 attr.replace_bpf_fd = OPTS_GET(opts, replace_fd, 0);
664 attr.expected_revision = OPTS_GET(opts, expected_revision, 0);
665
666 if (relative_id) {
667 attr.attach_flags = flags | BPF_F_ID;
668 attr.relative_id = relative_id;
669 } else {
670 attr.attach_flags = flags;
671 attr.relative_fd = relative_fd;
672 }
673
674 ret = sys_bpf(BPF_PROG_ATTACH, &attr, attr_sz);
675 return libbpf_err_errno(ret);
676 }
677
bpf_prog_detach_opts(int prog_fd,int target,enum bpf_attach_type type,const struct bpf_prog_detach_opts * opts)678 int bpf_prog_detach_opts(int prog_fd, int target, enum bpf_attach_type type,
679 const struct bpf_prog_detach_opts *opts)
680 {
681 const size_t attr_sz = offsetofend(union bpf_attr, expected_revision);
682 __u32 relative_id, flags;
683 int ret, relative_fd;
684 union bpf_attr attr;
685
686 if (!OPTS_VALID(opts, bpf_prog_detach_opts))
687 return libbpf_err(-EINVAL);
688
689 relative_id = OPTS_GET(opts, relative_id, 0);
690 relative_fd = OPTS_GET(opts, relative_fd, 0);
691 flags = OPTS_GET(opts, flags, 0);
692
693 /* validate we don't have unexpected combinations of non-zero fields */
694 if (relative_fd && relative_id)
695 return libbpf_err(-EINVAL);
696
697 memset(&attr, 0, attr_sz);
698 attr.target_fd = target;
699 attr.attach_bpf_fd = prog_fd;
700 attr.attach_type = type;
701 attr.expected_revision = OPTS_GET(opts, expected_revision, 0);
702
703 if (relative_id) {
704 attr.attach_flags = flags | BPF_F_ID;
705 attr.relative_id = relative_id;
706 } else {
707 attr.attach_flags = flags;
708 attr.relative_fd = relative_fd;
709 }
710
711 ret = sys_bpf(BPF_PROG_DETACH, &attr, attr_sz);
712 return libbpf_err_errno(ret);
713 }
714
bpf_prog_detach(int target_fd,enum bpf_attach_type type)715 int bpf_prog_detach(int target_fd, enum bpf_attach_type type)
716 {
717 return bpf_prog_detach_opts(0, target_fd, type, NULL);
718 }
719
bpf_prog_detach2(int prog_fd,int target_fd,enum bpf_attach_type type)720 int bpf_prog_detach2(int prog_fd, int target_fd, enum bpf_attach_type type)
721 {
722 return bpf_prog_detach_opts(prog_fd, target_fd, type, NULL);
723 }
724
bpf_link_create(int prog_fd,int target_fd,enum bpf_attach_type attach_type,const struct bpf_link_create_opts * opts)725 int bpf_link_create(int prog_fd, int target_fd,
726 enum bpf_attach_type attach_type,
727 const struct bpf_link_create_opts *opts)
728 {
729 const size_t attr_sz = offsetofend(union bpf_attr, link_create);
730 __u32 target_btf_id, iter_info_len, relative_id;
731 int fd, err, relative_fd;
732 union bpf_attr attr;
733
734 if (!OPTS_VALID(opts, bpf_link_create_opts))
735 return libbpf_err(-EINVAL);
736
737 iter_info_len = OPTS_GET(opts, iter_info_len, 0);
738 target_btf_id = OPTS_GET(opts, target_btf_id, 0);
739
740 /* validate we don't have unexpected combinations of non-zero fields */
741 if (iter_info_len || target_btf_id) {
742 if (iter_info_len && target_btf_id)
743 return libbpf_err(-EINVAL);
744 if (!OPTS_ZEROED(opts, target_btf_id))
745 return libbpf_err(-EINVAL);
746 }
747
748 memset(&attr, 0, attr_sz);
749 attr.link_create.prog_fd = prog_fd;
750 attr.link_create.target_fd = target_fd;
751 attr.link_create.attach_type = attach_type;
752 attr.link_create.flags = OPTS_GET(opts, flags, 0);
753
754 if (target_btf_id) {
755 attr.link_create.target_btf_id = target_btf_id;
756 goto proceed;
757 }
758
759 switch (attach_type) {
760 case BPF_TRACE_ITER:
761 attr.link_create.iter_info = ptr_to_u64(OPTS_GET(opts, iter_info, (void *)0));
762 attr.link_create.iter_info_len = iter_info_len;
763 break;
764 case BPF_PERF_EVENT:
765 attr.link_create.perf_event.bpf_cookie = OPTS_GET(opts, perf_event.bpf_cookie, 0);
766 if (!OPTS_ZEROED(opts, perf_event))
767 return libbpf_err(-EINVAL);
768 break;
769 case BPF_TRACE_KPROBE_MULTI:
770 case BPF_TRACE_KPROBE_SESSION:
771 attr.link_create.kprobe_multi.flags = OPTS_GET(opts, kprobe_multi.flags, 0);
772 attr.link_create.kprobe_multi.cnt = OPTS_GET(opts, kprobe_multi.cnt, 0);
773 attr.link_create.kprobe_multi.syms = ptr_to_u64(OPTS_GET(opts, kprobe_multi.syms, 0));
774 attr.link_create.kprobe_multi.addrs = ptr_to_u64(OPTS_GET(opts, kprobe_multi.addrs, 0));
775 attr.link_create.kprobe_multi.cookies = ptr_to_u64(OPTS_GET(opts, kprobe_multi.cookies, 0));
776 if (!OPTS_ZEROED(opts, kprobe_multi))
777 return libbpf_err(-EINVAL);
778 break;
779 case BPF_TRACE_UPROBE_MULTI:
780 case BPF_TRACE_UPROBE_SESSION:
781 attr.link_create.uprobe_multi.flags = OPTS_GET(opts, uprobe_multi.flags, 0);
782 attr.link_create.uprobe_multi.cnt = OPTS_GET(opts, uprobe_multi.cnt, 0);
783 attr.link_create.uprobe_multi.path = ptr_to_u64(OPTS_GET(opts, uprobe_multi.path, 0));
784 attr.link_create.uprobe_multi.offsets = ptr_to_u64(OPTS_GET(opts, uprobe_multi.offsets, 0));
785 attr.link_create.uprobe_multi.ref_ctr_offsets = ptr_to_u64(OPTS_GET(opts, uprobe_multi.ref_ctr_offsets, 0));
786 attr.link_create.uprobe_multi.cookies = ptr_to_u64(OPTS_GET(opts, uprobe_multi.cookies, 0));
787 attr.link_create.uprobe_multi.pid = OPTS_GET(opts, uprobe_multi.pid, 0);
788 if (!OPTS_ZEROED(opts, uprobe_multi))
789 return libbpf_err(-EINVAL);
790 break;
791 case BPF_TRACE_RAW_TP:
792 case BPF_TRACE_FENTRY:
793 case BPF_TRACE_FEXIT:
794 case BPF_MODIFY_RETURN:
795 case BPF_LSM_MAC:
796 attr.link_create.tracing.cookie = OPTS_GET(opts, tracing.cookie, 0);
797 if (!OPTS_ZEROED(opts, tracing))
798 return libbpf_err(-EINVAL);
799 break;
800 case BPF_NETFILTER:
801 attr.link_create.netfilter.pf = OPTS_GET(opts, netfilter.pf, 0);
802 attr.link_create.netfilter.hooknum = OPTS_GET(opts, netfilter.hooknum, 0);
803 attr.link_create.netfilter.priority = OPTS_GET(opts, netfilter.priority, 0);
804 attr.link_create.netfilter.flags = OPTS_GET(opts, netfilter.flags, 0);
805 if (!OPTS_ZEROED(opts, netfilter))
806 return libbpf_err(-EINVAL);
807 break;
808 case BPF_TCX_INGRESS:
809 case BPF_TCX_EGRESS:
810 relative_fd = OPTS_GET(opts, tcx.relative_fd, 0);
811 relative_id = OPTS_GET(opts, tcx.relative_id, 0);
812 if (relative_fd && relative_id)
813 return libbpf_err(-EINVAL);
814 if (relative_id) {
815 attr.link_create.tcx.relative_id = relative_id;
816 attr.link_create.flags |= BPF_F_ID;
817 } else {
818 attr.link_create.tcx.relative_fd = relative_fd;
819 }
820 attr.link_create.tcx.expected_revision = OPTS_GET(opts, tcx.expected_revision, 0);
821 if (!OPTS_ZEROED(opts, tcx))
822 return libbpf_err(-EINVAL);
823 break;
824 case BPF_NETKIT_PRIMARY:
825 case BPF_NETKIT_PEER:
826 relative_fd = OPTS_GET(opts, netkit.relative_fd, 0);
827 relative_id = OPTS_GET(opts, netkit.relative_id, 0);
828 if (relative_fd && relative_id)
829 return libbpf_err(-EINVAL);
830 if (relative_id) {
831 attr.link_create.netkit.relative_id = relative_id;
832 attr.link_create.flags |= BPF_F_ID;
833 } else {
834 attr.link_create.netkit.relative_fd = relative_fd;
835 }
836 attr.link_create.netkit.expected_revision = OPTS_GET(opts, netkit.expected_revision, 0);
837 if (!OPTS_ZEROED(opts, netkit))
838 return libbpf_err(-EINVAL);
839 break;
840 case BPF_CGROUP_INET_INGRESS:
841 case BPF_CGROUP_INET_EGRESS:
842 case BPF_CGROUP_INET_SOCK_CREATE:
843 case BPF_CGROUP_INET_SOCK_RELEASE:
844 case BPF_CGROUP_INET4_BIND:
845 case BPF_CGROUP_INET6_BIND:
846 case BPF_CGROUP_INET4_POST_BIND:
847 case BPF_CGROUP_INET6_POST_BIND:
848 case BPF_CGROUP_INET4_CONNECT:
849 case BPF_CGROUP_INET6_CONNECT:
850 case BPF_CGROUP_UNIX_CONNECT:
851 case BPF_CGROUP_INET4_GETPEERNAME:
852 case BPF_CGROUP_INET6_GETPEERNAME:
853 case BPF_CGROUP_UNIX_GETPEERNAME:
854 case BPF_CGROUP_INET4_GETSOCKNAME:
855 case BPF_CGROUP_INET6_GETSOCKNAME:
856 case BPF_CGROUP_UNIX_GETSOCKNAME:
857 case BPF_CGROUP_UDP4_SENDMSG:
858 case BPF_CGROUP_UDP6_SENDMSG:
859 case BPF_CGROUP_UNIX_SENDMSG:
860 case BPF_CGROUP_UDP4_RECVMSG:
861 case BPF_CGROUP_UDP6_RECVMSG:
862 case BPF_CGROUP_UNIX_RECVMSG:
863 case BPF_CGROUP_SOCK_OPS:
864 case BPF_CGROUP_DEVICE:
865 case BPF_CGROUP_SYSCTL:
866 case BPF_CGROUP_GETSOCKOPT:
867 case BPF_CGROUP_SETSOCKOPT:
868 case BPF_LSM_CGROUP:
869 relative_fd = OPTS_GET(opts, cgroup.relative_fd, 0);
870 relative_id = OPTS_GET(opts, cgroup.relative_id, 0);
871 if (relative_fd && relative_id)
872 return libbpf_err(-EINVAL);
873 if (relative_id) {
874 attr.link_create.cgroup.relative_id = relative_id;
875 attr.link_create.flags |= BPF_F_ID;
876 } else {
877 attr.link_create.cgroup.relative_fd = relative_fd;
878 }
879 attr.link_create.cgroup.expected_revision =
880 OPTS_GET(opts, cgroup.expected_revision, 0);
881 if (!OPTS_ZEROED(opts, cgroup))
882 return libbpf_err(-EINVAL);
883 break;
884 default:
885 if (!OPTS_ZEROED(opts, flags))
886 return libbpf_err(-EINVAL);
887 break;
888 }
889 proceed:
890 fd = sys_bpf_fd(BPF_LINK_CREATE, &attr, attr_sz);
891 if (fd >= 0)
892 return fd;
893 /* we'll get EINVAL if LINK_CREATE doesn't support attaching fentry
894 * and other similar programs
895 */
896 err = -errno;
897 if (err != -EINVAL)
898 return libbpf_err(err);
899
900 /* if user used features not supported by
901 * BPF_RAW_TRACEPOINT_OPEN command, then just give up immediately
902 */
903 if (attr.link_create.target_fd || attr.link_create.target_btf_id)
904 return libbpf_err(err);
905 if (!OPTS_ZEROED(opts, sz))
906 return libbpf_err(err);
907
908 /* otherwise, for few select kinds of programs that can be
909 * attached using BPF_RAW_TRACEPOINT_OPEN command, try that as
910 * a fallback for older kernels
911 */
912 switch (attach_type) {
913 case BPF_TRACE_RAW_TP:
914 case BPF_LSM_MAC:
915 case BPF_TRACE_FENTRY:
916 case BPF_TRACE_FEXIT:
917 case BPF_MODIFY_RETURN:
918 return bpf_raw_tracepoint_open(NULL, prog_fd);
919 default:
920 return libbpf_err(err);
921 }
922 }
923
bpf_link_detach(int link_fd)924 int bpf_link_detach(int link_fd)
925 {
926 const size_t attr_sz = offsetofend(union bpf_attr, link_detach);
927 union bpf_attr attr;
928 int ret;
929
930 memset(&attr, 0, attr_sz);
931 attr.link_detach.link_fd = link_fd;
932
933 ret = sys_bpf(BPF_LINK_DETACH, &attr, attr_sz);
934 return libbpf_err_errno(ret);
935 }
936
bpf_link_update(int link_fd,int new_prog_fd,const struct bpf_link_update_opts * opts)937 int bpf_link_update(int link_fd, int new_prog_fd,
938 const struct bpf_link_update_opts *opts)
939 {
940 const size_t attr_sz = offsetofend(union bpf_attr, link_update);
941 union bpf_attr attr;
942 int ret;
943
944 if (!OPTS_VALID(opts, bpf_link_update_opts))
945 return libbpf_err(-EINVAL);
946
947 if (OPTS_GET(opts, old_prog_fd, 0) && OPTS_GET(opts, old_map_fd, 0))
948 return libbpf_err(-EINVAL);
949
950 memset(&attr, 0, attr_sz);
951 attr.link_update.link_fd = link_fd;
952 attr.link_update.new_prog_fd = new_prog_fd;
953 attr.link_update.flags = OPTS_GET(opts, flags, 0);
954 if (OPTS_GET(opts, old_prog_fd, 0))
955 attr.link_update.old_prog_fd = OPTS_GET(opts, old_prog_fd, 0);
956 else if (OPTS_GET(opts, old_map_fd, 0))
957 attr.link_update.old_map_fd = OPTS_GET(opts, old_map_fd, 0);
958
959 ret = sys_bpf(BPF_LINK_UPDATE, &attr, attr_sz);
960 return libbpf_err_errno(ret);
961 }
962
bpf_iter_create(int link_fd)963 int bpf_iter_create(int link_fd)
964 {
965 const size_t attr_sz = offsetofend(union bpf_attr, iter_create);
966 union bpf_attr attr;
967 int fd;
968
969 memset(&attr, 0, attr_sz);
970 attr.iter_create.link_fd = link_fd;
971
972 fd = sys_bpf_fd(BPF_ITER_CREATE, &attr, attr_sz);
973 return libbpf_err_errno(fd);
974 }
975
bpf_prog_query_opts(int target,enum bpf_attach_type type,struct bpf_prog_query_opts * opts)976 int bpf_prog_query_opts(int target, enum bpf_attach_type type,
977 struct bpf_prog_query_opts *opts)
978 {
979 const size_t attr_sz = offsetofend(union bpf_attr, query);
980 union bpf_attr attr;
981 int ret;
982
983 if (!OPTS_VALID(opts, bpf_prog_query_opts))
984 return libbpf_err(-EINVAL);
985
986 memset(&attr, 0, attr_sz);
987 attr.query.target_fd = target;
988 attr.query.attach_type = type;
989 attr.query.query_flags = OPTS_GET(opts, query_flags, 0);
990 attr.query.count = OPTS_GET(opts, count, 0);
991 attr.query.prog_ids = ptr_to_u64(OPTS_GET(opts, prog_ids, NULL));
992 attr.query.link_ids = ptr_to_u64(OPTS_GET(opts, link_ids, NULL));
993 attr.query.prog_attach_flags = ptr_to_u64(OPTS_GET(opts, prog_attach_flags, NULL));
994 attr.query.link_attach_flags = ptr_to_u64(OPTS_GET(opts, link_attach_flags, NULL));
995
996 ret = sys_bpf(BPF_PROG_QUERY, &attr, attr_sz);
997
998 OPTS_SET(opts, attach_flags, attr.query.attach_flags);
999 OPTS_SET(opts, revision, attr.query.revision);
1000 OPTS_SET(opts, count, attr.query.count);
1001
1002 return libbpf_err_errno(ret);
1003 }
1004
bpf_prog_query(int target_fd,enum bpf_attach_type type,__u32 query_flags,__u32 * attach_flags,__u32 * prog_ids,__u32 * prog_cnt)1005 int bpf_prog_query(int target_fd, enum bpf_attach_type type, __u32 query_flags,
1006 __u32 *attach_flags, __u32 *prog_ids, __u32 *prog_cnt)
1007 {
1008 LIBBPF_OPTS(bpf_prog_query_opts, opts);
1009 int ret;
1010
1011 opts.query_flags = query_flags;
1012 opts.prog_ids = prog_ids;
1013 opts.prog_cnt = *prog_cnt;
1014
1015 ret = bpf_prog_query_opts(target_fd, type, &opts);
1016
1017 if (attach_flags)
1018 *attach_flags = opts.attach_flags;
1019 *prog_cnt = opts.prog_cnt;
1020
1021 return libbpf_err_errno(ret);
1022 }
1023
bpf_prog_test_run_opts(int prog_fd,struct bpf_test_run_opts * opts)1024 int bpf_prog_test_run_opts(int prog_fd, struct bpf_test_run_opts *opts)
1025 {
1026 const size_t attr_sz = offsetofend(union bpf_attr, test);
1027 union bpf_attr attr;
1028 int ret;
1029
1030 if (!OPTS_VALID(opts, bpf_test_run_opts))
1031 return libbpf_err(-EINVAL);
1032
1033 memset(&attr, 0, attr_sz);
1034 attr.test.prog_fd = prog_fd;
1035 attr.test.batch_size = OPTS_GET(opts, batch_size, 0);
1036 attr.test.cpu = OPTS_GET(opts, cpu, 0);
1037 attr.test.flags = OPTS_GET(opts, flags, 0);
1038 attr.test.repeat = OPTS_GET(opts, repeat, 0);
1039 attr.test.duration = OPTS_GET(opts, duration, 0);
1040 attr.test.ctx_size_in = OPTS_GET(opts, ctx_size_in, 0);
1041 attr.test.ctx_size_out = OPTS_GET(opts, ctx_size_out, 0);
1042 attr.test.data_size_in = OPTS_GET(opts, data_size_in, 0);
1043 attr.test.data_size_out = OPTS_GET(opts, data_size_out, 0);
1044 attr.test.ctx_in = ptr_to_u64(OPTS_GET(opts, ctx_in, NULL));
1045 attr.test.ctx_out = ptr_to_u64(OPTS_GET(opts, ctx_out, NULL));
1046 attr.test.data_in = ptr_to_u64(OPTS_GET(opts, data_in, NULL));
1047 attr.test.data_out = ptr_to_u64(OPTS_GET(opts, data_out, NULL));
1048
1049 ret = sys_bpf(BPF_PROG_TEST_RUN, &attr, attr_sz);
1050
1051 OPTS_SET(opts, data_size_out, attr.test.data_size_out);
1052 OPTS_SET(opts, ctx_size_out, attr.test.ctx_size_out);
1053 OPTS_SET(opts, duration, attr.test.duration);
1054 OPTS_SET(opts, retval, attr.test.retval);
1055
1056 return libbpf_err_errno(ret);
1057 }
1058
bpf_obj_get_next_id(__u32 start_id,__u32 * next_id,int cmd)1059 static int bpf_obj_get_next_id(__u32 start_id, __u32 *next_id, int cmd)
1060 {
1061 const size_t attr_sz = offsetofend(union bpf_attr, open_flags);
1062 union bpf_attr attr;
1063 int err;
1064
1065 memset(&attr, 0, attr_sz);
1066 attr.start_id = start_id;
1067
1068 err = sys_bpf(cmd, &attr, attr_sz);
1069 if (!err)
1070 *next_id = attr.next_id;
1071
1072 return libbpf_err_errno(err);
1073 }
1074
bpf_prog_get_next_id(__u32 start_id,__u32 * next_id)1075 int bpf_prog_get_next_id(__u32 start_id, __u32 *next_id)
1076 {
1077 return bpf_obj_get_next_id(start_id, next_id, BPF_PROG_GET_NEXT_ID);
1078 }
1079
bpf_map_get_next_id(__u32 start_id,__u32 * next_id)1080 int bpf_map_get_next_id(__u32 start_id, __u32 *next_id)
1081 {
1082 return bpf_obj_get_next_id(start_id, next_id, BPF_MAP_GET_NEXT_ID);
1083 }
1084
bpf_btf_get_next_id(__u32 start_id,__u32 * next_id)1085 int bpf_btf_get_next_id(__u32 start_id, __u32 *next_id)
1086 {
1087 return bpf_obj_get_next_id(start_id, next_id, BPF_BTF_GET_NEXT_ID);
1088 }
1089
bpf_link_get_next_id(__u32 start_id,__u32 * next_id)1090 int bpf_link_get_next_id(__u32 start_id, __u32 *next_id)
1091 {
1092 return bpf_obj_get_next_id(start_id, next_id, BPF_LINK_GET_NEXT_ID);
1093 }
1094
bpf_prog_get_fd_by_id_opts(__u32 id,const struct bpf_get_fd_by_id_opts * opts)1095 int bpf_prog_get_fd_by_id_opts(__u32 id,
1096 const struct bpf_get_fd_by_id_opts *opts)
1097 {
1098 const size_t attr_sz = offsetofend(union bpf_attr, open_flags);
1099 union bpf_attr attr;
1100 int fd;
1101
1102 if (!OPTS_VALID(opts, bpf_get_fd_by_id_opts))
1103 return libbpf_err(-EINVAL);
1104
1105 memset(&attr, 0, attr_sz);
1106 attr.prog_id = id;
1107 attr.open_flags = OPTS_GET(opts, open_flags, 0);
1108
1109 fd = sys_bpf_fd(BPF_PROG_GET_FD_BY_ID, &attr, attr_sz);
1110 return libbpf_err_errno(fd);
1111 }
1112
bpf_prog_get_fd_by_id(__u32 id)1113 int bpf_prog_get_fd_by_id(__u32 id)
1114 {
1115 return bpf_prog_get_fd_by_id_opts(id, NULL);
1116 }
1117
bpf_map_get_fd_by_id_opts(__u32 id,const struct bpf_get_fd_by_id_opts * opts)1118 int bpf_map_get_fd_by_id_opts(__u32 id,
1119 const struct bpf_get_fd_by_id_opts *opts)
1120 {
1121 const size_t attr_sz = offsetofend(union bpf_attr, open_flags);
1122 union bpf_attr attr;
1123 int fd;
1124
1125 if (!OPTS_VALID(opts, bpf_get_fd_by_id_opts))
1126 return libbpf_err(-EINVAL);
1127
1128 memset(&attr, 0, attr_sz);
1129 attr.map_id = id;
1130 attr.open_flags = OPTS_GET(opts, open_flags, 0);
1131
1132 fd = sys_bpf_fd(BPF_MAP_GET_FD_BY_ID, &attr, attr_sz);
1133 return libbpf_err_errno(fd);
1134 }
1135
bpf_map_get_fd_by_id(__u32 id)1136 int bpf_map_get_fd_by_id(__u32 id)
1137 {
1138 return bpf_map_get_fd_by_id_opts(id, NULL);
1139 }
1140
bpf_btf_get_fd_by_id_opts(__u32 id,const struct bpf_get_fd_by_id_opts * opts)1141 int bpf_btf_get_fd_by_id_opts(__u32 id,
1142 const struct bpf_get_fd_by_id_opts *opts)
1143 {
1144 const size_t attr_sz = offsetofend(union bpf_attr, fd_by_id_token_fd);
1145 union bpf_attr attr;
1146 int fd;
1147
1148 if (!OPTS_VALID(opts, bpf_get_fd_by_id_opts))
1149 return libbpf_err(-EINVAL);
1150
1151 memset(&attr, 0, attr_sz);
1152 attr.btf_id = id;
1153 attr.open_flags = OPTS_GET(opts, open_flags, 0);
1154 attr.fd_by_id_token_fd = OPTS_GET(opts, token_fd, 0);
1155
1156 fd = sys_bpf_fd(BPF_BTF_GET_FD_BY_ID, &attr, attr_sz);
1157 return libbpf_err_errno(fd);
1158 }
1159
bpf_btf_get_fd_by_id(__u32 id)1160 int bpf_btf_get_fd_by_id(__u32 id)
1161 {
1162 return bpf_btf_get_fd_by_id_opts(id, NULL);
1163 }
1164
bpf_link_get_fd_by_id_opts(__u32 id,const struct bpf_get_fd_by_id_opts * opts)1165 int bpf_link_get_fd_by_id_opts(__u32 id,
1166 const struct bpf_get_fd_by_id_opts *opts)
1167 {
1168 const size_t attr_sz = offsetofend(union bpf_attr, open_flags);
1169 union bpf_attr attr;
1170 int fd;
1171
1172 if (!OPTS_VALID(opts, bpf_get_fd_by_id_opts))
1173 return libbpf_err(-EINVAL);
1174
1175 memset(&attr, 0, attr_sz);
1176 attr.link_id = id;
1177 attr.open_flags = OPTS_GET(opts, open_flags, 0);
1178
1179 fd = sys_bpf_fd(BPF_LINK_GET_FD_BY_ID, &attr, attr_sz);
1180 return libbpf_err_errno(fd);
1181 }
1182
bpf_link_get_fd_by_id(__u32 id)1183 int bpf_link_get_fd_by_id(__u32 id)
1184 {
1185 return bpf_link_get_fd_by_id_opts(id, NULL);
1186 }
1187
bpf_obj_get_info_by_fd(int bpf_fd,void * info,__u32 * info_len)1188 int bpf_obj_get_info_by_fd(int bpf_fd, void *info, __u32 *info_len)
1189 {
1190 const size_t attr_sz = offsetofend(union bpf_attr, info);
1191 union bpf_attr attr;
1192 int err;
1193
1194 memset(&attr, 0, attr_sz);
1195 attr.info.bpf_fd = bpf_fd;
1196 attr.info.info_len = *info_len;
1197 attr.info.info = ptr_to_u64(info);
1198
1199 err = sys_bpf(BPF_OBJ_GET_INFO_BY_FD, &attr, attr_sz);
1200 if (!err)
1201 *info_len = attr.info.info_len;
1202 return libbpf_err_errno(err);
1203 }
1204
bpf_prog_get_info_by_fd(int prog_fd,struct bpf_prog_info * info,__u32 * info_len)1205 int bpf_prog_get_info_by_fd(int prog_fd, struct bpf_prog_info *info, __u32 *info_len)
1206 {
1207 return bpf_obj_get_info_by_fd(prog_fd, info, info_len);
1208 }
1209
bpf_map_get_info_by_fd(int map_fd,struct bpf_map_info * info,__u32 * info_len)1210 int bpf_map_get_info_by_fd(int map_fd, struct bpf_map_info *info, __u32 *info_len)
1211 {
1212 return bpf_obj_get_info_by_fd(map_fd, info, info_len);
1213 }
1214
bpf_btf_get_info_by_fd(int btf_fd,struct bpf_btf_info * info,__u32 * info_len)1215 int bpf_btf_get_info_by_fd(int btf_fd, struct bpf_btf_info *info, __u32 *info_len)
1216 {
1217 return bpf_obj_get_info_by_fd(btf_fd, info, info_len);
1218 }
1219
bpf_link_get_info_by_fd(int link_fd,struct bpf_link_info * info,__u32 * info_len)1220 int bpf_link_get_info_by_fd(int link_fd, struct bpf_link_info *info, __u32 *info_len)
1221 {
1222 return bpf_obj_get_info_by_fd(link_fd, info, info_len);
1223 }
1224
bpf_raw_tracepoint_open_opts(int prog_fd,struct bpf_raw_tp_opts * opts)1225 int bpf_raw_tracepoint_open_opts(int prog_fd, struct bpf_raw_tp_opts *opts)
1226 {
1227 const size_t attr_sz = offsetofend(union bpf_attr, raw_tracepoint);
1228 union bpf_attr attr;
1229 int fd;
1230
1231 if (!OPTS_VALID(opts, bpf_raw_tp_opts))
1232 return libbpf_err(-EINVAL);
1233
1234 memset(&attr, 0, attr_sz);
1235 attr.raw_tracepoint.prog_fd = prog_fd;
1236 attr.raw_tracepoint.name = ptr_to_u64(OPTS_GET(opts, tp_name, NULL));
1237 attr.raw_tracepoint.cookie = OPTS_GET(opts, cookie, 0);
1238
1239 fd = sys_bpf_fd(BPF_RAW_TRACEPOINT_OPEN, &attr, attr_sz);
1240 return libbpf_err_errno(fd);
1241 }
1242
bpf_raw_tracepoint_open(const char * name,int prog_fd)1243 int bpf_raw_tracepoint_open(const char *name, int prog_fd)
1244 {
1245 LIBBPF_OPTS(bpf_raw_tp_opts, opts, .tp_name = name);
1246
1247 return bpf_raw_tracepoint_open_opts(prog_fd, &opts);
1248 }
1249
bpf_btf_load(const void * btf_data,size_t btf_size,struct bpf_btf_load_opts * opts)1250 int bpf_btf_load(const void *btf_data, size_t btf_size, struct bpf_btf_load_opts *opts)
1251 {
1252 const size_t attr_sz = offsetofend(union bpf_attr, btf_token_fd);
1253 union bpf_attr attr;
1254 char *log_buf;
1255 size_t log_size;
1256 __u32 log_level;
1257 int fd;
1258
1259 bump_rlimit_memlock();
1260
1261 memset(&attr, 0, attr_sz);
1262
1263 if (!OPTS_VALID(opts, bpf_btf_load_opts))
1264 return libbpf_err(-EINVAL);
1265
1266 log_buf = OPTS_GET(opts, log_buf, NULL);
1267 log_size = OPTS_GET(opts, log_size, 0);
1268 log_level = OPTS_GET(opts, log_level, 0);
1269
1270 if (log_size > UINT_MAX)
1271 return libbpf_err(-EINVAL);
1272 if (log_size && !log_buf)
1273 return libbpf_err(-EINVAL);
1274
1275 attr.btf = ptr_to_u64(btf_data);
1276 attr.btf_size = btf_size;
1277
1278 attr.btf_flags = OPTS_GET(opts, btf_flags, 0);
1279 attr.btf_token_fd = OPTS_GET(opts, token_fd, 0);
1280
1281 /* log_level == 0 and log_buf != NULL means "try loading without
1282 * log_buf, but retry with log_buf and log_level=1 on error", which is
1283 * consistent across low-level and high-level BTF and program loading
1284 * APIs within libbpf and provides a sensible behavior in practice
1285 */
1286 if (log_level) {
1287 attr.btf_log_buf = ptr_to_u64(log_buf);
1288 attr.btf_log_size = (__u32)log_size;
1289 attr.btf_log_level = log_level;
1290 }
1291
1292 fd = sys_bpf_fd(BPF_BTF_LOAD, &attr, attr_sz);
1293 if (fd < 0 && log_buf && log_level == 0) {
1294 attr.btf_log_buf = ptr_to_u64(log_buf);
1295 attr.btf_log_size = (__u32)log_size;
1296 attr.btf_log_level = 1;
1297 fd = sys_bpf_fd(BPF_BTF_LOAD, &attr, attr_sz);
1298 }
1299
1300 OPTS_SET(opts, log_true_size, attr.btf_log_true_size);
1301 return libbpf_err_errno(fd);
1302 }
1303
bpf_task_fd_query(int pid,int fd,__u32 flags,char * buf,__u32 * buf_len,__u32 * prog_id,__u32 * fd_type,__u64 * probe_offset,__u64 * probe_addr)1304 int bpf_task_fd_query(int pid, int fd, __u32 flags, char *buf, __u32 *buf_len,
1305 __u32 *prog_id, __u32 *fd_type, __u64 *probe_offset,
1306 __u64 *probe_addr)
1307 {
1308 const size_t attr_sz = offsetofend(union bpf_attr, task_fd_query);
1309 union bpf_attr attr;
1310 int err;
1311
1312 memset(&attr, 0, attr_sz);
1313 attr.task_fd_query.pid = pid;
1314 attr.task_fd_query.fd = fd;
1315 attr.task_fd_query.flags = flags;
1316 attr.task_fd_query.buf = ptr_to_u64(buf);
1317 attr.task_fd_query.buf_len = *buf_len;
1318
1319 err = sys_bpf(BPF_TASK_FD_QUERY, &attr, attr_sz);
1320
1321 *buf_len = attr.task_fd_query.buf_len;
1322 *prog_id = attr.task_fd_query.prog_id;
1323 *fd_type = attr.task_fd_query.fd_type;
1324 *probe_offset = attr.task_fd_query.probe_offset;
1325 *probe_addr = attr.task_fd_query.probe_addr;
1326
1327 return libbpf_err_errno(err);
1328 }
1329
bpf_enable_stats(enum bpf_stats_type type)1330 int bpf_enable_stats(enum bpf_stats_type type)
1331 {
1332 const size_t attr_sz = offsetofend(union bpf_attr, enable_stats);
1333 union bpf_attr attr;
1334 int fd;
1335
1336 memset(&attr, 0, attr_sz);
1337 attr.enable_stats.type = type;
1338
1339 fd = sys_bpf_fd(BPF_ENABLE_STATS, &attr, attr_sz);
1340 return libbpf_err_errno(fd);
1341 }
1342
bpf_prog_bind_map(int prog_fd,int map_fd,const struct bpf_prog_bind_opts * opts)1343 int bpf_prog_bind_map(int prog_fd, int map_fd,
1344 const struct bpf_prog_bind_opts *opts)
1345 {
1346 const size_t attr_sz = offsetofend(union bpf_attr, prog_bind_map);
1347 union bpf_attr attr;
1348 int ret;
1349
1350 if (!OPTS_VALID(opts, bpf_prog_bind_opts))
1351 return libbpf_err(-EINVAL);
1352
1353 memset(&attr, 0, attr_sz);
1354 attr.prog_bind_map.prog_fd = prog_fd;
1355 attr.prog_bind_map.map_fd = map_fd;
1356 attr.prog_bind_map.flags = OPTS_GET(opts, flags, 0);
1357
1358 ret = sys_bpf(BPF_PROG_BIND_MAP, &attr, attr_sz);
1359 return libbpf_err_errno(ret);
1360 }
1361
bpf_token_create(int bpffs_fd,struct bpf_token_create_opts * opts)1362 int bpf_token_create(int bpffs_fd, struct bpf_token_create_opts *opts)
1363 {
1364 const size_t attr_sz = offsetofend(union bpf_attr, token_create);
1365 union bpf_attr attr;
1366 int fd;
1367
1368 if (!OPTS_VALID(opts, bpf_token_create_opts))
1369 return libbpf_err(-EINVAL);
1370
1371 memset(&attr, 0, attr_sz);
1372 attr.token_create.bpffs_fd = bpffs_fd;
1373 attr.token_create.flags = OPTS_GET(opts, flags, 0);
1374
1375 fd = sys_bpf_fd(BPF_TOKEN_CREATE, &attr, attr_sz);
1376 return libbpf_err_errno(fd);
1377 }
1378
bpf_prog_stream_read(int prog_fd,__u32 stream_id,void * buf,__u32 buf_len,struct bpf_prog_stream_read_opts * opts)1379 int bpf_prog_stream_read(int prog_fd, __u32 stream_id, void *buf, __u32 buf_len,
1380 struct bpf_prog_stream_read_opts *opts)
1381 {
1382 const size_t attr_sz = offsetofend(union bpf_attr, prog_stream_read);
1383 union bpf_attr attr;
1384 int err;
1385
1386 if (!OPTS_VALID(opts, bpf_prog_stream_read_opts))
1387 return libbpf_err(-EINVAL);
1388
1389 memset(&attr, 0, attr_sz);
1390 attr.prog_stream_read.stream_buf = ptr_to_u64(buf);
1391 attr.prog_stream_read.stream_buf_len = buf_len;
1392 attr.prog_stream_read.stream_id = stream_id;
1393 attr.prog_stream_read.prog_fd = prog_fd;
1394
1395 err = sys_bpf(BPF_PROG_STREAM_READ_BY_FD, &attr, attr_sz);
1396 return libbpf_err_errno(err);
1397 }
1398