1 #ifndef __BPF_EXPERIMENTAL__ 2 #define __BPF_EXPERIMENTAL__ 3 4 #include <vmlinux.h> 5 #include <bpf/bpf_tracing.h> 6 #include <bpf/bpf_helpers.h> 7 #include <bpf/bpf_core_read.h> 8 9 #define __contains(name, node) __attribute__((btf_decl_tag("contains:" #name ":" #node))) 10 11 /* Description 12 * Allocates an object of the type represented by 'local_type_id' in 13 * program BTF. User may use the bpf_core_type_id_local macro to pass the 14 * type ID of a struct in program BTF. 15 * 16 * The 'local_type_id' parameter must be a known constant. 17 * The 'meta' parameter is rewritten by the verifier, no need for BPF 18 * program to set it. 19 * Returns 20 * A pointer to an object of the type corresponding to the passed in 21 * 'local_type_id', or NULL on failure. 22 */ 23 extern void *bpf_obj_new_impl(__u64 local_type_id, void *meta) __ksym; 24 25 /* Convenience macro to wrap over bpf_obj_new_impl */ 26 #define bpf_obj_new(type) ((type *)bpf_obj_new_impl(bpf_core_type_id_local(type), NULL)) 27 28 /* Description 29 * Free an allocated object. All fields of the object that require 30 * destruction will be destructed before the storage is freed. 31 * 32 * The 'meta' parameter is rewritten by the verifier, no need for BPF 33 * program to set it. 34 * Returns 35 * Void. 36 */ 37 extern void bpf_obj_drop_impl(void *kptr, void *meta) __ksym; 38 39 /* Convenience macro to wrap over bpf_obj_drop_impl */ 40 #define bpf_obj_drop(kptr) bpf_obj_drop_impl(kptr, NULL) 41 42 /* Description 43 * Increment the refcount on a refcounted local kptr, turning the 44 * non-owning reference input into an owning reference in the process. 45 * 46 * The 'meta' parameter is rewritten by the verifier, no need for BPF 47 * program to set it. 48 * Returns 49 * An owning reference to the object pointed to by 'kptr' 50 */ 51 extern void *bpf_refcount_acquire_impl(void *kptr, void *meta) __ksym; 52 53 /* Convenience macro to wrap over bpf_refcount_acquire_impl */ 54 #define bpf_refcount_acquire(kptr) bpf_refcount_acquire_impl(kptr, NULL) 55 56 /* Description 57 * Add a new entry to the beginning of the BPF linked list. 58 * 59 * The 'meta' and 'off' parameters are rewritten by the verifier, no need 60 * for BPF programs to set them 61 * Returns 62 * 0 if the node was successfully added 63 * -EINVAL if the node wasn't added because it's already in a list 64 */ 65 extern int bpf_list_push_front_impl(struct bpf_list_head *head, 66 struct bpf_list_node *node, 67 void *meta, __u64 off) __ksym; 68 69 /* Convenience macro to wrap over bpf_list_push_front_impl */ 70 #define bpf_list_push_front(head, node) bpf_list_push_front_impl(head, node, NULL, 0) 71 72 /* Description 73 * Add a new entry to the end of the BPF linked list. 74 * 75 * The 'meta' and 'off' parameters are rewritten by the verifier, no need 76 * for BPF programs to set them 77 * Returns 78 * 0 if the node was successfully added 79 * -EINVAL if the node wasn't added because it's already in a list 80 */ 81 extern int bpf_list_push_back_impl(struct bpf_list_head *head, 82 struct bpf_list_node *node, 83 void *meta, __u64 off) __ksym; 84 85 /* Convenience macro to wrap over bpf_list_push_back_impl */ 86 #define bpf_list_push_back(head, node) bpf_list_push_back_impl(head, node, NULL, 0) 87 88 /* Description 89 * Remove the entry at the beginning of the BPF linked list. 90 * Returns 91 * Pointer to bpf_list_node of deleted entry, or NULL if list is empty. 92 */ 93 extern struct bpf_list_node *bpf_list_pop_front(struct bpf_list_head *head) __ksym; 94 95 /* Description 96 * Remove the entry at the end of the BPF linked list. 97 * Returns 98 * Pointer to bpf_list_node of deleted entry, or NULL if list is empty. 99 */ 100 extern struct bpf_list_node *bpf_list_pop_back(struct bpf_list_head *head) __ksym; 101 102 /* Description 103 * Remove 'node' from rbtree with root 'root' 104 * Returns 105 * Pointer to the removed node, or NULL if 'root' didn't contain 'node' 106 */ 107 extern struct bpf_rb_node *bpf_rbtree_remove(struct bpf_rb_root *root, 108 struct bpf_rb_node *node) __ksym; 109 110 /* Description 111 * Add 'node' to rbtree with root 'root' using comparator 'less' 112 * 113 * The 'meta' and 'off' parameters are rewritten by the verifier, no need 114 * for BPF programs to set them 115 * Returns 116 * 0 if the node was successfully added 117 * -EINVAL if the node wasn't added because it's already in a tree 118 */ 119 extern int bpf_rbtree_add_impl(struct bpf_rb_root *root, struct bpf_rb_node *node, 120 bool (less)(struct bpf_rb_node *a, const struct bpf_rb_node *b), 121 void *meta, __u64 off) __ksym; 122 123 /* Convenience macro to wrap over bpf_rbtree_add_impl */ 124 #define bpf_rbtree_add(head, node, less) bpf_rbtree_add_impl(head, node, less, NULL, 0) 125 126 /* Description 127 * Return the first (leftmost) node in input tree 128 * Returns 129 * Pointer to the node, which is _not_ removed from the tree. If the tree 130 * contains no nodes, returns NULL. 131 */ 132 extern struct bpf_rb_node *bpf_rbtree_first(struct bpf_rb_root *root) __ksym; 133 134 /* Description 135 * Allocates a percpu object of the type represented by 'local_type_id' in 136 * program BTF. User may use the bpf_core_type_id_local macro to pass the 137 * type ID of a struct in program BTF. 138 * 139 * The 'local_type_id' parameter must be a known constant. 140 * The 'meta' parameter is rewritten by the verifier, no need for BPF 141 * program to set it. 142 * Returns 143 * A pointer to a percpu object of the type corresponding to the passed in 144 * 'local_type_id', or NULL on failure. 145 */ 146 extern void *bpf_percpu_obj_new_impl(__u64 local_type_id, void *meta) __ksym; 147 148 /* Convenience macro to wrap over bpf_percpu_obj_new_impl */ 149 #define bpf_percpu_obj_new(type) ((type __percpu_kptr *)bpf_percpu_obj_new_impl(bpf_core_type_id_local(type), NULL)) 150 151 /* Description 152 * Free an allocated percpu object. All fields of the object that require 153 * destruction will be destructed before the storage is freed. 154 * 155 * The 'meta' parameter is rewritten by the verifier, no need for BPF 156 * program to set it. 157 * Returns 158 * Void. 159 */ 160 extern void bpf_percpu_obj_drop_impl(void *kptr, void *meta) __ksym; 161 162 struct bpf_iter_task_vma; 163 164 extern int bpf_iter_task_vma_new(struct bpf_iter_task_vma *it, 165 struct task_struct *task, 166 unsigned long addr) __ksym; 167 extern struct vm_area_struct *bpf_iter_task_vma_next(struct bpf_iter_task_vma *it) __ksym; 168 extern void bpf_iter_task_vma_destroy(struct bpf_iter_task_vma *it) __ksym; 169 170 /* Convenience macro to wrap over bpf_obj_drop_impl */ 171 #define bpf_percpu_obj_drop(kptr) bpf_percpu_obj_drop_impl(kptr, NULL) 172 173 /* Description 174 * Throw a BPF exception from the program, immediately terminating its 175 * execution and unwinding the stack. The supplied 'cookie' parameter 176 * will be the return value of the program when an exception is thrown, 177 * and the default exception callback is used. Otherwise, if an exception 178 * callback is set using the '__exception_cb(callback)' declaration tag 179 * on the main program, the 'cookie' parameter will be the callback's only 180 * input argument. 181 * 182 * Thus, in case of default exception callback, 'cookie' is subjected to 183 * constraints on the program's return value (as with R0 on exit). 184 * Otherwise, the return value of the marked exception callback will be 185 * subjected to the same checks. 186 * 187 * Note that throwing an exception with lingering resources (locks, 188 * references, etc.) will lead to a verification error. 189 * 190 * Note that callbacks *cannot* call this helper. 191 * Returns 192 * Never. 193 * Throws 194 * An exception with the specified 'cookie' value. 195 */ 196 extern void bpf_throw(u64 cookie) __ksym; 197 198 /* This macro must be used to mark the exception callback corresponding to the 199 * main program. For example: 200 * 201 * int exception_cb(u64 cookie) { 202 * return cookie; 203 * } 204 * 205 * SEC("tc") 206 * __exception_cb(exception_cb) 207 * int main_prog(struct __sk_buff *ctx) { 208 * ... 209 * return TC_ACT_OK; 210 * } 211 * 212 * Here, exception callback for the main program will be 'exception_cb'. Note 213 * that this attribute can only be used once, and multiple exception callbacks 214 * specified for the main program will lead to verification error. 215 */ 216 #define __exception_cb(name) __attribute__((btf_decl_tag("exception_callback:" #name))) 217 218 #define __bpf_assert_signed(x) _Generic((x), \ 219 unsigned long: 0, \ 220 unsigned long long: 0, \ 221 signed long: 1, \ 222 signed long long: 1 \ 223 ) 224 225 #define __bpf_assert_check(LHS, op, RHS) \ 226 _Static_assert(sizeof(&(LHS)), "1st argument must be an lvalue expression"); \ 227 _Static_assert(sizeof(LHS) == 8, "Only 8-byte integers are supported\n"); \ 228 _Static_assert(__builtin_constant_p(__bpf_assert_signed(LHS)), "internal static assert"); \ 229 _Static_assert(__builtin_constant_p((RHS)), "2nd argument must be a constant expression") 230 231 #define __bpf_assert(LHS, op, cons, RHS, VAL) \ 232 ({ \ 233 (void)bpf_throw; \ 234 asm volatile ("if %[lhs] " op " %[rhs] goto +2; r1 = %[value]; call bpf_throw" \ 235 : : [lhs] "r"(LHS), [rhs] cons(RHS), [value] "ri"(VAL) : ); \ 236 }) 237 238 #define __bpf_assert_op_sign(LHS, op, cons, RHS, VAL, supp_sign) \ 239 ({ \ 240 __bpf_assert_check(LHS, op, RHS); \ 241 if (__bpf_assert_signed(LHS) && !(supp_sign)) \ 242 __bpf_assert(LHS, "s" #op, cons, RHS, VAL); \ 243 else \ 244 __bpf_assert(LHS, #op, cons, RHS, VAL); \ 245 }) 246 247 #define __bpf_assert_op(LHS, op, RHS, VAL, supp_sign) \ 248 ({ \ 249 if (sizeof(typeof(RHS)) == 8) { \ 250 const typeof(RHS) rhs_var = (RHS); \ 251 __bpf_assert_op_sign(LHS, op, "r", rhs_var, VAL, supp_sign); \ 252 } else { \ 253 __bpf_assert_op_sign(LHS, op, "i", RHS, VAL, supp_sign); \ 254 } \ 255 }) 256 257 #define __cmp_cannot_be_signed(x) \ 258 __builtin_strcmp(#x, "==") == 0 || __builtin_strcmp(#x, "!=") == 0 || \ 259 __builtin_strcmp(#x, "&") == 0 260 261 #define __is_signed_type(type) (((type)(-1)) < (type)1) 262 263 #define __bpf_cmp(LHS, OP, PRED, RHS, DEFAULT) \ 264 ({ \ 265 __label__ l_true; \ 266 bool ret = DEFAULT; \ 267 asm volatile goto("if %[lhs] " OP " %[rhs] goto %l[l_true]" \ 268 :: [lhs] "r"((short)LHS), [rhs] PRED (RHS) :: l_true); \ 269 ret = !DEFAULT; \ 270 l_true: \ 271 ret; \ 272 }) 273 274 /* C type conversions coupled with comparison operator are tricky. 275 * Make sure BPF program is compiled with -Wsign-compare then 276 * __lhs OP __rhs below will catch the mistake. 277 * Be aware that we check only __lhs to figure out the sign of compare. 278 */ 279 #define _bpf_cmp(LHS, OP, RHS, UNLIKELY) \ 280 ({ \ 281 typeof(LHS) __lhs = (LHS); \ 282 typeof(RHS) __rhs = (RHS); \ 283 bool ret; \ 284 _Static_assert(sizeof(&(LHS)), "1st argument must be an lvalue expression"); \ 285 (void)(__lhs OP __rhs); \ 286 if (__cmp_cannot_be_signed(OP) || !__is_signed_type(typeof(__lhs))) { \ 287 if (sizeof(__rhs) == 8) \ 288 /* "i" will truncate 64-bit constant into s32, \ 289 * so we have to use extra register via "r". \ 290 */ \ 291 ret = __bpf_cmp(__lhs, #OP, "r", __rhs, UNLIKELY); \ 292 else \ 293 ret = __bpf_cmp(__lhs, #OP, "ri", __rhs, UNLIKELY); \ 294 } else { \ 295 if (sizeof(__rhs) == 8) \ 296 ret = __bpf_cmp(__lhs, "s"#OP, "r", __rhs, UNLIKELY); \ 297 else \ 298 ret = __bpf_cmp(__lhs, "s"#OP, "ri", __rhs, UNLIKELY); \ 299 } \ 300 ret; \ 301 }) 302 303 #ifndef bpf_cmp_unlikely 304 #define bpf_cmp_unlikely(LHS, OP, RHS) _bpf_cmp(LHS, OP, RHS, true) 305 #endif 306 307 #ifndef bpf_cmp_likely 308 #define bpf_cmp_likely(LHS, OP, RHS) \ 309 ({ \ 310 bool ret = 0; \ 311 if (__builtin_strcmp(#OP, "==") == 0) \ 312 ret = _bpf_cmp(LHS, !=, RHS, false); \ 313 else if (__builtin_strcmp(#OP, "!=") == 0) \ 314 ret = _bpf_cmp(LHS, ==, RHS, false); \ 315 else if (__builtin_strcmp(#OP, "<=") == 0) \ 316 ret = _bpf_cmp(LHS, >, RHS, false); \ 317 else if (__builtin_strcmp(#OP, "<") == 0) \ 318 ret = _bpf_cmp(LHS, >=, RHS, false); \ 319 else if (__builtin_strcmp(#OP, ">") == 0) \ 320 ret = _bpf_cmp(LHS, <=, RHS, false); \ 321 else if (__builtin_strcmp(#OP, ">=") == 0) \ 322 ret = _bpf_cmp(LHS, <, RHS, false); \ 323 else \ 324 asm volatile("r0 " #OP " invalid compare"); \ 325 ret; \ 326 }) 327 #endif 328 329 /* 330 * Note that cond_break can only be portably used in the body of a breakable 331 * construct, whereas can_loop can be used anywhere. 332 */ 333 #ifdef __BPF_FEATURE_MAY_GOTO 334 #define can_loop \ 335 ({ __label__ l_break, l_continue; \ 336 bool ret = true; \ 337 asm volatile goto("may_goto %l[l_break]" \ 338 :::: l_break); \ 339 goto l_continue; \ 340 l_break: ret = false; \ 341 l_continue:; \ 342 ret; \ 343 }) 344 345 #define cond_break \ 346 ({ __label__ l_break, l_continue; \ 347 asm volatile goto("may_goto %l[l_break]" \ 348 :::: l_break); \ 349 goto l_continue; \ 350 l_break: break; \ 351 l_continue:; \ 352 }) 353 #else 354 #define can_loop \ 355 ({ __label__ l_break, l_continue; \ 356 bool ret = true; \ 357 asm volatile goto("1:.byte 0xe5; \ 358 .byte 0; \ 359 .long ((%l[l_break] - 1b - 8) / 8) & 0xffff; \ 360 .short 0" \ 361 :::: l_break); \ 362 goto l_continue; \ 363 l_break: ret = false; \ 364 l_continue:; \ 365 ret; \ 366 }) 367 368 #define cond_break \ 369 ({ __label__ l_break, l_continue; \ 370 asm volatile goto("1:.byte 0xe5; \ 371 .byte 0; \ 372 .long ((%l[l_break] - 1b - 8) / 8) & 0xffff; \ 373 .short 0" \ 374 :::: l_break); \ 375 goto l_continue; \ 376 l_break: break; \ 377 l_continue:; \ 378 }) 379 #endif 380 381 #ifndef bpf_nop_mov 382 #define bpf_nop_mov(var) \ 383 asm volatile("%[reg]=%[reg]"::[reg]"r"((short)var)) 384 #endif 385 386 /* emit instruction: 387 * rX = rX .off = BPF_ADDR_SPACE_CAST .imm32 = (dst_as << 16) | src_as 388 */ 389 #ifndef bpf_addr_space_cast 390 #define bpf_addr_space_cast(var, dst_as, src_as)\ 391 asm volatile(".byte 0xBF; \ 392 .ifc %[reg], r0; \ 393 .byte 0x00; \ 394 .endif; \ 395 .ifc %[reg], r1; \ 396 .byte 0x11; \ 397 .endif; \ 398 .ifc %[reg], r2; \ 399 .byte 0x22; \ 400 .endif; \ 401 .ifc %[reg], r3; \ 402 .byte 0x33; \ 403 .endif; \ 404 .ifc %[reg], r4; \ 405 .byte 0x44; \ 406 .endif; \ 407 .ifc %[reg], r5; \ 408 .byte 0x55; \ 409 .endif; \ 410 .ifc %[reg], r6; \ 411 .byte 0x66; \ 412 .endif; \ 413 .ifc %[reg], r7; \ 414 .byte 0x77; \ 415 .endif; \ 416 .ifc %[reg], r8; \ 417 .byte 0x88; \ 418 .endif; \ 419 .ifc %[reg], r9; \ 420 .byte 0x99; \ 421 .endif; \ 422 .short %[off]; \ 423 .long %[as]" \ 424 : [reg]"+r"(var) \ 425 : [off]"i"(BPF_ADDR_SPACE_CAST) \ 426 , [as]"i"((dst_as << 16) | src_as)); 427 #endif 428 429 void bpf_preempt_disable(void) __weak __ksym; 430 void bpf_preempt_enable(void) __weak __ksym; 431 432 typedef struct { 433 } __bpf_preempt_t; 434 435 static inline __bpf_preempt_t __bpf_preempt_constructor(void) 436 { 437 __bpf_preempt_t ret = {}; 438 439 bpf_preempt_disable(); 440 return ret; 441 } 442 static inline void __bpf_preempt_destructor(__bpf_preempt_t *t) 443 { 444 bpf_preempt_enable(); 445 } 446 #define bpf_guard_preempt() \ 447 __bpf_preempt_t ___bpf_apply(preempt, __COUNTER__) \ 448 __attribute__((__unused__, __cleanup__(__bpf_preempt_destructor))) = \ 449 __bpf_preempt_constructor() 450 451 /* Description 452 * Assert that a conditional expression is true. 453 * Returns 454 * Void. 455 * Throws 456 * An exception with the value zero when the assertion fails. 457 */ 458 #define bpf_assert(cond) if (!(cond)) bpf_throw(0); 459 460 /* Description 461 * Assert that a conditional expression is true. 462 * Returns 463 * Void. 464 * Throws 465 * An exception with the specified value when the assertion fails. 466 */ 467 #define bpf_assert_with(cond, value) if (!(cond)) bpf_throw(value); 468 469 /* Description 470 * Assert that LHS is in the range [BEG, END] (inclusive of both). This 471 * statement updates the known bounds of LHS during verification. Note 472 * that both BEG and END must be constant values, and must fit within the 473 * data type of LHS. 474 * Returns 475 * Void. 476 * Throws 477 * An exception with the value zero when the assertion fails. 478 */ 479 #define bpf_assert_range(LHS, BEG, END) \ 480 ({ \ 481 _Static_assert(BEG <= END, "BEG must be <= END"); \ 482 barrier_var(LHS); \ 483 __bpf_assert_op(LHS, >=, BEG, 0, false); \ 484 __bpf_assert_op(LHS, <=, END, 0, false); \ 485 }) 486 487 /* Description 488 * Assert that LHS is in the range [BEG, END] (inclusive of both). This 489 * statement updates the known bounds of LHS during verification. Note 490 * that both BEG and END must be constant values, and must fit within the 491 * data type of LHS. 492 * Returns 493 * Void. 494 * Throws 495 * An exception with the specified value when the assertion fails. 496 */ 497 #define bpf_assert_range_with(LHS, BEG, END, value) \ 498 ({ \ 499 _Static_assert(BEG <= END, "BEG must be <= END"); \ 500 barrier_var(LHS); \ 501 __bpf_assert_op(LHS, >=, BEG, value, false); \ 502 __bpf_assert_op(LHS, <=, END, value, false); \ 503 }) 504 505 struct bpf_iter_css_task; 506 struct cgroup_subsys_state; 507 extern int bpf_iter_css_task_new(struct bpf_iter_css_task *it, 508 struct cgroup_subsys_state *css, unsigned int flags) __weak __ksym; 509 extern struct task_struct *bpf_iter_css_task_next(struct bpf_iter_css_task *it) __weak __ksym; 510 extern void bpf_iter_css_task_destroy(struct bpf_iter_css_task *it) __weak __ksym; 511 512 struct bpf_iter_task; 513 extern int bpf_iter_task_new(struct bpf_iter_task *it, 514 struct task_struct *task, unsigned int flags) __weak __ksym; 515 extern struct task_struct *bpf_iter_task_next(struct bpf_iter_task *it) __weak __ksym; 516 extern void bpf_iter_task_destroy(struct bpf_iter_task *it) __weak __ksym; 517 518 struct bpf_iter_css; 519 extern int bpf_iter_css_new(struct bpf_iter_css *it, 520 struct cgroup_subsys_state *start, unsigned int flags) __weak __ksym; 521 extern struct cgroup_subsys_state *bpf_iter_css_next(struct bpf_iter_css *it) __weak __ksym; 522 extern void bpf_iter_css_destroy(struct bpf_iter_css *it) __weak __ksym; 523 524 extern int bpf_wq_init(struct bpf_wq *wq, void *p__map, unsigned int flags) __weak __ksym; 525 extern int bpf_wq_start(struct bpf_wq *wq, unsigned int flags) __weak __ksym; 526 extern int bpf_wq_set_callback_impl(struct bpf_wq *wq, 527 int (callback_fn)(void *map, int *key, struct bpf_wq *wq), 528 unsigned int flags__k, void *aux__ign) __ksym; 529 #define bpf_wq_set_callback(timer, cb, flags) \ 530 bpf_wq_set_callback_impl(timer, cb, flags, NULL) 531 #endif 532