1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause) 2 /* Copyright (c) 2021 Facebook */ 3 #include <stdio.h> 4 #include <stdlib.h> 5 #include <string.h> 6 #include <errno.h> 7 #include <asm/byteorder.h> 8 #include <linux/filter.h> 9 #include <sys/param.h> 10 #include "btf.h" 11 #include "bpf.h" 12 #include "libbpf.h" 13 #include "libbpf_internal.h" 14 #include "hashmap.h" 15 #include "bpf_gen_internal.h" 16 #include "skel_internal.h" 17 18 #define MAX_USED_MAPS 64 19 #define MAX_USED_PROGS 32 20 #define MAX_KFUNC_DESCS 256 21 #define MAX_FD_ARRAY_SZ (MAX_USED_MAPS + MAX_KFUNC_DESCS) 22 23 /* The following structure describes the stack layout of the loader program. 24 * In addition R6 contains the pointer to context. 25 * R7 contains the result of the last sys_bpf command (typically error or FD). 26 * R9 contains the result of the last sys_close command. 27 * 28 * Naming convention: 29 * ctx - bpf program context 30 * stack - bpf program stack 31 * blob - bpf_attr-s, strings, insns, map data. 32 * All the bytes that loader prog will use for read/write. 33 */ 34 struct loader_stack { 35 __u32 btf_fd; 36 __u32 inner_map_fd; 37 __u32 prog_fd[MAX_USED_PROGS]; 38 }; 39 40 #define stack_off(field) \ 41 (__s16)(-sizeof(struct loader_stack) + offsetof(struct loader_stack, field)) 42 43 #define attr_field(attr, field) (attr + offsetof(union bpf_attr, field)) 44 45 static int blob_fd_array_off(struct bpf_gen *gen, int index) 46 { 47 return gen->fd_array + index * sizeof(int); 48 } 49 50 static int realloc_insn_buf(struct bpf_gen *gen, __u32 size) 51 { 52 size_t off = gen->insn_cur - gen->insn_start; 53 void *insn_start; 54 55 if (gen->error) 56 return gen->error; 57 if (size > INT32_MAX || off + size > INT32_MAX) { 58 gen->error = -ERANGE; 59 return -ERANGE; 60 } 61 insn_start = realloc(gen->insn_start, off + size); 62 if (!insn_start) { 63 gen->error = -ENOMEM; 64 free(gen->insn_start); 65 gen->insn_start = NULL; 66 return -ENOMEM; 67 } 68 gen->insn_start = insn_start; 69 gen->insn_cur = insn_start + off; 70 return 0; 71 } 72 73 static int realloc_data_buf(struct bpf_gen *gen, __u32 size) 74 { 75 size_t off = gen->data_cur - gen->data_start; 76 void *data_start; 77 78 if (gen->error) 79 return gen->error; 80 if (size > INT32_MAX || off + size > INT32_MAX) { 81 gen->error = -ERANGE; 82 return -ERANGE; 83 } 84 data_start = realloc(gen->data_start, off + size); 85 if (!data_start) { 86 gen->error = -ENOMEM; 87 free(gen->data_start); 88 gen->data_start = NULL; 89 return -ENOMEM; 90 } 91 gen->data_start = data_start; 92 gen->data_cur = data_start + off; 93 return 0; 94 } 95 96 static void emit(struct bpf_gen *gen, struct bpf_insn insn) 97 { 98 if (realloc_insn_buf(gen, sizeof(insn))) 99 return; 100 memcpy(gen->insn_cur, &insn, sizeof(insn)); 101 gen->insn_cur += sizeof(insn); 102 } 103 104 static void emit2(struct bpf_gen *gen, struct bpf_insn insn1, struct bpf_insn insn2) 105 { 106 emit(gen, insn1); 107 emit(gen, insn2); 108 } 109 110 static int add_data(struct bpf_gen *gen, const void *data, __u32 size); 111 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off); 112 static void emit_signature_match(struct bpf_gen *gen); 113 114 void bpf_gen__init(struct bpf_gen *gen, int log_level, int nr_progs, int nr_maps) 115 { 116 size_t stack_sz = sizeof(struct loader_stack), nr_progs_sz; 117 int i; 118 119 gen->fd_array = add_data(gen, NULL, MAX_FD_ARRAY_SZ * sizeof(int)); 120 gen->log_level = log_level; 121 /* save ctx pointer into R6 */ 122 emit(gen, BPF_MOV64_REG(BPF_REG_6, BPF_REG_1)); 123 124 /* bzero stack */ 125 emit(gen, BPF_MOV64_REG(BPF_REG_1, BPF_REG_10)); 126 emit(gen, BPF_ALU64_IMM(BPF_ADD, BPF_REG_1, -stack_sz)); 127 emit(gen, BPF_MOV64_IMM(BPF_REG_2, stack_sz)); 128 emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0)); 129 emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel)); 130 131 /* amount of stack actually used, only used to calculate iterations, not stack offset */ 132 nr_progs_sz = offsetof(struct loader_stack, prog_fd[nr_progs]); 133 /* jump over cleanup code */ 134 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 135 /* size of cleanup code below (including map fd cleanup) */ 136 (nr_progs_sz / 4) * 3 + 2 + 137 /* 6 insns for emit_sys_close_blob, 138 * 6 insns for debug_regs in emit_sys_close_blob 139 */ 140 nr_maps * (6 + (gen->log_level ? 6 : 0)))); 141 142 /* remember the label where all error branches will jump to */ 143 gen->cleanup_label = gen->insn_cur - gen->insn_start; 144 /* emit cleanup code: close all temp FDs */ 145 for (i = 0; i < nr_progs_sz; i += 4) { 146 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, -stack_sz + i)); 147 emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0, 1)); 148 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close)); 149 } 150 for (i = 0; i < nr_maps; i++) 151 emit_sys_close_blob(gen, blob_fd_array_off(gen, i)); 152 /* R7 contains the error code from sys_bpf. Copy it into R0 and exit. */ 153 emit(gen, BPF_MOV64_REG(BPF_REG_0, BPF_REG_7)); 154 emit(gen, BPF_EXIT_INSN()); 155 if (OPTS_GET(gen->opts, gen_hash, false)) 156 emit_signature_match(gen); 157 } 158 159 static int add_data(struct bpf_gen *gen, const void *data, __u32 size) 160 { 161 __u32 size8 = roundup(size, 8); 162 __u64 zero = 0; 163 void *prev; 164 165 if (realloc_data_buf(gen, size8)) 166 return 0; 167 prev = gen->data_cur; 168 if (data) { 169 memcpy(gen->data_cur, data, size); 170 memcpy(gen->data_cur + size, &zero, size8 - size); 171 } else { 172 memset(gen->data_cur, 0, size8); 173 } 174 gen->data_cur += size8; 175 return prev - gen->data_start; 176 } 177 178 /* Get index for map_fd/btf_fd slot in reserved fd_array, or in data relative 179 * to start of fd_array. Caller can decide if it is usable or not. 180 */ 181 static int add_map_fd(struct bpf_gen *gen) 182 { 183 if (gen->nr_maps == MAX_USED_MAPS) { 184 pr_warn("Total maps exceeds %d\n", MAX_USED_MAPS); 185 gen->error = -E2BIG; 186 return 0; 187 } 188 return gen->nr_maps++; 189 } 190 191 static int add_kfunc_btf_fd(struct bpf_gen *gen) 192 { 193 int cur; 194 195 if (gen->nr_fd_array == MAX_KFUNC_DESCS) { 196 cur = add_data(gen, NULL, sizeof(int)); 197 return (cur - gen->fd_array) / sizeof(int); 198 } 199 return MAX_USED_MAPS + gen->nr_fd_array++; 200 } 201 202 static int insn_bytes_to_bpf_size(__u32 sz) 203 { 204 switch (sz) { 205 case 8: return BPF_DW; 206 case 4: return BPF_W; 207 case 2: return BPF_H; 208 case 1: return BPF_B; 209 default: return -1; 210 } 211 } 212 213 /* *(u64 *)(blob + off) = (u64)(void *)(blob + data) */ 214 static void emit_rel_store(struct bpf_gen *gen, int off, int data) 215 { 216 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE, 217 0, 0, 0, data)); 218 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 219 0, 0, 0, off)); 220 emit(gen, BPF_STX_MEM(BPF_DW, BPF_REG_1, BPF_REG_0, 0)); 221 } 222 223 static void move_blob2blob(struct bpf_gen *gen, int off, int size, int blob_off) 224 { 225 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE, 226 0, 0, 0, blob_off)); 227 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_2, 0)); 228 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 229 0, 0, 0, off)); 230 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0)); 231 } 232 233 static void move_blob2ctx(struct bpf_gen *gen, int ctx_off, int size, int blob_off) 234 { 235 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 236 0, 0, 0, blob_off)); 237 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_1, 0)); 238 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off)); 239 } 240 241 static void move_ctx2blob(struct bpf_gen *gen, int off, int size, int ctx_off, 242 bool check_non_zero) 243 { 244 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_6, ctx_off)); 245 if (check_non_zero) 246 /* If value in ctx is zero don't update the blob. 247 * For example: when ctx->map.max_entries == 0, keep default max_entries from bpf.c 248 */ 249 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_0, 0, 3)); 250 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 251 0, 0, 0, off)); 252 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0)); 253 } 254 255 static void move_stack2blob(struct bpf_gen *gen, int off, int size, int stack_off) 256 { 257 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off)); 258 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 259 0, 0, 0, off)); 260 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0)); 261 } 262 263 static void move_stack2ctx(struct bpf_gen *gen, int ctx_off, int size, int stack_off) 264 { 265 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off)); 266 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off)); 267 } 268 269 static void emit_sys_bpf(struct bpf_gen *gen, int cmd, int attr, int attr_size) 270 { 271 emit(gen, BPF_MOV64_IMM(BPF_REG_1, cmd)); 272 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE, 273 0, 0, 0, attr)); 274 emit(gen, BPF_MOV64_IMM(BPF_REG_3, attr_size)); 275 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_bpf)); 276 /* remember the result in R7 */ 277 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0)); 278 } 279 280 static bool is_simm16(__s64 value) 281 { 282 return value == (__s64)(__s16)value; 283 } 284 285 static void emit_check_err(struct bpf_gen *gen) 286 { 287 __s64 off = -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 1; 288 289 /* R7 contains result of last sys_bpf command. 290 * if (R7 < 0) goto cleanup; 291 */ 292 if (is_simm16(off)) { 293 emit(gen, BPF_JMP_IMM(BPF_JSLT, BPF_REG_7, 0, off)); 294 } else { 295 gen->error = -ERANGE; 296 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, -1)); 297 } 298 } 299 300 /* reg1 and reg2 should not be R1 - R5. They can be R0, R6 - R10 */ 301 static void emit_debug(struct bpf_gen *gen, int reg1, int reg2, 302 const char *fmt, va_list args) 303 { 304 char buf[1024]; 305 int addr, len, ret; 306 307 if (!gen->log_level) 308 return; 309 ret = vsnprintf(buf, sizeof(buf), fmt, args); 310 if (ret < 1024 - 7 && reg1 >= 0 && reg2 < 0) 311 /* The special case to accommodate common debug_ret(): 312 * to avoid specifying BPF_REG_7 and adding " r=%%d" to 313 * prints explicitly. 314 */ 315 strcat(buf, " r=%d"); 316 len = strlen(buf) + 1; 317 addr = add_data(gen, buf, len); 318 319 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 320 0, 0, 0, addr)); 321 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len)); 322 if (reg1 >= 0) 323 emit(gen, BPF_MOV64_REG(BPF_REG_3, reg1)); 324 if (reg2 >= 0) 325 emit(gen, BPF_MOV64_REG(BPF_REG_4, reg2)); 326 emit(gen, BPF_EMIT_CALL(BPF_FUNC_trace_printk)); 327 } 328 329 static void debug_regs(struct bpf_gen *gen, int reg1, int reg2, const char *fmt, ...) 330 { 331 va_list args; 332 333 va_start(args, fmt); 334 emit_debug(gen, reg1, reg2, fmt, args); 335 va_end(args); 336 } 337 338 static void debug_ret(struct bpf_gen *gen, const char *fmt, ...) 339 { 340 va_list args; 341 342 va_start(args, fmt); 343 emit_debug(gen, BPF_REG_7, -1, fmt, args); 344 va_end(args); 345 } 346 347 static void __emit_sys_close(struct bpf_gen *gen) 348 { 349 emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0, 350 /* 2 is the number of the following insns 351 * * 6 is additional insns in debug_regs 352 */ 353 2 + (gen->log_level ? 6 : 0))); 354 emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_1)); 355 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close)); 356 debug_regs(gen, BPF_REG_9, BPF_REG_0, "close(%%d) = %%d"); 357 } 358 359 static void emit_sys_close_stack(struct bpf_gen *gen, int stack_off) 360 { 361 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, stack_off)); 362 __emit_sys_close(gen); 363 } 364 365 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off) 366 { 367 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE, 368 0, 0, 0, blob_off)); 369 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_0, 0)); 370 __emit_sys_close(gen); 371 } 372 373 static void compute_sha_update_offsets(struct bpf_gen *gen); 374 375 int bpf_gen__finish(struct bpf_gen *gen, int nr_progs, int nr_maps) 376 { 377 int i; 378 379 if (nr_progs < gen->nr_progs || nr_maps != gen->nr_maps) { 380 pr_warn("nr_progs %d/%d nr_maps %d/%d mismatch\n", 381 nr_progs, gen->nr_progs, nr_maps, gen->nr_maps); 382 gen->error = -EFAULT; 383 return gen->error; 384 } 385 emit_sys_close_stack(gen, stack_off(btf_fd)); 386 for (i = 0; i < gen->nr_progs; i++) 387 move_stack2ctx(gen, 388 sizeof(struct bpf_loader_ctx) + 389 sizeof(struct bpf_map_desc) * gen->nr_maps + 390 sizeof(struct bpf_prog_desc) * i + 391 offsetof(struct bpf_prog_desc, prog_fd), 4, 392 stack_off(prog_fd[i])); 393 for (i = 0; i < gen->nr_maps; i++) 394 move_blob2ctx(gen, 395 sizeof(struct bpf_loader_ctx) + 396 sizeof(struct bpf_map_desc) * i + 397 offsetof(struct bpf_map_desc, map_fd), 4, 398 blob_fd_array_off(gen, i)); 399 emit(gen, BPF_MOV64_IMM(BPF_REG_0, 0)); 400 emit(gen, BPF_EXIT_INSN()); 401 if (OPTS_GET(gen->opts, gen_hash, false)) 402 compute_sha_update_offsets(gen); 403 404 pr_debug("gen: finish %s\n", errstr(gen->error)); 405 if (!gen->error) { 406 struct gen_loader_opts *opts = gen->opts; 407 408 opts->insns = gen->insn_start; 409 opts->insns_sz = gen->insn_cur - gen->insn_start; 410 opts->data = gen->data_start; 411 opts->data_sz = gen->data_cur - gen->data_start; 412 413 /* use target endianness for embedded loader */ 414 if (gen->swapped_endian) { 415 struct bpf_insn *insn = (struct bpf_insn *)opts->insns; 416 int insn_cnt = opts->insns_sz / sizeof(struct bpf_insn); 417 418 for (i = 0; i < insn_cnt; i++) 419 bpf_insn_bswap(insn++); 420 } 421 } 422 return gen->error; 423 } 424 425 void bpf_gen__free(struct bpf_gen *gen) 426 { 427 if (!gen) 428 return; 429 free(gen->data_start); 430 free(gen->insn_start); 431 free(gen); 432 } 433 434 /* 435 * Fields of bpf_attr are set to values in native byte-order before being 436 * written to the target-bound data blob, and may need endian conversion. 437 * This macro allows providing the correct value in situ more simply than 438 * writing a separate converter for *all fields* of *all records* included 439 * in union bpf_attr. Note that sizeof(rval) should match the assignment 440 * target to avoid runtime problems. 441 */ 442 #define tgt_endian(rval) ({ \ 443 typeof(rval) _val = (rval); \ 444 if (gen->swapped_endian) { \ 445 switch (sizeof(_val)) { \ 446 case 1: break; \ 447 case 2: _val = bswap_16(_val); break; \ 448 case 4: _val = bswap_32(_val); break; \ 449 case 8: _val = bswap_64(_val); break; \ 450 default: pr_warn("unsupported bswap size!\n"); \ 451 } \ 452 } \ 453 _val; \ 454 }) 455 456 static void compute_sha_update_offsets(struct bpf_gen *gen) 457 { 458 __u64 sha[SHA256_DWORD_SIZE]; 459 __u64 sha_dw; 460 int i; 461 462 libbpf_sha256(gen->data_start, gen->data_cur - gen->data_start, (__u8 *)sha); 463 for (i = 0; i < SHA256_DWORD_SIZE; i++) { 464 struct bpf_insn *insn = 465 (struct bpf_insn *)(gen->insn_start + gen->hash_insn_offset[i]); 466 sha_dw = tgt_endian(sha[i]); 467 insn[0].imm = (__u32)sha_dw; 468 insn[1].imm = sha_dw >> 32; 469 } 470 } 471 472 void bpf_gen__load_btf(struct bpf_gen *gen, const void *btf_raw_data, 473 __u32 btf_raw_size) 474 { 475 int attr_size = offsetofend(union bpf_attr, btf_log_level); 476 int btf_data, btf_load_attr; 477 union bpf_attr attr; 478 479 memset(&attr, 0, attr_size); 480 btf_data = add_data(gen, btf_raw_data, btf_raw_size); 481 482 attr.btf_size = tgt_endian(btf_raw_size); 483 btf_load_attr = add_data(gen, &attr, attr_size); 484 pr_debug("gen: load_btf: off %d size %d, attr: off %d size %d\n", 485 btf_data, btf_raw_size, btf_load_attr, attr_size); 486 487 /* populate union bpf_attr with user provided log details */ 488 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_level), 4, 489 offsetof(struct bpf_loader_ctx, log_level), false); 490 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_size), 4, 491 offsetof(struct bpf_loader_ctx, log_size), false); 492 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_buf), 8, 493 offsetof(struct bpf_loader_ctx, log_buf), false); 494 /* populate union bpf_attr with a pointer to the BTF data */ 495 emit_rel_store(gen, attr_field(btf_load_attr, btf), btf_data); 496 /* emit BTF_LOAD command */ 497 emit_sys_bpf(gen, BPF_BTF_LOAD, btf_load_attr, attr_size); 498 debug_ret(gen, "btf_load size %d", btf_raw_size); 499 emit_check_err(gen); 500 /* remember btf_fd in the stack, if successful */ 501 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7, stack_off(btf_fd))); 502 } 503 504 void bpf_gen__map_create(struct bpf_gen *gen, 505 enum bpf_map_type map_type, 506 const char *map_name, 507 __u32 key_size, __u32 value_size, __u32 max_entries, 508 struct bpf_map_create_opts *map_attr, int map_idx) 509 { 510 int attr_size = offsetofend(union bpf_attr, map_extra); 511 bool close_inner_map_fd = false; 512 int map_create_attr, idx; 513 union bpf_attr attr; 514 515 memset(&attr, 0, attr_size); 516 attr.map_type = tgt_endian(map_type); 517 attr.key_size = tgt_endian(key_size); 518 attr.value_size = tgt_endian(value_size); 519 attr.map_flags = tgt_endian(map_attr->map_flags); 520 attr.map_extra = tgt_endian(map_attr->map_extra); 521 if (map_name) 522 libbpf_strlcpy(attr.map_name, map_name, sizeof(attr.map_name)); 523 attr.numa_node = tgt_endian(map_attr->numa_node); 524 attr.map_ifindex = tgt_endian(map_attr->map_ifindex); 525 attr.max_entries = tgt_endian(max_entries); 526 attr.btf_key_type_id = tgt_endian(map_attr->btf_key_type_id); 527 attr.btf_value_type_id = tgt_endian(map_attr->btf_value_type_id); 528 529 map_create_attr = add_data(gen, &attr, attr_size); 530 pr_debug("gen: map_create: %s idx %d type %d value_type_id %d, attr: off %d size %d\n", 531 map_name, map_idx, map_type, map_attr->btf_value_type_id, 532 map_create_attr, attr_size); 533 534 if (map_attr->btf_value_type_id) 535 /* populate union bpf_attr with btf_fd saved in the stack earlier */ 536 move_stack2blob(gen, attr_field(map_create_attr, btf_fd), 4, 537 stack_off(btf_fd)); 538 switch (map_type) { 539 case BPF_MAP_TYPE_ARRAY_OF_MAPS: 540 case BPF_MAP_TYPE_HASH_OF_MAPS: 541 move_stack2blob(gen, attr_field(map_create_attr, inner_map_fd), 4, 542 stack_off(inner_map_fd)); 543 close_inner_map_fd = true; 544 break; 545 default: 546 break; 547 } 548 /* conditionally update max_entries */ 549 if (map_idx >= 0) 550 move_ctx2blob(gen, attr_field(map_create_attr, max_entries), 4, 551 sizeof(struct bpf_loader_ctx) + 552 sizeof(struct bpf_map_desc) * map_idx + 553 offsetof(struct bpf_map_desc, max_entries), 554 true /* check that max_entries != 0 */); 555 /* emit MAP_CREATE command */ 556 emit_sys_bpf(gen, BPF_MAP_CREATE, map_create_attr, attr_size); 557 debug_ret(gen, "map_create %s idx %d type %d value_size %d value_btf_id %d", 558 map_name, map_idx, map_type, value_size, 559 map_attr->btf_value_type_id); 560 emit_check_err(gen); 561 /* remember map_fd in the stack, if successful */ 562 if (map_idx < 0) { 563 /* This bpf_gen__map_create() function is called with map_idx >= 0 564 * for all maps that libbpf loading logic tracks. 565 * It's called with -1 to create an inner map. 566 */ 567 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7, 568 stack_off(inner_map_fd))); 569 } else if (map_idx != gen->nr_maps) { 570 gen->error = -EDOM; /* internal bug */ 571 return; 572 } else { 573 /* add_map_fd does gen->nr_maps++ */ 574 idx = add_map_fd(gen); 575 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 576 0, 0, 0, blob_fd_array_off(gen, idx))); 577 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_1, BPF_REG_7, 0)); 578 } 579 if (close_inner_map_fd) 580 emit_sys_close_stack(gen, stack_off(inner_map_fd)); 581 } 582 583 static void emit_signature_match(struct bpf_gen *gen) 584 { 585 __s64 off; 586 int i; 587 588 for (i = 0; i < SHA256_DWORD_SIZE; i++) { 589 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX, 590 0, 0, 0, 0)); 591 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_2, BPF_REG_1, i * sizeof(__u64))); 592 gen->hash_insn_offset[i] = gen->insn_cur - gen->insn_start; 593 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_3, 0, 0, 0, 0, 0)); 594 595 off = -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 2; 596 if (is_simm16(off)) { 597 emit(gen, BPF_MOV64_IMM(BPF_REG_7, -EINVAL)); 598 emit(gen, BPF_JMP_REG(BPF_JNE, BPF_REG_2, BPF_REG_3, off)); 599 } else { 600 gen->error = -ERANGE; 601 } 602 } 603 } 604 605 void bpf_gen__record_attach_target(struct bpf_gen *gen, const char *attach_name, 606 enum bpf_attach_type type) 607 { 608 const char *prefix; 609 int kind, ret; 610 611 btf_get_kernel_prefix_kind(type, &prefix, &kind); 612 gen->attach_kind = kind; 613 ret = snprintf(gen->attach_target, sizeof(gen->attach_target), "%s%s", 614 prefix, attach_name); 615 if (ret >= sizeof(gen->attach_target)) 616 gen->error = -ENOSPC; 617 } 618 619 static void emit_find_attach_target(struct bpf_gen *gen) 620 { 621 int name, len = strlen(gen->attach_target) + 1; 622 623 pr_debug("gen: find_attach_tgt %s %d\n", gen->attach_target, gen->attach_kind); 624 name = add_data(gen, gen->attach_target, len); 625 626 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 627 0, 0, 0, name)); 628 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len)); 629 emit(gen, BPF_MOV64_IMM(BPF_REG_3, gen->attach_kind)); 630 emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0)); 631 emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind)); 632 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0)); 633 debug_ret(gen, "find_by_name_kind(%s,%d)", 634 gen->attach_target, gen->attach_kind); 635 emit_check_err(gen); 636 /* if successful, btf_id is in lower 32-bit of R7 and 637 * btf_obj_fd is in upper 32-bit 638 */ 639 } 640 641 void bpf_gen__record_extern(struct bpf_gen *gen, const char *name, bool is_weak, 642 bool is_typeless, bool is_ld64, int kind, int insn_idx) 643 { 644 struct ksym_relo_desc *relo; 645 646 relo = libbpf_reallocarray(gen->relos, gen->relo_cnt + 1, sizeof(*relo)); 647 if (!relo) { 648 gen->error = -ENOMEM; 649 return; 650 } 651 gen->relos = relo; 652 relo += gen->relo_cnt; 653 relo->name = name; 654 relo->is_weak = is_weak; 655 relo->is_typeless = is_typeless; 656 relo->is_ld64 = is_ld64; 657 relo->kind = kind; 658 relo->insn_idx = insn_idx; 659 gen->relo_cnt++; 660 } 661 662 /* returns existing ksym_desc with ref incremented, or inserts a new one */ 663 static struct ksym_desc *get_ksym_desc(struct bpf_gen *gen, struct ksym_relo_desc *relo) 664 { 665 struct ksym_desc *kdesc; 666 int i; 667 668 for (i = 0; i < gen->nr_ksyms; i++) { 669 kdesc = &gen->ksyms[i]; 670 if (kdesc->kind == relo->kind && kdesc->is_ld64 == relo->is_ld64 && 671 !strcmp(kdesc->name, relo->name)) { 672 kdesc->ref++; 673 return kdesc; 674 } 675 } 676 kdesc = libbpf_reallocarray(gen->ksyms, gen->nr_ksyms + 1, sizeof(*kdesc)); 677 if (!kdesc) { 678 gen->error = -ENOMEM; 679 return NULL; 680 } 681 gen->ksyms = kdesc; 682 kdesc = &gen->ksyms[gen->nr_ksyms++]; 683 kdesc->name = relo->name; 684 kdesc->kind = relo->kind; 685 kdesc->ref = 1; 686 kdesc->off = 0; 687 kdesc->insn = 0; 688 kdesc->is_ld64 = relo->is_ld64; 689 return kdesc; 690 } 691 692 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7} 693 * Returns result in BPF_REG_7 694 */ 695 static void emit_bpf_find_by_name_kind(struct bpf_gen *gen, struct ksym_relo_desc *relo) 696 { 697 int name_off, len = strlen(relo->name) + 1; 698 699 name_off = add_data(gen, relo->name, len); 700 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 701 0, 0, 0, name_off)); 702 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len)); 703 emit(gen, BPF_MOV64_IMM(BPF_REG_3, relo->kind)); 704 emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0)); 705 emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind)); 706 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0)); 707 debug_ret(gen, "find_by_name_kind(%s,%d)", relo->name, relo->kind); 708 } 709 710 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7} 711 * Returns result in BPF_REG_7 712 * Returns u64 symbol addr in BPF_REG_9 713 */ 714 static void emit_bpf_kallsyms_lookup_name(struct bpf_gen *gen, struct ksym_relo_desc *relo) 715 { 716 int name_off, len = strlen(relo->name) + 1, res_off; 717 718 name_off = add_data(gen, relo->name, len); 719 res_off = add_data(gen, NULL, 8); /* res is u64 */ 720 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 721 0, 0, 0, name_off)); 722 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len)); 723 emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0)); 724 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_4, BPF_PSEUDO_MAP_IDX_VALUE, 725 0, 0, 0, res_off)); 726 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_4)); 727 emit(gen, BPF_EMIT_CALL(BPF_FUNC_kallsyms_lookup_name)); 728 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_9, BPF_REG_7, 0)); 729 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0)); 730 debug_ret(gen, "kallsyms_lookup_name(%s,%d)", relo->name, relo->kind); 731 } 732 733 /* Expects: 734 * BPF_REG_8 - pointer to instruction 735 * 736 * We need to reuse BTF fd for same symbol otherwise each relocation takes a new 737 * index, while kernel limits total kfunc BTFs to 256. For duplicate symbols, 738 * this would mean a new BTF fd index for each entry. By pairing symbol name 739 * with index, we get the insn->imm, insn->off pairing that kernel uses for 740 * kfunc_tab, which becomes the effective limit even though all of them may 741 * share same index in fd_array (such that kfunc_btf_tab has 1 element). 742 */ 743 static void emit_relo_kfunc_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn) 744 { 745 struct ksym_desc *kdesc; 746 int btf_fd_idx; 747 748 kdesc = get_ksym_desc(gen, relo); 749 if (!kdesc) 750 return; 751 /* try to copy from existing bpf_insn */ 752 if (kdesc->ref > 1) { 753 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4, 754 kdesc->insn + offsetof(struct bpf_insn, imm)); 755 move_blob2blob(gen, insn + offsetof(struct bpf_insn, off), 2, 756 kdesc->insn + offsetof(struct bpf_insn, off)); 757 goto log; 758 } 759 /* remember insn offset, so we can copy BTF ID and FD later */ 760 kdesc->insn = insn; 761 emit_bpf_find_by_name_kind(gen, relo); 762 if (!relo->is_weak) 763 emit_check_err(gen); 764 /* get index in fd_array to store BTF FD at */ 765 btf_fd_idx = add_kfunc_btf_fd(gen); 766 if (btf_fd_idx > INT16_MAX) { 767 pr_warn("BTF fd off %d for kfunc %s exceeds INT16_MAX, cannot process relocation\n", 768 btf_fd_idx, relo->name); 769 gen->error = -E2BIG; 770 return; 771 } 772 kdesc->off = btf_fd_idx; 773 /* jump to success case */ 774 emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3)); 775 /* set value for imm, off as 0 */ 776 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0)); 777 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0)); 778 /* skip success case for ret < 0 */ 779 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 10)); 780 /* store btf_id into insn[insn_idx].imm */ 781 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm))); 782 /* obtain fd in BPF_REG_9 */ 783 emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_7)); 784 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32)); 785 /* load fd_array slot pointer */ 786 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE, 787 0, 0, 0, blob_fd_array_off(gen, btf_fd_idx))); 788 /* store BTF fd in slot, 0 for vmlinux */ 789 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_9, 0)); 790 /* jump to insn[insn_idx].off store if fd denotes module BTF */ 791 emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_9, 0, 2)); 792 /* set the default value for off */ 793 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0)); 794 /* skip BTF fd store for vmlinux BTF */ 795 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1)); 796 /* store index into insn[insn_idx].off */ 797 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), btf_fd_idx)); 798 log: 799 if (!gen->log_level) 800 return; 801 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8, 802 offsetof(struct bpf_insn, imm))); 803 emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8, 804 offsetof(struct bpf_insn, off))); 805 debug_regs(gen, BPF_REG_7, BPF_REG_9, " func (%s:count=%d): imm: %%d, off: %%d", 806 relo->name, kdesc->ref); 807 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE, 808 0, 0, 0, blob_fd_array_off(gen, kdesc->off))); 809 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_9, BPF_REG_0, 0)); 810 debug_regs(gen, BPF_REG_9, -1, " func (%s:count=%d): btf_fd", 811 relo->name, kdesc->ref); 812 } 813 814 static void emit_ksym_relo_log(struct bpf_gen *gen, struct ksym_relo_desc *relo, 815 int ref) 816 { 817 if (!gen->log_level) 818 return; 819 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8, 820 offsetof(struct bpf_insn, imm))); 821 emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8, sizeof(struct bpf_insn) + 822 offsetof(struct bpf_insn, imm))); 823 debug_regs(gen, BPF_REG_7, BPF_REG_9, " var t=%d w=%d (%s:count=%d): imm[0]: %%d, imm[1]: %%d", 824 relo->is_typeless, relo->is_weak, relo->name, ref); 825 emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code))); 826 debug_regs(gen, BPF_REG_9, -1, " var t=%d w=%d (%s:count=%d): insn.reg", 827 relo->is_typeless, relo->is_weak, relo->name, ref); 828 } 829 830 /* Expects: 831 * BPF_REG_8 - pointer to instruction 832 */ 833 static void emit_relo_ksym_typeless(struct bpf_gen *gen, 834 struct ksym_relo_desc *relo, int insn) 835 { 836 struct ksym_desc *kdesc; 837 838 kdesc = get_ksym_desc(gen, relo); 839 if (!kdesc) 840 return; 841 /* try to copy from existing ldimm64 insn */ 842 if (kdesc->ref > 1) { 843 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4, 844 kdesc->insn + offsetof(struct bpf_insn, imm)); 845 move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4, 846 kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)); 847 goto log; 848 } 849 /* remember insn offset, so we can copy ksym addr later */ 850 kdesc->insn = insn; 851 /* skip typeless ksym_desc in fd closing loop in cleanup_relos */ 852 kdesc->typeless = true; 853 emit_bpf_kallsyms_lookup_name(gen, relo); 854 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_7, -ENOENT, 1)); 855 emit_check_err(gen); 856 /* store lower half of addr into insn[insn_idx].imm */ 857 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9, offsetof(struct bpf_insn, imm))); 858 /* store upper half of addr into insn[insn_idx + 1].imm */ 859 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32)); 860 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9, 861 sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm))); 862 log: 863 emit_ksym_relo_log(gen, relo, kdesc->ref); 864 } 865 866 static __u32 src_reg_mask(struct bpf_gen *gen) 867 { 868 #if defined(__LITTLE_ENDIAN_BITFIELD) /* src_reg,dst_reg,... */ 869 return gen->swapped_endian ? 0xf0 : 0x0f; 870 #elif defined(__BIG_ENDIAN_BITFIELD) /* dst_reg,src_reg,... */ 871 return gen->swapped_endian ? 0x0f : 0xf0; 872 #else 873 #error "Unsupported bit endianness, cannot proceed" 874 #endif 875 } 876 877 /* Expects: 878 * BPF_REG_8 - pointer to instruction 879 */ 880 static void emit_relo_ksym_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn) 881 { 882 struct ksym_desc *kdesc; 883 __u32 reg_mask; 884 885 kdesc = get_ksym_desc(gen, relo); 886 if (!kdesc) 887 return; 888 /* try to copy from existing ldimm64 insn */ 889 if (kdesc->ref > 1) { 890 move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4, 891 kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)); 892 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4, 893 kdesc->insn + offsetof(struct bpf_insn, imm)); 894 /* jump over src_reg adjustment if imm (btf_id) is not 0, reuse BPF_REG_0 from move_blob2blob 895 * If btf_id is zero, clear BPF_PSEUDO_BTF_ID flag in src_reg of ld_imm64 insn 896 */ 897 emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, 3)); 898 goto clear_src_reg; 899 } 900 /* remember insn offset, so we can copy BTF ID and FD later */ 901 kdesc->insn = insn; 902 emit_bpf_find_by_name_kind(gen, relo); 903 if (!relo->is_weak) 904 emit_check_err(gen); 905 /* jump to success case */ 906 emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3)); 907 /* set values for insn[insn_idx].imm, insn[insn_idx + 1].imm as 0 */ 908 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0)); 909 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 0)); 910 /* skip success case for ret < 0 */ 911 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 4)); 912 /* store btf_id into insn[insn_idx].imm */ 913 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm))); 914 /* store btf_obj_fd into insn[insn_idx + 1].imm */ 915 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32)); 916 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, 917 sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm))); 918 /* skip src_reg adjustment */ 919 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 3)); 920 clear_src_reg: 921 /* clear bpf_object__relocate_data's src_reg assignment, otherwise we get a verifier failure */ 922 reg_mask = src_reg_mask(gen); 923 emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code))); 924 emit(gen, BPF_ALU32_IMM(BPF_AND, BPF_REG_9, reg_mask)); 925 emit(gen, BPF_STX_MEM(BPF_B, BPF_REG_8, BPF_REG_9, offsetofend(struct bpf_insn, code))); 926 927 emit_ksym_relo_log(gen, relo, kdesc->ref); 928 } 929 930 void bpf_gen__record_relo_core(struct bpf_gen *gen, 931 const struct bpf_core_relo *core_relo) 932 { 933 struct bpf_core_relo *relos; 934 935 relos = libbpf_reallocarray(gen->core_relos, gen->core_relo_cnt + 1, sizeof(*relos)); 936 if (!relos) { 937 gen->error = -ENOMEM; 938 return; 939 } 940 gen->core_relos = relos; 941 relos += gen->core_relo_cnt; 942 memcpy(relos, core_relo, sizeof(*relos)); 943 gen->core_relo_cnt++; 944 } 945 946 static void emit_relo(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insns) 947 { 948 int insn; 949 950 pr_debug("gen: emit_relo (%d): %s at %d %s\n", 951 relo->kind, relo->name, relo->insn_idx, relo->is_ld64 ? "ld64" : "call"); 952 insn = insns + sizeof(struct bpf_insn) * relo->insn_idx; 953 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_8, BPF_PSEUDO_MAP_IDX_VALUE, 0, 0, 0, insn)); 954 if (relo->is_ld64) { 955 if (relo->is_typeless) 956 emit_relo_ksym_typeless(gen, relo, insn); 957 else 958 emit_relo_ksym_btf(gen, relo, insn); 959 } else { 960 emit_relo_kfunc_btf(gen, relo, insn); 961 } 962 } 963 964 static void emit_relos(struct bpf_gen *gen, int insns) 965 { 966 int i; 967 968 for (i = 0; i < gen->relo_cnt; i++) 969 emit_relo(gen, gen->relos + i, insns); 970 } 971 972 static void cleanup_core_relo(struct bpf_gen *gen) 973 { 974 if (!gen->core_relo_cnt) 975 return; 976 free(gen->core_relos); 977 gen->core_relo_cnt = 0; 978 gen->core_relos = NULL; 979 } 980 981 static void cleanup_relos(struct bpf_gen *gen, int insns) 982 { 983 struct ksym_desc *kdesc; 984 int i, insn; 985 986 for (i = 0; i < gen->nr_ksyms; i++) { 987 kdesc = &gen->ksyms[i]; 988 /* only close fds for typed ksyms and kfuncs */ 989 if (kdesc->is_ld64 && !kdesc->typeless) { 990 /* close fd recorded in insn[insn_idx + 1].imm */ 991 insn = kdesc->insn; 992 insn += sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm); 993 emit_sys_close_blob(gen, insn); 994 } else if (!kdesc->is_ld64) { 995 emit_sys_close_blob(gen, blob_fd_array_off(gen, kdesc->off)); 996 if (kdesc->off < MAX_FD_ARRAY_SZ) 997 gen->nr_fd_array--; 998 } 999 } 1000 if (gen->nr_ksyms) { 1001 free(gen->ksyms); 1002 gen->nr_ksyms = 0; 1003 gen->ksyms = NULL; 1004 } 1005 if (gen->relo_cnt) { 1006 free(gen->relos); 1007 gen->relo_cnt = 0; 1008 gen->relos = NULL; 1009 } 1010 cleanup_core_relo(gen); 1011 } 1012 1013 /* Convert func, line, and core relo info blobs to target endianness */ 1014 static void info_blob_bswap(struct bpf_gen *gen, int func_info, int line_info, 1015 int core_relos, struct bpf_prog_load_opts *load_attr) 1016 { 1017 struct bpf_func_info *fi = gen->data_start + func_info; 1018 struct bpf_line_info *li = gen->data_start + line_info; 1019 struct bpf_core_relo *cr = gen->data_start + core_relos; 1020 int i; 1021 1022 for (i = 0; i < load_attr->func_info_cnt; i++) 1023 bpf_func_info_bswap(fi++); 1024 1025 for (i = 0; i < load_attr->line_info_cnt; i++) 1026 bpf_line_info_bswap(li++); 1027 1028 for (i = 0; i < gen->core_relo_cnt; i++) 1029 bpf_core_relo_bswap(cr++); 1030 } 1031 1032 void bpf_gen__prog_load(struct bpf_gen *gen, 1033 enum bpf_prog_type prog_type, const char *prog_name, 1034 const char *license, struct bpf_insn *insns, size_t insn_cnt, 1035 struct bpf_prog_load_opts *load_attr, int prog_idx) 1036 { 1037 int func_info_tot_sz = load_attr->func_info_cnt * 1038 load_attr->func_info_rec_size; 1039 int line_info_tot_sz = load_attr->line_info_cnt * 1040 load_attr->line_info_rec_size; 1041 int core_relo_tot_sz = gen->core_relo_cnt * 1042 sizeof(struct bpf_core_relo); 1043 int prog_load_attr, license_off, insns_off, func_info, line_info, core_relos; 1044 int attr_size = offsetofend(union bpf_attr, core_relo_rec_size); 1045 union bpf_attr attr; 1046 1047 memset(&attr, 0, attr_size); 1048 /* add license string to blob of bytes */ 1049 license_off = add_data(gen, license, strlen(license) + 1); 1050 /* add insns to blob of bytes */ 1051 insns_off = add_data(gen, insns, insn_cnt * sizeof(struct bpf_insn)); 1052 pr_debug("gen: prog_load: prog_idx %d type %d insn off %d insns_cnt %zd license off %d\n", 1053 prog_idx, prog_type, insns_off, insn_cnt, license_off); 1054 1055 /* convert blob insns to target endianness */ 1056 if (gen->swapped_endian) { 1057 struct bpf_insn *insn = gen->data_start + insns_off; 1058 int i; 1059 1060 for (i = 0; i < insn_cnt; i++, insn++) 1061 bpf_insn_bswap(insn); 1062 } 1063 1064 attr.prog_type = tgt_endian(prog_type); 1065 attr.expected_attach_type = tgt_endian(load_attr->expected_attach_type); 1066 attr.attach_btf_id = tgt_endian(load_attr->attach_btf_id); 1067 attr.prog_ifindex = tgt_endian(load_attr->prog_ifindex); 1068 attr.kern_version = 0; 1069 attr.insn_cnt = tgt_endian((__u32)insn_cnt); 1070 attr.prog_flags = tgt_endian(load_attr->prog_flags); 1071 1072 attr.func_info_rec_size = tgt_endian(load_attr->func_info_rec_size); 1073 attr.func_info_cnt = tgt_endian(load_attr->func_info_cnt); 1074 func_info = add_data(gen, load_attr->func_info, func_info_tot_sz); 1075 pr_debug("gen: prog_load: func_info: off %d cnt %d rec size %d\n", 1076 func_info, load_attr->func_info_cnt, 1077 load_attr->func_info_rec_size); 1078 1079 attr.line_info_rec_size = tgt_endian(load_attr->line_info_rec_size); 1080 attr.line_info_cnt = tgt_endian(load_attr->line_info_cnt); 1081 line_info = add_data(gen, load_attr->line_info, line_info_tot_sz); 1082 pr_debug("gen: prog_load: line_info: off %d cnt %d rec size %d\n", 1083 line_info, load_attr->line_info_cnt, 1084 load_attr->line_info_rec_size); 1085 1086 attr.core_relo_rec_size = tgt_endian((__u32)sizeof(struct bpf_core_relo)); 1087 attr.core_relo_cnt = tgt_endian(gen->core_relo_cnt); 1088 core_relos = add_data(gen, gen->core_relos, core_relo_tot_sz); 1089 pr_debug("gen: prog_load: core_relos: off %d cnt %d rec size %zd\n", 1090 core_relos, gen->core_relo_cnt, 1091 sizeof(struct bpf_core_relo)); 1092 1093 /* convert all info blobs to target endianness */ 1094 if (gen->swapped_endian) 1095 info_blob_bswap(gen, func_info, line_info, core_relos, load_attr); 1096 1097 libbpf_strlcpy(attr.prog_name, prog_name, sizeof(attr.prog_name)); 1098 prog_load_attr = add_data(gen, &attr, attr_size); 1099 pr_debug("gen: prog_load: attr: off %d size %d\n", 1100 prog_load_attr, attr_size); 1101 1102 /* populate union bpf_attr with a pointer to license */ 1103 emit_rel_store(gen, attr_field(prog_load_attr, license), license_off); 1104 1105 /* populate union bpf_attr with a pointer to instructions */ 1106 emit_rel_store(gen, attr_field(prog_load_attr, insns), insns_off); 1107 1108 /* populate union bpf_attr with a pointer to func_info */ 1109 emit_rel_store(gen, attr_field(prog_load_attr, func_info), func_info); 1110 1111 /* populate union bpf_attr with a pointer to line_info */ 1112 emit_rel_store(gen, attr_field(prog_load_attr, line_info), line_info); 1113 1114 /* populate union bpf_attr with a pointer to core_relos */ 1115 emit_rel_store(gen, attr_field(prog_load_attr, core_relos), core_relos); 1116 1117 /* populate union bpf_attr fd_array with a pointer to data where map_fds are saved */ 1118 emit_rel_store(gen, attr_field(prog_load_attr, fd_array), gen->fd_array); 1119 1120 /* populate union bpf_attr with user provided log details */ 1121 move_ctx2blob(gen, attr_field(prog_load_attr, log_level), 4, 1122 offsetof(struct bpf_loader_ctx, log_level), false); 1123 move_ctx2blob(gen, attr_field(prog_load_attr, log_size), 4, 1124 offsetof(struct bpf_loader_ctx, log_size), false); 1125 move_ctx2blob(gen, attr_field(prog_load_attr, log_buf), 8, 1126 offsetof(struct bpf_loader_ctx, log_buf), false); 1127 /* populate union bpf_attr with btf_fd saved in the stack earlier */ 1128 move_stack2blob(gen, attr_field(prog_load_attr, prog_btf_fd), 4, 1129 stack_off(btf_fd)); 1130 if (gen->attach_kind) { 1131 emit_find_attach_target(gen); 1132 /* populate union bpf_attr with btf_id and btf_obj_fd found by helper */ 1133 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE, 1134 0, 0, 0, prog_load_attr)); 1135 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7, 1136 offsetof(union bpf_attr, attach_btf_id))); 1137 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32)); 1138 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7, 1139 offsetof(union bpf_attr, attach_btf_obj_fd))); 1140 } 1141 emit_relos(gen, insns_off); 1142 /* emit PROG_LOAD command */ 1143 emit_sys_bpf(gen, BPF_PROG_LOAD, prog_load_attr, attr_size); 1144 debug_ret(gen, "prog_load %s insn_cnt %d", attr.prog_name, attr.insn_cnt); 1145 /* successful or not, close btf module FDs used in extern ksyms and attach_btf_obj_fd */ 1146 cleanup_relos(gen, insns_off); 1147 if (gen->attach_kind) { 1148 emit_sys_close_blob(gen, 1149 attr_field(prog_load_attr, attach_btf_obj_fd)); 1150 gen->attach_kind = 0; 1151 } 1152 emit_check_err(gen); 1153 /* remember prog_fd in the stack, if successful */ 1154 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7, 1155 stack_off(prog_fd[gen->nr_progs]))); 1156 gen->nr_progs++; 1157 } 1158 1159 void bpf_gen__map_update_elem(struct bpf_gen *gen, int map_idx, void *pvalue, 1160 __u32 value_size) 1161 { 1162 int attr_size = offsetofend(union bpf_attr, flags); 1163 int map_update_attr, value, key; 1164 union bpf_attr attr; 1165 int zero = 0; 1166 1167 memset(&attr, 0, attr_size); 1168 1169 value = add_data(gen, pvalue, value_size); 1170 key = add_data(gen, &zero, sizeof(zero)); 1171 1172 /* if (map_desc[map_idx].initial_value) { 1173 * if (ctx->flags & BPF_SKEL_KERNEL) 1174 * bpf_probe_read_kernel(value, value_size, initial_value); 1175 * else 1176 * bpf_copy_from_user(value, value_size, initial_value); 1177 * } 1178 */ 1179 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_3, BPF_REG_6, 1180 sizeof(struct bpf_loader_ctx) + 1181 sizeof(struct bpf_map_desc) * map_idx + 1182 offsetof(struct bpf_map_desc, initial_value))); 1183 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_3, 0, 8)); 1184 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE, 1185 0, 0, 0, value)); 1186 emit(gen, BPF_MOV64_IMM(BPF_REG_2, value_size)); 1187 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_0, BPF_REG_6, 1188 offsetof(struct bpf_loader_ctx, flags))); 1189 emit(gen, BPF_JMP_IMM(BPF_JSET, BPF_REG_0, BPF_SKEL_KERNEL, 2)); 1190 emit(gen, BPF_EMIT_CALL(BPF_FUNC_copy_from_user)); 1191 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1)); 1192 emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel)); 1193 1194 map_update_attr = add_data(gen, &attr, attr_size); 1195 pr_debug("gen: map_update_elem: idx %d, value: off %d size %d, attr: off %d size %d\n", 1196 map_idx, value, value_size, map_update_attr, attr_size); 1197 move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4, 1198 blob_fd_array_off(gen, map_idx)); 1199 emit_rel_store(gen, attr_field(map_update_attr, key), key); 1200 emit_rel_store(gen, attr_field(map_update_attr, value), value); 1201 /* emit MAP_UPDATE_ELEM command */ 1202 emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size); 1203 debug_ret(gen, "update_elem idx %d value_size %d", map_idx, value_size); 1204 emit_check_err(gen); 1205 } 1206 1207 void bpf_gen__populate_outer_map(struct bpf_gen *gen, int outer_map_idx, int slot, 1208 int inner_map_idx) 1209 { 1210 int attr_size = offsetofend(union bpf_attr, flags); 1211 int map_update_attr, key; 1212 union bpf_attr attr; 1213 int tgt_slot; 1214 1215 memset(&attr, 0, attr_size); 1216 1217 tgt_slot = tgt_endian(slot); 1218 key = add_data(gen, &tgt_slot, sizeof(tgt_slot)); 1219 1220 map_update_attr = add_data(gen, &attr, attr_size); 1221 pr_debug("gen: populate_outer_map: outer %d key %d inner %d, attr: off %d size %d\n", 1222 outer_map_idx, slot, inner_map_idx, map_update_attr, attr_size); 1223 move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4, 1224 blob_fd_array_off(gen, outer_map_idx)); 1225 emit_rel_store(gen, attr_field(map_update_attr, key), key); 1226 emit_rel_store(gen, attr_field(map_update_attr, value), 1227 blob_fd_array_off(gen, inner_map_idx)); 1228 1229 /* emit MAP_UPDATE_ELEM command */ 1230 emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size); 1231 debug_ret(gen, "populate_outer_map outer %d key %d inner %d", 1232 outer_map_idx, slot, inner_map_idx); 1233 emit_check_err(gen); 1234 } 1235 1236 void bpf_gen__map_freeze(struct bpf_gen *gen, int map_idx) 1237 { 1238 int attr_size = offsetofend(union bpf_attr, map_fd); 1239 int map_freeze_attr; 1240 union bpf_attr attr; 1241 1242 memset(&attr, 0, attr_size); 1243 map_freeze_attr = add_data(gen, &attr, attr_size); 1244 pr_debug("gen: map_freeze: idx %d, attr: off %d size %d\n", 1245 map_idx, map_freeze_attr, attr_size); 1246 move_blob2blob(gen, attr_field(map_freeze_attr, map_fd), 4, 1247 blob_fd_array_off(gen, map_idx)); 1248 /* emit MAP_FREEZE command */ 1249 emit_sys_bpf(gen, BPF_MAP_FREEZE, map_freeze_attr, attr_size); 1250 debug_ret(gen, "map_freeze"); 1251 emit_check_err(gen); 1252 } 1253