1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2 /* Copyright (c) 2021 Facebook */
3 #include <stdio.h>
4 #include <stdlib.h>
5 #include <string.h>
6 #include <errno.h>
7 #include <asm/byteorder.h>
8 #include <linux/filter.h>
9 #include <sys/param.h>
10 #include "btf.h"
11 #include "bpf.h"
12 #include "libbpf.h"
13 #include "libbpf_internal.h"
14 #include "hashmap.h"
15 #include "bpf_gen_internal.h"
16 #include "skel_internal.h"
17
18 #define MAX_USED_MAPS 64
19 #define MAX_USED_PROGS 32
20 #define MAX_KFUNC_DESCS 256
21 #define MAX_FD_ARRAY_SZ (MAX_USED_MAPS + MAX_KFUNC_DESCS)
22
23 /* The following structure describes the stack layout of the loader program.
24 * In addition R6 contains the pointer to context.
25 * R7 contains the result of the last sys_bpf command (typically error or FD).
26 * R9 contains the result of the last sys_close command.
27 *
28 * Naming convention:
29 * ctx - bpf program context
30 * stack - bpf program stack
31 * blob - bpf_attr-s, strings, insns, map data.
32 * All the bytes that loader prog will use for read/write.
33 */
34 struct loader_stack {
35 __u32 btf_fd;
36 __u32 inner_map_fd;
37 __u32 prog_fd[MAX_USED_PROGS];
38 };
39
40 #define stack_off(field) \
41 (__s16)(-sizeof(struct loader_stack) + offsetof(struct loader_stack, field))
42
43 #define attr_field(attr, field) (attr + offsetof(union bpf_attr, field))
44
blob_fd_array_off(struct bpf_gen * gen,int index)45 static int blob_fd_array_off(struct bpf_gen *gen, int index)
46 {
47 return gen->fd_array + index * sizeof(int);
48 }
49
realloc_insn_buf(struct bpf_gen * gen,__u32 size)50 static int realloc_insn_buf(struct bpf_gen *gen, __u32 size)
51 {
52 size_t off = gen->insn_cur - gen->insn_start;
53 void *insn_start;
54
55 if (gen->error)
56 return gen->error;
57 if (size > INT32_MAX || off + size > INT32_MAX) {
58 gen->error = -ERANGE;
59 return -ERANGE;
60 }
61 insn_start = realloc(gen->insn_start, off + size);
62 if (!insn_start) {
63 gen->error = -ENOMEM;
64 free(gen->insn_start);
65 gen->insn_start = NULL;
66 return -ENOMEM;
67 }
68 gen->insn_start = insn_start;
69 gen->insn_cur = insn_start + off;
70 return 0;
71 }
72
realloc_data_buf(struct bpf_gen * gen,__u32 size)73 static int realloc_data_buf(struct bpf_gen *gen, __u32 size)
74 {
75 size_t off = gen->data_cur - gen->data_start;
76 void *data_start;
77
78 if (gen->error)
79 return gen->error;
80 if (size > INT32_MAX || off + size > INT32_MAX) {
81 gen->error = -ERANGE;
82 return -ERANGE;
83 }
84 data_start = realloc(gen->data_start, off + size);
85 if (!data_start) {
86 gen->error = -ENOMEM;
87 free(gen->data_start);
88 gen->data_start = NULL;
89 return -ENOMEM;
90 }
91 gen->data_start = data_start;
92 gen->data_cur = data_start + off;
93 return 0;
94 }
95
emit(struct bpf_gen * gen,struct bpf_insn insn)96 static void emit(struct bpf_gen *gen, struct bpf_insn insn)
97 {
98 if (realloc_insn_buf(gen, sizeof(insn)))
99 return;
100 memcpy(gen->insn_cur, &insn, sizeof(insn));
101 gen->insn_cur += sizeof(insn);
102 }
103
emit2(struct bpf_gen * gen,struct bpf_insn insn1,struct bpf_insn insn2)104 static void emit2(struct bpf_gen *gen, struct bpf_insn insn1, struct bpf_insn insn2)
105 {
106 emit(gen, insn1);
107 emit(gen, insn2);
108 }
109
110 static int add_data(struct bpf_gen *gen, const void *data, __u32 size);
111 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off);
112 static void emit_signature_match(struct bpf_gen *gen);
113
bpf_gen__init(struct bpf_gen * gen,int log_level,int nr_progs,int nr_maps)114 void bpf_gen__init(struct bpf_gen *gen, int log_level, int nr_progs, int nr_maps)
115 {
116 size_t stack_sz = sizeof(struct loader_stack), nr_progs_sz;
117 int i;
118
119 gen->fd_array = add_data(gen, NULL, MAX_FD_ARRAY_SZ * sizeof(int));
120 gen->log_level = log_level;
121 /* save ctx pointer into R6 */
122 emit(gen, BPF_MOV64_REG(BPF_REG_6, BPF_REG_1));
123
124 /* bzero stack */
125 emit(gen, BPF_MOV64_REG(BPF_REG_1, BPF_REG_10));
126 emit(gen, BPF_ALU64_IMM(BPF_ADD, BPF_REG_1, -stack_sz));
127 emit(gen, BPF_MOV64_IMM(BPF_REG_2, stack_sz));
128 emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0));
129 emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel));
130
131 /* amount of stack actually used, only used to calculate iterations, not stack offset */
132 nr_progs_sz = offsetof(struct loader_stack, prog_fd[nr_progs]);
133 /* jump over cleanup code */
134 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0,
135 /* size of cleanup code below (including map fd cleanup) */
136 (nr_progs_sz / 4) * 3 + 2 +
137 /* 6 insns for emit_sys_close_blob,
138 * 6 insns for debug_regs in emit_sys_close_blob
139 */
140 nr_maps * (6 + (gen->log_level ? 6 : 0))));
141
142 /* remember the label where all error branches will jump to */
143 gen->cleanup_label = gen->insn_cur - gen->insn_start;
144 /* emit cleanup code: close all temp FDs */
145 for (i = 0; i < nr_progs_sz; i += 4) {
146 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, -stack_sz + i));
147 emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0, 1));
148 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close));
149 }
150 for (i = 0; i < nr_maps; i++)
151 emit_sys_close_blob(gen, blob_fd_array_off(gen, i));
152 /* R7 contains the error code from sys_bpf. Copy it into R0 and exit. */
153 emit(gen, BPF_MOV64_REG(BPF_REG_0, BPF_REG_7));
154 emit(gen, BPF_EXIT_INSN());
155 if (OPTS_GET(gen->opts, gen_hash, false))
156 emit_signature_match(gen);
157 }
158
add_data(struct bpf_gen * gen,const void * data,__u32 size)159 static int add_data(struct bpf_gen *gen, const void *data, __u32 size)
160 {
161 __u32 size8 = roundup(size, 8);
162 __u64 zero = 0;
163 void *prev;
164
165 if (realloc_data_buf(gen, size8))
166 return 0;
167 prev = gen->data_cur;
168 if (data) {
169 memcpy(gen->data_cur, data, size);
170 memcpy(gen->data_cur + size, &zero, size8 - size);
171 } else {
172 memset(gen->data_cur, 0, size8);
173 }
174 gen->data_cur += size8;
175 return prev - gen->data_start;
176 }
177
178 /* Get index for map_fd/btf_fd slot in reserved fd_array, or in data relative
179 * to start of fd_array. Caller can decide if it is usable or not.
180 */
add_map_fd(struct bpf_gen * gen)181 static int add_map_fd(struct bpf_gen *gen)
182 {
183 if (gen->nr_maps == MAX_USED_MAPS) {
184 pr_warn("Total maps exceeds %d\n", MAX_USED_MAPS);
185 gen->error = -E2BIG;
186 return 0;
187 }
188 return gen->nr_maps++;
189 }
190
add_kfunc_btf_fd(struct bpf_gen * gen)191 static int add_kfunc_btf_fd(struct bpf_gen *gen)
192 {
193 int cur;
194
195 if (gen->nr_fd_array == MAX_KFUNC_DESCS) {
196 cur = add_data(gen, NULL, sizeof(int));
197 return (cur - gen->fd_array) / sizeof(int);
198 }
199 return MAX_USED_MAPS + gen->nr_fd_array++;
200 }
201
insn_bytes_to_bpf_size(__u32 sz)202 static int insn_bytes_to_bpf_size(__u32 sz)
203 {
204 switch (sz) {
205 case 8: return BPF_DW;
206 case 4: return BPF_W;
207 case 2: return BPF_H;
208 case 1: return BPF_B;
209 default: return -1;
210 }
211 }
212
213 /* *(u64 *)(blob + off) = (u64)(void *)(blob + data) */
emit_rel_store(struct bpf_gen * gen,int off,int data)214 static void emit_rel_store(struct bpf_gen *gen, int off, int data)
215 {
216 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
217 0, 0, 0, data));
218 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
219 0, 0, 0, off));
220 emit(gen, BPF_STX_MEM(BPF_DW, BPF_REG_1, BPF_REG_0, 0));
221 }
222
move_blob2blob(struct bpf_gen * gen,int off,int size,int blob_off)223 static void move_blob2blob(struct bpf_gen *gen, int off, int size, int blob_off)
224 {
225 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE,
226 0, 0, 0, blob_off));
227 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_2, 0));
228 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
229 0, 0, 0, off));
230 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
231 }
232
move_blob2ctx(struct bpf_gen * gen,int ctx_off,int size,int blob_off)233 static void move_blob2ctx(struct bpf_gen *gen, int ctx_off, int size, int blob_off)
234 {
235 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
236 0, 0, 0, blob_off));
237 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_1, 0));
238 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off));
239 }
240
move_ctx2blob(struct bpf_gen * gen,int off,int size,int ctx_off,bool check_non_zero)241 static void move_ctx2blob(struct bpf_gen *gen, int off, int size, int ctx_off,
242 bool check_non_zero)
243 {
244 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_6, ctx_off));
245 if (check_non_zero)
246 /* If value in ctx is zero don't update the blob.
247 * For example: when ctx->map.max_entries == 0, keep default max_entries from bpf.c
248 */
249 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_0, 0, 3));
250 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
251 0, 0, 0, off));
252 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
253 }
254
move_stack2blob(struct bpf_gen * gen,int off,int size,int stack_off)255 static void move_stack2blob(struct bpf_gen *gen, int off, int size, int stack_off)
256 {
257 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off));
258 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
259 0, 0, 0, off));
260 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
261 }
262
move_stack2ctx(struct bpf_gen * gen,int ctx_off,int size,int stack_off)263 static void move_stack2ctx(struct bpf_gen *gen, int ctx_off, int size, int stack_off)
264 {
265 emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off));
266 emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off));
267 }
268
emit_sys_bpf(struct bpf_gen * gen,int cmd,int attr,int attr_size)269 static void emit_sys_bpf(struct bpf_gen *gen, int cmd, int attr, int attr_size)
270 {
271 emit(gen, BPF_MOV64_IMM(BPF_REG_1, cmd));
272 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE,
273 0, 0, 0, attr));
274 emit(gen, BPF_MOV64_IMM(BPF_REG_3, attr_size));
275 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_bpf));
276 /* remember the result in R7 */
277 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
278 }
279
is_simm16(__s64 value)280 static bool is_simm16(__s64 value)
281 {
282 return value == (__s64)(__s16)value;
283 }
284
emit_check_err(struct bpf_gen * gen)285 static void emit_check_err(struct bpf_gen *gen)
286 {
287 __s64 off = -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 1;
288
289 /* R7 contains result of last sys_bpf command.
290 * if (R7 < 0) goto cleanup;
291 */
292 if (is_simm16(off)) {
293 emit(gen, BPF_JMP_IMM(BPF_JSLT, BPF_REG_7, 0, off));
294 } else {
295 gen->error = -ERANGE;
296 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, -1));
297 }
298 }
299
300 /* reg1 and reg2 should not be R1 - R5. They can be R0, R6 - R10 */
emit_debug(struct bpf_gen * gen,int reg1,int reg2,const char * fmt,va_list args)301 static void emit_debug(struct bpf_gen *gen, int reg1, int reg2,
302 const char *fmt, va_list args)
303 {
304 char buf[1024];
305 int addr, len, ret;
306
307 if (!gen->log_level)
308 return;
309 ret = vsnprintf(buf, sizeof(buf), fmt, args);
310 if (ret < 1024 - 7 && reg1 >= 0 && reg2 < 0)
311 /* The special case to accommodate common debug_ret():
312 * to avoid specifying BPF_REG_7 and adding " r=%%d" to
313 * prints explicitly.
314 */
315 strcat(buf, " r=%d");
316 len = strlen(buf) + 1;
317 addr = add_data(gen, buf, len);
318
319 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
320 0, 0, 0, addr));
321 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
322 if (reg1 >= 0)
323 emit(gen, BPF_MOV64_REG(BPF_REG_3, reg1));
324 if (reg2 >= 0)
325 emit(gen, BPF_MOV64_REG(BPF_REG_4, reg2));
326 emit(gen, BPF_EMIT_CALL(BPF_FUNC_trace_printk));
327 }
328
debug_regs(struct bpf_gen * gen,int reg1,int reg2,const char * fmt,...)329 static void debug_regs(struct bpf_gen *gen, int reg1, int reg2, const char *fmt, ...)
330 {
331 va_list args;
332
333 va_start(args, fmt);
334 emit_debug(gen, reg1, reg2, fmt, args);
335 va_end(args);
336 }
337
debug_ret(struct bpf_gen * gen,const char * fmt,...)338 static void debug_ret(struct bpf_gen *gen, const char *fmt, ...)
339 {
340 va_list args;
341
342 va_start(args, fmt);
343 emit_debug(gen, BPF_REG_7, -1, fmt, args);
344 va_end(args);
345 }
346
__emit_sys_close(struct bpf_gen * gen)347 static void __emit_sys_close(struct bpf_gen *gen)
348 {
349 emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0,
350 /* 2 is the number of the following insns
351 * * 6 is additional insns in debug_regs
352 */
353 2 + (gen->log_level ? 6 : 0)));
354 emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_1));
355 emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close));
356 debug_regs(gen, BPF_REG_9, BPF_REG_0, "close(%%d) = %%d");
357 }
358
emit_sys_close_stack(struct bpf_gen * gen,int stack_off)359 static void emit_sys_close_stack(struct bpf_gen *gen, int stack_off)
360 {
361 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, stack_off));
362 __emit_sys_close(gen);
363 }
364
emit_sys_close_blob(struct bpf_gen * gen,int blob_off)365 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off)
366 {
367 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
368 0, 0, 0, blob_off));
369 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_0, 0));
370 __emit_sys_close(gen);
371 }
372
373 static void compute_sha_update_offsets(struct bpf_gen *gen);
374
bpf_gen__finish(struct bpf_gen * gen,int nr_progs,int nr_maps)375 int bpf_gen__finish(struct bpf_gen *gen, int nr_progs, int nr_maps)
376 {
377 int i;
378
379 if (nr_progs < gen->nr_progs || nr_maps != gen->nr_maps) {
380 pr_warn("nr_progs %d/%d nr_maps %d/%d mismatch\n",
381 nr_progs, gen->nr_progs, nr_maps, gen->nr_maps);
382 gen->error = -EFAULT;
383 return gen->error;
384 }
385 emit_sys_close_stack(gen, stack_off(btf_fd));
386 for (i = 0; i < gen->nr_progs; i++)
387 move_stack2ctx(gen,
388 sizeof(struct bpf_loader_ctx) +
389 sizeof(struct bpf_map_desc) * gen->nr_maps +
390 sizeof(struct bpf_prog_desc) * i +
391 offsetof(struct bpf_prog_desc, prog_fd), 4,
392 stack_off(prog_fd[i]));
393 for (i = 0; i < gen->nr_maps; i++)
394 move_blob2ctx(gen,
395 sizeof(struct bpf_loader_ctx) +
396 sizeof(struct bpf_map_desc) * i +
397 offsetof(struct bpf_map_desc, map_fd), 4,
398 blob_fd_array_off(gen, i));
399 emit(gen, BPF_MOV64_IMM(BPF_REG_0, 0));
400 emit(gen, BPF_EXIT_INSN());
401 if (OPTS_GET(gen->opts, gen_hash, false))
402 compute_sha_update_offsets(gen);
403
404 pr_debug("gen: finish %s\n", errstr(gen->error));
405 if (!gen->error) {
406 struct gen_loader_opts *opts = gen->opts;
407
408 opts->insns = gen->insn_start;
409 opts->insns_sz = gen->insn_cur - gen->insn_start;
410 opts->data = gen->data_start;
411 opts->data_sz = gen->data_cur - gen->data_start;
412
413 /* use target endianness for embedded loader */
414 if (gen->swapped_endian) {
415 struct bpf_insn *insn = (struct bpf_insn *)opts->insns;
416 int insn_cnt = opts->insns_sz / sizeof(struct bpf_insn);
417
418 for (i = 0; i < insn_cnt; i++)
419 bpf_insn_bswap(insn++);
420 }
421 }
422 return gen->error;
423 }
424
bpf_gen__free(struct bpf_gen * gen)425 void bpf_gen__free(struct bpf_gen *gen)
426 {
427 if (!gen)
428 return;
429 free(gen->data_start);
430 free(gen->insn_start);
431 free(gen);
432 }
433
434 /*
435 * Fields of bpf_attr are set to values in native byte-order before being
436 * written to the target-bound data blob, and may need endian conversion.
437 * This macro allows providing the correct value in situ more simply than
438 * writing a separate converter for *all fields* of *all records* included
439 * in union bpf_attr. Note that sizeof(rval) should match the assignment
440 * target to avoid runtime problems.
441 */
442 #define tgt_endian(rval) ({ \
443 typeof(rval) _val = (rval); \
444 if (gen->swapped_endian) { \
445 switch (sizeof(_val)) { \
446 case 1: break; \
447 case 2: _val = bswap_16(_val); break; \
448 case 4: _val = bswap_32(_val); break; \
449 case 8: _val = bswap_64(_val); break; \
450 default: pr_warn("unsupported bswap size!\n"); \
451 } \
452 } \
453 _val; \
454 })
455
compute_sha_update_offsets(struct bpf_gen * gen)456 static void compute_sha_update_offsets(struct bpf_gen *gen)
457 {
458 __u64 sha[SHA256_DWORD_SIZE];
459 __u64 sha_dw;
460 int i;
461
462 libbpf_sha256(gen->data_start, gen->data_cur - gen->data_start, (__u8 *)sha);
463 for (i = 0; i < SHA256_DWORD_SIZE; i++) {
464 struct bpf_insn *insn =
465 (struct bpf_insn *)(gen->insn_start + gen->hash_insn_offset[i]);
466 sha_dw = tgt_endian(sha[i]);
467 insn[0].imm = (__u32)sha_dw;
468 insn[1].imm = sha_dw >> 32;
469 }
470 }
471
bpf_gen__load_btf(struct bpf_gen * gen,const void * btf_raw_data,__u32 btf_raw_size)472 void bpf_gen__load_btf(struct bpf_gen *gen, const void *btf_raw_data,
473 __u32 btf_raw_size)
474 {
475 int attr_size = offsetofend(union bpf_attr, btf_log_level);
476 int btf_data, btf_load_attr;
477 union bpf_attr attr;
478
479 memset(&attr, 0, attr_size);
480 btf_data = add_data(gen, btf_raw_data, btf_raw_size);
481
482 attr.btf_size = tgt_endian(btf_raw_size);
483 btf_load_attr = add_data(gen, &attr, attr_size);
484 pr_debug("gen: load_btf: off %d size %d, attr: off %d size %d\n",
485 btf_data, btf_raw_size, btf_load_attr, attr_size);
486
487 /* populate union bpf_attr with user provided log details */
488 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_level), 4,
489 offsetof(struct bpf_loader_ctx, log_level), false);
490 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_size), 4,
491 offsetof(struct bpf_loader_ctx, log_size), false);
492 move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_buf), 8,
493 offsetof(struct bpf_loader_ctx, log_buf), false);
494 /* populate union bpf_attr with a pointer to the BTF data */
495 emit_rel_store(gen, attr_field(btf_load_attr, btf), btf_data);
496 /* emit BTF_LOAD command */
497 emit_sys_bpf(gen, BPF_BTF_LOAD, btf_load_attr, attr_size);
498 debug_ret(gen, "btf_load size %d", btf_raw_size);
499 emit_check_err(gen);
500 /* remember btf_fd in the stack, if successful */
501 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7, stack_off(btf_fd)));
502 }
503
bpf_gen__map_create(struct bpf_gen * gen,enum bpf_map_type map_type,const char * map_name,__u32 key_size,__u32 value_size,__u32 max_entries,struct bpf_map_create_opts * map_attr,int map_idx)504 void bpf_gen__map_create(struct bpf_gen *gen,
505 enum bpf_map_type map_type,
506 const char *map_name,
507 __u32 key_size, __u32 value_size, __u32 max_entries,
508 struct bpf_map_create_opts *map_attr, int map_idx)
509 {
510 int attr_size = offsetofend(union bpf_attr, map_extra);
511 bool close_inner_map_fd = false;
512 int map_create_attr, idx;
513 union bpf_attr attr;
514
515 memset(&attr, 0, attr_size);
516 attr.map_type = tgt_endian(map_type);
517 attr.key_size = tgt_endian(key_size);
518 attr.value_size = tgt_endian(value_size);
519 attr.map_flags = tgt_endian(map_attr->map_flags);
520 attr.map_extra = tgt_endian(map_attr->map_extra);
521 if (map_name)
522 libbpf_strlcpy(attr.map_name, map_name, sizeof(attr.map_name));
523 attr.numa_node = tgt_endian(map_attr->numa_node);
524 attr.map_ifindex = tgt_endian(map_attr->map_ifindex);
525 attr.max_entries = tgt_endian(max_entries);
526 attr.btf_key_type_id = tgt_endian(map_attr->btf_key_type_id);
527 attr.btf_value_type_id = tgt_endian(map_attr->btf_value_type_id);
528
529 map_create_attr = add_data(gen, &attr, attr_size);
530 pr_debug("gen: map_create: %s idx %d type %d value_type_id %d, attr: off %d size %d\n",
531 map_name, map_idx, map_type, map_attr->btf_value_type_id,
532 map_create_attr, attr_size);
533
534 if (map_attr->btf_value_type_id)
535 /* populate union bpf_attr with btf_fd saved in the stack earlier */
536 move_stack2blob(gen, attr_field(map_create_attr, btf_fd), 4,
537 stack_off(btf_fd));
538 switch (map_type) {
539 case BPF_MAP_TYPE_ARRAY_OF_MAPS:
540 case BPF_MAP_TYPE_HASH_OF_MAPS:
541 move_stack2blob(gen, attr_field(map_create_attr, inner_map_fd), 4,
542 stack_off(inner_map_fd));
543 close_inner_map_fd = true;
544 break;
545 default:
546 break;
547 }
548 /* conditionally update max_entries */
549 if (map_idx >= 0)
550 move_ctx2blob(gen, attr_field(map_create_attr, max_entries), 4,
551 sizeof(struct bpf_loader_ctx) +
552 sizeof(struct bpf_map_desc) * map_idx +
553 offsetof(struct bpf_map_desc, max_entries),
554 true /* check that max_entries != 0 */);
555 /* emit MAP_CREATE command */
556 emit_sys_bpf(gen, BPF_MAP_CREATE, map_create_attr, attr_size);
557 debug_ret(gen, "map_create %s idx %d type %d value_size %d value_btf_id %d",
558 map_name, map_idx, map_type, value_size,
559 map_attr->btf_value_type_id);
560 emit_check_err(gen);
561 /* remember map_fd in the stack, if successful */
562 if (map_idx < 0) {
563 /* This bpf_gen__map_create() function is called with map_idx >= 0
564 * for all maps that libbpf loading logic tracks.
565 * It's called with -1 to create an inner map.
566 */
567 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7,
568 stack_off(inner_map_fd)));
569 } else if (map_idx != gen->nr_maps) {
570 gen->error = -EDOM; /* internal bug */
571 return;
572 } else {
573 /* add_map_fd does gen->nr_maps++ */
574 idx = add_map_fd(gen);
575 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
576 0, 0, 0, blob_fd_array_off(gen, idx)));
577 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_1, BPF_REG_7, 0));
578 }
579 if (close_inner_map_fd)
580 emit_sys_close_stack(gen, stack_off(inner_map_fd));
581 }
582
emit_signature_match(struct bpf_gen * gen)583 static void emit_signature_match(struct bpf_gen *gen)
584 {
585 __s64 off;
586 int i;
587
588 for (i = 0; i < SHA256_DWORD_SIZE; i++) {
589 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX,
590 0, 0, 0, 0));
591 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_2, BPF_REG_1, i * sizeof(__u64)));
592 gen->hash_insn_offset[i] = gen->insn_cur - gen->insn_start;
593 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_3, 0, 0, 0, 0, 0));
594
595 off = -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 2;
596 if (is_simm16(off)) {
597 emit(gen, BPF_MOV64_IMM(BPF_REG_7, -EINVAL));
598 emit(gen, BPF_JMP_REG(BPF_JNE, BPF_REG_2, BPF_REG_3, off));
599 } else {
600 gen->error = -ERANGE;
601 }
602 }
603 }
604
bpf_gen__record_attach_target(struct bpf_gen * gen,const char * attach_name,enum bpf_attach_type type)605 void bpf_gen__record_attach_target(struct bpf_gen *gen, const char *attach_name,
606 enum bpf_attach_type type)
607 {
608 const char *prefix;
609 int kind, ret;
610
611 btf_get_kernel_prefix_kind(type, &prefix, &kind);
612 gen->attach_kind = kind;
613 ret = snprintf(gen->attach_target, sizeof(gen->attach_target), "%s%s",
614 prefix, attach_name);
615 if (ret >= sizeof(gen->attach_target))
616 gen->error = -ENOSPC;
617 }
618
emit_find_attach_target(struct bpf_gen * gen)619 static void emit_find_attach_target(struct bpf_gen *gen)
620 {
621 int name, len = strlen(gen->attach_target) + 1;
622
623 pr_debug("gen: find_attach_tgt %s %d\n", gen->attach_target, gen->attach_kind);
624 name = add_data(gen, gen->attach_target, len);
625
626 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
627 0, 0, 0, name));
628 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
629 emit(gen, BPF_MOV64_IMM(BPF_REG_3, gen->attach_kind));
630 emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0));
631 emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind));
632 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
633 debug_ret(gen, "find_by_name_kind(%s,%d)",
634 gen->attach_target, gen->attach_kind);
635 emit_check_err(gen);
636 /* if successful, btf_id is in lower 32-bit of R7 and
637 * btf_obj_fd is in upper 32-bit
638 */
639 }
640
bpf_gen__record_extern(struct bpf_gen * gen,const char * name,bool is_weak,bool is_typeless,bool is_ld64,int kind,int insn_idx)641 void bpf_gen__record_extern(struct bpf_gen *gen, const char *name, bool is_weak,
642 bool is_typeless, bool is_ld64, int kind, int insn_idx)
643 {
644 struct ksym_relo_desc *relo;
645
646 relo = libbpf_reallocarray(gen->relos, gen->relo_cnt + 1, sizeof(*relo));
647 if (!relo) {
648 gen->error = -ENOMEM;
649 return;
650 }
651 gen->relos = relo;
652 relo += gen->relo_cnt;
653 relo->name = name;
654 relo->is_weak = is_weak;
655 relo->is_typeless = is_typeless;
656 relo->is_ld64 = is_ld64;
657 relo->kind = kind;
658 relo->insn_idx = insn_idx;
659 gen->relo_cnt++;
660 }
661
662 /* returns existing ksym_desc with ref incremented, or inserts a new one */
get_ksym_desc(struct bpf_gen * gen,struct ksym_relo_desc * relo)663 static struct ksym_desc *get_ksym_desc(struct bpf_gen *gen, struct ksym_relo_desc *relo)
664 {
665 struct ksym_desc *kdesc;
666 int i;
667
668 for (i = 0; i < gen->nr_ksyms; i++) {
669 kdesc = &gen->ksyms[i];
670 if (kdesc->kind == relo->kind && kdesc->is_ld64 == relo->is_ld64 &&
671 !strcmp(kdesc->name, relo->name)) {
672 kdesc->ref++;
673 return kdesc;
674 }
675 }
676 kdesc = libbpf_reallocarray(gen->ksyms, gen->nr_ksyms + 1, sizeof(*kdesc));
677 if (!kdesc) {
678 gen->error = -ENOMEM;
679 return NULL;
680 }
681 gen->ksyms = kdesc;
682 kdesc = &gen->ksyms[gen->nr_ksyms++];
683 kdesc->name = relo->name;
684 kdesc->kind = relo->kind;
685 kdesc->ref = 1;
686 kdesc->off = 0;
687 kdesc->insn = 0;
688 kdesc->is_ld64 = relo->is_ld64;
689 return kdesc;
690 }
691
692 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7}
693 * Returns result in BPF_REG_7
694 */
emit_bpf_find_by_name_kind(struct bpf_gen * gen,struct ksym_relo_desc * relo)695 static void emit_bpf_find_by_name_kind(struct bpf_gen *gen, struct ksym_relo_desc *relo)
696 {
697 int name_off, len = strlen(relo->name) + 1;
698
699 name_off = add_data(gen, relo->name, len);
700 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
701 0, 0, 0, name_off));
702 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
703 emit(gen, BPF_MOV64_IMM(BPF_REG_3, relo->kind));
704 emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0));
705 emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind));
706 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
707 debug_ret(gen, "find_by_name_kind(%s,%d)", relo->name, relo->kind);
708 }
709
710 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7}
711 * Returns result in BPF_REG_7
712 * Returns u64 symbol addr in BPF_REG_9
713 */
emit_bpf_kallsyms_lookup_name(struct bpf_gen * gen,struct ksym_relo_desc * relo)714 static void emit_bpf_kallsyms_lookup_name(struct bpf_gen *gen, struct ksym_relo_desc *relo)
715 {
716 int name_off, len = strlen(relo->name) + 1, res_off;
717
718 name_off = add_data(gen, relo->name, len);
719 res_off = add_data(gen, NULL, 8); /* res is u64 */
720 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
721 0, 0, 0, name_off));
722 emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
723 emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0));
724 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_4, BPF_PSEUDO_MAP_IDX_VALUE,
725 0, 0, 0, res_off));
726 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_4));
727 emit(gen, BPF_EMIT_CALL(BPF_FUNC_kallsyms_lookup_name));
728 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_9, BPF_REG_7, 0));
729 emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
730 debug_ret(gen, "kallsyms_lookup_name(%s,%d)", relo->name, relo->kind);
731 }
732
733 /* Expects:
734 * BPF_REG_8 - pointer to instruction
735 *
736 * We need to reuse BTF fd for same symbol otherwise each relocation takes a new
737 * index, while kernel limits total kfunc BTFs to 256. For duplicate symbols,
738 * this would mean a new BTF fd index for each entry. By pairing symbol name
739 * with index, we get the insn->imm, insn->off pairing that kernel uses for
740 * kfunc_tab, which becomes the effective limit even though all of them may
741 * share same index in fd_array (such that kfunc_btf_tab has 1 element).
742 */
emit_relo_kfunc_btf(struct bpf_gen * gen,struct ksym_relo_desc * relo,int insn)743 static void emit_relo_kfunc_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn)
744 {
745 struct ksym_desc *kdesc;
746 int btf_fd_idx;
747
748 kdesc = get_ksym_desc(gen, relo);
749 if (!kdesc)
750 return;
751 /* try to copy from existing bpf_insn */
752 if (kdesc->ref > 1) {
753 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
754 kdesc->insn + offsetof(struct bpf_insn, imm));
755 move_blob2blob(gen, insn + offsetof(struct bpf_insn, off), 2,
756 kdesc->insn + offsetof(struct bpf_insn, off));
757 goto log;
758 }
759 /* remember insn offset, so we can copy BTF ID and FD later */
760 kdesc->insn = insn;
761 emit_bpf_find_by_name_kind(gen, relo);
762 if (!relo->is_weak)
763 emit_check_err(gen);
764 /* get index in fd_array to store BTF FD at */
765 btf_fd_idx = add_kfunc_btf_fd(gen);
766 if (btf_fd_idx > INT16_MAX) {
767 pr_warn("BTF fd off %d for kfunc %s exceeds INT16_MAX, cannot process relocation\n",
768 btf_fd_idx, relo->name);
769 gen->error = -E2BIG;
770 return;
771 }
772 kdesc->off = btf_fd_idx;
773 /* jump to success case */
774 emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3));
775 /* set value for imm, off as 0 */
776 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0));
777 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0));
778 /* skip success case for ret < 0 */
779 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 10));
780 /* store btf_id into insn[insn_idx].imm */
781 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm)));
782 /* obtain fd in BPF_REG_9 */
783 emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_7));
784 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32));
785 /* load fd_array slot pointer */
786 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
787 0, 0, 0, blob_fd_array_off(gen, btf_fd_idx)));
788 /* store BTF fd in slot, 0 for vmlinux */
789 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_9, 0));
790 /* jump to insn[insn_idx].off store if fd denotes module BTF */
791 emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_9, 0, 2));
792 /* set the default value for off */
793 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0));
794 /* skip BTF fd store for vmlinux BTF */
795 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1));
796 /* store index into insn[insn_idx].off */
797 emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), btf_fd_idx));
798 log:
799 if (!gen->log_level)
800 return;
801 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8,
802 offsetof(struct bpf_insn, imm)));
803 emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8,
804 offsetof(struct bpf_insn, off)));
805 debug_regs(gen, BPF_REG_7, BPF_REG_9, " func (%s:count=%d): imm: %%d, off: %%d",
806 relo->name, kdesc->ref);
807 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
808 0, 0, 0, blob_fd_array_off(gen, kdesc->off)));
809 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_9, BPF_REG_0, 0));
810 debug_regs(gen, BPF_REG_9, -1, " func (%s:count=%d): btf_fd",
811 relo->name, kdesc->ref);
812 }
813
emit_ksym_relo_log(struct bpf_gen * gen,struct ksym_relo_desc * relo,int ref)814 static void emit_ksym_relo_log(struct bpf_gen *gen, struct ksym_relo_desc *relo,
815 int ref)
816 {
817 if (!gen->log_level)
818 return;
819 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8,
820 offsetof(struct bpf_insn, imm)));
821 emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8, sizeof(struct bpf_insn) +
822 offsetof(struct bpf_insn, imm)));
823 debug_regs(gen, BPF_REG_7, BPF_REG_9, " var t=%d w=%d (%s:count=%d): imm[0]: %%d, imm[1]: %%d",
824 relo->is_typeless, relo->is_weak, relo->name, ref);
825 emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code)));
826 debug_regs(gen, BPF_REG_9, -1, " var t=%d w=%d (%s:count=%d): insn.reg",
827 relo->is_typeless, relo->is_weak, relo->name, ref);
828 }
829
830 /* Expects:
831 * BPF_REG_8 - pointer to instruction
832 */
emit_relo_ksym_typeless(struct bpf_gen * gen,struct ksym_relo_desc * relo,int insn)833 static void emit_relo_ksym_typeless(struct bpf_gen *gen,
834 struct ksym_relo_desc *relo, int insn)
835 {
836 struct ksym_desc *kdesc;
837
838 kdesc = get_ksym_desc(gen, relo);
839 if (!kdesc)
840 return;
841 /* try to copy from existing ldimm64 insn */
842 if (kdesc->ref > 1) {
843 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
844 kdesc->insn + offsetof(struct bpf_insn, imm));
845 move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4,
846 kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm));
847 goto log;
848 }
849 /* remember insn offset, so we can copy ksym addr later */
850 kdesc->insn = insn;
851 /* skip typeless ksym_desc in fd closing loop in cleanup_relos */
852 kdesc->typeless = true;
853 emit_bpf_kallsyms_lookup_name(gen, relo);
854 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_7, -ENOENT, 1));
855 emit_check_err(gen);
856 /* store lower half of addr into insn[insn_idx].imm */
857 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9, offsetof(struct bpf_insn, imm)));
858 /* store upper half of addr into insn[insn_idx + 1].imm */
859 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32));
860 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9,
861 sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)));
862 log:
863 emit_ksym_relo_log(gen, relo, kdesc->ref);
864 }
865
src_reg_mask(struct bpf_gen * gen)866 static __u32 src_reg_mask(struct bpf_gen *gen)
867 {
868 #if defined(__LITTLE_ENDIAN_BITFIELD) /* src_reg,dst_reg,... */
869 return gen->swapped_endian ? 0xf0 : 0x0f;
870 #elif defined(__BIG_ENDIAN_BITFIELD) /* dst_reg,src_reg,... */
871 return gen->swapped_endian ? 0x0f : 0xf0;
872 #else
873 #error "Unsupported bit endianness, cannot proceed"
874 #endif
875 }
876
877 /* Expects:
878 * BPF_REG_8 - pointer to instruction
879 */
emit_relo_ksym_btf(struct bpf_gen * gen,struct ksym_relo_desc * relo,int insn)880 static void emit_relo_ksym_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn)
881 {
882 struct ksym_desc *kdesc;
883 __u32 reg_mask;
884
885 kdesc = get_ksym_desc(gen, relo);
886 if (!kdesc)
887 return;
888 /* try to copy from existing ldimm64 insn */
889 if (kdesc->ref > 1) {
890 move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4,
891 kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm));
892 move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
893 kdesc->insn + offsetof(struct bpf_insn, imm));
894 /* jump over src_reg adjustment if imm (btf_id) is not 0, reuse BPF_REG_0 from move_blob2blob
895 * If btf_id is zero, clear BPF_PSEUDO_BTF_ID flag in src_reg of ld_imm64 insn
896 */
897 emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, 3));
898 goto clear_src_reg;
899 }
900 /* remember insn offset, so we can copy BTF ID and FD later */
901 kdesc->insn = insn;
902 emit_bpf_find_by_name_kind(gen, relo);
903 if (!relo->is_weak)
904 emit_check_err(gen);
905 /* jump to success case */
906 emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3));
907 /* set values for insn[insn_idx].imm, insn[insn_idx + 1].imm as 0 */
908 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0));
909 emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 0));
910 /* skip success case for ret < 0 */
911 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 4));
912 /* store btf_id into insn[insn_idx].imm */
913 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm)));
914 /* store btf_obj_fd into insn[insn_idx + 1].imm */
915 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32));
916 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7,
917 sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)));
918 /* skip src_reg adjustment */
919 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 3));
920 clear_src_reg:
921 /* clear bpf_object__relocate_data's src_reg assignment, otherwise we get a verifier failure */
922 reg_mask = src_reg_mask(gen);
923 emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code)));
924 emit(gen, BPF_ALU32_IMM(BPF_AND, BPF_REG_9, reg_mask));
925 emit(gen, BPF_STX_MEM(BPF_B, BPF_REG_8, BPF_REG_9, offsetofend(struct bpf_insn, code)));
926
927 emit_ksym_relo_log(gen, relo, kdesc->ref);
928 }
929
bpf_gen__record_relo_core(struct bpf_gen * gen,const struct bpf_core_relo * core_relo)930 void bpf_gen__record_relo_core(struct bpf_gen *gen,
931 const struct bpf_core_relo *core_relo)
932 {
933 struct bpf_core_relo *relos;
934
935 relos = libbpf_reallocarray(gen->core_relos, gen->core_relo_cnt + 1, sizeof(*relos));
936 if (!relos) {
937 gen->error = -ENOMEM;
938 return;
939 }
940 gen->core_relos = relos;
941 relos += gen->core_relo_cnt;
942 memcpy(relos, core_relo, sizeof(*relos));
943 gen->core_relo_cnt++;
944 }
945
emit_relo(struct bpf_gen * gen,struct ksym_relo_desc * relo,int insns)946 static void emit_relo(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insns)
947 {
948 int insn;
949
950 pr_debug("gen: emit_relo (%d): %s at %d %s\n",
951 relo->kind, relo->name, relo->insn_idx, relo->is_ld64 ? "ld64" : "call");
952 insn = insns + sizeof(struct bpf_insn) * relo->insn_idx;
953 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_8, BPF_PSEUDO_MAP_IDX_VALUE, 0, 0, 0, insn));
954 if (relo->is_ld64) {
955 if (relo->is_typeless)
956 emit_relo_ksym_typeless(gen, relo, insn);
957 else
958 emit_relo_ksym_btf(gen, relo, insn);
959 } else {
960 emit_relo_kfunc_btf(gen, relo, insn);
961 }
962 }
963
emit_relos(struct bpf_gen * gen,int insns)964 static void emit_relos(struct bpf_gen *gen, int insns)
965 {
966 int i;
967
968 for (i = 0; i < gen->relo_cnt; i++)
969 emit_relo(gen, gen->relos + i, insns);
970 }
971
cleanup_core_relo(struct bpf_gen * gen)972 static void cleanup_core_relo(struct bpf_gen *gen)
973 {
974 if (!gen->core_relo_cnt)
975 return;
976 free(gen->core_relos);
977 gen->core_relo_cnt = 0;
978 gen->core_relos = NULL;
979 }
980
cleanup_relos(struct bpf_gen * gen,int insns)981 static void cleanup_relos(struct bpf_gen *gen, int insns)
982 {
983 struct ksym_desc *kdesc;
984 int i, insn;
985
986 for (i = 0; i < gen->nr_ksyms; i++) {
987 kdesc = &gen->ksyms[i];
988 /* only close fds for typed ksyms and kfuncs */
989 if (kdesc->is_ld64 && !kdesc->typeless) {
990 /* close fd recorded in insn[insn_idx + 1].imm */
991 insn = kdesc->insn;
992 insn += sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm);
993 emit_sys_close_blob(gen, insn);
994 } else if (!kdesc->is_ld64) {
995 emit_sys_close_blob(gen, blob_fd_array_off(gen, kdesc->off));
996 if (kdesc->off < MAX_FD_ARRAY_SZ)
997 gen->nr_fd_array--;
998 }
999 }
1000 if (gen->nr_ksyms) {
1001 free(gen->ksyms);
1002 gen->nr_ksyms = 0;
1003 gen->ksyms = NULL;
1004 }
1005 if (gen->relo_cnt) {
1006 free(gen->relos);
1007 gen->relo_cnt = 0;
1008 gen->relos = NULL;
1009 }
1010 cleanup_core_relo(gen);
1011 }
1012
1013 /* Convert func, line, and core relo info blobs to target endianness */
info_blob_bswap(struct bpf_gen * gen,int func_info,int line_info,int core_relos,struct bpf_prog_load_opts * load_attr)1014 static void info_blob_bswap(struct bpf_gen *gen, int func_info, int line_info,
1015 int core_relos, struct bpf_prog_load_opts *load_attr)
1016 {
1017 struct bpf_func_info *fi = gen->data_start + func_info;
1018 struct bpf_line_info *li = gen->data_start + line_info;
1019 struct bpf_core_relo *cr = gen->data_start + core_relos;
1020 int i;
1021
1022 for (i = 0; i < load_attr->func_info_cnt; i++)
1023 bpf_func_info_bswap(fi++);
1024
1025 for (i = 0; i < load_attr->line_info_cnt; i++)
1026 bpf_line_info_bswap(li++);
1027
1028 for (i = 0; i < gen->core_relo_cnt; i++)
1029 bpf_core_relo_bswap(cr++);
1030 }
1031
bpf_gen__prog_load(struct bpf_gen * gen,enum bpf_prog_type prog_type,const char * prog_name,const char * license,struct bpf_insn * insns,size_t insn_cnt,struct bpf_prog_load_opts * load_attr,int prog_idx)1032 void bpf_gen__prog_load(struct bpf_gen *gen,
1033 enum bpf_prog_type prog_type, const char *prog_name,
1034 const char *license, struct bpf_insn *insns, size_t insn_cnt,
1035 struct bpf_prog_load_opts *load_attr, int prog_idx)
1036 {
1037 int func_info_tot_sz = load_attr->func_info_cnt *
1038 load_attr->func_info_rec_size;
1039 int line_info_tot_sz = load_attr->line_info_cnt *
1040 load_attr->line_info_rec_size;
1041 int core_relo_tot_sz = gen->core_relo_cnt *
1042 sizeof(struct bpf_core_relo);
1043 int prog_load_attr, license_off, insns_off, func_info, line_info, core_relos;
1044 int attr_size = offsetofend(union bpf_attr, core_relo_rec_size);
1045 union bpf_attr attr;
1046
1047 memset(&attr, 0, attr_size);
1048 /* add license string to blob of bytes */
1049 license_off = add_data(gen, license, strlen(license) + 1);
1050 /* add insns to blob of bytes */
1051 insns_off = add_data(gen, insns, insn_cnt * sizeof(struct bpf_insn));
1052 pr_debug("gen: prog_load: prog_idx %d type %d insn off %d insns_cnt %zd license off %d\n",
1053 prog_idx, prog_type, insns_off, insn_cnt, license_off);
1054
1055 /* convert blob insns to target endianness */
1056 if (gen->swapped_endian) {
1057 struct bpf_insn *insn = gen->data_start + insns_off;
1058 int i;
1059
1060 for (i = 0; i < insn_cnt; i++, insn++)
1061 bpf_insn_bswap(insn);
1062 }
1063
1064 attr.prog_type = tgt_endian(prog_type);
1065 attr.expected_attach_type = tgt_endian(load_attr->expected_attach_type);
1066 attr.attach_btf_id = tgt_endian(load_attr->attach_btf_id);
1067 attr.prog_ifindex = tgt_endian(load_attr->prog_ifindex);
1068 attr.kern_version = 0;
1069 attr.insn_cnt = tgt_endian((__u32)insn_cnt);
1070 attr.prog_flags = tgt_endian(load_attr->prog_flags);
1071
1072 attr.func_info_rec_size = tgt_endian(load_attr->func_info_rec_size);
1073 attr.func_info_cnt = tgt_endian(load_attr->func_info_cnt);
1074 func_info = add_data(gen, load_attr->func_info, func_info_tot_sz);
1075 pr_debug("gen: prog_load: func_info: off %d cnt %d rec size %d\n",
1076 func_info, load_attr->func_info_cnt,
1077 load_attr->func_info_rec_size);
1078
1079 attr.line_info_rec_size = tgt_endian(load_attr->line_info_rec_size);
1080 attr.line_info_cnt = tgt_endian(load_attr->line_info_cnt);
1081 line_info = add_data(gen, load_attr->line_info, line_info_tot_sz);
1082 pr_debug("gen: prog_load: line_info: off %d cnt %d rec size %d\n",
1083 line_info, load_attr->line_info_cnt,
1084 load_attr->line_info_rec_size);
1085
1086 attr.core_relo_rec_size = tgt_endian((__u32)sizeof(struct bpf_core_relo));
1087 attr.core_relo_cnt = tgt_endian(gen->core_relo_cnt);
1088 core_relos = add_data(gen, gen->core_relos, core_relo_tot_sz);
1089 pr_debug("gen: prog_load: core_relos: off %d cnt %d rec size %zd\n",
1090 core_relos, gen->core_relo_cnt,
1091 sizeof(struct bpf_core_relo));
1092
1093 /* convert all info blobs to target endianness */
1094 if (gen->swapped_endian)
1095 info_blob_bswap(gen, func_info, line_info, core_relos, load_attr);
1096
1097 libbpf_strlcpy(attr.prog_name, prog_name, sizeof(attr.prog_name));
1098 prog_load_attr = add_data(gen, &attr, attr_size);
1099 pr_debug("gen: prog_load: attr: off %d size %d\n",
1100 prog_load_attr, attr_size);
1101
1102 /* populate union bpf_attr with a pointer to license */
1103 emit_rel_store(gen, attr_field(prog_load_attr, license), license_off);
1104
1105 /* populate union bpf_attr with a pointer to instructions */
1106 emit_rel_store(gen, attr_field(prog_load_attr, insns), insns_off);
1107
1108 /* populate union bpf_attr with a pointer to func_info */
1109 emit_rel_store(gen, attr_field(prog_load_attr, func_info), func_info);
1110
1111 /* populate union bpf_attr with a pointer to line_info */
1112 emit_rel_store(gen, attr_field(prog_load_attr, line_info), line_info);
1113
1114 /* populate union bpf_attr with a pointer to core_relos */
1115 emit_rel_store(gen, attr_field(prog_load_attr, core_relos), core_relos);
1116
1117 /* populate union bpf_attr fd_array with a pointer to data where map_fds are saved */
1118 emit_rel_store(gen, attr_field(prog_load_attr, fd_array), gen->fd_array);
1119
1120 /* populate union bpf_attr with user provided log details */
1121 move_ctx2blob(gen, attr_field(prog_load_attr, log_level), 4,
1122 offsetof(struct bpf_loader_ctx, log_level), false);
1123 move_ctx2blob(gen, attr_field(prog_load_attr, log_size), 4,
1124 offsetof(struct bpf_loader_ctx, log_size), false);
1125 move_ctx2blob(gen, attr_field(prog_load_attr, log_buf), 8,
1126 offsetof(struct bpf_loader_ctx, log_buf), false);
1127 /* populate union bpf_attr with btf_fd saved in the stack earlier */
1128 move_stack2blob(gen, attr_field(prog_load_attr, prog_btf_fd), 4,
1129 stack_off(btf_fd));
1130 if (gen->attach_kind) {
1131 emit_find_attach_target(gen);
1132 /* populate union bpf_attr with btf_id and btf_obj_fd found by helper */
1133 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
1134 0, 0, 0, prog_load_attr));
1135 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7,
1136 offsetof(union bpf_attr, attach_btf_id)));
1137 emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32));
1138 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7,
1139 offsetof(union bpf_attr, attach_btf_obj_fd)));
1140 }
1141 emit_relos(gen, insns_off);
1142 /* emit PROG_LOAD command */
1143 emit_sys_bpf(gen, BPF_PROG_LOAD, prog_load_attr, attr_size);
1144 debug_ret(gen, "prog_load %s insn_cnt %d", attr.prog_name, attr.insn_cnt);
1145 /* successful or not, close btf module FDs used in extern ksyms and attach_btf_obj_fd */
1146 cleanup_relos(gen, insns_off);
1147 if (gen->attach_kind) {
1148 emit_sys_close_blob(gen,
1149 attr_field(prog_load_attr, attach_btf_obj_fd));
1150 gen->attach_kind = 0;
1151 }
1152 emit_check_err(gen);
1153 /* remember prog_fd in the stack, if successful */
1154 emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7,
1155 stack_off(prog_fd[gen->nr_progs])));
1156 gen->nr_progs++;
1157 }
1158
bpf_gen__map_update_elem(struct bpf_gen * gen,int map_idx,void * pvalue,__u32 value_size)1159 void bpf_gen__map_update_elem(struct bpf_gen *gen, int map_idx, void *pvalue,
1160 __u32 value_size)
1161 {
1162 int attr_size = offsetofend(union bpf_attr, flags);
1163 int map_update_attr, value, key;
1164 union bpf_attr attr;
1165 int zero = 0;
1166
1167 memset(&attr, 0, attr_size);
1168
1169 value = add_data(gen, pvalue, value_size);
1170 key = add_data(gen, &zero, sizeof(zero));
1171
1172 /* if (map_desc[map_idx].initial_value) {
1173 * if (ctx->flags & BPF_SKEL_KERNEL)
1174 * bpf_probe_read_kernel(value, value_size, initial_value);
1175 * else
1176 * bpf_copy_from_user(value, value_size, initial_value);
1177 * }
1178 */
1179 emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_3, BPF_REG_6,
1180 sizeof(struct bpf_loader_ctx) +
1181 sizeof(struct bpf_map_desc) * map_idx +
1182 offsetof(struct bpf_map_desc, initial_value)));
1183 emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_3, 0, 8));
1184 emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
1185 0, 0, 0, value));
1186 emit(gen, BPF_MOV64_IMM(BPF_REG_2, value_size));
1187 emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_0, BPF_REG_6,
1188 offsetof(struct bpf_loader_ctx, flags)));
1189 emit(gen, BPF_JMP_IMM(BPF_JSET, BPF_REG_0, BPF_SKEL_KERNEL, 2));
1190 emit(gen, BPF_EMIT_CALL(BPF_FUNC_copy_from_user));
1191 emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1));
1192 emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel));
1193
1194 map_update_attr = add_data(gen, &attr, attr_size);
1195 pr_debug("gen: map_update_elem: idx %d, value: off %d size %d, attr: off %d size %d\n",
1196 map_idx, value, value_size, map_update_attr, attr_size);
1197 move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4,
1198 blob_fd_array_off(gen, map_idx));
1199 emit_rel_store(gen, attr_field(map_update_attr, key), key);
1200 emit_rel_store(gen, attr_field(map_update_attr, value), value);
1201 /* emit MAP_UPDATE_ELEM command */
1202 emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size);
1203 debug_ret(gen, "update_elem idx %d value_size %d", map_idx, value_size);
1204 emit_check_err(gen);
1205 }
1206
bpf_gen__populate_outer_map(struct bpf_gen * gen,int outer_map_idx,int slot,int inner_map_idx)1207 void bpf_gen__populate_outer_map(struct bpf_gen *gen, int outer_map_idx, int slot,
1208 int inner_map_idx)
1209 {
1210 int attr_size = offsetofend(union bpf_attr, flags);
1211 int map_update_attr, key;
1212 union bpf_attr attr;
1213 int tgt_slot;
1214
1215 memset(&attr, 0, attr_size);
1216
1217 tgt_slot = tgt_endian(slot);
1218 key = add_data(gen, &tgt_slot, sizeof(tgt_slot));
1219
1220 map_update_attr = add_data(gen, &attr, attr_size);
1221 pr_debug("gen: populate_outer_map: outer %d key %d inner %d, attr: off %d size %d\n",
1222 outer_map_idx, slot, inner_map_idx, map_update_attr, attr_size);
1223 move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4,
1224 blob_fd_array_off(gen, outer_map_idx));
1225 emit_rel_store(gen, attr_field(map_update_attr, key), key);
1226 emit_rel_store(gen, attr_field(map_update_attr, value),
1227 blob_fd_array_off(gen, inner_map_idx));
1228
1229 /* emit MAP_UPDATE_ELEM command */
1230 emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size);
1231 debug_ret(gen, "populate_outer_map outer %d key %d inner %d",
1232 outer_map_idx, slot, inner_map_idx);
1233 emit_check_err(gen);
1234 }
1235
bpf_gen__map_freeze(struct bpf_gen * gen,int map_idx)1236 void bpf_gen__map_freeze(struct bpf_gen *gen, int map_idx)
1237 {
1238 int attr_size = offsetofend(union bpf_attr, map_fd);
1239 int map_freeze_attr;
1240 union bpf_attr attr;
1241
1242 memset(&attr, 0, attr_size);
1243 map_freeze_attr = add_data(gen, &attr, attr_size);
1244 pr_debug("gen: map_freeze: idx %d, attr: off %d size %d\n",
1245 map_idx, map_freeze_attr, attr_size);
1246 move_blob2blob(gen, attr_field(map_freeze_attr, map_fd), 4,
1247 blob_fd_array_off(gen, map_idx));
1248 /* emit MAP_FREEZE command */
1249 emit_sys_bpf(gen, BPF_MAP_FREEZE, map_freeze_attr, attr_size);
1250 debug_ret(gen, "map_freeze");
1251 emit_check_err(gen);
1252 }
1253