xref: /linux/tools/lib/bpf/gen_loader.c (revision 40863f4d6ef2c34bb00dd1070dfaf9d5f27a497e)
1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2 /* Copyright (c) 2021 Facebook */
3 #include <stdio.h>
4 #include <stdlib.h>
5 #include <string.h>
6 #include <errno.h>
7 #include <linux/filter.h>
8 #include <sys/param.h>
9 #include "btf.h"
10 #include "bpf.h"
11 #include "libbpf.h"
12 #include "libbpf_internal.h"
13 #include "hashmap.h"
14 #include "bpf_gen_internal.h"
15 #include "skel_internal.h"
16 #include <asm/byteorder.h>
17 #include "str_error.h"
18 
19 #define MAX_USED_MAPS	64
20 #define MAX_USED_PROGS	32
21 #define MAX_KFUNC_DESCS 256
22 #define MAX_FD_ARRAY_SZ (MAX_USED_MAPS + MAX_KFUNC_DESCS)
23 
24 /* The following structure describes the stack layout of the loader program.
25  * In addition R6 contains the pointer to context.
26  * R7 contains the result of the last sys_bpf command (typically error or FD).
27  * R9 contains the result of the last sys_close command.
28  *
29  * Naming convention:
30  * ctx - bpf program context
31  * stack - bpf program stack
32  * blob - bpf_attr-s, strings, insns, map data.
33  *        All the bytes that loader prog will use for read/write.
34  */
35 struct loader_stack {
36 	__u32 btf_fd;
37 	__u32 inner_map_fd;
38 	__u32 prog_fd[MAX_USED_PROGS];
39 };
40 
41 #define stack_off(field) \
42 	(__s16)(-sizeof(struct loader_stack) + offsetof(struct loader_stack, field))
43 
44 #define attr_field(attr, field) (attr + offsetof(union bpf_attr, field))
45 
46 static int blob_fd_array_off(struct bpf_gen *gen, int index)
47 {
48 	return gen->fd_array + index * sizeof(int);
49 }
50 
51 static int realloc_insn_buf(struct bpf_gen *gen, __u32 size)
52 {
53 	size_t off = gen->insn_cur - gen->insn_start;
54 	void *insn_start;
55 
56 	if (gen->error)
57 		return gen->error;
58 	if (size > INT32_MAX || off + size > INT32_MAX) {
59 		gen->error = -ERANGE;
60 		return -ERANGE;
61 	}
62 	insn_start = realloc(gen->insn_start, off + size);
63 	if (!insn_start) {
64 		gen->error = -ENOMEM;
65 		free(gen->insn_start);
66 		gen->insn_start = NULL;
67 		return -ENOMEM;
68 	}
69 	gen->insn_start = insn_start;
70 	gen->insn_cur = insn_start + off;
71 	return 0;
72 }
73 
74 static int realloc_data_buf(struct bpf_gen *gen, __u32 size)
75 {
76 	size_t off = gen->data_cur - gen->data_start;
77 	void *data_start;
78 
79 	if (gen->error)
80 		return gen->error;
81 	if (size > INT32_MAX || off + size > INT32_MAX) {
82 		gen->error = -ERANGE;
83 		return -ERANGE;
84 	}
85 	data_start = realloc(gen->data_start, off + size);
86 	if (!data_start) {
87 		gen->error = -ENOMEM;
88 		free(gen->data_start);
89 		gen->data_start = NULL;
90 		return -ENOMEM;
91 	}
92 	gen->data_start = data_start;
93 	gen->data_cur = data_start + off;
94 	return 0;
95 }
96 
97 static void emit(struct bpf_gen *gen, struct bpf_insn insn)
98 {
99 	if (realloc_insn_buf(gen, sizeof(insn)))
100 		return;
101 	memcpy(gen->insn_cur, &insn, sizeof(insn));
102 	gen->insn_cur += sizeof(insn);
103 }
104 
105 static void emit2(struct bpf_gen *gen, struct bpf_insn insn1, struct bpf_insn insn2)
106 {
107 	emit(gen, insn1);
108 	emit(gen, insn2);
109 }
110 
111 static int add_data(struct bpf_gen *gen, const void *data, __u32 size);
112 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off);
113 static void emit_signature_match(struct bpf_gen *gen);
114 
115 void bpf_gen__init(struct bpf_gen *gen, int log_level, int nr_progs, int nr_maps)
116 {
117 	size_t stack_sz = sizeof(struct loader_stack), nr_progs_sz;
118 	int i;
119 
120 	gen->fd_array = add_data(gen, NULL, MAX_FD_ARRAY_SZ * sizeof(int));
121 	gen->log_level = log_level;
122 	/* save ctx pointer into R6 */
123 	emit(gen, BPF_MOV64_REG(BPF_REG_6, BPF_REG_1));
124 
125 	/* bzero stack */
126 	emit(gen, BPF_MOV64_REG(BPF_REG_1, BPF_REG_10));
127 	emit(gen, BPF_ALU64_IMM(BPF_ADD, BPF_REG_1, -stack_sz));
128 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, stack_sz));
129 	emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0));
130 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel));
131 
132 	/* amount of stack actually used, only used to calculate iterations, not stack offset */
133 	nr_progs_sz = offsetof(struct loader_stack, prog_fd[nr_progs]);
134 	/* jump over cleanup code */
135 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0,
136 			      /* size of cleanup code below (including map fd cleanup) */
137 			      (nr_progs_sz / 4) * 3 + 2 +
138 			      /* 6 insns for emit_sys_close_blob,
139 			       * 6 insns for debug_regs in emit_sys_close_blob
140 			       */
141 			      nr_maps * (6 + (gen->log_level ? 6 : 0))));
142 
143 	/* remember the label where all error branches will jump to */
144 	gen->cleanup_label = gen->insn_cur - gen->insn_start;
145 	/* emit cleanup code: close all temp FDs */
146 	for (i = 0; i < nr_progs_sz; i += 4) {
147 		emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, -stack_sz + i));
148 		emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0, 1));
149 		emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close));
150 	}
151 	for (i = 0; i < nr_maps; i++)
152 		emit_sys_close_blob(gen, blob_fd_array_off(gen, i));
153 	/* R7 contains the error code from sys_bpf. Copy it into R0 and exit. */
154 	emit(gen, BPF_MOV64_REG(BPF_REG_0, BPF_REG_7));
155 	emit(gen, BPF_EXIT_INSN());
156 	if (OPTS_GET(gen->opts, gen_hash, false))
157 		emit_signature_match(gen);
158 }
159 
160 static int add_data(struct bpf_gen *gen, const void *data, __u32 size)
161 {
162 	__u32 size8 = roundup(size, 8);
163 	__u64 zero = 0;
164 	void *prev;
165 
166 	if (realloc_data_buf(gen, size8))
167 		return 0;
168 	prev = gen->data_cur;
169 	if (data) {
170 		memcpy(gen->data_cur, data, size);
171 		memcpy(gen->data_cur + size, &zero, size8 - size);
172 	} else {
173 		memset(gen->data_cur, 0, size8);
174 	}
175 	gen->data_cur += size8;
176 	return prev - gen->data_start;
177 }
178 
179 /* Get index for map_fd/btf_fd slot in reserved fd_array, or in data relative
180  * to start of fd_array. Caller can decide if it is usable or not.
181  */
182 static int add_map_fd(struct bpf_gen *gen)
183 {
184 	if (gen->nr_maps == MAX_USED_MAPS) {
185 		pr_warn("Total maps exceeds %d\n", MAX_USED_MAPS);
186 		gen->error = -E2BIG;
187 		return 0;
188 	}
189 	return gen->nr_maps++;
190 }
191 
192 static int add_kfunc_btf_fd(struct bpf_gen *gen)
193 {
194 	int cur;
195 
196 	if (gen->nr_fd_array == MAX_KFUNC_DESCS) {
197 		cur = add_data(gen, NULL, sizeof(int));
198 		return (cur - gen->fd_array) / sizeof(int);
199 	}
200 	return MAX_USED_MAPS + gen->nr_fd_array++;
201 }
202 
203 static int insn_bytes_to_bpf_size(__u32 sz)
204 {
205 	switch (sz) {
206 	case 8: return BPF_DW;
207 	case 4: return BPF_W;
208 	case 2: return BPF_H;
209 	case 1: return BPF_B;
210 	default: return -1;
211 	}
212 }
213 
214 /* *(u64 *)(blob + off) = (u64)(void *)(blob + data) */
215 static void emit_rel_store(struct bpf_gen *gen, int off, int data)
216 {
217 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
218 					 0, 0, 0, data));
219 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
220 					 0, 0, 0, off));
221 	emit(gen, BPF_STX_MEM(BPF_DW, BPF_REG_1, BPF_REG_0, 0));
222 }
223 
224 static void move_blob2blob(struct bpf_gen *gen, int off, int size, int blob_off)
225 {
226 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE,
227 					 0, 0, 0, blob_off));
228 	emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_2, 0));
229 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
230 					 0, 0, 0, off));
231 	emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
232 }
233 
234 static void move_blob2ctx(struct bpf_gen *gen, int ctx_off, int size, int blob_off)
235 {
236 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
237 					 0, 0, 0, blob_off));
238 	emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_1, 0));
239 	emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off));
240 }
241 
242 static void move_ctx2blob(struct bpf_gen *gen, int off, int size, int ctx_off,
243 				   bool check_non_zero)
244 {
245 	emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_6, ctx_off));
246 	if (check_non_zero)
247 		/* If value in ctx is zero don't update the blob.
248 		 * For example: when ctx->map.max_entries == 0, keep default max_entries from bpf.c
249 		 */
250 		emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_0, 0, 3));
251 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
252 					 0, 0, 0, off));
253 	emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
254 }
255 
256 static void move_stack2blob(struct bpf_gen *gen, int off, int size, int stack_off)
257 {
258 	emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off));
259 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
260 					 0, 0, 0, off));
261 	emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_1, BPF_REG_0, 0));
262 }
263 
264 static void move_stack2ctx(struct bpf_gen *gen, int ctx_off, int size, int stack_off)
265 {
266 	emit(gen, BPF_LDX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_0, BPF_REG_10, stack_off));
267 	emit(gen, BPF_STX_MEM(insn_bytes_to_bpf_size(size), BPF_REG_6, BPF_REG_0, ctx_off));
268 }
269 
270 static void emit_sys_bpf(struct bpf_gen *gen, int cmd, int attr, int attr_size)
271 {
272 	emit(gen, BPF_MOV64_IMM(BPF_REG_1, cmd));
273 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_2, BPF_PSEUDO_MAP_IDX_VALUE,
274 					 0, 0, 0, attr));
275 	emit(gen, BPF_MOV64_IMM(BPF_REG_3, attr_size));
276 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_bpf));
277 	/* remember the result in R7 */
278 	emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
279 }
280 
281 static bool is_simm16(__s64 value)
282 {
283 	return value == (__s64)(__s16)value;
284 }
285 
286 static void emit_check_err(struct bpf_gen *gen)
287 {
288 	__s64 off = -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 1;
289 
290 	/* R7 contains result of last sys_bpf command.
291 	 * if (R7 < 0) goto cleanup;
292 	 */
293 	if (is_simm16(off)) {
294 		emit(gen, BPF_JMP_IMM(BPF_JSLT, BPF_REG_7, 0, off));
295 	} else {
296 		gen->error = -ERANGE;
297 		emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, -1));
298 	}
299 }
300 
301 /* reg1 and reg2 should not be R1 - R5. They can be R0, R6 - R10 */
302 static void emit_debug(struct bpf_gen *gen, int reg1, int reg2,
303 		       const char *fmt, va_list args)
304 {
305 	char buf[1024];
306 	int addr, len, ret;
307 
308 	if (!gen->log_level)
309 		return;
310 	ret = vsnprintf(buf, sizeof(buf), fmt, args);
311 	if (ret < 1024 - 7 && reg1 >= 0 && reg2 < 0)
312 		/* The special case to accommodate common debug_ret():
313 		 * to avoid specifying BPF_REG_7 and adding " r=%%d" to
314 		 * prints explicitly.
315 		 */
316 		strcat(buf, " r=%d");
317 	len = strlen(buf) + 1;
318 	addr = add_data(gen, buf, len);
319 
320 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
321 					 0, 0, 0, addr));
322 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
323 	if (reg1 >= 0)
324 		emit(gen, BPF_MOV64_REG(BPF_REG_3, reg1));
325 	if (reg2 >= 0)
326 		emit(gen, BPF_MOV64_REG(BPF_REG_4, reg2));
327 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_trace_printk));
328 }
329 
330 static void debug_regs(struct bpf_gen *gen, int reg1, int reg2, const char *fmt, ...)
331 {
332 	va_list args;
333 
334 	va_start(args, fmt);
335 	emit_debug(gen, reg1, reg2, fmt, args);
336 	va_end(args);
337 }
338 
339 static void debug_ret(struct bpf_gen *gen, const char *fmt, ...)
340 {
341 	va_list args;
342 
343 	va_start(args, fmt);
344 	emit_debug(gen, BPF_REG_7, -1, fmt, args);
345 	va_end(args);
346 }
347 
348 static void __emit_sys_close(struct bpf_gen *gen)
349 {
350 	emit(gen, BPF_JMP_IMM(BPF_JSLE, BPF_REG_1, 0,
351 			      /* 2 is the number of the following insns
352 			       * * 6 is additional insns in debug_regs
353 			       */
354 			      2 + (gen->log_level ? 6 : 0)));
355 	emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_1));
356 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_sys_close));
357 	debug_regs(gen, BPF_REG_9, BPF_REG_0, "close(%%d) = %%d");
358 }
359 
360 static void emit_sys_close_stack(struct bpf_gen *gen, int stack_off)
361 {
362 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_10, stack_off));
363 	__emit_sys_close(gen);
364 }
365 
366 static void emit_sys_close_blob(struct bpf_gen *gen, int blob_off)
367 {
368 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
369 					 0, 0, 0, blob_off));
370 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_1, BPF_REG_0, 0));
371 	__emit_sys_close(gen);
372 }
373 
374 static int compute_sha_udpate_offsets(struct bpf_gen *gen);
375 
376 int bpf_gen__finish(struct bpf_gen *gen, int nr_progs, int nr_maps)
377 {
378 	int i;
379 
380 	if (nr_progs < gen->nr_progs || nr_maps != gen->nr_maps) {
381 		pr_warn("nr_progs %d/%d nr_maps %d/%d mismatch\n",
382 			nr_progs, gen->nr_progs, nr_maps, gen->nr_maps);
383 		gen->error = -EFAULT;
384 		return gen->error;
385 	}
386 	emit_sys_close_stack(gen, stack_off(btf_fd));
387 	for (i = 0; i < gen->nr_progs; i++)
388 		move_stack2ctx(gen,
389 			       sizeof(struct bpf_loader_ctx) +
390 			       sizeof(struct bpf_map_desc) * gen->nr_maps +
391 			       sizeof(struct bpf_prog_desc) * i +
392 			       offsetof(struct bpf_prog_desc, prog_fd), 4,
393 			       stack_off(prog_fd[i]));
394 	for (i = 0; i < gen->nr_maps; i++)
395 		move_blob2ctx(gen,
396 			      sizeof(struct bpf_loader_ctx) +
397 			      sizeof(struct bpf_map_desc) * i +
398 			      offsetof(struct bpf_map_desc, map_fd), 4,
399 			      blob_fd_array_off(gen, i));
400 	emit(gen, BPF_MOV64_IMM(BPF_REG_0, 0));
401 	emit(gen, BPF_EXIT_INSN());
402 	if (OPTS_GET(gen->opts, gen_hash, false)) {
403 		gen->error = compute_sha_udpate_offsets(gen);
404 		if (gen->error)
405 			return gen->error;
406 	}
407 
408 	pr_debug("gen: finish %s\n", errstr(gen->error));
409 	if (!gen->error) {
410 		struct gen_loader_opts *opts = gen->opts;
411 
412 		opts->insns = gen->insn_start;
413 		opts->insns_sz = gen->insn_cur - gen->insn_start;
414 		opts->data = gen->data_start;
415 		opts->data_sz = gen->data_cur - gen->data_start;
416 
417 		/* use target endianness for embedded loader */
418 		if (gen->swapped_endian) {
419 			struct bpf_insn *insn = (struct bpf_insn *)opts->insns;
420 			int insn_cnt = opts->insns_sz / sizeof(struct bpf_insn);
421 
422 			for (i = 0; i < insn_cnt; i++)
423 				bpf_insn_bswap(insn++);
424 		}
425 	}
426 	return gen->error;
427 }
428 
429 void bpf_gen__free(struct bpf_gen *gen)
430 {
431 	if (!gen)
432 		return;
433 	free(gen->data_start);
434 	free(gen->insn_start);
435 	free(gen);
436 }
437 
438 /*
439  * Fields of bpf_attr are set to values in native byte-order before being
440  * written to the target-bound data blob, and may need endian conversion.
441  * This macro allows providing the correct value in situ more simply than
442  * writing a separate converter for *all fields* of *all records* included
443  * in union bpf_attr. Note that sizeof(rval) should match the assignment
444  * target to avoid runtime problems.
445  */
446 #define tgt_endian(rval) ({					\
447 	typeof(rval) _val = (rval);				\
448 	if (gen->swapped_endian) {				\
449 		switch (sizeof(_val)) {				\
450 		case 1: break;					\
451 		case 2: _val = bswap_16(_val); break;		\
452 		case 4: _val = bswap_32(_val); break;		\
453 		case 8: _val = bswap_64(_val); break;		\
454 		default: pr_warn("unsupported bswap size!\n");	\
455 		}						\
456 	}							\
457 	_val;							\
458 })
459 
460 static int compute_sha_udpate_offsets(struct bpf_gen *gen)
461 {
462 	__u64 sha[SHA256_DWORD_SIZE];
463 	__u64 sha_dw;
464 	int i, err;
465 
466 	err = libbpf_sha256(gen->data_start, gen->data_cur - gen->data_start, sha, SHA256_DIGEST_LENGTH);
467 	if (err < 0) {
468 		pr_warn("sha256 computation of the metadata failed");
469 		return err;
470 	}
471 	for (i = 0; i < SHA256_DWORD_SIZE; i++) {
472 		struct bpf_insn *insn =
473 			(struct bpf_insn *)(gen->insn_start + gen->hash_insn_offset[i]);
474 		sha_dw = tgt_endian(sha[i]);
475 		insn[0].imm = (__u32)sha_dw;
476 		insn[1].imm = sha_dw >> 32;
477 	}
478 	return 0;
479 }
480 
481 void bpf_gen__load_btf(struct bpf_gen *gen, const void *btf_raw_data,
482 		       __u32 btf_raw_size)
483 {
484 	int attr_size = offsetofend(union bpf_attr, btf_log_level);
485 	int btf_data, btf_load_attr;
486 	union bpf_attr attr;
487 
488 	memset(&attr, 0, attr_size);
489 	btf_data = add_data(gen, btf_raw_data, btf_raw_size);
490 
491 	attr.btf_size = tgt_endian(btf_raw_size);
492 	btf_load_attr = add_data(gen, &attr, attr_size);
493 	pr_debug("gen: load_btf: off %d size %d, attr: off %d size %d\n",
494 		 btf_data, btf_raw_size, btf_load_attr, attr_size);
495 
496 	/* populate union bpf_attr with user provided log details */
497 	move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_level), 4,
498 		      offsetof(struct bpf_loader_ctx, log_level), false);
499 	move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_size), 4,
500 		      offsetof(struct bpf_loader_ctx, log_size), false);
501 	move_ctx2blob(gen, attr_field(btf_load_attr, btf_log_buf), 8,
502 		      offsetof(struct bpf_loader_ctx, log_buf), false);
503 	/* populate union bpf_attr with a pointer to the BTF data */
504 	emit_rel_store(gen, attr_field(btf_load_attr, btf), btf_data);
505 	/* emit BTF_LOAD command */
506 	emit_sys_bpf(gen, BPF_BTF_LOAD, btf_load_attr, attr_size);
507 	debug_ret(gen, "btf_load size %d", btf_raw_size);
508 	emit_check_err(gen);
509 	/* remember btf_fd in the stack, if successful */
510 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7, stack_off(btf_fd)));
511 }
512 
513 void bpf_gen__map_create(struct bpf_gen *gen,
514 			 enum bpf_map_type map_type,
515 			 const char *map_name,
516 			 __u32 key_size, __u32 value_size, __u32 max_entries,
517 			 struct bpf_map_create_opts *map_attr, int map_idx)
518 {
519 	int attr_size = offsetofend(union bpf_attr, map_extra);
520 	bool close_inner_map_fd = false;
521 	int map_create_attr, idx;
522 	union bpf_attr attr;
523 
524 	memset(&attr, 0, attr_size);
525 	attr.map_type = tgt_endian(map_type);
526 	attr.key_size = tgt_endian(key_size);
527 	attr.value_size = tgt_endian(value_size);
528 	attr.map_flags = tgt_endian(map_attr->map_flags);
529 	attr.map_extra = tgt_endian(map_attr->map_extra);
530 	if (map_name)
531 		libbpf_strlcpy(attr.map_name, map_name, sizeof(attr.map_name));
532 	attr.numa_node = tgt_endian(map_attr->numa_node);
533 	attr.map_ifindex = tgt_endian(map_attr->map_ifindex);
534 	attr.max_entries = tgt_endian(max_entries);
535 	attr.btf_key_type_id = tgt_endian(map_attr->btf_key_type_id);
536 	attr.btf_value_type_id = tgt_endian(map_attr->btf_value_type_id);
537 
538 	map_create_attr = add_data(gen, &attr, attr_size);
539 	pr_debug("gen: map_create: %s idx %d type %d value_type_id %d, attr: off %d size %d\n",
540 		 map_name, map_idx, map_type, map_attr->btf_value_type_id,
541 		 map_create_attr, attr_size);
542 
543 	if (map_attr->btf_value_type_id)
544 		/* populate union bpf_attr with btf_fd saved in the stack earlier */
545 		move_stack2blob(gen, attr_field(map_create_attr, btf_fd), 4,
546 				stack_off(btf_fd));
547 	switch (map_type) {
548 	case BPF_MAP_TYPE_ARRAY_OF_MAPS:
549 	case BPF_MAP_TYPE_HASH_OF_MAPS:
550 		move_stack2blob(gen, attr_field(map_create_attr, inner_map_fd), 4,
551 				stack_off(inner_map_fd));
552 		close_inner_map_fd = true;
553 		break;
554 	default:
555 		break;
556 	}
557 	/* conditionally update max_entries */
558 	if (map_idx >= 0)
559 		move_ctx2blob(gen, attr_field(map_create_attr, max_entries), 4,
560 			      sizeof(struct bpf_loader_ctx) +
561 			      sizeof(struct bpf_map_desc) * map_idx +
562 			      offsetof(struct bpf_map_desc, max_entries),
563 			      true /* check that max_entries != 0 */);
564 	/* emit MAP_CREATE command */
565 	emit_sys_bpf(gen, BPF_MAP_CREATE, map_create_attr, attr_size);
566 	debug_ret(gen, "map_create %s idx %d type %d value_size %d value_btf_id %d",
567 		  map_name, map_idx, map_type, value_size,
568 		  map_attr->btf_value_type_id);
569 	emit_check_err(gen);
570 	/* remember map_fd in the stack, if successful */
571 	if (map_idx < 0) {
572 		/* This bpf_gen__map_create() function is called with map_idx >= 0
573 		 * for all maps that libbpf loading logic tracks.
574 		 * It's called with -1 to create an inner map.
575 		 */
576 		emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7,
577 				      stack_off(inner_map_fd)));
578 	} else if (map_idx != gen->nr_maps) {
579 		gen->error = -EDOM; /* internal bug */
580 		return;
581 	} else {
582 		/* add_map_fd does gen->nr_maps++ */
583 		idx = add_map_fd(gen);
584 		emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
585 						 0, 0, 0, blob_fd_array_off(gen, idx)));
586 		emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_1, BPF_REG_7, 0));
587 	}
588 	if (close_inner_map_fd)
589 		emit_sys_close_stack(gen, stack_off(inner_map_fd));
590 }
591 
592 static void emit_signature_match(struct bpf_gen *gen)
593 {
594 	__s64 off;
595 	int i;
596 
597 	for (i = 0; i < SHA256_DWORD_SIZE; i++) {
598 		emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX,
599 						 0, 0, 0, 0));
600 		emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_2, BPF_REG_1, i * sizeof(__u64)));
601 		gen->hash_insn_offset[i] = gen->insn_cur - gen->insn_start;
602 		emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_3, 0, 0, 0, 0, 0));
603 
604 		off =  -(gen->insn_cur - gen->insn_start - gen->cleanup_label) / 8 - 1;
605 		if (is_simm16(off)) {
606 			emit(gen, BPF_MOV64_IMM(BPF_REG_7, -EINVAL));
607 			emit(gen, BPF_JMP_REG(BPF_JNE, BPF_REG_2, BPF_REG_3, off));
608 		} else {
609 			gen->error = -ERANGE;
610 			emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, -1));
611 		}
612 	}
613 }
614 
615 void bpf_gen__record_attach_target(struct bpf_gen *gen, const char *attach_name,
616 				   enum bpf_attach_type type)
617 {
618 	const char *prefix;
619 	int kind, ret;
620 
621 	btf_get_kernel_prefix_kind(type, &prefix, &kind);
622 	gen->attach_kind = kind;
623 	ret = snprintf(gen->attach_target, sizeof(gen->attach_target), "%s%s",
624 		       prefix, attach_name);
625 	if (ret >= sizeof(gen->attach_target))
626 		gen->error = -ENOSPC;
627 }
628 
629 static void emit_find_attach_target(struct bpf_gen *gen)
630 {
631 	int name, len = strlen(gen->attach_target) + 1;
632 
633 	pr_debug("gen: find_attach_tgt %s %d\n", gen->attach_target, gen->attach_kind);
634 	name = add_data(gen, gen->attach_target, len);
635 
636 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
637 					 0, 0, 0, name));
638 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
639 	emit(gen, BPF_MOV64_IMM(BPF_REG_3, gen->attach_kind));
640 	emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0));
641 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind));
642 	emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
643 	debug_ret(gen, "find_by_name_kind(%s,%d)",
644 		  gen->attach_target, gen->attach_kind);
645 	emit_check_err(gen);
646 	/* if successful, btf_id is in lower 32-bit of R7 and
647 	 * btf_obj_fd is in upper 32-bit
648 	 */
649 }
650 
651 void bpf_gen__record_extern(struct bpf_gen *gen, const char *name, bool is_weak,
652 			    bool is_typeless, bool is_ld64, int kind, int insn_idx)
653 {
654 	struct ksym_relo_desc *relo;
655 
656 	relo = libbpf_reallocarray(gen->relos, gen->relo_cnt + 1, sizeof(*relo));
657 	if (!relo) {
658 		gen->error = -ENOMEM;
659 		return;
660 	}
661 	gen->relos = relo;
662 	relo += gen->relo_cnt;
663 	relo->name = name;
664 	relo->is_weak = is_weak;
665 	relo->is_typeless = is_typeless;
666 	relo->is_ld64 = is_ld64;
667 	relo->kind = kind;
668 	relo->insn_idx = insn_idx;
669 	gen->relo_cnt++;
670 }
671 
672 /* returns existing ksym_desc with ref incremented, or inserts a new one */
673 static struct ksym_desc *get_ksym_desc(struct bpf_gen *gen, struct ksym_relo_desc *relo)
674 {
675 	struct ksym_desc *kdesc;
676 	int i;
677 
678 	for (i = 0; i < gen->nr_ksyms; i++) {
679 		kdesc = &gen->ksyms[i];
680 		if (kdesc->kind == relo->kind && kdesc->is_ld64 == relo->is_ld64 &&
681 		    !strcmp(kdesc->name, relo->name)) {
682 			kdesc->ref++;
683 			return kdesc;
684 		}
685 	}
686 	kdesc = libbpf_reallocarray(gen->ksyms, gen->nr_ksyms + 1, sizeof(*kdesc));
687 	if (!kdesc) {
688 		gen->error = -ENOMEM;
689 		return NULL;
690 	}
691 	gen->ksyms = kdesc;
692 	kdesc = &gen->ksyms[gen->nr_ksyms++];
693 	kdesc->name = relo->name;
694 	kdesc->kind = relo->kind;
695 	kdesc->ref = 1;
696 	kdesc->off = 0;
697 	kdesc->insn = 0;
698 	kdesc->is_ld64 = relo->is_ld64;
699 	return kdesc;
700 }
701 
702 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7}
703  * Returns result in BPF_REG_7
704  */
705 static void emit_bpf_find_by_name_kind(struct bpf_gen *gen, struct ksym_relo_desc *relo)
706 {
707 	int name_off, len = strlen(relo->name) + 1;
708 
709 	name_off = add_data(gen, relo->name, len);
710 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
711 					 0, 0, 0, name_off));
712 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
713 	emit(gen, BPF_MOV64_IMM(BPF_REG_3, relo->kind));
714 	emit(gen, BPF_MOV64_IMM(BPF_REG_4, 0));
715 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_btf_find_by_name_kind));
716 	emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
717 	debug_ret(gen, "find_by_name_kind(%s,%d)", relo->name, relo->kind);
718 }
719 
720 /* Overwrites BPF_REG_{0, 1, 2, 3, 4, 7}
721  * Returns result in BPF_REG_7
722  * Returns u64 symbol addr in BPF_REG_9
723  */
724 static void emit_bpf_kallsyms_lookup_name(struct bpf_gen *gen, struct ksym_relo_desc *relo)
725 {
726 	int name_off, len = strlen(relo->name) + 1, res_off;
727 
728 	name_off = add_data(gen, relo->name, len);
729 	res_off = add_data(gen, NULL, 8); /* res is u64 */
730 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
731 					 0, 0, 0, name_off));
732 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, len));
733 	emit(gen, BPF_MOV64_IMM(BPF_REG_3, 0));
734 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_4, BPF_PSEUDO_MAP_IDX_VALUE,
735 					 0, 0, 0, res_off));
736 	emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_4));
737 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_kallsyms_lookup_name));
738 	emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_9, BPF_REG_7, 0));
739 	emit(gen, BPF_MOV64_REG(BPF_REG_7, BPF_REG_0));
740 	debug_ret(gen, "kallsyms_lookup_name(%s,%d)", relo->name, relo->kind);
741 }
742 
743 /* Expects:
744  * BPF_REG_8 - pointer to instruction
745  *
746  * We need to reuse BTF fd for same symbol otherwise each relocation takes a new
747  * index, while kernel limits total kfunc BTFs to 256. For duplicate symbols,
748  * this would mean a new BTF fd index for each entry. By pairing symbol name
749  * with index, we get the insn->imm, insn->off pairing that kernel uses for
750  * kfunc_tab, which becomes the effective limit even though all of them may
751  * share same index in fd_array (such that kfunc_btf_tab has 1 element).
752  */
753 static void emit_relo_kfunc_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn)
754 {
755 	struct ksym_desc *kdesc;
756 	int btf_fd_idx;
757 
758 	kdesc = get_ksym_desc(gen, relo);
759 	if (!kdesc)
760 		return;
761 	/* try to copy from existing bpf_insn */
762 	if (kdesc->ref > 1) {
763 		move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
764 			       kdesc->insn + offsetof(struct bpf_insn, imm));
765 		move_blob2blob(gen, insn + offsetof(struct bpf_insn, off), 2,
766 			       kdesc->insn + offsetof(struct bpf_insn, off));
767 		goto log;
768 	}
769 	/* remember insn offset, so we can copy BTF ID and FD later */
770 	kdesc->insn = insn;
771 	emit_bpf_find_by_name_kind(gen, relo);
772 	if (!relo->is_weak)
773 		emit_check_err(gen);
774 	/* get index in fd_array to store BTF FD at */
775 	btf_fd_idx = add_kfunc_btf_fd(gen);
776 	if (btf_fd_idx > INT16_MAX) {
777 		pr_warn("BTF fd off %d for kfunc %s exceeds INT16_MAX, cannot process relocation\n",
778 			btf_fd_idx, relo->name);
779 		gen->error = -E2BIG;
780 		return;
781 	}
782 	kdesc->off = btf_fd_idx;
783 	/* jump to success case */
784 	emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3));
785 	/* set value for imm, off as 0 */
786 	emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0));
787 	emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0));
788 	/* skip success case for ret < 0 */
789 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 10));
790 	/* store btf_id into insn[insn_idx].imm */
791 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm)));
792 	/* obtain fd in BPF_REG_9 */
793 	emit(gen, BPF_MOV64_REG(BPF_REG_9, BPF_REG_7));
794 	emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32));
795 	/* load fd_array slot pointer */
796 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
797 					 0, 0, 0, blob_fd_array_off(gen, btf_fd_idx)));
798 	/* store BTF fd in slot, 0 for vmlinux */
799 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_9, 0));
800 	/* jump to insn[insn_idx].off store if fd denotes module BTF */
801 	emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_9, 0, 2));
802 	/* set the default value for off */
803 	emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), 0));
804 	/* skip BTF fd store for vmlinux BTF */
805 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1));
806 	/* store index into insn[insn_idx].off */
807 	emit(gen, BPF_ST_MEM(BPF_H, BPF_REG_8, offsetof(struct bpf_insn, off), btf_fd_idx));
808 log:
809 	if (!gen->log_level)
810 		return;
811 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8,
812 			      offsetof(struct bpf_insn, imm)));
813 	emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8,
814 			      offsetof(struct bpf_insn, off)));
815 	debug_regs(gen, BPF_REG_7, BPF_REG_9, " func (%s:count=%d): imm: %%d, off: %%d",
816 		   relo->name, kdesc->ref);
817 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
818 					 0, 0, 0, blob_fd_array_off(gen, kdesc->off)));
819 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_9, BPF_REG_0, 0));
820 	debug_regs(gen, BPF_REG_9, -1, " func (%s:count=%d): btf_fd",
821 		   relo->name, kdesc->ref);
822 }
823 
824 static void emit_ksym_relo_log(struct bpf_gen *gen, struct ksym_relo_desc *relo,
825 			       int ref)
826 {
827 	if (!gen->log_level)
828 		return;
829 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_8,
830 			      offsetof(struct bpf_insn, imm)));
831 	emit(gen, BPF_LDX_MEM(BPF_H, BPF_REG_9, BPF_REG_8, sizeof(struct bpf_insn) +
832 			      offsetof(struct bpf_insn, imm)));
833 	debug_regs(gen, BPF_REG_7, BPF_REG_9, " var t=%d w=%d (%s:count=%d): imm[0]: %%d, imm[1]: %%d",
834 		   relo->is_typeless, relo->is_weak, relo->name, ref);
835 	emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code)));
836 	debug_regs(gen, BPF_REG_9, -1, " var t=%d w=%d (%s:count=%d): insn.reg",
837 		   relo->is_typeless, relo->is_weak, relo->name, ref);
838 }
839 
840 /* Expects:
841  * BPF_REG_8 - pointer to instruction
842  */
843 static void emit_relo_ksym_typeless(struct bpf_gen *gen,
844 				    struct ksym_relo_desc *relo, int insn)
845 {
846 	struct ksym_desc *kdesc;
847 
848 	kdesc = get_ksym_desc(gen, relo);
849 	if (!kdesc)
850 		return;
851 	/* try to copy from existing ldimm64 insn */
852 	if (kdesc->ref > 1) {
853 		move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
854 			       kdesc->insn + offsetof(struct bpf_insn, imm));
855 		move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4,
856 			       kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm));
857 		goto log;
858 	}
859 	/* remember insn offset, so we can copy ksym addr later */
860 	kdesc->insn = insn;
861 	/* skip typeless ksym_desc in fd closing loop in cleanup_relos */
862 	kdesc->typeless = true;
863 	emit_bpf_kallsyms_lookup_name(gen, relo);
864 	emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_7, -ENOENT, 1));
865 	emit_check_err(gen);
866 	/* store lower half of addr into insn[insn_idx].imm */
867 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9, offsetof(struct bpf_insn, imm)));
868 	/* store upper half of addr into insn[insn_idx + 1].imm */
869 	emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_9, 32));
870 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_9,
871 		      sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)));
872 log:
873 	emit_ksym_relo_log(gen, relo, kdesc->ref);
874 }
875 
876 static __u32 src_reg_mask(struct bpf_gen *gen)
877 {
878 #if defined(__LITTLE_ENDIAN_BITFIELD) /* src_reg,dst_reg,... */
879 	return gen->swapped_endian ? 0xf0 : 0x0f;
880 #elif defined(__BIG_ENDIAN_BITFIELD) /* dst_reg,src_reg,... */
881 	return gen->swapped_endian ? 0x0f : 0xf0;
882 #else
883 #error "Unsupported bit endianness, cannot proceed"
884 #endif
885 }
886 
887 /* Expects:
888  * BPF_REG_8 - pointer to instruction
889  */
890 static void emit_relo_ksym_btf(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insn)
891 {
892 	struct ksym_desc *kdesc;
893 	__u32 reg_mask;
894 
895 	kdesc = get_ksym_desc(gen, relo);
896 	if (!kdesc)
897 		return;
898 	/* try to copy from existing ldimm64 insn */
899 	if (kdesc->ref > 1) {
900 		move_blob2blob(gen, insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 4,
901 			       kdesc->insn + sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm));
902 		move_blob2blob(gen, insn + offsetof(struct bpf_insn, imm), 4,
903 			       kdesc->insn + offsetof(struct bpf_insn, imm));
904 		/* jump over src_reg adjustment if imm (btf_id) is not 0, reuse BPF_REG_0 from move_blob2blob
905 		 * If btf_id is zero, clear BPF_PSEUDO_BTF_ID flag in src_reg of ld_imm64 insn
906 		 */
907 		emit(gen, BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, 3));
908 		goto clear_src_reg;
909 	}
910 	/* remember insn offset, so we can copy BTF ID and FD later */
911 	kdesc->insn = insn;
912 	emit_bpf_find_by_name_kind(gen, relo);
913 	if (!relo->is_weak)
914 		emit_check_err(gen);
915 	/* jump to success case */
916 	emit(gen, BPF_JMP_IMM(BPF_JSGE, BPF_REG_7, 0, 3));
917 	/* set values for insn[insn_idx].imm, insn[insn_idx + 1].imm as 0 */
918 	emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, offsetof(struct bpf_insn, imm), 0));
919 	emit(gen, BPF_ST_MEM(BPF_W, BPF_REG_8, sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm), 0));
920 	/* skip success case for ret < 0 */
921 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 4));
922 	/* store btf_id into insn[insn_idx].imm */
923 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7, offsetof(struct bpf_insn, imm)));
924 	/* store btf_obj_fd into insn[insn_idx + 1].imm */
925 	emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32));
926 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_8, BPF_REG_7,
927 			      sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm)));
928 	/* skip src_reg adjustment */
929 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 3));
930 clear_src_reg:
931 	/* clear bpf_object__relocate_data's src_reg assignment, otherwise we get a verifier failure */
932 	reg_mask = src_reg_mask(gen);
933 	emit(gen, BPF_LDX_MEM(BPF_B, BPF_REG_9, BPF_REG_8, offsetofend(struct bpf_insn, code)));
934 	emit(gen, BPF_ALU32_IMM(BPF_AND, BPF_REG_9, reg_mask));
935 	emit(gen, BPF_STX_MEM(BPF_B, BPF_REG_8, BPF_REG_9, offsetofend(struct bpf_insn, code)));
936 
937 	emit_ksym_relo_log(gen, relo, kdesc->ref);
938 }
939 
940 void bpf_gen__record_relo_core(struct bpf_gen *gen,
941 			       const struct bpf_core_relo *core_relo)
942 {
943 	struct bpf_core_relo *relos;
944 
945 	relos = libbpf_reallocarray(gen->core_relos, gen->core_relo_cnt + 1, sizeof(*relos));
946 	if (!relos) {
947 		gen->error = -ENOMEM;
948 		return;
949 	}
950 	gen->core_relos = relos;
951 	relos += gen->core_relo_cnt;
952 	memcpy(relos, core_relo, sizeof(*relos));
953 	gen->core_relo_cnt++;
954 }
955 
956 static void emit_relo(struct bpf_gen *gen, struct ksym_relo_desc *relo, int insns)
957 {
958 	int insn;
959 
960 	pr_debug("gen: emit_relo (%d): %s at %d %s\n",
961 		 relo->kind, relo->name, relo->insn_idx, relo->is_ld64 ? "ld64" : "call");
962 	insn = insns + sizeof(struct bpf_insn) * relo->insn_idx;
963 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_8, BPF_PSEUDO_MAP_IDX_VALUE, 0, 0, 0, insn));
964 	if (relo->is_ld64) {
965 		if (relo->is_typeless)
966 			emit_relo_ksym_typeless(gen, relo, insn);
967 		else
968 			emit_relo_ksym_btf(gen, relo, insn);
969 	} else {
970 		emit_relo_kfunc_btf(gen, relo, insn);
971 	}
972 }
973 
974 static void emit_relos(struct bpf_gen *gen, int insns)
975 {
976 	int i;
977 
978 	for (i = 0; i < gen->relo_cnt; i++)
979 		emit_relo(gen, gen->relos + i, insns);
980 }
981 
982 static void cleanup_core_relo(struct bpf_gen *gen)
983 {
984 	if (!gen->core_relo_cnt)
985 		return;
986 	free(gen->core_relos);
987 	gen->core_relo_cnt = 0;
988 	gen->core_relos = NULL;
989 }
990 
991 static void cleanup_relos(struct bpf_gen *gen, int insns)
992 {
993 	struct ksym_desc *kdesc;
994 	int i, insn;
995 
996 	for (i = 0; i < gen->nr_ksyms; i++) {
997 		kdesc = &gen->ksyms[i];
998 		/* only close fds for typed ksyms and kfuncs */
999 		if (kdesc->is_ld64 && !kdesc->typeless) {
1000 			/* close fd recorded in insn[insn_idx + 1].imm */
1001 			insn = kdesc->insn;
1002 			insn += sizeof(struct bpf_insn) + offsetof(struct bpf_insn, imm);
1003 			emit_sys_close_blob(gen, insn);
1004 		} else if (!kdesc->is_ld64) {
1005 			emit_sys_close_blob(gen, blob_fd_array_off(gen, kdesc->off));
1006 			if (kdesc->off < MAX_FD_ARRAY_SZ)
1007 				gen->nr_fd_array--;
1008 		}
1009 	}
1010 	if (gen->nr_ksyms) {
1011 		free(gen->ksyms);
1012 		gen->nr_ksyms = 0;
1013 		gen->ksyms = NULL;
1014 	}
1015 	if (gen->relo_cnt) {
1016 		free(gen->relos);
1017 		gen->relo_cnt = 0;
1018 		gen->relos = NULL;
1019 	}
1020 	cleanup_core_relo(gen);
1021 }
1022 
1023 /* Convert func, line, and core relo info blobs to target endianness */
1024 static void info_blob_bswap(struct bpf_gen *gen, int func_info, int line_info,
1025 			    int core_relos, struct bpf_prog_load_opts *load_attr)
1026 {
1027 	struct bpf_func_info *fi = gen->data_start + func_info;
1028 	struct bpf_line_info *li = gen->data_start + line_info;
1029 	struct bpf_core_relo *cr = gen->data_start + core_relos;
1030 	int i;
1031 
1032 	for (i = 0; i < load_attr->func_info_cnt; i++)
1033 		bpf_func_info_bswap(fi++);
1034 
1035 	for (i = 0; i < load_attr->line_info_cnt; i++)
1036 		bpf_line_info_bswap(li++);
1037 
1038 	for (i = 0; i < gen->core_relo_cnt; i++)
1039 		bpf_core_relo_bswap(cr++);
1040 }
1041 
1042 void bpf_gen__prog_load(struct bpf_gen *gen,
1043 			enum bpf_prog_type prog_type, const char *prog_name,
1044 			const char *license, struct bpf_insn *insns, size_t insn_cnt,
1045 			struct bpf_prog_load_opts *load_attr, int prog_idx)
1046 {
1047 	int func_info_tot_sz = load_attr->func_info_cnt *
1048 			       load_attr->func_info_rec_size;
1049 	int line_info_tot_sz = load_attr->line_info_cnt *
1050 			       load_attr->line_info_rec_size;
1051 	int core_relo_tot_sz = gen->core_relo_cnt *
1052 			       sizeof(struct bpf_core_relo);
1053 	int prog_load_attr, license_off, insns_off, func_info, line_info, core_relos;
1054 	int attr_size = offsetofend(union bpf_attr, core_relo_rec_size);
1055 	union bpf_attr attr;
1056 
1057 	memset(&attr, 0, attr_size);
1058 	/* add license string to blob of bytes */
1059 	license_off = add_data(gen, license, strlen(license) + 1);
1060 	/* add insns to blob of bytes */
1061 	insns_off = add_data(gen, insns, insn_cnt * sizeof(struct bpf_insn));
1062 	pr_debug("gen: prog_load: prog_idx %d type %d insn off %d insns_cnt %zd license off %d\n",
1063 		 prog_idx, prog_type, insns_off, insn_cnt, license_off);
1064 
1065 	/* convert blob insns to target endianness */
1066 	if (gen->swapped_endian) {
1067 		struct bpf_insn *insn = gen->data_start + insns_off;
1068 		int i;
1069 
1070 		for (i = 0; i < insn_cnt; i++, insn++)
1071 			bpf_insn_bswap(insn);
1072 	}
1073 
1074 	attr.prog_type = tgt_endian(prog_type);
1075 	attr.expected_attach_type = tgt_endian(load_attr->expected_attach_type);
1076 	attr.attach_btf_id = tgt_endian(load_attr->attach_btf_id);
1077 	attr.prog_ifindex = tgt_endian(load_attr->prog_ifindex);
1078 	attr.kern_version = 0;
1079 	attr.insn_cnt = tgt_endian((__u32)insn_cnt);
1080 	attr.prog_flags = tgt_endian(load_attr->prog_flags);
1081 
1082 	attr.func_info_rec_size = tgt_endian(load_attr->func_info_rec_size);
1083 	attr.func_info_cnt = tgt_endian(load_attr->func_info_cnt);
1084 	func_info = add_data(gen, load_attr->func_info, func_info_tot_sz);
1085 	pr_debug("gen: prog_load: func_info: off %d cnt %d rec size %d\n",
1086 		 func_info, load_attr->func_info_cnt,
1087 		 load_attr->func_info_rec_size);
1088 
1089 	attr.line_info_rec_size = tgt_endian(load_attr->line_info_rec_size);
1090 	attr.line_info_cnt = tgt_endian(load_attr->line_info_cnt);
1091 	line_info = add_data(gen, load_attr->line_info, line_info_tot_sz);
1092 	pr_debug("gen: prog_load: line_info: off %d cnt %d rec size %d\n",
1093 		 line_info, load_attr->line_info_cnt,
1094 		 load_attr->line_info_rec_size);
1095 
1096 	attr.core_relo_rec_size = tgt_endian((__u32)sizeof(struct bpf_core_relo));
1097 	attr.core_relo_cnt = tgt_endian(gen->core_relo_cnt);
1098 	core_relos = add_data(gen, gen->core_relos, core_relo_tot_sz);
1099 	pr_debug("gen: prog_load: core_relos: off %d cnt %d rec size %zd\n",
1100 		 core_relos, gen->core_relo_cnt,
1101 		 sizeof(struct bpf_core_relo));
1102 
1103 	/* convert all info blobs to target endianness */
1104 	if (gen->swapped_endian)
1105 		info_blob_bswap(gen, func_info, line_info, core_relos, load_attr);
1106 
1107 	libbpf_strlcpy(attr.prog_name, prog_name, sizeof(attr.prog_name));
1108 	prog_load_attr = add_data(gen, &attr, attr_size);
1109 	pr_debug("gen: prog_load: attr: off %d size %d\n",
1110 		 prog_load_attr, attr_size);
1111 
1112 	/* populate union bpf_attr with a pointer to license */
1113 	emit_rel_store(gen, attr_field(prog_load_attr, license), license_off);
1114 
1115 	/* populate union bpf_attr with a pointer to instructions */
1116 	emit_rel_store(gen, attr_field(prog_load_attr, insns), insns_off);
1117 
1118 	/* populate union bpf_attr with a pointer to func_info */
1119 	emit_rel_store(gen, attr_field(prog_load_attr, func_info), func_info);
1120 
1121 	/* populate union bpf_attr with a pointer to line_info */
1122 	emit_rel_store(gen, attr_field(prog_load_attr, line_info), line_info);
1123 
1124 	/* populate union bpf_attr with a pointer to core_relos */
1125 	emit_rel_store(gen, attr_field(prog_load_attr, core_relos), core_relos);
1126 
1127 	/* populate union bpf_attr fd_array with a pointer to data where map_fds are saved */
1128 	emit_rel_store(gen, attr_field(prog_load_attr, fd_array), gen->fd_array);
1129 
1130 	/* populate union bpf_attr with user provided log details */
1131 	move_ctx2blob(gen, attr_field(prog_load_attr, log_level), 4,
1132 		      offsetof(struct bpf_loader_ctx, log_level), false);
1133 	move_ctx2blob(gen, attr_field(prog_load_attr, log_size), 4,
1134 		      offsetof(struct bpf_loader_ctx, log_size), false);
1135 	move_ctx2blob(gen, attr_field(prog_load_attr, log_buf), 8,
1136 		      offsetof(struct bpf_loader_ctx, log_buf), false);
1137 	/* populate union bpf_attr with btf_fd saved in the stack earlier */
1138 	move_stack2blob(gen, attr_field(prog_load_attr, prog_btf_fd), 4,
1139 			stack_off(btf_fd));
1140 	if (gen->attach_kind) {
1141 		emit_find_attach_target(gen);
1142 		/* populate union bpf_attr with btf_id and btf_obj_fd found by helper */
1143 		emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_0, BPF_PSEUDO_MAP_IDX_VALUE,
1144 						 0, 0, 0, prog_load_attr));
1145 		emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7,
1146 				      offsetof(union bpf_attr, attach_btf_id)));
1147 		emit(gen, BPF_ALU64_IMM(BPF_RSH, BPF_REG_7, 32));
1148 		emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_0, BPF_REG_7,
1149 				      offsetof(union bpf_attr, attach_btf_obj_fd)));
1150 	}
1151 	emit_relos(gen, insns_off);
1152 	/* emit PROG_LOAD command */
1153 	emit_sys_bpf(gen, BPF_PROG_LOAD, prog_load_attr, attr_size);
1154 	debug_ret(gen, "prog_load %s insn_cnt %d", attr.prog_name, attr.insn_cnt);
1155 	/* successful or not, close btf module FDs used in extern ksyms and attach_btf_obj_fd */
1156 	cleanup_relos(gen, insns_off);
1157 	if (gen->attach_kind) {
1158 		emit_sys_close_blob(gen,
1159 				    attr_field(prog_load_attr, attach_btf_obj_fd));
1160 		gen->attach_kind = 0;
1161 	}
1162 	emit_check_err(gen);
1163 	/* remember prog_fd in the stack, if successful */
1164 	emit(gen, BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_7,
1165 			      stack_off(prog_fd[gen->nr_progs])));
1166 	gen->nr_progs++;
1167 }
1168 
1169 void bpf_gen__map_update_elem(struct bpf_gen *gen, int map_idx, void *pvalue,
1170 			      __u32 value_size)
1171 {
1172 	int attr_size = offsetofend(union bpf_attr, flags);
1173 	int map_update_attr, value, key;
1174 	union bpf_attr attr;
1175 	int zero = 0;
1176 
1177 	memset(&attr, 0, attr_size);
1178 
1179 	value = add_data(gen, pvalue, value_size);
1180 	key = add_data(gen, &zero, sizeof(zero));
1181 
1182 	/* if (map_desc[map_idx].initial_value) {
1183 	 *    if (ctx->flags & BPF_SKEL_KERNEL)
1184 	 *        bpf_probe_read_kernel(value, value_size, initial_value);
1185 	 *    else
1186 	 *        bpf_copy_from_user(value, value_size, initial_value);
1187 	 * }
1188 	 */
1189 	emit(gen, BPF_LDX_MEM(BPF_DW, BPF_REG_3, BPF_REG_6,
1190 			      sizeof(struct bpf_loader_ctx) +
1191 			      sizeof(struct bpf_map_desc) * map_idx +
1192 			      offsetof(struct bpf_map_desc, initial_value)));
1193 	emit(gen, BPF_JMP_IMM(BPF_JEQ, BPF_REG_3, 0, 8));
1194 	emit2(gen, BPF_LD_IMM64_RAW_FULL(BPF_REG_1, BPF_PSEUDO_MAP_IDX_VALUE,
1195 					 0, 0, 0, value));
1196 	emit(gen, BPF_MOV64_IMM(BPF_REG_2, value_size));
1197 	emit(gen, BPF_LDX_MEM(BPF_W, BPF_REG_0, BPF_REG_6,
1198 			      offsetof(struct bpf_loader_ctx, flags)));
1199 	emit(gen, BPF_JMP_IMM(BPF_JSET, BPF_REG_0, BPF_SKEL_KERNEL, 2));
1200 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_copy_from_user));
1201 	emit(gen, BPF_JMP_IMM(BPF_JA, 0, 0, 1));
1202 	emit(gen, BPF_EMIT_CALL(BPF_FUNC_probe_read_kernel));
1203 
1204 	map_update_attr = add_data(gen, &attr, attr_size);
1205 	pr_debug("gen: map_update_elem: idx %d, value: off %d size %d, attr: off %d size %d\n",
1206 		 map_idx, value, value_size, map_update_attr, attr_size);
1207 	move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4,
1208 		       blob_fd_array_off(gen, map_idx));
1209 	emit_rel_store(gen, attr_field(map_update_attr, key), key);
1210 	emit_rel_store(gen, attr_field(map_update_attr, value), value);
1211 	/* emit MAP_UPDATE_ELEM command */
1212 	emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size);
1213 	debug_ret(gen, "update_elem idx %d value_size %d", map_idx, value_size);
1214 	emit_check_err(gen);
1215 }
1216 
1217 void bpf_gen__populate_outer_map(struct bpf_gen *gen, int outer_map_idx, int slot,
1218 				 int inner_map_idx)
1219 {
1220 	int attr_size = offsetofend(union bpf_attr, flags);
1221 	int map_update_attr, key;
1222 	union bpf_attr attr;
1223 	int tgt_slot;
1224 
1225 	memset(&attr, 0, attr_size);
1226 
1227 	tgt_slot = tgt_endian(slot);
1228 	key = add_data(gen, &tgt_slot, sizeof(tgt_slot));
1229 
1230 	map_update_attr = add_data(gen, &attr, attr_size);
1231 	pr_debug("gen: populate_outer_map: outer %d key %d inner %d, attr: off %d size %d\n",
1232 		 outer_map_idx, slot, inner_map_idx, map_update_attr, attr_size);
1233 	move_blob2blob(gen, attr_field(map_update_attr, map_fd), 4,
1234 		       blob_fd_array_off(gen, outer_map_idx));
1235 	emit_rel_store(gen, attr_field(map_update_attr, key), key);
1236 	emit_rel_store(gen, attr_field(map_update_attr, value),
1237 		       blob_fd_array_off(gen, inner_map_idx));
1238 
1239 	/* emit MAP_UPDATE_ELEM command */
1240 	emit_sys_bpf(gen, BPF_MAP_UPDATE_ELEM, map_update_attr, attr_size);
1241 	debug_ret(gen, "populate_outer_map outer %d key %d inner %d",
1242 		  outer_map_idx, slot, inner_map_idx);
1243 	emit_check_err(gen);
1244 }
1245 
1246 void bpf_gen__map_freeze(struct bpf_gen *gen, int map_idx)
1247 {
1248 	int attr_size = offsetofend(union bpf_attr, map_fd);
1249 	int map_freeze_attr;
1250 	union bpf_attr attr;
1251 
1252 	memset(&attr, 0, attr_size);
1253 	map_freeze_attr = add_data(gen, &attr, attr_size);
1254 	pr_debug("gen: map_freeze: idx %d, attr: off %d size %d\n",
1255 		 map_idx, map_freeze_attr, attr_size);
1256 	move_blob2blob(gen, attr_field(map_freeze_attr, map_fd), 4,
1257 		       blob_fd_array_off(gen, map_idx));
1258 	/* emit MAP_FREEZE command */
1259 	emit_sys_bpf(gen, BPF_MAP_FREEZE, map_freeze_attr, attr_size);
1260 	debug_ret(gen, "map_freeze");
1261 	emit_check_err(gen);
1262 }
1263