// SPDX-License-Identifier: GPL-2.0 #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "trace_helpers.h" #include #include #include #include "bpf/libbpf_internal.h" #define TRACEFS_PIPE "/sys/kernel/tracing/trace_pipe" #define DEBUGFS_PIPE "/sys/kernel/debug/tracing/trace_pipe" struct ksyms { struct ksym *syms; size_t sym_cap; size_t sym_cnt; }; static struct ksyms *ksyms; static pthread_mutex_t ksyms_mutex = PTHREAD_MUTEX_INITIALIZER; static int ksyms__add_symbol(struct ksyms *ksyms, const char *name, unsigned long addr) { void *tmp; tmp = strdup(name); if (!tmp) return -ENOMEM; ksyms->syms[ksyms->sym_cnt].addr = addr; ksyms->syms[ksyms->sym_cnt].name = tmp; ksyms->sym_cnt++; return 0; } void free_kallsyms_local(struct ksyms *ksyms) { unsigned int i; if (!ksyms) return; if (!ksyms->syms) { free(ksyms); return; } for (i = 0; i < ksyms->sym_cnt; i++) free(ksyms->syms[i].name); free(ksyms->syms); free(ksyms); } static struct ksyms *load_kallsyms_local_common(ksym_cmp_t cmp_cb) { FILE *f; char func[256], buf[256]; char symbol; void *addr; int ret; struct ksyms *ksyms; f = fopen("/proc/kallsyms", "r"); if (!f) return NULL; ksyms = calloc(1, sizeof(struct ksyms)); if (!ksyms) { fclose(f); return NULL; } while (fgets(buf, sizeof(buf), f)) { if (sscanf(buf, "%p %c %s", &addr, &symbol, func) != 3) break; if (!addr) continue; ret = libbpf_ensure_mem((void **) &ksyms->syms, &ksyms->sym_cap, sizeof(struct ksym), ksyms->sym_cnt + 1); if (ret) goto error; ret = ksyms__add_symbol(ksyms, func, (unsigned long)addr); if (ret) goto error; } fclose(f); qsort(ksyms->syms, ksyms->sym_cnt, sizeof(struct ksym), cmp_cb); return ksyms; error: fclose(f); free_kallsyms_local(ksyms); return NULL; } static int ksym_cmp(const void *p1, const void *p2) { return ((struct ksym *)p1)->addr - ((struct ksym *)p2)->addr; } struct ksyms *load_kallsyms_local(void) { return load_kallsyms_local_common(ksym_cmp); } struct ksyms *load_kallsyms_custom_local(ksym_cmp_t cmp_cb) { return load_kallsyms_local_common(cmp_cb); } int load_kallsyms(void) { pthread_mutex_lock(&ksyms_mutex); if (!ksyms) ksyms = load_kallsyms_local(); pthread_mutex_unlock(&ksyms_mutex); return ksyms ? 0 : 1; } struct ksym *ksym_search_local(struct ksyms *ksyms, long key) { int start = 0, end = ksyms->sym_cnt; int result; /* kallsyms not loaded. return NULL */ if (ksyms->sym_cnt <= 0) return NULL; while (start < end) { size_t mid = start + (end - start) / 2; result = key - ksyms->syms[mid].addr; if (result < 0) end = mid; else if (result > 0) start = mid + 1; else return &ksyms->syms[mid]; } if (start >= 1 && ksyms->syms[start - 1].addr < key && key < ksyms->syms[start].addr) /* valid ksym */ return &ksyms->syms[start - 1]; /* out of range. return _stext */ return &ksyms->syms[0]; } struct ksym *search_kallsyms_custom_local(struct ksyms *ksyms, const void *p, ksym_search_cmp_t cmp_cb) { int start = 0, mid, end = ksyms->sym_cnt; struct ksym *ks; int result; while (start < end) { mid = start + (end - start) / 2; ks = &ksyms->syms[mid]; result = cmp_cb(p, ks); if (result < 0) end = mid; else if (result > 0) start = mid + 1; else return ks; } return NULL; } struct ksym *ksym_search(long key) { if (!ksyms) return NULL; return ksym_search_local(ksyms, key); } long ksym_get_addr_local(struct ksyms *ksyms, const char *name) { int i; for (i = 0; i < ksyms->sym_cnt; i++) { if (strcmp(ksyms->syms[i].name, name) == 0) return ksyms->syms[i].addr; } return 0; } long ksym_get_addr(const char *name) { if (!ksyms) return 0; return ksym_get_addr_local(ksyms, name); } /* open kallsyms and read symbol addresses on the fly. Without caching all symbols, * this is faster than load + find. */ int kallsyms_find(const char *sym, unsigned long long *addr) { char type, name[500], *match; unsigned long long value; int err = 0; FILE *f; f = fopen("/proc/kallsyms", "r"); if (!f) return -EINVAL; while (fscanf(f, "%llx %c %499s%*[^\n]\n", &value, &type, name) > 0) { /* If CONFIG_LTO_CLANG_THIN is enabled, static variable/function * symbols could be promoted to global due to cross-file inlining. * For such cases, clang compiler will add .llvm. suffix * to those symbols to avoid potential naming conflict. * Let us ignore .llvm. suffix during symbol comparison. */ if (type == 'd') { match = strstr(name, ".llvm."); if (match) *match = '\0'; } if (strcmp(name, sym) == 0) { *addr = value; goto out; } } err = -ENOENT; out: fclose(f); return err; } #ifdef PROCMAP_QUERY int env_verbosity __weak = 0; static int procmap_query(int fd, const void *addr, __u32 query_flags, size_t *start, size_t *offset, int *flags) { char path_buf[PATH_MAX], build_id_buf[20]; struct procmap_query q; int err; memset(&q, 0, sizeof(q)); q.size = sizeof(q); q.query_flags = query_flags; q.query_addr = (__u64)addr; q.vma_name_addr = (__u64)path_buf; q.vma_name_size = sizeof(path_buf); q.build_id_addr = (__u64)build_id_buf; q.build_id_size = sizeof(build_id_buf); err = ioctl(fd, PROCMAP_QUERY, &q); if (err < 0) { err = -errno; if (err == -ENOTTY) return -EOPNOTSUPP; /* ioctl() not implemented yet */ if (err == -ENOENT) return -ESRCH; /* vma not found */ return err; } if (env_verbosity >= 1) { printf("VMA FOUND (addr %08lx): %08lx-%08lx %c%c%c%c %08lx %02x:%02x %ld %s (build ID: %s, %d bytes)\n", (long)addr, (long)q.vma_start, (long)q.vma_end, (q.vma_flags & PROCMAP_QUERY_VMA_READABLE) ? 'r' : '-', (q.vma_flags & PROCMAP_QUERY_VMA_WRITABLE) ? 'w' : '-', (q.vma_flags & PROCMAP_QUERY_VMA_EXECUTABLE) ? 'x' : '-', (q.vma_flags & PROCMAP_QUERY_VMA_SHARED) ? 's' : 'p', (long)q.vma_offset, q.dev_major, q.dev_minor, (long)q.inode, q.vma_name_size ? path_buf : "", q.build_id_size ? "YES" : "NO", q.build_id_size); } *start = q.vma_start; *offset = q.vma_offset; *flags = q.vma_flags; return 0; } #else static int procmap_query(int fd, const void *addr, __u32 query_flags, size_t *start, size_t *offset, int *flags) { return -EOPNOTSUPP; } #endif ssize_t get_uprobe_offset(const void *addr) { size_t start, base, end; FILE *f; char buf[256]; int err, flags; f = fopen("/proc/self/maps", "r"); if (!f) return -errno; /* requested executable VMA only */ err = procmap_query(fileno(f), addr, PROCMAP_QUERY_VMA_EXECUTABLE, &start, &base, &flags); if (err == -EOPNOTSUPP) { bool found = false; while (fscanf(f, "%zx-%zx %s %zx %*[^\n]\n", &start, &end, buf, &base) == 4) { if (buf[2] == 'x' && (uintptr_t)addr >= start && (uintptr_t)addr < end) { found = true; break; } } if (!found) { fclose(f); return -ESRCH; } } else if (err) { fclose(f); return err; } fclose(f); #if defined(__powerpc64__) && defined(_CALL_ELF) && _CALL_ELF == 2 #define OP_RT_RA_MASK 0xffff0000UL #define LIS_R2 0x3c400000UL #define ADDIS_R2_R12 0x3c4c0000UL #define ADDI_R2_R2 0x38420000UL /* * A PPC64 ABIv2 function may have a local and a global entry * point. We need to use the local entry point when patching * functions, so identify and step over the global entry point * sequence. * * The global entry point sequence is always of the form: * * addis r2,r12,XXXX * addi r2,r2,XXXX * * A linker optimisation may convert the addis to lis: * * lis r2,XXXX * addi r2,r2,XXXX */ { const __u32 *insn = (const __u32 *)(uintptr_t)addr; if ((((*insn & OP_RT_RA_MASK) == ADDIS_R2_R12) || ((*insn & OP_RT_RA_MASK) == LIS_R2)) && ((*(insn + 1) & OP_RT_RA_MASK) == ADDI_R2_R2)) return (uintptr_t)(insn + 2) - start + base; } #endif return (uintptr_t)addr - start + base; } ssize_t get_rel_offset(uintptr_t addr) { size_t start, end, offset; char buf[256]; FILE *f; int err, flags; f = fopen("/proc/self/maps", "r"); if (!f) return -errno; err = procmap_query(fileno(f), (const void *)addr, 0, &start, &offset, &flags); if (err == 0) { fclose(f); return (size_t)addr - start + offset; } else if (err != -EOPNOTSUPP) { fclose(f); return err; } else if (err) { while (fscanf(f, "%zx-%zx %s %zx %*[^\n]\n", &start, &end, buf, &offset) == 4) { if (addr >= start && addr < end) { fclose(f); return (size_t)addr - start + offset; } } } fclose(f); return -EINVAL; } static int parse_build_id_buf(const void *note_start, Elf32_Word note_size, char *build_id) { Elf32_Word note_offs = 0; while (note_offs + sizeof(Elf32_Nhdr) < note_size) { Elf32_Nhdr *nhdr = (Elf32_Nhdr *)(note_start + note_offs); if (nhdr->n_type == 3 && nhdr->n_namesz == sizeof("GNU") && !strcmp((char *)(nhdr + 1), "GNU") && nhdr->n_descsz > 0 && nhdr->n_descsz <= BPF_BUILD_ID_SIZE) { memcpy(build_id, note_start + note_offs + ALIGN(sizeof("GNU"), 4) + sizeof(Elf32_Nhdr), nhdr->n_descsz); memset(build_id + nhdr->n_descsz, 0, BPF_BUILD_ID_SIZE - nhdr->n_descsz); return (int) nhdr->n_descsz; } note_offs = note_offs + sizeof(Elf32_Nhdr) + ALIGN(nhdr->n_namesz, 4) + ALIGN(nhdr->n_descsz, 4); } return -ENOENT; } /* Reads binary from *path* file and returns it in the *build_id* buffer * with *size* which is expected to be at least BPF_BUILD_ID_SIZE bytes. * Returns size of build id on success. On error the error value is * returned. */ int read_build_id(const char *path, char *build_id, size_t size) { int fd, err = -EINVAL; Elf *elf = NULL; GElf_Ehdr ehdr; size_t max, i; if (size < BPF_BUILD_ID_SIZE) return -EINVAL; fd = open(path, O_RDONLY | O_CLOEXEC); if (fd < 0) return -errno; (void)elf_version(EV_CURRENT); elf = elf_begin(fd, ELF_C_READ_MMAP, NULL); if (!elf) goto out; if (elf_kind(elf) != ELF_K_ELF) goto out; if (!gelf_getehdr(elf, &ehdr)) goto out; for (i = 0; i < ehdr.e_phnum; i++) { GElf_Phdr mem, *phdr; char *data; phdr = gelf_getphdr(elf, i, &mem); if (!phdr) goto out; if (phdr->p_type != PT_NOTE) continue; data = elf_rawfile(elf, &max); if (!data) goto out; if (phdr->p_offset + phdr->p_memsz > max) goto out; err = parse_build_id_buf(data + phdr->p_offset, phdr->p_memsz, build_id); if (err > 0) break; } out: if (elf) elf_end(elf); close(fd); return err; } int read_trace_pipe_iter(void (*cb)(const char *str, void *data), void *data, int iter) { size_t buflen, n; char *buf = NULL; FILE *fp = NULL; if (access(TRACEFS_PIPE, F_OK) == 0) fp = fopen(TRACEFS_PIPE, "r"); else fp = fopen(DEBUGFS_PIPE, "r"); if (!fp) return -1; /* We do not want to wait forever when iter is specified. */ if (iter) fcntl(fileno(fp), F_SETFL, O_NONBLOCK); while ((n = getline(&buf, &buflen, fp) >= 0) || errno == EAGAIN) { if (n > 0) cb(buf, data); if (iter && !(--iter)) break; } free(buf); if (fp) fclose(fp); return 0; } static void trace_pipe_cb(const char *str, void *data) { printf("%s", str); } void read_trace_pipe(void) { read_trace_pipe_iter(trace_pipe_cb, NULL, 0); }