| // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause) |
| /* Copyright (c) 2024, Oracle and/or its affiliates. */ |
| |
| #ifndef _GNU_SOURCE |
| #define _GNU_SOURCE |
| #endif |
| |
| #ifdef __KERNEL__ |
| #include <linux/bpf.h> |
| #include <linux/bsearch.h> |
| #include <linux/btf.h> |
| #include <linux/sort.h> |
| #include <linux/string.h> |
| #include <linux/bpf_verifier.h> |
| |
| #define btf_type_by_id (struct btf_type *)btf_type_by_id |
| #define btf__type_cnt btf_nr_types |
| #define btf__base_btf btf_base_btf |
| #define btf__name_by_offset btf_name_by_offset |
| #define btf__str_by_offset btf_str_by_offset |
| #define btf_kflag btf_type_kflag |
| |
| #define calloc(nmemb, sz) kvcalloc(nmemb, sz, GFP_KERNEL | __GFP_NOWARN) |
| #define free(ptr) kvfree(ptr) |
| #define qsort(base, num, sz, cmp) sort(base, num, sz, cmp, NULL) |
| |
| #else |
| |
| #include "btf.h" |
| #include "bpf.h" |
| #include "libbpf.h" |
| #include "libbpf_internal.h" |
| |
| #endif /* __KERNEL__ */ |
| |
| struct btf; |
| |
| struct btf_relocate { |
| struct btf *btf; |
| const struct btf *base_btf; |
| const struct btf *dist_base_btf; |
| unsigned int nr_base_types; |
| unsigned int nr_split_types; |
| unsigned int nr_dist_base_types; |
| int dist_str_len; |
| int base_str_len; |
| __u32 *id_map; |
| __u32 *str_map; |
| }; |
| |
| /* Set temporarily in relocation id_map if distilled base struct/union is |
| * embedded in a split BTF struct/union; in such a case, size information must |
| * match between distilled base BTF and base BTF representation of type. |
| */ |
| #define BTF_IS_EMBEDDED ((__u32)-1) |
| |
| /* <name, size, id> triple used in sorting/searching distilled base BTF. */ |
| struct btf_name_info { |
| const char *name; |
| /* set when search requires a size match */ |
| bool needs_size: 1; |
| unsigned int size: 31; |
| __u32 id; |
| }; |
| |
| static int btf_relocate_rewrite_type_id(struct btf_relocate *r, __u32 i) |
| { |
| struct btf_type *t = btf_type_by_id(r->btf, i); |
| struct btf_field_iter it; |
| __u32 *id; |
| int err; |
| |
| err = btf_field_iter_init(&it, t, BTF_FIELD_ITER_IDS); |
| if (err) |
| return err; |
| |
| while ((id = btf_field_iter_next(&it))) |
| *id = r->id_map[*id]; |
| return 0; |
| } |
| |
| /* Simple string comparison used for sorting within BTF, since all distilled |
| * types are named. If strings match, and size is non-zero for both elements |
| * fall back to using size for ordering. |
| */ |
| static int cmp_btf_name_size(const void *n1, const void *n2) |
| { |
| const struct btf_name_info *ni1 = n1; |
| const struct btf_name_info *ni2 = n2; |
| int name_diff = strcmp(ni1->name, ni2->name); |
| |
| if (!name_diff && ni1->needs_size && ni2->needs_size) |
| return ni2->size - ni1->size; |
| return name_diff; |
| } |
| |
| /* Binary search with a small twist; find leftmost element that matches |
| * so that we can then iterate through all exact matches. So for example |
| * searching { "a", "bb", "bb", "c" } we would always match on the |
| * leftmost "bb". |
| */ |
| static struct btf_name_info *search_btf_name_size(struct btf_name_info *key, |
| struct btf_name_info *vals, |
| int nelems) |
| { |
| struct btf_name_info *ret = NULL; |
| int high = nelems - 1; |
| int low = 0; |
| |
| while (low <= high) { |
| int mid = (low + high)/2; |
| struct btf_name_info *val = &vals[mid]; |
| int diff = cmp_btf_name_size(key, val); |
| |
| if (diff == 0) |
| ret = val; |
| /* even if found, keep searching for leftmost match */ |
| if (diff <= 0) |
| high = mid - 1; |
| else |
| low = mid + 1; |
| } |
| return ret; |
| } |
| |
| /* If a member of a split BTF struct/union refers to a base BTF |
| * struct/union, mark that struct/union id temporarily in the id_map |
| * with BTF_IS_EMBEDDED. Members can be const/restrict/volatile/typedef |
| * reference types, but if a pointer is encountered, the type is no longer |
| * considered embedded. |
| */ |
| static int btf_mark_embedded_composite_type_ids(struct btf_relocate *r, __u32 i) |
| { |
| struct btf_type *t = btf_type_by_id(r->btf, i); |
| struct btf_field_iter it; |
| __u32 *id; |
| int err; |
| |
| if (!btf_is_composite(t)) |
| return 0; |
| |
| err = btf_field_iter_init(&it, t, BTF_FIELD_ITER_IDS); |
| if (err) |
| return err; |
| |
| while ((id = btf_field_iter_next(&it))) { |
| __u32 next_id = *id; |
| |
| while (next_id) { |
| t = btf_type_by_id(r->btf, next_id); |
| switch (btf_kind(t)) { |
| case BTF_KIND_CONST: |
| case BTF_KIND_RESTRICT: |
| case BTF_KIND_VOLATILE: |
| case BTF_KIND_TYPEDEF: |
| case BTF_KIND_TYPE_TAG: |
| next_id = t->type; |
| break; |
| case BTF_KIND_ARRAY: { |
| struct btf_array *a = btf_array(t); |
| |
| next_id = a->type; |
| break; |
| } |
| case BTF_KIND_STRUCT: |
| case BTF_KIND_UNION: |
| if (next_id < r->nr_dist_base_types) |
| r->id_map[next_id] = BTF_IS_EMBEDDED; |
| next_id = 0; |
| break; |
| default: |
| next_id = 0; |
| break; |
| } |
| } |
| } |
| |
| return 0; |
| } |
| |
| /* Build a map from distilled base BTF ids to base BTF ids. To do so, iterate |
| * through base BTF looking up distilled type (using binary search) equivalents. |
| */ |
| static int btf_relocate_map_distilled_base(struct btf_relocate *r) |
| { |
| struct btf_name_info *info, *info_end; |
| struct btf_type *base_t, *dist_t; |
| __u8 *base_name_cnt = NULL; |
| int err = 0; |
| __u32 id; |
| |
| /* generate a sort index array of name/type ids sorted by name for |
| * distilled base BTF to speed name-based lookups. |
| */ |
| info = calloc(r->nr_dist_base_types, sizeof(*info)); |
| if (!info) { |
| err = -ENOMEM; |
| goto done; |
| } |
| info_end = info + r->nr_dist_base_types; |
| for (id = 0; id < r->nr_dist_base_types; id++) { |
| dist_t = btf_type_by_id(r->dist_base_btf, id); |
| info[id].name = btf__name_by_offset(r->dist_base_btf, dist_t->name_off); |
| info[id].id = id; |
| info[id].size = dist_t->size; |
| info[id].needs_size = true; |
| } |
| qsort(info, r->nr_dist_base_types, sizeof(*info), cmp_btf_name_size); |
| |
| /* Mark distilled base struct/union members of split BTF structs/unions |
| * in id_map with BTF_IS_EMBEDDED; this signals that these types |
| * need to match both name and size, otherwise embedding the base |
| * struct/union in the split type is invalid. |
| */ |
| for (id = r->nr_dist_base_types; id < r->nr_split_types; id++) { |
| err = btf_mark_embedded_composite_type_ids(r, id); |
| if (err) |
| goto done; |
| } |
| |
| /* Collect name counts for composite types in base BTF. If multiple |
| * instances of a struct/union of the same name exist, we need to use |
| * size to determine which to map to since name alone is ambiguous. |
| */ |
| base_name_cnt = calloc(r->base_str_len, sizeof(*base_name_cnt)); |
| if (!base_name_cnt) { |
| err = -ENOMEM; |
| goto done; |
| } |
| for (id = 1; id < r->nr_base_types; id++) { |
| base_t = btf_type_by_id(r->base_btf, id); |
| if (!btf_is_composite(base_t) || !base_t->name_off) |
| continue; |
| if (base_name_cnt[base_t->name_off] < 255) |
| base_name_cnt[base_t->name_off]++; |
| } |
| |
| /* Now search base BTF for matching distilled base BTF types. */ |
| for (id = 1; id < r->nr_base_types; id++) { |
| struct btf_name_info *dist_info, base_info = {}; |
| int dist_kind, base_kind; |
| |
| base_t = btf_type_by_id(r->base_btf, id); |
| /* distilled base consists of named types only. */ |
| if (!base_t->name_off) |
| continue; |
| base_kind = btf_kind(base_t); |
| base_info.id = id; |
| base_info.name = btf__name_by_offset(r->base_btf, base_t->name_off); |
| switch (base_kind) { |
| case BTF_KIND_INT: |
| case BTF_KIND_FLOAT: |
| case BTF_KIND_ENUM: |
| case BTF_KIND_ENUM64: |
| /* These types should match both name and size */ |
| base_info.needs_size = true; |
| base_info.size = base_t->size; |
| break; |
| case BTF_KIND_FWD: |
| /* No size considerations for fwds. */ |
| break; |
| case BTF_KIND_STRUCT: |
| case BTF_KIND_UNION: |
| /* Size only needs to be used for struct/union if there |
| * are multiple types in base BTF with the same name. |
| * If there are multiple _distilled_ types with the same |
| * name (a very unlikely scenario), that doesn't matter |
| * unless corresponding _base_ types to match them are |
| * missing. |
| */ |
| base_info.needs_size = base_name_cnt[base_t->name_off] > 1; |
| base_info.size = base_t->size; |
| break; |
| default: |
| continue; |
| } |
| /* iterate over all matching distilled base types */ |
| for (dist_info = search_btf_name_size(&base_info, info, r->nr_dist_base_types); |
| dist_info != NULL && dist_info < info_end && |
| cmp_btf_name_size(&base_info, dist_info) == 0; |
| dist_info++) { |
| if (!dist_info->id || dist_info->id >= r->nr_dist_base_types) { |
| pr_warn("base BTF id [%d] maps to invalid distilled base BTF id [%d]\n", |
| id, dist_info->id); |
| err = -EINVAL; |
| goto done; |
| } |
| dist_t = btf_type_by_id(r->dist_base_btf, dist_info->id); |
| dist_kind = btf_kind(dist_t); |
| |
| /* Validate that the found distilled type is compatible. |
| * Do not error out on mismatch as another match may |
| * occur for an identically-named type. |
| */ |
| switch (dist_kind) { |
| case BTF_KIND_FWD: |
| switch (base_kind) { |
| case BTF_KIND_FWD: |
| if (btf_kflag(dist_t) != btf_kflag(base_t)) |
| continue; |
| break; |
| case BTF_KIND_STRUCT: |
| if (btf_kflag(base_t)) |
| continue; |
| break; |
| case BTF_KIND_UNION: |
| if (!btf_kflag(base_t)) |
| continue; |
| break; |
| default: |
| continue; |
| } |
| break; |
| case BTF_KIND_INT: |
| if (dist_kind != base_kind || |
| btf_int_encoding(base_t) != btf_int_encoding(dist_t)) |
| continue; |
| break; |
| case BTF_KIND_FLOAT: |
| if (dist_kind != base_kind) |
| continue; |
| break; |
| case BTF_KIND_ENUM: |
| /* ENUM and ENUM64 are encoded as sized ENUM in |
| * distilled base BTF. |
| */ |
| if (base_kind != dist_kind && base_kind != BTF_KIND_ENUM64) |
| continue; |
| break; |
| case BTF_KIND_STRUCT: |
| case BTF_KIND_UNION: |
| /* size verification is required for embedded |
| * struct/unions. |
| */ |
| if (r->id_map[dist_info->id] == BTF_IS_EMBEDDED && |
| base_t->size != dist_t->size) |
| continue; |
| break; |
| default: |
| continue; |
| } |
| if (r->id_map[dist_info->id] && |
| r->id_map[dist_info->id] != BTF_IS_EMBEDDED) { |
| /* we already have a match; this tells us that |
| * multiple base types of the same name |
| * have the same size, since for cases where |
| * multiple types have the same name we match |
| * on name and size. In this case, we have |
| * no way of determining which to relocate |
| * to in base BTF, so error out. |
| */ |
| pr_warn("distilled base BTF type '%s' [%u], size %u has multiple candidates of the same size (ids [%u, %u]) in base BTF\n", |
| base_info.name, dist_info->id, |
| base_t->size, id, r->id_map[dist_info->id]); |
| err = -EINVAL; |
| goto done; |
| } |
| /* map id and name */ |
| r->id_map[dist_info->id] = id; |
| r->str_map[dist_t->name_off] = base_t->name_off; |
| } |
| } |
| /* ensure all distilled BTF ids now have a mapping... */ |
| for (id = 1; id < r->nr_dist_base_types; id++) { |
| const char *name; |
| |
| if (r->id_map[id] && r->id_map[id] != BTF_IS_EMBEDDED) |
| continue; |
| dist_t = btf_type_by_id(r->dist_base_btf, id); |
| name = btf__name_by_offset(r->dist_base_btf, dist_t->name_off); |
| pr_warn("distilled base BTF type '%s' [%d] is not mapped to base BTF id\n", |
| name, id); |
| err = -EINVAL; |
| break; |
| } |
| done: |
| free(base_name_cnt); |
| free(info); |
| return err; |
| } |
| |
| /* distilled base should only have named int/float/enum/fwd/struct/union types. */ |
| static int btf_relocate_validate_distilled_base(struct btf_relocate *r) |
| { |
| unsigned int i; |
| |
| for (i = 1; i < r->nr_dist_base_types; i++) { |
| struct btf_type *t = btf_type_by_id(r->dist_base_btf, i); |
| int kind = btf_kind(t); |
| |
| switch (kind) { |
| case BTF_KIND_INT: |
| case BTF_KIND_FLOAT: |
| case BTF_KIND_ENUM: |
| case BTF_KIND_STRUCT: |
| case BTF_KIND_UNION: |
| case BTF_KIND_FWD: |
| if (t->name_off) |
| break; |
| pr_warn("type [%d], kind [%d] is invalid for distilled base BTF; it is anonymous\n", |
| i, kind); |
| return -EINVAL; |
| default: |
| pr_warn("type [%d] in distilled based BTF has unexpected kind [%d]\n", |
| i, kind); |
| return -EINVAL; |
| } |
| } |
| return 0; |
| } |
| |
| static int btf_relocate_rewrite_strs(struct btf_relocate *r, __u32 i) |
| { |
| struct btf_type *t = btf_type_by_id(r->btf, i); |
| struct btf_field_iter it; |
| __u32 *str_off; |
| int off, err; |
| |
| err = btf_field_iter_init(&it, t, BTF_FIELD_ITER_STRS); |
| if (err) |
| return err; |
| |
| while ((str_off = btf_field_iter_next(&it))) { |
| if (!*str_off) |
| continue; |
| if (*str_off >= r->dist_str_len) { |
| *str_off += r->base_str_len - r->dist_str_len; |
| } else { |
| off = r->str_map[*str_off]; |
| if (!off) { |
| pr_warn("string '%s' [offset %u] is not mapped to base BTF", |
| btf__str_by_offset(r->btf, off), *str_off); |
| return -ENOENT; |
| } |
| *str_off = off; |
| } |
| } |
| return 0; |
| } |
| |
| /* If successful, output of relocation is updated BTF with base BTF pointing |
| * at base_btf, and type ids, strings adjusted accordingly. |
| */ |
| int btf_relocate(struct btf *btf, const struct btf *base_btf, __u32 **id_map) |
| { |
| unsigned int nr_types = btf__type_cnt(btf); |
| const struct btf_header *dist_base_hdr; |
| const struct btf_header *base_hdr; |
| struct btf_relocate r = {}; |
| int err = 0; |
| __u32 id, i; |
| |
| r.dist_base_btf = btf__base_btf(btf); |
| if (!base_btf || r.dist_base_btf == base_btf) |
| return -EINVAL; |
| |
| r.nr_dist_base_types = btf__type_cnt(r.dist_base_btf); |
| r.nr_base_types = btf__type_cnt(base_btf); |
| r.nr_split_types = nr_types - r.nr_dist_base_types; |
| r.btf = btf; |
| r.base_btf = base_btf; |
| |
| r.id_map = calloc(nr_types, sizeof(*r.id_map)); |
| r.str_map = calloc(btf_header(r.dist_base_btf)->str_len, sizeof(*r.str_map)); |
| dist_base_hdr = btf_header(r.dist_base_btf); |
| base_hdr = btf_header(r.base_btf); |
| r.dist_str_len = dist_base_hdr->str_len; |
| r.base_str_len = base_hdr->str_len; |
| if (!r.id_map || !r.str_map) { |
| err = -ENOMEM; |
| goto err_out; |
| } |
| |
| err = btf_relocate_validate_distilled_base(&r); |
| if (err) |
| goto err_out; |
| |
| /* Split BTF ids need to be adjusted as base and distilled base |
| * have different numbers of types, changing the start id of split |
| * BTF. |
| */ |
| for (id = r.nr_dist_base_types; id < nr_types; id++) |
| r.id_map[id] = id + r.nr_base_types - r.nr_dist_base_types; |
| |
| /* Build a map from distilled base ids to actual base BTF ids; it is used |
| * to update split BTF id references. Also build a str_map mapping from |
| * distilled base BTF names to base BTF names. |
| */ |
| err = btf_relocate_map_distilled_base(&r); |
| if (err) |
| goto err_out; |
| |
| /* Next, rewrite type ids in split BTF, replacing split ids with updated |
| * ids based on number of types in base BTF, and base ids with |
| * relocated ids from base_btf. |
| */ |
| for (i = 0, id = r.nr_dist_base_types; i < r.nr_split_types; i++, id++) { |
| err = btf_relocate_rewrite_type_id(&r, id); |
| if (err) |
| goto err_out; |
| } |
| /* String offsets now need to be updated using the str_map. */ |
| for (i = 0; i < r.nr_split_types; i++) { |
| err = btf_relocate_rewrite_strs(&r, i + r.nr_dist_base_types); |
| if (err) |
| goto err_out; |
| } |
| /* Finally reset base BTF to be base_btf */ |
| btf_set_base_btf(btf, base_btf); |
| |
| if (id_map) { |
| *id_map = r.id_map; |
| r.id_map = NULL; |
| } |
| err_out: |
| free(r.id_map); |
| free(r.str_map); |
| return err; |
| } |