Commit 1afbcd94 authored by Alexei Starovoitov's avatar Alexei Starovoitov

Merge branch 'generalize-bpf-ksym'

Jiri Olsa says:

====================
this patchset adds trampoline and dispatcher objects
to be visible in /proc/kallsyms.

  $ sudo cat /proc/kallsyms | tail -20
  ...
  ffffffffa050f000 t bpf_prog_5a2b06eab81b8f51    [bpf]
  ffffffffa0511000 t bpf_prog_6deef7357e7b4530    [bpf]
  ffffffffa0542000 t bpf_trampoline_13832 [bpf]
  ffffffffa0548000 t bpf_prog_96f1b5bf4e4cc6dc_mutex_lock [bpf]
  ffffffffa0572000 t bpf_prog_d1c63e29ad82c4ab_bpf_prog1  [bpf]
  ffffffffa0585000 t bpf_prog_e314084d332a5338__dissect   [bpf]
  ffffffffa0587000 t bpf_prog_59785a79eac7e5d2_mutex_unlock       [bpf]
  ffffffffa0589000 t bpf_prog_d0db6e0cac050163_mutex_lock [bpf]
  ffffffffa058d000 t bpf_prog_d8f047721e4d8321_bpf_prog2  [bpf]
  ffffffffa05df000 t bpf_trampoline_25637 [bpf]
  ffffffffa05e3000 t bpf_prog_d8f047721e4d8321_bpf_prog2  [bpf]
  ffffffffa05e5000 t bpf_prog_3b185187f1855c4c    [bpf]
  ffffffffa05e7000 t bpf_prog_d8f047721e4d8321_bpf_prog2  [bpf]
  ffffffffa05eb000 t bpf_prog_93cebb259dd5c4b2_do_sys_open        [bpf]
  ffffffffa0677000 t bpf_dispatcher_xdp   [bpf]

v5 changes:
  - keeping just 1 bpf_tree for all the objects and adding flag
    to recognize bpf_objects when searching for exception tables [Alexei]
  - no need for is_bpf_image_address call in kernel_text_address [Alexei]
  - removed the bpf_image tree, because it's no longer needed

v4 changes:
  - add trampoline and dispatcher to kallsyms once the it's allocated [Alexei]
  - omit the symbols sorting for kallsyms [Alexei]
  - small title change in one patch [Song]
  - some function renames:
     bpf_get_prog_name to bpf_prog_ksym_set_name
     bpf_get_prog_addr_region to bpf_prog_ksym_set_addr
  - added acks to changelogs
  - I checked and there'll be conflict on perftool side with
    upcoming changes from Adrian Hunter (text poke events),
    so I think it's better if Arnaldo takes the perf changes
    via perf tree and we will solve all conflicts there

v3 changes:
  - use container_of directly in bpf_get_ksym_start  [Daniel]
  - add more changelog explanations for ksym addresses [Daniel]

v2 changes:
  - omit extra condition in __bpf_ksym_add for sorting code (Andrii)
  - rename bpf_kallsyms_tree_ops to bpf_ksym_tree (Andrii)
  - expose only executable code in kallsyms (Andrii)
  - use full trampoline key as its kallsyms id (Andrii)
  - explained the BPF_TRAMP_REPLACE case (Andrii)
  - small format changes in bpf_trampoline_link_prog/bpf_trampoline_unlink_prog (Andrii)
  - propagate error value in bpf_dispatcher_update and update kallsym if it's successful (Andrii)
  - get rid of __always_inline for bpf_ksym_tree callbacks (Andrii)
  - added KSYMBOL notification for bpf_image add/removal
  - added perf tools changes to properly display trampoline/dispatcher
====================
Signed-off-by: default avatarAlexei Starovoitov <ast@kernel.org>
parents 98868668 7ac88eba
...@@ -238,7 +238,11 @@ page_table_range_init(unsigned long start, unsigned long end, pgd_t *pgd_base) ...@@ -238,7 +238,11 @@ page_table_range_init(unsigned long start, unsigned long end, pgd_t *pgd_base)
} }
} }
static inline int is_kernel_text(unsigned long addr) /*
* The <linux/kallsyms.h> already defines is_kernel_text,
* using '__' prefix not to get in conflict.
*/
static inline int __is_kernel_text(unsigned long addr)
{ {
if (addr >= (unsigned long)_text && addr <= (unsigned long)__init_end) if (addr >= (unsigned long)_text && addr <= (unsigned long)__init_end)
return 1; return 1;
...@@ -328,8 +332,8 @@ kernel_physical_mapping_init(unsigned long start, ...@@ -328,8 +332,8 @@ kernel_physical_mapping_init(unsigned long start,
addr2 = (pfn + PTRS_PER_PTE-1) * PAGE_SIZE + addr2 = (pfn + PTRS_PER_PTE-1) * PAGE_SIZE +
PAGE_OFFSET + PAGE_SIZE-1; PAGE_OFFSET + PAGE_SIZE-1;
if (is_kernel_text(addr) || if (__is_kernel_text(addr) ||
is_kernel_text(addr2)) __is_kernel_text(addr2))
prot = PAGE_KERNEL_LARGE_EXEC; prot = PAGE_KERNEL_LARGE_EXEC;
pages_2m++; pages_2m++;
...@@ -354,7 +358,7 @@ kernel_physical_mapping_init(unsigned long start, ...@@ -354,7 +358,7 @@ kernel_physical_mapping_init(unsigned long start,
*/ */
pgprot_t init_prot = __pgprot(PTE_IDENT_ATTR); pgprot_t init_prot = __pgprot(PTE_IDENT_ATTR);
if (is_kernel_text(addr)) if (__is_kernel_text(addr))
prot = PAGE_KERNEL_EXEC; prot = PAGE_KERNEL_EXEC;
pages_4k++; pages_4k++;
...@@ -881,7 +885,7 @@ static void mark_nxdata_nx(void) ...@@ -881,7 +885,7 @@ static void mark_nxdata_nx(void)
*/ */
unsigned long start = PFN_ALIGN(_etext); unsigned long start = PFN_ALIGN(_etext);
/* /*
* This comes from is_kernel_text upper limit. Also HPAGE where used: * This comes from __is_kernel_text upper limit. Also HPAGE where used:
*/ */
unsigned long size = (((unsigned long)__init_end + HPAGE_SIZE) & HPAGE_MASK) - start; unsigned long size = (((unsigned long)__init_end + HPAGE_SIZE) & HPAGE_MASK) - start;
......
...@@ -18,6 +18,7 @@ ...@@ -18,6 +18,7 @@
#include <linux/refcount.h> #include <linux/refcount.h>
#include <linux/mutex.h> #include <linux/mutex.h>
#include <linux/module.h> #include <linux/module.h>
#include <linux/kallsyms.h>
struct bpf_verifier_env; struct bpf_verifier_env;
struct bpf_verifier_log; struct bpf_verifier_log;
...@@ -471,6 +472,15 @@ int arch_prepare_bpf_trampoline(void *image, void *image_end, ...@@ -471,6 +472,15 @@ int arch_prepare_bpf_trampoline(void *image, void *image_end,
u64 notrace __bpf_prog_enter(void); u64 notrace __bpf_prog_enter(void);
void notrace __bpf_prog_exit(struct bpf_prog *prog, u64 start); void notrace __bpf_prog_exit(struct bpf_prog *prog, u64 start);
struct bpf_ksym {
unsigned long start;
unsigned long end;
char name[KSYM_NAME_LEN];
struct list_head lnode;
struct latch_tree_node tnode;
bool prog;
};
enum bpf_tramp_prog_type { enum bpf_tramp_prog_type {
BPF_TRAMP_FENTRY, BPF_TRAMP_FENTRY,
BPF_TRAMP_FEXIT, BPF_TRAMP_FEXIT,
...@@ -503,6 +513,7 @@ struct bpf_trampoline { ...@@ -503,6 +513,7 @@ struct bpf_trampoline {
/* Executable image of trampoline */ /* Executable image of trampoline */
void *image; void *image;
u64 selector; u64 selector;
struct bpf_ksym ksym;
}; };
#define BPF_DISPATCHER_MAX 48 /* Fits in 2048B */ #define BPF_DISPATCHER_MAX 48 /* Fits in 2048B */
...@@ -520,9 +531,10 @@ struct bpf_dispatcher { ...@@ -520,9 +531,10 @@ struct bpf_dispatcher {
int num_progs; int num_progs;
void *image; void *image;
u32 image_off; u32 image_off;
struct bpf_ksym ksym;
}; };
static __always_inline unsigned int bpf_dispatcher_nopfunc( static __always_inline unsigned int bpf_dispatcher_nop_func(
const void *ctx, const void *ctx,
const struct bpf_insn *insnsi, const struct bpf_insn *insnsi,
unsigned int (*bpf_func)(const void *, unsigned int (*bpf_func)(const void *,
...@@ -535,17 +547,21 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key); ...@@ -535,17 +547,21 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key);
int bpf_trampoline_link_prog(struct bpf_prog *prog); int bpf_trampoline_link_prog(struct bpf_prog *prog);
int bpf_trampoline_unlink_prog(struct bpf_prog *prog); int bpf_trampoline_unlink_prog(struct bpf_prog *prog);
void bpf_trampoline_put(struct bpf_trampoline *tr); void bpf_trampoline_put(struct bpf_trampoline *tr);
#define BPF_DISPATCHER_INIT(name) { \ #define BPF_DISPATCHER_INIT(_name) { \
.mutex = __MUTEX_INITIALIZER(name.mutex), \ .mutex = __MUTEX_INITIALIZER(_name.mutex), \
.func = &name##func, \ .func = &_name##_func, \
.progs = {}, \ .progs = {}, \
.num_progs = 0, \ .num_progs = 0, \
.image = NULL, \ .image = NULL, \
.image_off = 0 \ .image_off = 0, \
.ksym = { \
.name = #_name, \
.lnode = LIST_HEAD_INIT(_name.ksym.lnode), \
}, \
} }
#define DEFINE_BPF_DISPATCHER(name) \ #define DEFINE_BPF_DISPATCHER(name) \
noinline unsigned int name##func( \ noinline unsigned int bpf_dispatcher_##name##_func( \
const void *ctx, \ const void *ctx, \
const struct bpf_insn *insnsi, \ const struct bpf_insn *insnsi, \
unsigned int (*bpf_func)(const void *, \ unsigned int (*bpf_func)(const void *, \
...@@ -553,26 +569,26 @@ void bpf_trampoline_put(struct bpf_trampoline *tr); ...@@ -553,26 +569,26 @@ void bpf_trampoline_put(struct bpf_trampoline *tr);
{ \ { \
return bpf_func(ctx, insnsi); \ return bpf_func(ctx, insnsi); \
} \ } \
EXPORT_SYMBOL(name##func); \ EXPORT_SYMBOL(bpf_dispatcher_##name##_func); \
struct bpf_dispatcher name = BPF_DISPATCHER_INIT(name); struct bpf_dispatcher bpf_dispatcher_##name = \
BPF_DISPATCHER_INIT(bpf_dispatcher_##name);
#define DECLARE_BPF_DISPATCHER(name) \ #define DECLARE_BPF_DISPATCHER(name) \
unsigned int name##func( \ unsigned int bpf_dispatcher_##name##_func( \
const void *ctx, \ const void *ctx, \
const struct bpf_insn *insnsi, \ const struct bpf_insn *insnsi, \
unsigned int (*bpf_func)(const void *, \ unsigned int (*bpf_func)(const void *, \
const struct bpf_insn *)); \ const struct bpf_insn *)); \
extern struct bpf_dispatcher name; extern struct bpf_dispatcher bpf_dispatcher_##name;
#define BPF_DISPATCHER_FUNC(name) name##func #define BPF_DISPATCHER_FUNC(name) bpf_dispatcher_##name##_func
#define BPF_DISPATCHER_PTR(name) (&name) #define BPF_DISPATCHER_PTR(name) (&bpf_dispatcher_##name)
void bpf_dispatcher_change_prog(struct bpf_dispatcher *d, struct bpf_prog *from, void bpf_dispatcher_change_prog(struct bpf_dispatcher *d, struct bpf_prog *from,
struct bpf_prog *to); struct bpf_prog *to);
struct bpf_image { /* Called only from JIT-enabled code, so there's no need for stubs. */
struct latch_tree_node tnode; void *bpf_jit_alloc_exec_page(void);
unsigned char data[]; void bpf_image_ksym_add(void *data, struct bpf_ksym *ksym);
}; void bpf_image_ksym_del(struct bpf_ksym *ksym);
#define BPF_IMAGE_SIZE (PAGE_SIZE - sizeof(struct bpf_image)) void bpf_ksym_add(struct bpf_ksym *ksym);
bool is_bpf_image_address(unsigned long address); void bpf_ksym_del(struct bpf_ksym *ksym);
void *bpf_image_alloc(void);
#else #else
static inline struct bpf_trampoline *bpf_trampoline_lookup(u64 key) static inline struct bpf_trampoline *bpf_trampoline_lookup(u64 key)
{ {
...@@ -589,7 +605,7 @@ static inline int bpf_trampoline_unlink_prog(struct bpf_prog *prog) ...@@ -589,7 +605,7 @@ static inline int bpf_trampoline_unlink_prog(struct bpf_prog *prog)
static inline void bpf_trampoline_put(struct bpf_trampoline *tr) {} static inline void bpf_trampoline_put(struct bpf_trampoline *tr) {}
#define DEFINE_BPF_DISPATCHER(name) #define DEFINE_BPF_DISPATCHER(name)
#define DECLARE_BPF_DISPATCHER(name) #define DECLARE_BPF_DISPATCHER(name)
#define BPF_DISPATCHER_FUNC(name) bpf_dispatcher_nopfunc #define BPF_DISPATCHER_FUNC(name) bpf_dispatcher_nop_func
#define BPF_DISPATCHER_PTR(name) NULL #define BPF_DISPATCHER_PTR(name) NULL
static inline void bpf_dispatcher_change_prog(struct bpf_dispatcher *d, static inline void bpf_dispatcher_change_prog(struct bpf_dispatcher *d,
struct bpf_prog *from, struct bpf_prog *from,
...@@ -650,8 +666,7 @@ struct bpf_prog_aux { ...@@ -650,8 +666,7 @@ struct bpf_prog_aux {
void *jit_data; /* JIT specific data. arch dependent */ void *jit_data; /* JIT specific data. arch dependent */
struct bpf_jit_poke_descriptor *poke_tab; struct bpf_jit_poke_descriptor *poke_tab;
u32 size_poke_tab; u32 size_poke_tab;
struct latch_tree_node ksym_tnode; struct bpf_ksym ksym;
struct list_head ksym_lnode;
const struct bpf_prog_ops *ops; const struct bpf_prog_ops *ops;
struct bpf_map **used_maps; struct bpf_map **used_maps;
struct bpf_prog *prog; struct bpf_prog *prog;
......
...@@ -577,7 +577,7 @@ DECLARE_STATIC_KEY_FALSE(bpf_stats_enabled_key); ...@@ -577,7 +577,7 @@ DECLARE_STATIC_KEY_FALSE(bpf_stats_enabled_key);
ret; }) ret; })
#define BPF_PROG_RUN(prog, ctx) \ #define BPF_PROG_RUN(prog, ctx) \
__BPF_PROG_RUN(prog, ctx, bpf_dispatcher_nopfunc) __BPF_PROG_RUN(prog, ctx, bpf_dispatcher_nop_func)
/* /*
* Use in preemptible and therefore migratable context to make sure that * Use in preemptible and therefore migratable context to make sure that
...@@ -596,7 +596,7 @@ static inline u32 bpf_prog_run_pin_on_cpu(const struct bpf_prog *prog, ...@@ -596,7 +596,7 @@ static inline u32 bpf_prog_run_pin_on_cpu(const struct bpf_prog *prog,
u32 ret; u32 ret;
migrate_disable(); migrate_disable();
ret = __BPF_PROG_RUN(prog, ctx, bpf_dispatcher_nopfunc); ret = __BPF_PROG_RUN(prog, ctx, bpf_dispatcher_nop_func);
migrate_enable(); migrate_enable();
return ret; return ret;
} }
...@@ -722,7 +722,7 @@ static inline u32 bpf_prog_run_clear_cb(const struct bpf_prog *prog, ...@@ -722,7 +722,7 @@ static inline u32 bpf_prog_run_clear_cb(const struct bpf_prog *prog,
return res; return res;
} }
DECLARE_BPF_DISPATCHER(bpf_dispatcher_xdp) DECLARE_BPF_DISPATCHER(xdp)
static __always_inline u32 bpf_prog_run_xdp(const struct bpf_prog *prog, static __always_inline u32 bpf_prog_run_xdp(const struct bpf_prog *prog,
struct xdp_buff *xdp) struct xdp_buff *xdp)
...@@ -733,8 +733,7 @@ static __always_inline u32 bpf_prog_run_xdp(const struct bpf_prog *prog, ...@@ -733,8 +733,7 @@ static __always_inline u32 bpf_prog_run_xdp(const struct bpf_prog *prog,
* already takes rcu_read_lock() when fetching the program, so * already takes rcu_read_lock() when fetching the program, so
* it's not necessary here anymore. * it's not necessary here anymore.
*/ */
return __BPF_PROG_RUN(prog, xdp, return __BPF_PROG_RUN(prog, xdp, BPF_DISPATCHER_FUNC(xdp));
BPF_DISPATCHER_FUNC(bpf_dispatcher_xdp));
} }
void bpf_prog_change_xdp(struct bpf_prog *prev_prog, struct bpf_prog *prog); void bpf_prog_change_xdp(struct bpf_prog *prev_prog, struct bpf_prog *prog);
...@@ -1084,7 +1083,6 @@ bpf_address_lookup(unsigned long addr, unsigned long *size, ...@@ -1084,7 +1083,6 @@ bpf_address_lookup(unsigned long addr, unsigned long *size,
void bpf_prog_kallsyms_add(struct bpf_prog *fp); void bpf_prog_kallsyms_add(struct bpf_prog *fp);
void bpf_prog_kallsyms_del(struct bpf_prog *fp); void bpf_prog_kallsyms_del(struct bpf_prog *fp);
void bpf_get_prog_name(const struct bpf_prog *prog, char *sym);
#else /* CONFIG_BPF_JIT */ #else /* CONFIG_BPF_JIT */
...@@ -1153,11 +1151,6 @@ static inline void bpf_prog_kallsyms_del(struct bpf_prog *fp) ...@@ -1153,11 +1151,6 @@ static inline void bpf_prog_kallsyms_del(struct bpf_prog *fp)
{ {
} }
static inline void bpf_get_prog_name(const struct bpf_prog *prog, char *sym)
{
sym[0] = '\0';
}
#endif /* CONFIG_BPF_JIT */ #endif /* CONFIG_BPF_JIT */
void bpf_prog_kallsyms_del_all(struct bpf_prog *fp); void bpf_prog_kallsyms_del_all(struct bpf_prog *fp);
......
...@@ -97,7 +97,7 @@ struct bpf_prog *bpf_prog_alloc_no_stats(unsigned int size, gfp_t gfp_extra_flag ...@@ -97,7 +97,7 @@ struct bpf_prog *bpf_prog_alloc_no_stats(unsigned int size, gfp_t gfp_extra_flag
fp->aux->prog = fp; fp->aux->prog = fp;
fp->jit_requested = ebpf_jit_enabled(); fp->jit_requested = ebpf_jit_enabled();
INIT_LIST_HEAD_RCU(&fp->aux->ksym_lnode); INIT_LIST_HEAD_RCU(&fp->aux->ksym.lnode);
return fp; return fp;
} }
...@@ -523,22 +523,22 @@ int bpf_jit_kallsyms __read_mostly = IS_BUILTIN(CONFIG_BPF_JIT_DEFAULT_ON); ...@@ -523,22 +523,22 @@ int bpf_jit_kallsyms __read_mostly = IS_BUILTIN(CONFIG_BPF_JIT_DEFAULT_ON);
int bpf_jit_harden __read_mostly; int bpf_jit_harden __read_mostly;
long bpf_jit_limit __read_mostly; long bpf_jit_limit __read_mostly;
static __always_inline void static void
bpf_get_prog_addr_region(const struct bpf_prog *prog, bpf_prog_ksym_set_addr(struct bpf_prog *prog)
unsigned long *symbol_start,
unsigned long *symbol_end)
{ {
const struct bpf_binary_header *hdr = bpf_jit_binary_hdr(prog); const struct bpf_binary_header *hdr = bpf_jit_binary_hdr(prog);
unsigned long addr = (unsigned long)hdr; unsigned long addr = (unsigned long)hdr;
WARN_ON_ONCE(!bpf_prog_ebpf_jited(prog)); WARN_ON_ONCE(!bpf_prog_ebpf_jited(prog));
*symbol_start = addr; prog->aux->ksym.start = (unsigned long) prog->bpf_func;
*symbol_end = addr + hdr->pages * PAGE_SIZE; prog->aux->ksym.end = addr + hdr->pages * PAGE_SIZE;
} }
void bpf_get_prog_name(const struct bpf_prog *prog, char *sym) static void
bpf_prog_ksym_set_name(struct bpf_prog *prog)
{ {
char *sym = prog->aux->ksym.name;
const char *end = sym + KSYM_NAME_LEN; const char *end = sym + KSYM_NAME_LEN;
const struct btf_type *type; const struct btf_type *type;
const char *func_name; const char *func_name;
...@@ -572,36 +572,27 @@ void bpf_get_prog_name(const struct bpf_prog *prog, char *sym) ...@@ -572,36 +572,27 @@ void bpf_get_prog_name(const struct bpf_prog *prog, char *sym)
*sym = 0; *sym = 0;
} }
static __always_inline unsigned long static unsigned long bpf_get_ksym_start(struct latch_tree_node *n)
bpf_get_prog_addr_start(struct latch_tree_node *n)
{ {
unsigned long symbol_start, symbol_end; return container_of(n, struct bpf_ksym, tnode)->start;
const struct bpf_prog_aux *aux;
aux = container_of(n, struct bpf_prog_aux, ksym_tnode);
bpf_get_prog_addr_region(aux->prog, &symbol_start, &symbol_end);
return symbol_start;
} }
static __always_inline bool bpf_tree_less(struct latch_tree_node *a, static __always_inline bool bpf_tree_less(struct latch_tree_node *a,
struct latch_tree_node *b) struct latch_tree_node *b)
{ {
return bpf_get_prog_addr_start(a) < bpf_get_prog_addr_start(b); return bpf_get_ksym_start(a) < bpf_get_ksym_start(b);
} }
static __always_inline int bpf_tree_comp(void *key, struct latch_tree_node *n) static __always_inline int bpf_tree_comp(void *key, struct latch_tree_node *n)
{ {
unsigned long val = (unsigned long)key; unsigned long val = (unsigned long)key;
unsigned long symbol_start, symbol_end; const struct bpf_ksym *ksym;
const struct bpf_prog_aux *aux;
aux = container_of(n, struct bpf_prog_aux, ksym_tnode); ksym = container_of(n, struct bpf_ksym, tnode);
bpf_get_prog_addr_region(aux->prog, &symbol_start, &symbol_end);
if (val < symbol_start) if (val < ksym->start)
return -1; return -1;
if (val >= symbol_end) if (val >= ksym->end)
return 1; return 1;
return 0; return 0;
...@@ -616,20 +607,29 @@ static DEFINE_SPINLOCK(bpf_lock); ...@@ -616,20 +607,29 @@ static DEFINE_SPINLOCK(bpf_lock);
static LIST_HEAD(bpf_kallsyms); static LIST_HEAD(bpf_kallsyms);
static struct latch_tree_root bpf_tree __cacheline_aligned; static struct latch_tree_root bpf_tree __cacheline_aligned;
static void bpf_prog_ksym_node_add(struct bpf_prog_aux *aux) void bpf_ksym_add(struct bpf_ksym *ksym)
{ {
WARN_ON_ONCE(!list_empty(&aux->ksym_lnode)); spin_lock_bh(&bpf_lock);
list_add_tail_rcu(&aux->ksym_lnode, &bpf_kallsyms); WARN_ON_ONCE(!list_empty(&ksym->lnode));
latch_tree_insert(&aux->ksym_tnode, &bpf_tree, &bpf_tree_ops); list_add_tail_rcu(&ksym->lnode, &bpf_kallsyms);
latch_tree_insert(&ksym->tnode, &bpf_tree, &bpf_tree_ops);
spin_unlock_bh(&bpf_lock);
} }
static void bpf_prog_ksym_node_del(struct bpf_prog_aux *aux) static void __bpf_ksym_del(struct bpf_ksym *ksym)
{ {
if (list_empty(&aux->ksym_lnode)) if (list_empty(&ksym->lnode))
return; return;
latch_tree_erase(&aux->ksym_tnode, &bpf_tree, &bpf_tree_ops); latch_tree_erase(&ksym->tnode, &bpf_tree, &bpf_tree_ops);
list_del_rcu(&aux->ksym_lnode); list_del_rcu(&ksym->lnode);
}
void bpf_ksym_del(struct bpf_ksym *ksym)
{
spin_lock_bh(&bpf_lock);
__bpf_ksym_del(ksym);
spin_unlock_bh(&bpf_lock);
} }
static bool bpf_prog_kallsyms_candidate(const struct bpf_prog *fp) static bool bpf_prog_kallsyms_candidate(const struct bpf_prog *fp)
...@@ -639,8 +639,8 @@ static bool bpf_prog_kallsyms_candidate(const struct bpf_prog *fp) ...@@ -639,8 +639,8 @@ static bool bpf_prog_kallsyms_candidate(const struct bpf_prog *fp)
static bool bpf_prog_kallsyms_verify_off(const struct bpf_prog *fp) static bool bpf_prog_kallsyms_verify_off(const struct bpf_prog *fp)
{ {
return list_empty(&fp->aux->ksym_lnode) || return list_empty(&fp->aux->ksym.lnode) ||
fp->aux->ksym_lnode.prev == LIST_POISON2; fp->aux->ksym.lnode.prev == LIST_POISON2;
} }
void bpf_prog_kallsyms_add(struct bpf_prog *fp) void bpf_prog_kallsyms_add(struct bpf_prog *fp)
...@@ -649,9 +649,11 @@ void bpf_prog_kallsyms_add(struct bpf_prog *fp) ...@@ -649,9 +649,11 @@ void bpf_prog_kallsyms_add(struct bpf_prog *fp)
!capable(CAP_SYS_ADMIN)) !capable(CAP_SYS_ADMIN))
return; return;
spin_lock_bh(&bpf_lock); bpf_prog_ksym_set_addr(fp);
bpf_prog_ksym_node_add(fp->aux); bpf_prog_ksym_set_name(fp);
spin_unlock_bh(&bpf_lock); fp->aux->ksym.prog = true;
bpf_ksym_add(&fp->aux->ksym);
} }
void bpf_prog_kallsyms_del(struct bpf_prog *fp) void bpf_prog_kallsyms_del(struct bpf_prog *fp)
...@@ -659,33 +661,30 @@ void bpf_prog_kallsyms_del(struct bpf_prog *fp) ...@@ -659,33 +661,30 @@ void bpf_prog_kallsyms_del(struct bpf_prog *fp)
if (!bpf_prog_kallsyms_candidate(fp)) if (!bpf_prog_kallsyms_candidate(fp))
return; return;
spin_lock_bh(&bpf_lock); bpf_ksym_del(&fp->aux->ksym);
bpf_prog_ksym_node_del(fp->aux);
spin_unlock_bh(&bpf_lock);
} }
static struct bpf_prog *bpf_prog_kallsyms_find(unsigned long addr) static struct bpf_ksym *bpf_ksym_find(unsigned long addr)
{ {
struct latch_tree_node *n; struct latch_tree_node *n;
n = latch_tree_find((void *)addr, &bpf_tree, &bpf_tree_ops); n = latch_tree_find((void *)addr, &bpf_tree, &bpf_tree_ops);
return n ? return n ? container_of(n, struct bpf_ksym, tnode) : NULL;
container_of(n, struct bpf_prog_aux, ksym_tnode)->prog :
NULL;
} }
const char *__bpf_address_lookup(unsigned long addr, unsigned long *size, const char *__bpf_address_lookup(unsigned long addr, unsigned long *size,
unsigned long *off, char *sym) unsigned long *off, char *sym)
{ {
unsigned long symbol_start, symbol_end; struct bpf_ksym *ksym;
struct bpf_prog *prog;
char *ret = NULL; char *ret = NULL;
rcu_read_lock(); rcu_read_lock();
prog = bpf_prog_kallsyms_find(addr); ksym = bpf_ksym_find(addr);
if (prog) { if (ksym) {
bpf_get_prog_addr_region(prog, &symbol_start, &symbol_end); unsigned long symbol_start = ksym->start;
bpf_get_prog_name(prog, sym); unsigned long symbol_end = ksym->end;
strncpy(sym, ksym->name, KSYM_NAME_LEN);
ret = sym; ret = sym;
if (size) if (size)
...@@ -703,19 +702,28 @@ bool is_bpf_text_address(unsigned long addr) ...@@ -703,19 +702,28 @@ bool is_bpf_text_address(unsigned long addr)
bool ret; bool ret;
rcu_read_lock(); rcu_read_lock();
ret = bpf_prog_kallsyms_find(addr) != NULL; ret = bpf_ksym_find(addr) != NULL;
rcu_read_unlock(); rcu_read_unlock();
return ret; return ret;
} }
static struct bpf_prog *bpf_prog_ksym_find(unsigned long addr)
{
struct bpf_ksym *ksym = bpf_ksym_find(addr);
return ksym && ksym->prog ?
container_of(ksym, struct bpf_prog_aux, ksym)->prog :
NULL;
}
const struct exception_table_entry *search_bpf_extables(unsigned long addr) const struct exception_table_entry *search_bpf_extables(unsigned long addr)
{ {
const struct exception_table_entry *e = NULL; const struct exception_table_entry *e = NULL;
struct bpf_prog *prog; struct bpf_prog *prog;
rcu_read_lock(); rcu_read_lock();
prog = bpf_prog_kallsyms_find(addr); prog = bpf_prog_ksym_find(addr);
if (!prog) if (!prog)
goto out; goto out;
if (!prog->aux->num_exentries) if (!prog->aux->num_exentries)
...@@ -730,7 +738,7 @@ const struct exception_table_entry *search_bpf_extables(unsigned long addr) ...@@ -730,7 +738,7 @@ const struct exception_table_entry *search_bpf_extables(unsigned long addr)
int bpf_get_kallsym(unsigned int symnum, unsigned long *value, char *type, int bpf_get_kallsym(unsigned int symnum, unsigned long *value, char *type,
char *sym) char *sym)
{ {
struct bpf_prog_aux *aux; struct bpf_ksym *ksym;
unsigned int it = 0; unsigned int it = 0;
int ret = -ERANGE; int ret = -ERANGE;
...@@ -738,13 +746,13 @@ int bpf_get_kallsym(unsigned int symnum, unsigned long *value, char *type, ...@@ -738,13 +746,13 @@ int bpf_get_kallsym(unsigned int symnum, unsigned long *value, char *type,
return ret; return ret;
rcu_read_lock(); rcu_read_lock();
list_for_each_entry_rcu(aux, &bpf_kallsyms, ksym_lnode) { list_for_each_entry_rcu(ksym, &bpf_kallsyms, lnode) {
if (it++ != symnum) if (it++ != symnum)
continue; continue;
bpf_get_prog_name(aux->prog, sym); strncpy(sym, ksym->name, KSYM_NAME_LEN);
*value = (unsigned long)aux->prog->bpf_func; *value = ksym->start;
*type = BPF_SYM_ELF_TYPE; *type = BPF_SYM_ELF_TYPE;
ret = 0; ret = 0;
......
...@@ -113,7 +113,7 @@ static void bpf_dispatcher_update(struct bpf_dispatcher *d, int prev_num_progs) ...@@ -113,7 +113,7 @@ static void bpf_dispatcher_update(struct bpf_dispatcher *d, int prev_num_progs)
noff = 0; noff = 0;
} else { } else {
old = d->image + d->image_off; old = d->image + d->image_off;
noff = d->image_off ^ (BPF_IMAGE_SIZE / 2); noff = d->image_off ^ (PAGE_SIZE / 2);
} }
new = d->num_progs ? d->image + noff : NULL; new = d->num_progs ? d->image + noff : NULL;
...@@ -140,9 +140,10 @@ void bpf_dispatcher_change_prog(struct bpf_dispatcher *d, struct bpf_prog *from, ...@@ -140,9 +140,10 @@ void bpf_dispatcher_change_prog(struct bpf_dispatcher *d, struct bpf_prog *from,
mutex_lock(&d->mutex); mutex_lock(&d->mutex);
if (!d->image) { if (!d->image) {
d->image = bpf_image_alloc(); d->image = bpf_jit_alloc_exec_page();
if (!d->image) if (!d->image)
goto out; goto out;
bpf_image_ksym_add(d->image, &d->ksym);
} }
prev_num_progs = d->num_progs; prev_num_progs = d->num_progs;
......
...@@ -5,6 +5,7 @@ ...@@ -5,6 +5,7 @@
#include <linux/filter.h> #include <linux/filter.h>
#include <linux/ftrace.h> #include <linux/ftrace.h>
#include <linux/rbtree_latch.h> #include <linux/rbtree_latch.h>
#include <linux/perf_event.h>
/* dummy _ops. The verifier will operate on target program's ops. */ /* dummy _ops. The verifier will operate on target program's ops. */
const struct bpf_verifier_ops bpf_extension_verifier_ops = { const struct bpf_verifier_ops bpf_extension_verifier_ops = {
...@@ -17,12 +18,11 @@ const struct bpf_prog_ops bpf_extension_prog_ops = { ...@@ -17,12 +18,11 @@ const struct bpf_prog_ops bpf_extension_prog_ops = {
#define TRAMPOLINE_TABLE_SIZE (1 << TRAMPOLINE_HASH_BITS) #define TRAMPOLINE_TABLE_SIZE (1 << TRAMPOLINE_HASH_BITS)
static struct hlist_head trampoline_table[TRAMPOLINE_TABLE_SIZE]; static struct hlist_head trampoline_table[TRAMPOLINE_TABLE_SIZE];
static struct latch_tree_root image_tree __cacheline_aligned;
/* serializes access to trampoline_table and image_tree */ /* serializes access to trampoline_table */
static DEFINE_MUTEX(trampoline_mutex); static DEFINE_MUTEX(trampoline_mutex);
static void *bpf_jit_alloc_exec_page(void) void *bpf_jit_alloc_exec_page(void)
{ {
void *image; void *image;
...@@ -38,62 +38,28 @@ static void *bpf_jit_alloc_exec_page(void) ...@@ -38,62 +38,28 @@ static void *bpf_jit_alloc_exec_page(void)
return image; return image;
} }
static __always_inline bool image_tree_less(struct latch_tree_node *a, void bpf_image_ksym_add(void *data, struct bpf_ksym *ksym)
struct latch_tree_node *b)
{ {
struct bpf_image *ia = container_of(a, struct bpf_image, tnode); ksym->start = (unsigned long) data;
struct bpf_image *ib = container_of(b, struct bpf_image, tnode); ksym->end = ksym->start + PAGE_SIZE;
bpf_ksym_add(ksym);
return ia < ib; perf_event_ksymbol(PERF_RECORD_KSYMBOL_TYPE_BPF, ksym->start,
} PAGE_SIZE, false, ksym->name);
static __always_inline int image_tree_comp(void *addr, struct latch_tree_node *n)
{
void *image = container_of(n, struct bpf_image, tnode);
if (addr < image)
return -1;
if (addr >= image + PAGE_SIZE)
return 1;
return 0;
}
static const struct latch_tree_ops image_tree_ops = {
.less = image_tree_less,
.comp = image_tree_comp,
};
static void *__bpf_image_alloc(bool lock)
{
struct bpf_image *image;
image = bpf_jit_alloc_exec_page();
if (!image)
return NULL;
if (lock)
mutex_lock(&trampoline_mutex);
latch_tree_insert(&image->tnode, &image_tree, &image_tree_ops);
if (lock)
mutex_unlock(&trampoline_mutex);
return image->data;
} }
void *bpf_image_alloc(void) void bpf_image_ksym_del(struct bpf_ksym *ksym)
{ {
return __bpf_image_alloc(true); bpf_ksym_del(ksym);
perf_event_ksymbol(PERF_RECORD_KSYMBOL_TYPE_BPF, ksym->start,
PAGE_SIZE, true, ksym->name);
} }
bool is_bpf_image_address(unsigned long addr) static void bpf_trampoline_ksym_add(struct bpf_trampoline *tr)
{ {
bool ret; struct bpf_ksym *ksym = &tr->ksym;
rcu_read_lock(); snprintf(ksym->name, KSYM_NAME_LEN, "bpf_trampoline_%llu", tr->key);
ret = latch_tree_find((void *) addr, &image_tree, &image_tree_ops) != NULL; bpf_image_ksym_add(tr->image, ksym);
rcu_read_unlock();
return ret;
} }
struct bpf_trampoline *bpf_trampoline_lookup(u64 key) struct bpf_trampoline *bpf_trampoline_lookup(u64 key)
...@@ -116,7 +82,7 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key) ...@@ -116,7 +82,7 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key)
goto out; goto out;
/* is_root was checked earlier. No need for bpf_jit_charge_modmem() */ /* is_root was checked earlier. No need for bpf_jit_charge_modmem() */
image = __bpf_image_alloc(false); image = bpf_jit_alloc_exec_page();
if (!image) { if (!image) {
kfree(tr); kfree(tr);
tr = NULL; tr = NULL;
...@@ -131,6 +97,8 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key) ...@@ -131,6 +97,8 @@ struct bpf_trampoline *bpf_trampoline_lookup(u64 key)
for (i = 0; i < BPF_TRAMP_MAX; i++) for (i = 0; i < BPF_TRAMP_MAX; i++)
INIT_HLIST_HEAD(&tr->progs_hlist[i]); INIT_HLIST_HEAD(&tr->progs_hlist[i]);
tr->image = image; tr->image = image;
INIT_LIST_HEAD_RCU(&tr->ksym.lnode);
bpf_trampoline_ksym_add(tr);
out: out:
mutex_unlock(&trampoline_mutex); mutex_unlock(&trampoline_mutex);
return tr; return tr;
...@@ -216,8 +184,8 @@ bpf_trampoline_get_progs(const struct bpf_trampoline *tr, int *total) ...@@ -216,8 +184,8 @@ bpf_trampoline_get_progs(const struct bpf_trampoline *tr, int *total)
static int bpf_trampoline_update(struct bpf_trampoline *tr) static int bpf_trampoline_update(struct bpf_trampoline *tr)
{ {
void *old_image = tr->image + ((tr->selector + 1) & 1) * BPF_IMAGE_SIZE/2; void *old_image = tr->image + ((tr->selector + 1) & 1) * PAGE_SIZE/2;
void *new_image = tr->image + (tr->selector & 1) * BPF_IMAGE_SIZE/2; void *new_image = tr->image + (tr->selector & 1) * PAGE_SIZE/2;
struct bpf_tramp_progs *tprogs; struct bpf_tramp_progs *tprogs;
u32 flags = BPF_TRAMP_F_RESTORE_REGS; u32 flags = BPF_TRAMP_F_RESTORE_REGS;
int err, total; int err, total;
...@@ -245,7 +213,7 @@ static int bpf_trampoline_update(struct bpf_trampoline *tr) ...@@ -245,7 +213,7 @@ static int bpf_trampoline_update(struct bpf_trampoline *tr)
synchronize_rcu_tasks(); synchronize_rcu_tasks();
err = arch_prepare_bpf_trampoline(new_image, new_image + BPF_IMAGE_SIZE / 2, err = arch_prepare_bpf_trampoline(new_image, new_image + PAGE_SIZE / 2,
&tr->func.model, flags, tprogs, &tr->func.model, flags, tprogs,
tr->func.addr); tr->func.addr);
if (err < 0) if (err < 0)
...@@ -356,8 +324,6 @@ int bpf_trampoline_unlink_prog(struct bpf_prog *prog) ...@@ -356,8 +324,6 @@ int bpf_trampoline_unlink_prog(struct bpf_prog *prog)
void bpf_trampoline_put(struct bpf_trampoline *tr) void bpf_trampoline_put(struct bpf_trampoline *tr)
{ {
struct bpf_image *image;
if (!tr) if (!tr)
return; return;
mutex_lock(&trampoline_mutex); mutex_lock(&trampoline_mutex);
...@@ -368,11 +334,10 @@ void bpf_trampoline_put(struct bpf_trampoline *tr) ...@@ -368,11 +334,10 @@ void bpf_trampoline_put(struct bpf_trampoline *tr)
goto out; goto out;
if (WARN_ON_ONCE(!hlist_empty(&tr->progs_hlist[BPF_TRAMP_FEXIT]))) if (WARN_ON_ONCE(!hlist_empty(&tr->progs_hlist[BPF_TRAMP_FEXIT])))
goto out; goto out;
image = container_of(tr->image, struct bpf_image, data); bpf_image_ksym_del(&tr->ksym);
latch_tree_erase(&image->tnode, &image_tree, &image_tree_ops);
/* wait for tasks to get out of trampoline before freeing it */ /* wait for tasks to get out of trampoline before freeing it */
synchronize_rcu_tasks(); synchronize_rcu_tasks();
bpf_jit_free_exec(image); bpf_jit_free_exec(tr->image);
hlist_del(&tr->hlist); hlist_del(&tr->hlist);
kfree(tr); kfree(tr);
out: out:
......
...@@ -8255,23 +8255,22 @@ static void perf_event_bpf_emit_ksymbols(struct bpf_prog *prog, ...@@ -8255,23 +8255,22 @@ static void perf_event_bpf_emit_ksymbols(struct bpf_prog *prog,
enum perf_bpf_event_type type) enum perf_bpf_event_type type)
{ {
bool unregister = type == PERF_BPF_EVENT_PROG_UNLOAD; bool unregister = type == PERF_BPF_EVENT_PROG_UNLOAD;
char sym[KSYM_NAME_LEN];
int i; int i;
if (prog->aux->func_cnt == 0) { if (prog->aux->func_cnt == 0) {
bpf_get_prog_name(prog, sym);
perf_event_ksymbol(PERF_RECORD_KSYMBOL_TYPE_BPF, perf_event_ksymbol(PERF_RECORD_KSYMBOL_TYPE_BPF,
(u64)(unsigned long)prog->bpf_func, (u64)(unsigned long)prog->bpf_func,
prog->jited_len, unregister, sym); prog->jited_len, unregister,
prog->aux->ksym.name);
} else { } else {
for (i = 0; i < prog->aux->func_cnt; i++) { for (i = 0; i < prog->aux->func_cnt; i++) {
struct bpf_prog *subprog = prog->aux->func[i]; struct bpf_prog *subprog = prog->aux->func[i];
bpf_get_prog_name(subprog, sym);
perf_event_ksymbol( perf_event_ksymbol(
PERF_RECORD_KSYMBOL_TYPE_BPF, PERF_RECORD_KSYMBOL_TYPE_BPF,
(u64)(unsigned long)subprog->bpf_func, (u64)(unsigned long)subprog->bpf_func,
subprog->jited_len, unregister, sym); subprog->jited_len, unregister,
prog->aux->ksym.name);
} }
} }
} }
......
...@@ -149,8 +149,6 @@ int kernel_text_address(unsigned long addr) ...@@ -149,8 +149,6 @@ int kernel_text_address(unsigned long addr)
goto out; goto out;
if (is_bpf_text_address(addr)) if (is_bpf_text_address(addr))
goto out; goto out;
if (is_bpf_image_address(addr))
goto out;
ret = 0; ret = 0;
out: out:
if (no_rcu) if (no_rcu)
......
...@@ -8859,10 +8859,9 @@ const struct bpf_prog_ops sk_reuseport_prog_ops = { ...@@ -8859,10 +8859,9 @@ const struct bpf_prog_ops sk_reuseport_prog_ops = {
}; };
#endif /* CONFIG_INET */ #endif /* CONFIG_INET */
DEFINE_BPF_DISPATCHER(bpf_dispatcher_xdp) DEFINE_BPF_DISPATCHER(xdp)
void bpf_prog_change_xdp(struct bpf_prog *prev_prog, struct bpf_prog *prog) void bpf_prog_change_xdp(struct bpf_prog *prev_prog, struct bpf_prog *prog)
{ {
bpf_dispatcher_change_prog(BPF_DISPATCHER_PTR(bpf_dispatcher_xdp), bpf_dispatcher_change_prog(BPF_DISPATCHER_PTR(xdp), prev_prog, prog);
prev_prog, prog);
} }
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment