Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 1 | /* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com |
| 2 | * |
| 3 | * This program is free software; you can redistribute it and/or |
| 4 | * modify it under the terms of version 2 of the GNU General Public |
| 5 | * License as published by the Free Software Foundation. |
| 6 | */ |
| 7 | #ifndef _LINUX_BPF_H |
| 8 | #define _LINUX_BPF_H 1 |
| 9 | |
| 10 | #include <uapi/linux/bpf.h> |
| 11 | #include <linux/workqueue.h> |
Alexei Starovoitov | db20fd2 | 2014-09-26 00:16:59 -0700 | [diff] [blame] | 12 | #include <linux/file.h> |
Alexei Starovoitov | b121d1e | 2016-03-07 21:57:13 -0800 | [diff] [blame] | 13 | #include <linux/percpu.h> |
Zi Shen Lim | 002245c | 2016-06-08 21:18:47 -0700 | [diff] [blame^] | 14 | #include <linux/err.h> |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 15 | |
| 16 | struct bpf_map; |
| 17 | |
| 18 | /* map is generic key/value storage optionally accesible by eBPF programs */ |
| 19 | struct bpf_map_ops { |
| 20 | /* funcs callable from userspace (via syscall) */ |
| 21 | struct bpf_map *(*map_alloc)(union bpf_attr *attr); |
| 22 | void (*map_free)(struct bpf_map *); |
Alexei Starovoitov | db20fd2 | 2014-09-26 00:16:59 -0700 | [diff] [blame] | 23 | int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key); |
| 24 | |
| 25 | /* funcs callable from userspace and from eBPF programs */ |
| 26 | void *(*map_lookup_elem)(struct bpf_map *map, void *key); |
Alexei Starovoitov | 3274f52 | 2014-11-13 17:36:44 -0800 | [diff] [blame] | 27 | int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags); |
Alexei Starovoitov | db20fd2 | 2014-09-26 00:16:59 -0700 | [diff] [blame] | 28 | int (*map_delete_elem)(struct bpf_map *map, void *key); |
Wang Nan | 2a36f0b | 2015-08-06 07:02:33 +0000 | [diff] [blame] | 29 | |
| 30 | /* funcs called by prog_array and perf_event_array map */ |
| 31 | void *(*map_fd_get_ptr) (struct bpf_map *map, int fd); |
| 32 | void (*map_fd_put_ptr) (void *ptr); |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 33 | }; |
| 34 | |
| 35 | struct bpf_map { |
| 36 | atomic_t refcnt; |
| 37 | enum bpf_map_type map_type; |
| 38 | u32 key_size; |
| 39 | u32 value_size; |
| 40 | u32 max_entries; |
Alexei Starovoitov | 6c90598 | 2016-03-07 21:57:15 -0800 | [diff] [blame] | 41 | u32 map_flags; |
Alexei Starovoitov | aaac3ba | 2015-10-07 22:23:22 -0700 | [diff] [blame] | 42 | u32 pages; |
| 43 | struct user_struct *user; |
Daniel Borkmann | a2c83ff | 2015-03-01 12:31:42 +0100 | [diff] [blame] | 44 | const struct bpf_map_ops *ops; |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 45 | struct work_struct work; |
Daniel Borkmann | c9da161 | 2015-11-24 21:28:15 +0100 | [diff] [blame] | 46 | atomic_t usercnt; |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 47 | }; |
| 48 | |
| 49 | struct bpf_map_type_list { |
| 50 | struct list_head list_node; |
Daniel Borkmann | a2c83ff | 2015-03-01 12:31:42 +0100 | [diff] [blame] | 51 | const struct bpf_map_ops *ops; |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 52 | enum bpf_map_type type; |
| 53 | }; |
| 54 | |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 55 | /* function argument constraints */ |
| 56 | enum bpf_arg_type { |
Daniel Borkmann | 80f1d68 | 2015-03-12 17:21:42 +0100 | [diff] [blame] | 57 | ARG_DONTCARE = 0, /* unused argument in helper function */ |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 58 | |
| 59 | /* the following constraints used to prototype |
| 60 | * bpf_map_lookup/update/delete_elem() functions |
| 61 | */ |
| 62 | ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */ |
| 63 | ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */ |
| 64 | ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */ |
| 65 | |
| 66 | /* the following constraints used to prototype bpf_memcmp() and other |
| 67 | * functions that access data on eBPF program stack |
| 68 | */ |
| 69 | ARG_PTR_TO_STACK, /* any pointer to eBPF program stack */ |
Daniel Borkmann | 435faee1 | 2016-04-13 00:10:51 +0200 | [diff] [blame] | 70 | ARG_PTR_TO_RAW_STACK, /* any pointer to eBPF program stack, area does not |
| 71 | * need to be initialized, helper function must fill |
| 72 | * all bytes or clear them in error case. |
| 73 | */ |
| 74 | |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 75 | ARG_CONST_STACK_SIZE, /* number of bytes accessed from stack */ |
Daniel Borkmann | 8e2fe1d9 | 2016-02-19 23:05:22 +0100 | [diff] [blame] | 76 | ARG_CONST_STACK_SIZE_OR_ZERO, /* number of bytes accessed from stack or 0 */ |
Daniel Borkmann | 80f1d68 | 2015-03-12 17:21:42 +0100 | [diff] [blame] | 77 | |
Alexei Starovoitov | 608cd71 | 2015-03-26 19:53:57 -0700 | [diff] [blame] | 78 | ARG_PTR_TO_CTX, /* pointer to context */ |
Daniel Borkmann | 80f1d68 | 2015-03-12 17:21:42 +0100 | [diff] [blame] | 79 | ARG_ANYTHING, /* any (initialized) argument is ok */ |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 80 | }; |
| 81 | |
| 82 | /* type of values returned from helper functions */ |
| 83 | enum bpf_return_type { |
| 84 | RET_INTEGER, /* function returns integer */ |
| 85 | RET_VOID, /* function doesn't return anything */ |
| 86 | RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */ |
| 87 | }; |
| 88 | |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 89 | /* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs |
| 90 | * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL |
| 91 | * instructions after verifying |
| 92 | */ |
| 93 | struct bpf_func_proto { |
| 94 | u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5); |
| 95 | bool gpl_only; |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 96 | enum bpf_return_type ret_type; |
| 97 | enum bpf_arg_type arg1_type; |
| 98 | enum bpf_arg_type arg2_type; |
| 99 | enum bpf_arg_type arg3_type; |
| 100 | enum bpf_arg_type arg4_type; |
| 101 | enum bpf_arg_type arg5_type; |
| 102 | }; |
| 103 | |
| 104 | /* bpf_context is intentionally undefined structure. Pointer to bpf_context is |
| 105 | * the first argument to eBPF programs. |
| 106 | * For socket filters: 'struct bpf_context *' == 'struct sk_buff *' |
| 107 | */ |
| 108 | struct bpf_context; |
| 109 | |
| 110 | enum bpf_access_type { |
| 111 | BPF_READ = 1, |
| 112 | BPF_WRITE = 2 |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 113 | }; |
| 114 | |
Alexei Starovoitov | ff936a0 | 2015-10-07 10:55:41 -0700 | [diff] [blame] | 115 | struct bpf_prog; |
| 116 | |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 117 | struct bpf_verifier_ops { |
| 118 | /* return eBPF function prototype for verification */ |
| 119 | const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id); |
Alexei Starovoitov | 17a5267 | 2014-09-26 00:17:06 -0700 | [diff] [blame] | 120 | |
| 121 | /* return true if 'size' wide access at offset 'off' within bpf_context |
| 122 | * with 'type' (read or write) is allowed |
| 123 | */ |
| 124 | bool (*is_valid_access)(int off, int size, enum bpf_access_type type); |
Alexei Starovoitov | 9bac3d6 | 2015-03-13 11:57:42 -0700 | [diff] [blame] | 125 | |
Alexei Starovoitov | d691f9e | 2015-06-04 10:11:54 -0700 | [diff] [blame] | 126 | u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg, |
| 127 | int src_reg, int ctx_off, |
Alexei Starovoitov | ff936a0 | 2015-10-07 10:55:41 -0700 | [diff] [blame] | 128 | struct bpf_insn *insn, struct bpf_prog *prog); |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 129 | }; |
| 130 | |
| 131 | struct bpf_prog_type_list { |
| 132 | struct list_head list_node; |
Daniel Borkmann | a2c83ff | 2015-03-01 12:31:42 +0100 | [diff] [blame] | 133 | const struct bpf_verifier_ops *ops; |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 134 | enum bpf_prog_type type; |
| 135 | }; |
| 136 | |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 137 | struct bpf_prog_aux { |
| 138 | atomic_t refcnt; |
Daniel Borkmann | 24701ec | 2015-03-01 12:31:47 +0100 | [diff] [blame] | 139 | u32 used_map_cnt; |
Alexei Starovoitov | 32bbe00 | 2016-04-06 18:43:28 -0700 | [diff] [blame] | 140 | u32 max_ctx_offset; |
Daniel Borkmann | a2c83ff | 2015-03-01 12:31:42 +0100 | [diff] [blame] | 141 | const struct bpf_verifier_ops *ops; |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 142 | struct bpf_map **used_maps; |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 143 | struct bpf_prog *prog; |
Alexei Starovoitov | aaac3ba | 2015-10-07 22:23:22 -0700 | [diff] [blame] | 144 | struct user_struct *user; |
Alexei Starovoitov | abf2e7d | 2015-05-28 19:26:02 -0700 | [diff] [blame] | 145 | union { |
| 146 | struct work_struct work; |
| 147 | struct rcu_head rcu; |
| 148 | }; |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 149 | }; |
| 150 | |
Alexei Starovoitov | 04fd61ab | 2015-05-19 16:59:03 -0700 | [diff] [blame] | 151 | struct bpf_array { |
| 152 | struct bpf_map map; |
| 153 | u32 elem_size; |
| 154 | /* 'ownership' of prog_array is claimed by the first program that |
| 155 | * is going to use this map or by the first program which FD is stored |
| 156 | * in the map to make sure that all callers and callees have the same |
| 157 | * prog_type and JITed flag |
| 158 | */ |
| 159 | enum bpf_prog_type owner_prog_type; |
| 160 | bool owner_jited; |
| 161 | union { |
| 162 | char value[0] __aligned(8); |
Wang Nan | 2a36f0b | 2015-08-06 07:02:33 +0000 | [diff] [blame] | 163 | void *ptrs[0] __aligned(8); |
Alexei Starovoitov | a10423b | 2016-02-01 22:39:54 -0800 | [diff] [blame] | 164 | void __percpu *pptrs[0] __aligned(8); |
Alexei Starovoitov | 04fd61ab | 2015-05-19 16:59:03 -0700 | [diff] [blame] | 165 | }; |
| 166 | }; |
| 167 | #define MAX_TAIL_CALL_CNT 32 |
| 168 | |
| 169 | u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5); |
Alexei Starovoitov | 9940d67 | 2016-04-06 18:43:27 -0700 | [diff] [blame] | 170 | u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5); |
Wang Nan | 2a36f0b | 2015-08-06 07:02:33 +0000 | [diff] [blame] | 171 | void bpf_fd_array_map_clear(struct bpf_map *map); |
Alexei Starovoitov | 04fd61ab | 2015-05-19 16:59:03 -0700 | [diff] [blame] | 172 | bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp); |
Daniel Borkmann | bd570ff | 2016-04-18 21:01:24 +0200 | [diff] [blame] | 173 | |
Alexei Starovoitov | 0756ea3 | 2015-06-12 19:39:13 -0700 | [diff] [blame] | 174 | const struct bpf_func_proto *bpf_get_trace_printk_proto(void); |
Daniel Borkmann | bd570ff | 2016-04-18 21:01:24 +0200 | [diff] [blame] | 175 | const struct bpf_func_proto *bpf_get_event_output_proto(void); |
Alexei Starovoitov | 04fd61ab | 2015-05-19 16:59:03 -0700 | [diff] [blame] | 176 | |
Alexei Starovoitov | 89aa075 | 2014-12-01 15:06:35 -0800 | [diff] [blame] | 177 | #ifdef CONFIG_BPF_SYSCALL |
Alexei Starovoitov | b121d1e | 2016-03-07 21:57:13 -0800 | [diff] [blame] | 178 | DECLARE_PER_CPU(int, bpf_prog_active); |
| 179 | |
Daniel Borkmann | 0fc174d | 2015-03-01 12:31:44 +0100 | [diff] [blame] | 180 | void bpf_register_prog_type(struct bpf_prog_type_list *tl); |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 181 | void bpf_register_map_type(struct bpf_map_type_list *tl); |
Daniel Borkmann | 0fc174d | 2015-03-01 12:31:44 +0100 | [diff] [blame] | 182 | |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 183 | struct bpf_prog *bpf_prog_get(u32 ufd); |
Alexei Starovoitov | 92117d8 | 2016-04-27 18:56:20 -0700 | [diff] [blame] | 184 | struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog); |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 185 | void bpf_prog_put(struct bpf_prog *prog); |
Alexei Starovoitov | abf2e7d | 2015-05-28 19:26:02 -0700 | [diff] [blame] | 186 | void bpf_prog_put_rcu(struct bpf_prog *prog); |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 187 | |
Daniel Borkmann | c9da161 | 2015-11-24 21:28:15 +0100 | [diff] [blame] | 188 | struct bpf_map *bpf_map_get_with_uref(u32 ufd); |
Daniel Borkmann | c210129 | 2015-10-29 14:58:07 +0100 | [diff] [blame] | 189 | struct bpf_map *__bpf_map_get(struct fd f); |
Alexei Starovoitov | 92117d8 | 2016-04-27 18:56:20 -0700 | [diff] [blame] | 190 | struct bpf_map *bpf_map_inc(struct bpf_map *map, bool uref); |
Daniel Borkmann | c9da161 | 2015-11-24 21:28:15 +0100 | [diff] [blame] | 191 | void bpf_map_put_with_uref(struct bpf_map *map); |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 192 | void bpf_map_put(struct bpf_map *map); |
Alexei Starovoitov | 6c90598 | 2016-03-07 21:57:15 -0800 | [diff] [blame] | 193 | int bpf_map_precharge_memlock(u32 pages); |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 194 | |
Alexei Starovoitov | 1be7f75 | 2015-10-07 22:23:21 -0700 | [diff] [blame] | 195 | extern int sysctl_unprivileged_bpf_disabled; |
| 196 | |
Daniel Borkmann | b219775 | 2015-10-29 14:58:09 +0100 | [diff] [blame] | 197 | int bpf_map_new_fd(struct bpf_map *map); |
| 198 | int bpf_prog_new_fd(struct bpf_prog *prog); |
| 199 | |
| 200 | int bpf_obj_pin_user(u32 ufd, const char __user *pathname); |
| 201 | int bpf_obj_get_user(const char __user *pathname); |
| 202 | |
Alexei Starovoitov | 15a07b3 | 2016-02-01 22:39:55 -0800 | [diff] [blame] | 203 | int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value); |
| 204 | int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value); |
| 205 | int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value, |
| 206 | u64 flags); |
| 207 | int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value, |
| 208 | u64 flags); |
Alexei Starovoitov | 557c0c6 | 2016-03-07 21:57:17 -0800 | [diff] [blame] | 209 | int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value); |
Alexei Starovoitov | 15a07b3 | 2016-02-01 22:39:55 -0800 | [diff] [blame] | 210 | |
| 211 | /* memcpy that is used with 8-byte aligned pointers, power-of-8 size and |
| 212 | * forced to use 'long' read/writes to try to atomically copy long counters. |
| 213 | * Best-effort only. No barriers here, since it _will_ race with concurrent |
| 214 | * updates from BPF programs. Called from bpf syscall and mostly used with |
| 215 | * size 8 or 16 bytes, so ask compiler to inline it. |
| 216 | */ |
| 217 | static inline void bpf_long_memcpy(void *dst, const void *src, u32 size) |
| 218 | { |
| 219 | const long *lsrc = src; |
| 220 | long *ldst = dst; |
| 221 | |
| 222 | size /= sizeof(long); |
| 223 | while (size--) |
| 224 | *ldst++ = *lsrc++; |
| 225 | } |
| 226 | |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 227 | /* verify correctness of eBPF program */ |
Alexei Starovoitov | 9bac3d6 | 2015-03-13 11:57:42 -0700 | [diff] [blame] | 228 | int bpf_check(struct bpf_prog **fp, union bpf_attr *attr); |
Daniel Borkmann | 0fc174d | 2015-03-01 12:31:44 +0100 | [diff] [blame] | 229 | #else |
| 230 | static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl) |
| 231 | { |
| 232 | } |
| 233 | |
| 234 | static inline struct bpf_prog *bpf_prog_get(u32 ufd) |
| 235 | { |
| 236 | return ERR_PTR(-EOPNOTSUPP); |
| 237 | } |
| 238 | |
| 239 | static inline void bpf_prog_put(struct bpf_prog *prog) |
| 240 | { |
| 241 | } |
Daniel Borkmann | 61e021f | 2015-03-02 15:21:55 +0100 | [diff] [blame] | 242 | #endif /* CONFIG_BPF_SYSCALL */ |
Alexei Starovoitov | 09756af | 2014-09-26 00:17:00 -0700 | [diff] [blame] | 243 | |
Alexei Starovoitov | d0003ec | 2014-11-13 17:36:49 -0800 | [diff] [blame] | 244 | /* verifier prototypes for helper functions called from eBPF programs */ |
Daniel Borkmann | a2c83ff | 2015-03-01 12:31:42 +0100 | [diff] [blame] | 245 | extern const struct bpf_func_proto bpf_map_lookup_elem_proto; |
| 246 | extern const struct bpf_func_proto bpf_map_update_elem_proto; |
| 247 | extern const struct bpf_func_proto bpf_map_delete_elem_proto; |
Alexei Starovoitov | d0003ec | 2014-11-13 17:36:49 -0800 | [diff] [blame] | 248 | |
Daniel Borkmann | 03e69b5 | 2015-03-14 02:27:16 +0100 | [diff] [blame] | 249 | extern const struct bpf_func_proto bpf_get_prandom_u32_proto; |
Daniel Borkmann | c04167c | 2015-03-14 02:27:17 +0100 | [diff] [blame] | 250 | extern const struct bpf_func_proto bpf_get_smp_processor_id_proto; |
Alexei Starovoitov | 04fd61ab | 2015-05-19 16:59:03 -0700 | [diff] [blame] | 251 | extern const struct bpf_func_proto bpf_tail_call_proto; |
Daniel Borkmann | 17ca8cb | 2015-05-29 23:23:06 +0200 | [diff] [blame] | 252 | extern const struct bpf_func_proto bpf_ktime_get_ns_proto; |
Alexei Starovoitov | ffeedaf | 2015-06-12 19:39:12 -0700 | [diff] [blame] | 253 | extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto; |
| 254 | extern const struct bpf_func_proto bpf_get_current_uid_gid_proto; |
| 255 | extern const struct bpf_func_proto bpf_get_current_comm_proto; |
Alexei Starovoitov | 4e10df9 | 2015-07-20 20:34:18 -0700 | [diff] [blame] | 256 | extern const struct bpf_func_proto bpf_skb_vlan_push_proto; |
| 257 | extern const struct bpf_func_proto bpf_skb_vlan_pop_proto; |
Alexei Starovoitov | d5a3b1f | 2016-02-17 19:58:58 -0800 | [diff] [blame] | 258 | extern const struct bpf_func_proto bpf_get_stackid_proto; |
Daniel Borkmann | 03e69b5 | 2015-03-14 02:27:16 +0100 | [diff] [blame] | 259 | |
Daniel Borkmann | 3ad0040 | 2015-10-08 01:20:39 +0200 | [diff] [blame] | 260 | /* Shared helpers among cBPF and eBPF. */ |
| 261 | void bpf_user_rnd_init_once(void); |
| 262 | u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5); |
| 263 | |
Alexei Starovoitov | 99c55f7 | 2014-09-26 00:16:57 -0700 | [diff] [blame] | 264 | #endif /* _LINUX_BPF_H */ |