blob: 909fc033173a7c893ffe7113f0e32568392b76ae [file] [log] [blame]
Alexei Starovoitov99c55f72014-09-26 00:16:57 -07001/* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
6 */
7#ifndef _LINUX_BPF_H
8#define _LINUX_BPF_H 1
9
10#include <uapi/linux/bpf.h>
Daniel Borkmann74451e662017-02-16 22:24:50 +010011
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070012#include <linux/workqueue.h>
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070013#include <linux/file.h>
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -080014#include <linux/percpu.h>
Zi Shen Lim002245c2016-06-08 21:18:47 -070015#include <linux/err.h>
Daniel Borkmann74451e662017-02-16 22:24:50 +010016#include <linux/rbtree_latch.h>
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070017
Daniel Borkmann3b1efb12016-06-15 22:47:14 +020018struct perf_event;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070019struct bpf_map;
20
21/* map is generic key/value storage optionally accesible by eBPF programs */
22struct bpf_map_ops {
23 /* funcs callable from userspace (via syscall) */
24 struct bpf_map *(*map_alloc)(union bpf_attr *attr);
Daniel Borkmann61d1b6a2016-06-15 22:47:12 +020025 void (*map_release)(struct bpf_map *map, struct file *map_file);
26 void (*map_free)(struct bpf_map *map);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070027 int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
28
29 /* funcs callable from userspace and from eBPF programs */
30 void *(*map_lookup_elem)(struct bpf_map *map, void *key);
Alexei Starovoitov3274f522014-11-13 17:36:44 -080031 int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070032 int (*map_delete_elem)(struct bpf_map *map, void *key);
Wang Nan2a36f0b2015-08-06 07:02:33 +000033
34 /* funcs called by prog_array and perf_event_array map */
Daniel Borkmannd056a782016-06-15 22:47:13 +020035 void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
36 int fd);
37 void (*map_fd_put_ptr)(void *ptr);
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070038};
39
40struct bpf_map {
41 atomic_t refcnt;
42 enum bpf_map_type map_type;
43 u32 key_size;
44 u32 value_size;
45 u32 max_entries;
Alexei Starovoitov6c905982016-03-07 21:57:15 -080046 u32 map_flags;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -070047 u32 pages;
48 struct user_struct *user;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010049 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070050 struct work_struct work;
Daniel Borkmannc9da1612015-11-24 21:28:15 +010051 atomic_t usercnt;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070052};
53
54struct bpf_map_type_list {
55 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010056 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070057 enum bpf_map_type type;
58};
59
Alexei Starovoitov17a52672014-09-26 00:17:06 -070060/* function argument constraints */
61enum bpf_arg_type {
Daniel Borkmann80f1d682015-03-12 17:21:42 +010062 ARG_DONTCARE = 0, /* unused argument in helper function */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070063
64 /* the following constraints used to prototype
65 * bpf_map_lookup/update/delete_elem() functions
66 */
67 ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
68 ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
69 ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
70
71 /* the following constraints used to prototype bpf_memcmp() and other
72 * functions that access data on eBPF program stack
73 */
Alexei Starovoitov39f19ebb2017-01-09 10:19:50 -080074 ARG_PTR_TO_MEM, /* pointer to valid memory (stack, packet, map value) */
75 ARG_PTR_TO_UNINIT_MEM, /* pointer to memory does not need to be initialized,
76 * helper function must fill all bytes or clear
77 * them in error case.
Daniel Borkmann435faee12016-04-13 00:10:51 +020078 */
79
Alexei Starovoitov39f19ebb2017-01-09 10:19:50 -080080 ARG_CONST_SIZE, /* number of bytes accessed from memory */
81 ARG_CONST_SIZE_OR_ZERO, /* number of bytes accessed from memory or 0 */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010082
Alexei Starovoitov608cd712015-03-26 19:53:57 -070083 ARG_PTR_TO_CTX, /* pointer to context */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010084 ARG_ANYTHING, /* any (initialized) argument is ok */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070085};
86
87/* type of values returned from helper functions */
88enum bpf_return_type {
89 RET_INTEGER, /* function returns integer */
90 RET_VOID, /* function doesn't return anything */
91 RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
92};
93
Alexei Starovoitov09756af2014-09-26 00:17:00 -070094/* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
95 * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
96 * instructions after verifying
97 */
98struct bpf_func_proto {
99 u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
100 bool gpl_only;
Daniel Borkmann36bbef52016-09-20 00:26:13 +0200101 bool pkt_access;
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700102 enum bpf_return_type ret_type;
103 enum bpf_arg_type arg1_type;
104 enum bpf_arg_type arg2_type;
105 enum bpf_arg_type arg3_type;
106 enum bpf_arg_type arg4_type;
107 enum bpf_arg_type arg5_type;
108};
109
110/* bpf_context is intentionally undefined structure. Pointer to bpf_context is
111 * the first argument to eBPF programs.
112 * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
113 */
114struct bpf_context;
115
116enum bpf_access_type {
117 BPF_READ = 1,
118 BPF_WRITE = 2
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700119};
120
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700121/* types of values stored in eBPF registers */
122enum bpf_reg_type {
123 NOT_INIT = 0, /* nothing was written into register */
124 UNKNOWN_VALUE, /* reg doesn't contain a valid pointer */
125 PTR_TO_CTX, /* reg points to bpf_context */
126 CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
127 PTR_TO_MAP_VALUE, /* reg points to map element value */
128 PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
129 FRAME_PTR, /* reg == frame_pointer */
130 PTR_TO_STACK, /* reg == frame_pointer + imm */
131 CONST_IMM, /* constant integer value */
132
133 /* PTR_TO_PACKET represents:
134 * skb->data
135 * skb->data + imm
136 * skb->data + (u16) var
137 * skb->data + (u16) var + imm
138 * if (range > 0) then [ptr, ptr + range - off) is safe to access
139 * if (id > 0) means that some 'var' was added
140 * if (off > 0) menas that 'imm' was added
141 */
142 PTR_TO_PACKET,
143 PTR_TO_PACKET_END, /* skb->data + headlen */
Josef Bacik48461132016-09-28 10:54:32 -0400144
145 /* PTR_TO_MAP_VALUE_ADJ is used for doing pointer math inside of a map
146 * elem value. We only allow this if we can statically verify that
147 * access from this register are going to fall within the size of the
148 * map element.
149 */
150 PTR_TO_MAP_VALUE_ADJ,
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700151};
152
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700153struct bpf_prog;
154
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700155struct bpf_verifier_ops {
156 /* return eBPF function prototype for verification */
157 const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700158
159 /* return true if 'size' wide access at offset 'off' within bpf_context
160 * with 'type' (read or write) is allowed
161 */
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700162 bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
163 enum bpf_reg_type *reg_type);
Daniel Borkmann36bbef52016-09-20 00:26:13 +0200164 int (*gen_prologue)(struct bpf_insn *insn, bool direct_write,
165 const struct bpf_prog *prog);
Daniel Borkmann6b8cc1d2017-01-12 11:51:32 +0100166 u32 (*convert_ctx_access)(enum bpf_access_type type,
167 const struct bpf_insn *src,
168 struct bpf_insn *dst,
169 struct bpf_prog *prog);
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700170};
171
172struct bpf_prog_type_list {
173 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100174 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700175 enum bpf_prog_type type;
176};
177
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700178struct bpf_prog_aux {
179 atomic_t refcnt;
Daniel Borkmann24701ec2015-03-01 12:31:47 +0100180 u32 used_map_cnt;
Alexei Starovoitov32bbe002016-04-06 18:43:28 -0700181 u32 max_ctx_offset;
Daniel Borkmann74451e662017-02-16 22:24:50 +0100182 struct latch_tree_node ksym_tnode;
183 struct list_head ksym_lnode;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100184 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700185 struct bpf_map **used_maps;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700186 struct bpf_prog *prog;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -0700187 struct user_struct *user;
Alexei Starovoitovabf2e7d2015-05-28 19:26:02 -0700188 union {
189 struct work_struct work;
190 struct rcu_head rcu;
191 };
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700192};
193
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700194struct bpf_array {
195 struct bpf_map map;
196 u32 elem_size;
197 /* 'ownership' of prog_array is claimed by the first program that
198 * is going to use this map or by the first program which FD is stored
199 * in the map to make sure that all callers and callees have the same
200 * prog_type and JITed flag
201 */
202 enum bpf_prog_type owner_prog_type;
203 bool owner_jited;
204 union {
205 char value[0] __aligned(8);
Wang Nan2a36f0b2015-08-06 07:02:33 +0000206 void *ptrs[0] __aligned(8);
Alexei Starovoitova10423b2016-02-01 22:39:54 -0800207 void __percpu *pptrs[0] __aligned(8);
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700208 };
209};
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200210
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700211#define MAX_TAIL_CALL_CNT 32
212
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200213struct bpf_event_entry {
214 struct perf_event *event;
215 struct file *perf_file;
216 struct file *map_file;
217 struct rcu_head rcu;
218};
219
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700220u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
Alexei Starovoitov9940d672016-04-06 18:43:27 -0700221u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200222
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700223bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
Daniel Borkmannf1f77142017-01-13 23:38:15 +0100224int bpf_prog_calc_tag(struct bpf_prog *fp);
Daniel Borkmannbd570ff2016-04-18 21:01:24 +0200225
Alexei Starovoitov0756ea32015-06-12 19:39:13 -0700226const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200227
228typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
Daniel Borkmannaa7145c2016-07-22 01:19:42 +0200229 unsigned long off, unsigned long len);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200230
231u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
232 void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700233
Alexei Starovoitov89aa0752014-12-01 15:06:35 -0800234#ifdef CONFIG_BPF_SYSCALL
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -0800235DECLARE_PER_CPU(int, bpf_prog_active);
236
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100237void bpf_register_prog_type(struct bpf_prog_type_list *tl);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100238void bpf_register_map_type(struct bpf_map_type_list *tl);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100239
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700240struct bpf_prog *bpf_prog_get(u32 ufd);
Daniel Borkmann113214b2016-06-30 17:24:44 +0200241struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100242struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog, int i);
Daniel Borkmannc5405942016-11-09 22:02:34 +0100243void bpf_prog_sub(struct bpf_prog *prog, int i);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100244struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100245void bpf_prog_put(struct bpf_prog *prog);
Daniel Borkmann5ccb0712016-12-18 01:52:58 +0100246int __bpf_prog_charge(struct user_struct *user, u32 pages);
247void __bpf_prog_uncharge(struct user_struct *user, u32 pages);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100248
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100249struct bpf_map *bpf_map_get_with_uref(u32 ufd);
Daniel Borkmannc2101292015-10-29 14:58:07 +0100250struct bpf_map *__bpf_map_get(struct fd f);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100251struct bpf_map * __must_check bpf_map_inc(struct bpf_map *map, bool uref);
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100252void bpf_map_put_with_uref(struct bpf_map *map);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100253void bpf_map_put(struct bpf_map *map);
Alexei Starovoitov6c905982016-03-07 21:57:15 -0800254int bpf_map_precharge_memlock(u32 pages);
Daniel Borkmannd407bd22017-01-18 15:14:17 +0100255void *bpf_map_area_alloc(size_t size);
256void bpf_map_area_free(void *base);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100257
Alexei Starovoitov1be7f752015-10-07 22:23:21 -0700258extern int sysctl_unprivileged_bpf_disabled;
259
Daniel Borkmannb2197752015-10-29 14:58:09 +0100260int bpf_map_new_fd(struct bpf_map *map);
261int bpf_prog_new_fd(struct bpf_prog *prog);
262
263int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
264int bpf_obj_get_user(const char __user *pathname);
265
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800266int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
267int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
268int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
269 u64 flags);
270int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
271 u64 flags);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200272
Alexei Starovoitov557c0c62016-03-07 21:57:17 -0800273int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800274
Daniel Borkmannd056a782016-06-15 22:47:13 +0200275int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
276 void *key, void *value, u64 map_flags);
277void bpf_fd_array_map_clear(struct bpf_map *map);
278
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800279/* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
280 * forced to use 'long' read/writes to try to atomically copy long counters.
281 * Best-effort only. No barriers here, since it _will_ race with concurrent
282 * updates from BPF programs. Called from bpf syscall and mostly used with
283 * size 8 or 16 bytes, so ask compiler to inline it.
284 */
285static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
286{
287 const long *lsrc = src;
288 long *ldst = dst;
289
290 size /= sizeof(long);
291 while (size--)
292 *ldst++ = *lsrc++;
293}
294
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100295/* verify correctness of eBPF program */
Alexei Starovoitov9bac3d62015-03-13 11:57:42 -0700296int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100297#else
298static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl)
299{
300}
301
302static inline struct bpf_prog *bpf_prog_get(u32 ufd)
303{
304 return ERR_PTR(-EOPNOTSUPP);
305}
306
Daniel Borkmann113214b2016-06-30 17:24:44 +0200307static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
308 enum bpf_prog_type type)
309{
310 return ERR_PTR(-EOPNOTSUPP);
311}
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100312static inline struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog,
313 int i)
Brenden Blancocc2e0b32016-07-20 07:55:52 -0700314{
315 return ERR_PTR(-EOPNOTSUPP);
316}
Daniel Borkmann113214b2016-06-30 17:24:44 +0200317
Daniel Borkmannc5405942016-11-09 22:02:34 +0100318static inline void bpf_prog_sub(struct bpf_prog *prog, int i)
319{
320}
321
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100322static inline void bpf_prog_put(struct bpf_prog *prog)
323{
324}
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100325
326static inline struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog)
Alexei Starovoitovaa6a5f32016-09-01 18:37:24 -0700327{
328 return ERR_PTR(-EOPNOTSUPP);
329}
Daniel Borkmann5ccb0712016-12-18 01:52:58 +0100330
331static inline int __bpf_prog_charge(struct user_struct *user, u32 pages)
332{
333 return 0;
334}
335
336static inline void __bpf_prog_uncharge(struct user_struct *user, u32 pages)
337{
338}
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100339#endif /* CONFIG_BPF_SYSCALL */
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700340
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800341/* verifier prototypes for helper functions called from eBPF programs */
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100342extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
343extern const struct bpf_func_proto bpf_map_update_elem_proto;
344extern const struct bpf_func_proto bpf_map_delete_elem_proto;
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800345
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100346extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
Daniel Borkmannc04167c2015-03-14 02:27:17 +0100347extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
Daniel Borkmann2d0e30c2016-10-21 12:46:33 +0200348extern const struct bpf_func_proto bpf_get_numa_node_id_proto;
Alexei Starovoitov04fd61ab2015-05-19 16:59:03 -0700349extern const struct bpf_func_proto bpf_tail_call_proto;
Daniel Borkmann17ca8cb2015-05-29 23:23:06 +0200350extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
Alexei Starovoitovffeedaf2015-06-12 19:39:12 -0700351extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
352extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
353extern const struct bpf_func_proto bpf_get_current_comm_proto;
Alexei Starovoitov4e10df92015-07-20 20:34:18 -0700354extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
355extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
Alexei Starovoitovd5a3b1f2016-02-17 19:58:58 -0800356extern const struct bpf_func_proto bpf_get_stackid_proto;
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100357
Daniel Borkmann3ad00402015-10-08 01:20:39 +0200358/* Shared helpers among cBPF and eBPF. */
359void bpf_user_rnd_init_once(void);
360u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
361
Alexei Starovoitov99c55f72014-09-26 00:16:57 -0700362#endif /* _LINUX_BPF_H */