blob: c13e92b00bf580d4145e0eb853f0a3cb422e7fa1 [file] [log] [blame]
Alexei Starovoitov99c55f72014-09-26 00:16:57 -07001/* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
6 */
7#ifndef _LINUX_BPF_H
8#define _LINUX_BPF_H 1
9
10#include <uapi/linux/bpf.h>
11#include <linux/workqueue.h>
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070012#include <linux/file.h>
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -080013#include <linux/percpu.h>
Zi Shen Lim002245c2016-06-08 21:18:47 -070014#include <linux/err.h>
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070015
Daniel Borkmann3b1efb12016-06-15 22:47:14 +020016struct perf_event;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070017struct bpf_map;
18
19/* map is generic key/value storage optionally accesible by eBPF programs */
20struct bpf_map_ops {
21 /* funcs callable from userspace (via syscall) */
22 struct bpf_map *(*map_alloc)(union bpf_attr *attr);
Daniel Borkmann61d1b6a2016-06-15 22:47:12 +020023 void (*map_release)(struct bpf_map *map, struct file *map_file);
24 void (*map_free)(struct bpf_map *map);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070025 int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
26
27 /* funcs callable from userspace and from eBPF programs */
28 void *(*map_lookup_elem)(struct bpf_map *map, void *key);
Alexei Starovoitov3274f522014-11-13 17:36:44 -080029 int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070030 int (*map_delete_elem)(struct bpf_map *map, void *key);
Wang Nan2a36f0b2015-08-06 07:02:33 +000031
32 /* funcs called by prog_array and perf_event_array map */
Daniel Borkmannd056a782016-06-15 22:47:13 +020033 void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
34 int fd);
35 void (*map_fd_put_ptr)(void *ptr);
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070036};
37
38struct bpf_map {
39 atomic_t refcnt;
40 enum bpf_map_type map_type;
41 u32 key_size;
42 u32 value_size;
43 u32 max_entries;
Alexei Starovoitov6c905982016-03-07 21:57:15 -080044 u32 map_flags;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -070045 u32 pages;
46 struct user_struct *user;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010047 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070048 struct work_struct work;
Daniel Borkmannc9da1612015-11-24 21:28:15 +010049 atomic_t usercnt;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070050};
51
52struct bpf_map_type_list {
53 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010054 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070055 enum bpf_map_type type;
56};
57
Alexei Starovoitov17a52672014-09-26 00:17:06 -070058/* function argument constraints */
59enum bpf_arg_type {
Daniel Borkmann80f1d682015-03-12 17:21:42 +010060 ARG_DONTCARE = 0, /* unused argument in helper function */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070061
62 /* the following constraints used to prototype
63 * bpf_map_lookup/update/delete_elem() functions
64 */
65 ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
66 ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
67 ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
68
69 /* the following constraints used to prototype bpf_memcmp() and other
70 * functions that access data on eBPF program stack
71 */
72 ARG_PTR_TO_STACK, /* any pointer to eBPF program stack */
Daniel Borkmann435faee12016-04-13 00:10:51 +020073 ARG_PTR_TO_RAW_STACK, /* any pointer to eBPF program stack, area does not
74 * need to be initialized, helper function must fill
75 * all bytes or clear them in error case.
76 */
77
Alexei Starovoitov17a52672014-09-26 00:17:06 -070078 ARG_CONST_STACK_SIZE, /* number of bytes accessed from stack */
Daniel Borkmann8e2fe1d92016-02-19 23:05:22 +010079 ARG_CONST_STACK_SIZE_OR_ZERO, /* number of bytes accessed from stack or 0 */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010080
Alexei Starovoitov608cd712015-03-26 19:53:57 -070081 ARG_PTR_TO_CTX, /* pointer to context */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010082 ARG_ANYTHING, /* any (initialized) argument is ok */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070083};
84
85/* type of values returned from helper functions */
86enum bpf_return_type {
87 RET_INTEGER, /* function returns integer */
88 RET_VOID, /* function doesn't return anything */
89 RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
90};
91
Alexei Starovoitov09756af2014-09-26 00:17:00 -070092/* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
93 * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
94 * instructions after verifying
95 */
96struct bpf_func_proto {
97 u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
98 bool gpl_only;
Alexei Starovoitov17a52672014-09-26 00:17:06 -070099 enum bpf_return_type ret_type;
100 enum bpf_arg_type arg1_type;
101 enum bpf_arg_type arg2_type;
102 enum bpf_arg_type arg3_type;
103 enum bpf_arg_type arg4_type;
104 enum bpf_arg_type arg5_type;
105};
106
107/* bpf_context is intentionally undefined structure. Pointer to bpf_context is
108 * the first argument to eBPF programs.
109 * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
110 */
111struct bpf_context;
112
113enum bpf_access_type {
114 BPF_READ = 1,
115 BPF_WRITE = 2
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700116};
117
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700118/* types of values stored in eBPF registers */
119enum bpf_reg_type {
120 NOT_INIT = 0, /* nothing was written into register */
121 UNKNOWN_VALUE, /* reg doesn't contain a valid pointer */
122 PTR_TO_CTX, /* reg points to bpf_context */
123 CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
124 PTR_TO_MAP_VALUE, /* reg points to map element value */
125 PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
126 FRAME_PTR, /* reg == frame_pointer */
127 PTR_TO_STACK, /* reg == frame_pointer + imm */
128 CONST_IMM, /* constant integer value */
129
130 /* PTR_TO_PACKET represents:
131 * skb->data
132 * skb->data + imm
133 * skb->data + (u16) var
134 * skb->data + (u16) var + imm
135 * if (range > 0) then [ptr, ptr + range - off) is safe to access
136 * if (id > 0) means that some 'var' was added
137 * if (off > 0) menas that 'imm' was added
138 */
139 PTR_TO_PACKET,
140 PTR_TO_PACKET_END, /* skb->data + headlen */
141};
142
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700143struct bpf_prog;
144
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700145struct bpf_verifier_ops {
146 /* return eBPF function prototype for verification */
147 const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700148
149 /* return true if 'size' wide access at offset 'off' within bpf_context
150 * with 'type' (read or write) is allowed
151 */
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700152 bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
153 enum bpf_reg_type *reg_type);
Alexei Starovoitov9bac3d62015-03-13 11:57:42 -0700154
Alexei Starovoitovd691f9e2015-06-04 10:11:54 -0700155 u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg,
156 int src_reg, int ctx_off,
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700157 struct bpf_insn *insn, struct bpf_prog *prog);
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700158};
159
160struct bpf_prog_type_list {
161 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100162 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700163 enum bpf_prog_type type;
164};
165
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700166struct bpf_prog_aux {
167 atomic_t refcnt;
Daniel Borkmann24701ec2015-03-01 12:31:47 +0100168 u32 used_map_cnt;
Alexei Starovoitov32bbe002016-04-06 18:43:28 -0700169 u32 max_ctx_offset;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100170 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700171 struct bpf_map **used_maps;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700172 struct bpf_prog *prog;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -0700173 struct user_struct *user;
Alexei Starovoitovabf2e7d2015-05-28 19:26:02 -0700174 union {
175 struct work_struct work;
176 struct rcu_head rcu;
177 };
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700178};
179
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700180struct bpf_array {
181 struct bpf_map map;
182 u32 elem_size;
183 /* 'ownership' of prog_array is claimed by the first program that
184 * is going to use this map or by the first program which FD is stored
185 * in the map to make sure that all callers and callees have the same
186 * prog_type and JITed flag
187 */
188 enum bpf_prog_type owner_prog_type;
189 bool owner_jited;
190 union {
191 char value[0] __aligned(8);
Wang Nan2a36f0b2015-08-06 07:02:33 +0000192 void *ptrs[0] __aligned(8);
Alexei Starovoitova10423b2016-02-01 22:39:54 -0800193 void __percpu *pptrs[0] __aligned(8);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700194 };
195};
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200196
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700197#define MAX_TAIL_CALL_CNT 32
198
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200199struct bpf_event_entry {
200 struct perf_event *event;
201 struct file *perf_file;
202 struct file *map_file;
203 struct rcu_head rcu;
204};
205
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700206u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
Alexei Starovoitov9940d672016-04-06 18:43:27 -0700207u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200208
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700209bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
Daniel Borkmannbd570ff2016-04-18 21:01:24 +0200210
Alexei Starovoitov0756ea32015-06-12 19:39:13 -0700211const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200212
213typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
214 unsigned long len);
215
216u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
217 void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700218
Alexei Starovoitov89aa0752014-12-01 15:06:35 -0800219#ifdef CONFIG_BPF_SYSCALL
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -0800220DECLARE_PER_CPU(int, bpf_prog_active);
221
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100222void bpf_register_prog_type(struct bpf_prog_type_list *tl);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100223void bpf_register_map_type(struct bpf_map_type_list *tl);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100224
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700225struct bpf_prog *bpf_prog_get(u32 ufd);
Daniel Borkmann113214b2016-06-30 17:24:44 +0200226struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
Alexei Starovoitov92117d82016-04-27 18:56:20 -0700227struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100228void bpf_prog_put(struct bpf_prog *prog);
229
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100230struct bpf_map *bpf_map_get_with_uref(u32 ufd);
Daniel Borkmannc2101292015-10-29 14:58:07 +0100231struct bpf_map *__bpf_map_get(struct fd f);
Alexei Starovoitov92117d82016-04-27 18:56:20 -0700232struct bpf_map *bpf_map_inc(struct bpf_map *map, bool uref);
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100233void bpf_map_put_with_uref(struct bpf_map *map);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100234void bpf_map_put(struct bpf_map *map);
Alexei Starovoitov6c905982016-03-07 21:57:15 -0800235int bpf_map_precharge_memlock(u32 pages);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100236
Alexei Starovoitov1be7f752015-10-07 22:23:21 -0700237extern int sysctl_unprivileged_bpf_disabled;
238
Daniel Borkmannb2197752015-10-29 14:58:09 +0100239int bpf_map_new_fd(struct bpf_map *map);
240int bpf_prog_new_fd(struct bpf_prog *prog);
241
242int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
243int bpf_obj_get_user(const char __user *pathname);
244
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800245int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
246int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
247int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
248 u64 flags);
249int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
250 u64 flags);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200251
Alexei Starovoitov557c0c62016-03-07 21:57:17 -0800252int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800253
Daniel Borkmannd056a782016-06-15 22:47:13 +0200254int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
255 void *key, void *value, u64 map_flags);
256void bpf_fd_array_map_clear(struct bpf_map *map);
257
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800258/* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
259 * forced to use 'long' read/writes to try to atomically copy long counters.
260 * Best-effort only. No barriers here, since it _will_ race with concurrent
261 * updates from BPF programs. Called from bpf syscall and mostly used with
262 * size 8 or 16 bytes, so ask compiler to inline it.
263 */
264static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
265{
266 const long *lsrc = src;
267 long *ldst = dst;
268
269 size /= sizeof(long);
270 while (size--)
271 *ldst++ = *lsrc++;
272}
273
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100274/* verify correctness of eBPF program */
Alexei Starovoitov9bac3d62015-03-13 11:57:42 -0700275int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100276#else
277static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl)
278{
279}
280
281static inline struct bpf_prog *bpf_prog_get(u32 ufd)
282{
283 return ERR_PTR(-EOPNOTSUPP);
284}
285
Daniel Borkmann113214b2016-06-30 17:24:44 +0200286static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
287 enum bpf_prog_type type)
288{
289 return ERR_PTR(-EOPNOTSUPP);
290}
291
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100292static inline void bpf_prog_put(struct bpf_prog *prog)
293{
294}
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100295#endif /* CONFIG_BPF_SYSCALL */
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700296
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800297/* verifier prototypes for helper functions called from eBPF programs */
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100298extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
299extern const struct bpf_func_proto bpf_map_update_elem_proto;
300extern const struct bpf_func_proto bpf_map_delete_elem_proto;
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800301
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100302extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
Daniel Borkmannc04167c2015-03-14 02:27:17 +0100303extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700304extern const struct bpf_func_proto bpf_tail_call_proto;
Daniel Borkmann17ca8cb2015-05-29 23:23:06 +0200305extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
Alexei Starovoitovffeedaf2015-06-12 19:39:12 -0700306extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
307extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
308extern const struct bpf_func_proto bpf_get_current_comm_proto;
Alexei Starovoitov4e10df92015-07-20 20:34:18 -0700309extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
310extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
Alexei Starovoitovd5a3b1f2016-02-17 19:58:58 -0800311extern const struct bpf_func_proto bpf_get_stackid_proto;
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100312
Daniel Borkmann3ad00402015-10-08 01:20:39 +0200313/* Shared helpers among cBPF and eBPF. */
314void bpf_user_rnd_init_once(void);
315u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
316
Alexei Starovoitov99c55f72014-09-26 00:16:57 -0700317#endif /* _LINUX_BPF_H */