blob: 28cb5fa5af927dbe7237ce77f76d52f52642be4f [file] [log] [blame]
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +01001/*
2 * Berkeley Packet Filter based traffic classifier
3 *
4 * Might be used to classify traffic through flexible, user-defined and
5 * possibly JIT-ed BPF filters for traffic control as an alternative to
6 * ematches.
7 *
8 * (C) 2013 Daniel Borkmann <dborkman@redhat.com>
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License version 2 as
12 * published by the Free Software Foundation.
13 */
14
15#include <linux/module.h>
16#include <linux/types.h>
17#include <linux/skbuff.h>
18#include <linux/filter.h>
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010019#include <linux/bpf.h>
20
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010021#include <net/rtnetlink.h>
22#include <net/pkt_cls.h>
23#include <net/sock.h>
24
25MODULE_LICENSE("GPL");
26MODULE_AUTHOR("Daniel Borkmann <dborkman@redhat.com>");
27MODULE_DESCRIPTION("TC BPF based classifier");
28
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010029#define CLS_BPF_NAME_LEN 256
Jakub Kicinski0d01d452016-09-21 11:43:54 +010030#define CLS_BPF_SUPPORTED_GEN_FLAGS \
Jakub Kicinskieadb4142016-09-21 11:43:55 +010031 (TCA_CLS_FLAGS_SKIP_HW | TCA_CLS_FLAGS_SKIP_SW)
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010032
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010033struct cls_bpf_head {
34 struct list_head plist;
35 u32 hgen;
John Fastabend1f947bf2014-09-12 20:10:24 -070036 struct rcu_head rcu;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010037};
38
39struct cls_bpf_prog {
Alexei Starovoitov7ae457c2014-07-30 20:34:16 -070040 struct bpf_prog *filter;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010041 struct list_head link;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010042 struct tcf_result res;
Daniel Borkmann045efa82015-09-15 23:05:42 -070043 bool exts_integrated;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +010044 bool offloaded;
Jakub Kicinski0d01d452016-09-21 11:43:54 +010045 u32 gen_flags;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010046 struct tcf_exts exts;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010047 u32 handle;
Daniel Borkmann55556dd2016-11-26 01:28:05 +010048 u16 bpf_num_ops;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010049 struct sock_filter *bpf_ops;
50 const char *bpf_name;
John Fastabend1f947bf2014-09-12 20:10:24 -070051 struct tcf_proto *tp;
52 struct rcu_head rcu;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010053};
54
55static const struct nla_policy bpf_policy[TCA_BPF_MAX + 1] = {
56 [TCA_BPF_CLASSID] = { .type = NLA_U32 },
Daniel Borkmann045efa82015-09-15 23:05:42 -070057 [TCA_BPF_FLAGS] = { .type = NLA_U32 },
Jakub Kicinski0d01d452016-09-21 11:43:54 +010058 [TCA_BPF_FLAGS_GEN] = { .type = NLA_U32 },
Daniel Borkmanne2e9b652015-03-01 12:31:48 +010059 [TCA_BPF_FD] = { .type = NLA_U32 },
Jamal Hadi Salim5a7a5552016-09-18 08:45:33 -040060 [TCA_BPF_NAME] = { .type = NLA_NUL_STRING,
61 .len = CLS_BPF_NAME_LEN },
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010062 [TCA_BPF_OPS_LEN] = { .type = NLA_U16 },
63 [TCA_BPF_OPS] = { .type = NLA_BINARY,
64 .len = sizeof(struct sock_filter) * BPF_MAXINSNS },
65};
66
Daniel Borkmann045efa82015-09-15 23:05:42 -070067static int cls_bpf_exec_opcode(int code)
68{
69 switch (code) {
70 case TC_ACT_OK:
Daniel Borkmann045efa82015-09-15 23:05:42 -070071 case TC_ACT_SHOT:
Daniel Borkmann045efa82015-09-15 23:05:42 -070072 case TC_ACT_STOLEN:
Alexei Starovoitov27b29f62015-09-15 23:05:43 -070073 case TC_ACT_REDIRECT:
Daniel Borkmann045efa82015-09-15 23:05:42 -070074 case TC_ACT_UNSPEC:
75 return code;
76 default:
77 return TC_ACT_UNSPEC;
78 }
79}
80
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010081static int cls_bpf_classify(struct sk_buff *skb, const struct tcf_proto *tp,
82 struct tcf_result *res)
83{
WANG Cong80dcbd12014-09-15 14:21:50 -070084 struct cls_bpf_head *head = rcu_dereference_bh(tp->root);
Daniel Borkmannfdc54322016-01-07 15:50:22 +010085 bool at_ingress = skb_at_tc_ingress(skb);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010086 struct cls_bpf_prog *prog;
Daniel Borkmann54720df2015-03-12 20:03:12 +010087 int ret = -1;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +010088
Daniel Borkmann54720df2015-03-12 20:03:12 +010089 /* Needed here for accessing maps. */
90 rcu_read_lock();
John Fastabend1f947bf2014-09-12 20:10:24 -070091 list_for_each_entry_rcu(prog, &head->plist, link) {
Alexei Starovoitov34312052015-06-04 10:11:53 -070092 int filter_res;
93
Daniel Borkmann045efa82015-09-15 23:05:42 -070094 qdisc_skb_cb(skb)->tc_classid = prog->res.classid;
95
Jakub Kicinskieadb4142016-09-21 11:43:55 +010096 if (tc_skip_sw(prog->gen_flags)) {
97 filter_res = prog->exts_integrated ? TC_ACT_UNSPEC : 0;
98 } else if (at_ingress) {
Alexei Starovoitov34312052015-06-04 10:11:53 -070099 /* It is safe to push/pull even if skb_shared() */
100 __skb_push(skb, skb->mac_len);
Alexei Starovoitovdb58ba42016-05-05 19:49:12 -0700101 bpf_compute_data_end(skb);
Alexei Starovoitov34312052015-06-04 10:11:53 -0700102 filter_res = BPF_PROG_RUN(prog->filter, skb);
103 __skb_pull(skb, skb->mac_len);
104 } else {
Alexei Starovoitovdb58ba42016-05-05 19:49:12 -0700105 bpf_compute_data_end(skb);
Alexei Starovoitov34312052015-06-04 10:11:53 -0700106 filter_res = BPF_PROG_RUN(prog->filter, skb);
107 }
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100108
Daniel Borkmann045efa82015-09-15 23:05:42 -0700109 if (prog->exts_integrated) {
Daniel Borkmann3a461da2016-03-15 22:41:22 +0100110 res->class = 0;
111 res->classid = TC_H_MAJ(prog->res.classid) |
112 qdisc_skb_cb(skb)->tc_classid;
Daniel Borkmann045efa82015-09-15 23:05:42 -0700113
114 ret = cls_bpf_exec_opcode(filter_res);
115 if (ret == TC_ACT_UNSPEC)
116 continue;
117 break;
118 }
119
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100120 if (filter_res == 0)
121 continue;
Daniel Borkmann3a461da2016-03-15 22:41:22 +0100122 if (filter_res != -1) {
123 res->class = 0;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100124 res->classid = filter_res;
Daniel Borkmann3a461da2016-03-15 22:41:22 +0100125 } else {
126 *res = prog->res;
127 }
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100128
129 ret = tcf_exts_exec(skb, &prog->exts, res);
130 if (ret < 0)
131 continue;
132
Daniel Borkmann54720df2015-03-12 20:03:12 +0100133 break;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100134 }
Daniel Borkmann54720df2015-03-12 20:03:12 +0100135 rcu_read_unlock();
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100136
Daniel Borkmann54720df2015-03-12 20:03:12 +0100137 return ret;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100138}
139
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100140static bool cls_bpf_is_ebpf(const struct cls_bpf_prog *prog)
141{
142 return !prog->bpf_ops;
143}
144
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100145static int cls_bpf_offload_cmd(struct tcf_proto *tp, struct cls_bpf_prog *prog,
146 enum tc_clsbpf_command cmd)
147{
148 struct net_device *dev = tp->q->dev_queue->dev;
149 struct tc_cls_bpf_offload bpf_offload = {};
150 struct tc_to_netdev offload;
151
152 offload.type = TC_SETUP_CLSBPF;
153 offload.cls_bpf = &bpf_offload;
154
155 bpf_offload.command = cmd;
156 bpf_offload.exts = &prog->exts;
157 bpf_offload.prog = prog->filter;
158 bpf_offload.name = prog->bpf_name;
159 bpf_offload.exts_integrated = prog->exts_integrated;
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100160 bpf_offload.gen_flags = prog->gen_flags;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100161
162 return dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle,
163 tp->protocol, &offload);
164}
165
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100166static int cls_bpf_offload(struct tcf_proto *tp, struct cls_bpf_prog *prog,
167 struct cls_bpf_prog *oldprog)
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100168{
169 struct net_device *dev = tp->q->dev_queue->dev;
170 struct cls_bpf_prog *obj = prog;
171 enum tc_clsbpf_command cmd;
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100172 bool skip_sw;
173 int ret;
174
175 skip_sw = tc_skip_sw(prog->gen_flags) ||
176 (oldprog && tc_skip_sw(oldprog->gen_flags));
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100177
178 if (oldprog && oldprog->offloaded) {
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100179 if (tc_should_offload(dev, tp, prog->gen_flags)) {
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100180 cmd = TC_CLSBPF_REPLACE;
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100181 } else if (!tc_skip_sw(prog->gen_flags)) {
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100182 obj = oldprog;
183 cmd = TC_CLSBPF_DESTROY;
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100184 } else {
185 return -EINVAL;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100186 }
187 } else {
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100188 if (!tc_should_offload(dev, tp, prog->gen_flags))
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100189 return skip_sw ? -EINVAL : 0;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100190 cmd = TC_CLSBPF_ADD;
191 }
192
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100193 ret = cls_bpf_offload_cmd(tp, obj, cmd);
194 if (ret)
195 return skip_sw ? ret : 0;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100196
197 obj->offloaded = true;
198 if (oldprog)
199 oldprog->offloaded = false;
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100200
201 return 0;
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100202}
203
204static void cls_bpf_stop_offload(struct tcf_proto *tp,
205 struct cls_bpf_prog *prog)
206{
207 int err;
208
209 if (!prog->offloaded)
210 return;
211
212 err = cls_bpf_offload_cmd(tp, prog, TC_CLSBPF_DESTROY);
213 if (err) {
214 pr_err("Stopping hardware offload failed: %d\n", err);
215 return;
216 }
217
218 prog->offloaded = false;
219}
220
Jakub Kicinski68d64062016-09-21 11:44:02 +0100221static void cls_bpf_offload_update_stats(struct tcf_proto *tp,
222 struct cls_bpf_prog *prog)
223{
224 if (!prog->offloaded)
225 return;
226
227 cls_bpf_offload_cmd(tp, prog, TC_CLSBPF_STATS);
228}
229
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100230static int cls_bpf_init(struct tcf_proto *tp)
231{
232 struct cls_bpf_head *head;
233
234 head = kzalloc(sizeof(*head), GFP_KERNEL);
235 if (head == NULL)
236 return -ENOBUFS;
237
John Fastabend1f947bf2014-09-12 20:10:24 -0700238 INIT_LIST_HEAD_RCU(&head->plist);
239 rcu_assign_pointer(tp->root, head);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100240
241 return 0;
242}
243
244static void cls_bpf_delete_prog(struct tcf_proto *tp, struct cls_bpf_prog *prog)
245{
WANG Cong18d02642014-09-25 10:26:37 -0700246 tcf_exts_destroy(&prog->exts);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100247
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100248 if (cls_bpf_is_ebpf(prog))
249 bpf_prog_put(prog->filter);
250 else
251 bpf_prog_destroy(prog->filter);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100252
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100253 kfree(prog->bpf_name);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100254 kfree(prog->bpf_ops);
255 kfree(prog);
256}
257
John Fastabend1f947bf2014-09-12 20:10:24 -0700258static void __cls_bpf_delete_prog(struct rcu_head *rcu)
259{
260 struct cls_bpf_prog *prog = container_of(rcu, struct cls_bpf_prog, rcu);
261
262 cls_bpf_delete_prog(prog->tp, prog);
263}
264
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100265static int cls_bpf_delete(struct tcf_proto *tp, unsigned long arg)
266{
Jiri Pirko472f5832014-12-02 18:00:32 +0100267 struct cls_bpf_prog *prog = (struct cls_bpf_prog *) arg;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100268
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100269 cls_bpf_stop_offload(tp, prog);
Jiri Pirko472f5832014-12-02 18:00:32 +0100270 list_del_rcu(&prog->link);
271 tcf_unbind_filter(tp, &prog->res);
272 call_rcu(&prog->rcu, __cls_bpf_delete_prog);
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100273
Jiri Pirko472f5832014-12-02 18:00:32 +0100274 return 0;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100275}
276
Cong Wang1e052be2015-03-06 11:47:59 -0800277static bool cls_bpf_destroy(struct tcf_proto *tp, bool force)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100278{
John Fastabend1f947bf2014-09-12 20:10:24 -0700279 struct cls_bpf_head *head = rtnl_dereference(tp->root);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100280 struct cls_bpf_prog *prog, *tmp;
281
Cong Wang1e052be2015-03-06 11:47:59 -0800282 if (!force && !list_empty(&head->plist))
283 return false;
284
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100285 list_for_each_entry_safe(prog, tmp, &head->plist, link) {
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100286 cls_bpf_stop_offload(tp, prog);
John Fastabend1f947bf2014-09-12 20:10:24 -0700287 list_del_rcu(&prog->link);
John Fastabend18cdb372014-10-05 21:28:52 -0700288 tcf_unbind_filter(tp, &prog->res);
John Fastabend1f947bf2014-09-12 20:10:24 -0700289 call_rcu(&prog->rcu, __cls_bpf_delete_prog);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100290 }
291
John Fastabend1f947bf2014-09-12 20:10:24 -0700292 RCU_INIT_POINTER(tp->root, NULL);
293 kfree_rcu(head, rcu);
Cong Wang1e052be2015-03-06 11:47:59 -0800294 return true;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100295}
296
297static unsigned long cls_bpf_get(struct tcf_proto *tp, u32 handle)
298{
John Fastabend1f947bf2014-09-12 20:10:24 -0700299 struct cls_bpf_head *head = rtnl_dereference(tp->root);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100300 struct cls_bpf_prog *prog;
301 unsigned long ret = 0UL;
302
303 if (head == NULL)
304 return 0UL;
305
Jiri Pirko3fe6b492014-12-02 18:00:33 +0100306 list_for_each_entry(prog, &head->plist, link) {
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100307 if (prog->handle == handle) {
308 ret = (unsigned long) prog;
309 break;
310 }
311 }
312
313 return ret;
314}
315
Daniel Borkmann045efa82015-09-15 23:05:42 -0700316static int cls_bpf_prog_from_ops(struct nlattr **tb, struct cls_bpf_prog *prog)
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100317{
318 struct sock_filter *bpf_ops;
319 struct sock_fprog_kern fprog_tmp;
320 struct bpf_prog *fp;
321 u16 bpf_size, bpf_num_ops;
322 int ret;
323
324 bpf_num_ops = nla_get_u16(tb[TCA_BPF_OPS_LEN]);
325 if (bpf_num_ops > BPF_MAXINSNS || bpf_num_ops == 0)
326 return -EINVAL;
327
328 bpf_size = bpf_num_ops * sizeof(*bpf_ops);
329 if (bpf_size != nla_len(tb[TCA_BPF_OPS]))
330 return -EINVAL;
331
332 bpf_ops = kzalloc(bpf_size, GFP_KERNEL);
333 if (bpf_ops == NULL)
334 return -ENOMEM;
335
336 memcpy(bpf_ops, nla_data(tb[TCA_BPF_OPS]), bpf_size);
337
338 fprog_tmp.len = bpf_num_ops;
339 fprog_tmp.filter = bpf_ops;
340
341 ret = bpf_prog_create(&fp, &fprog_tmp);
342 if (ret < 0) {
343 kfree(bpf_ops);
344 return ret;
345 }
346
347 prog->bpf_ops = bpf_ops;
348 prog->bpf_num_ops = bpf_num_ops;
349 prog->bpf_name = NULL;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100350 prog->filter = fp;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100351
352 return 0;
353}
354
Daniel Borkmannc46646d2015-09-30 01:41:51 +0200355static int cls_bpf_prog_from_efd(struct nlattr **tb, struct cls_bpf_prog *prog,
356 const struct tcf_proto *tp)
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100357{
358 struct bpf_prog *fp;
359 char *name = NULL;
360 u32 bpf_fd;
361
362 bpf_fd = nla_get_u32(tb[TCA_BPF_FD]);
363
Daniel Borkmann113214b2016-06-30 17:24:44 +0200364 fp = bpf_prog_get_type(bpf_fd, BPF_PROG_TYPE_SCHED_CLS);
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100365 if (IS_ERR(fp))
366 return PTR_ERR(fp);
367
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100368 if (tb[TCA_BPF_NAME]) {
Thomas Grafb15ca182016-10-26 10:53:16 +0200369 name = nla_memdup(tb[TCA_BPF_NAME], GFP_KERNEL);
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100370 if (!name) {
371 bpf_prog_put(fp);
372 return -ENOMEM;
373 }
374 }
375
376 prog->bpf_ops = NULL;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100377 prog->bpf_name = name;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100378 prog->filter = fp;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100379
Daniel Borkmann1f211a12016-01-07 22:29:47 +0100380 if (fp->dst_needed && !(tp->q->flags & TCQ_F_INGRESS))
Daniel Borkmannc46646d2015-09-30 01:41:51 +0200381 netif_keep_dst(qdisc_dev(tp->q));
382
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100383 return 0;
384}
385
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100386static int cls_bpf_modify_existing(struct net *net, struct tcf_proto *tp,
387 struct cls_bpf_prog *prog,
388 unsigned long base, struct nlattr **tb,
Cong Wang2f7ef2f2014-04-25 13:54:06 -0700389 struct nlattr *est, bool ovr)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100390{
Daniel Borkmann045efa82015-09-15 23:05:42 -0700391 bool is_bpf, is_ebpf, have_exts = false;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100392 struct tcf_exts exts;
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100393 u32 gen_flags = 0;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100394 int ret;
395
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100396 is_bpf = tb[TCA_BPF_OPS_LEN] && tb[TCA_BPF_OPS];
397 is_ebpf = tb[TCA_BPF_FD];
Daniel Borkmannef146fa2015-09-23 21:56:47 +0200398 if ((!is_bpf && !is_ebpf) || (is_bpf && is_ebpf))
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100399 return -EINVAL;
400
WANG Congb9a24bb2016-08-19 12:36:54 -0700401 ret = tcf_exts_init(&exts, TCA_BPF_ACT, TCA_BPF_POLICE);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100402 if (ret < 0)
403 return ret;
WANG Congb9a24bb2016-08-19 12:36:54 -0700404 ret = tcf_exts_validate(net, tp, tb, est, &exts, ovr);
405 if (ret < 0)
406 goto errout;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100407
Daniel Borkmann045efa82015-09-15 23:05:42 -0700408 if (tb[TCA_BPF_FLAGS]) {
409 u32 bpf_flags = nla_get_u32(tb[TCA_BPF_FLAGS]);
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100410
Daniel Borkmann045efa82015-09-15 23:05:42 -0700411 if (bpf_flags & ~TCA_BPF_FLAG_ACT_DIRECT) {
WANG Congb9a24bb2016-08-19 12:36:54 -0700412 ret = -EINVAL;
413 goto errout;
Daniel Borkmann045efa82015-09-15 23:05:42 -0700414 }
415
416 have_exts = bpf_flags & TCA_BPF_FLAG_ACT_DIRECT;
417 }
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100418 if (tb[TCA_BPF_FLAGS_GEN]) {
419 gen_flags = nla_get_u32(tb[TCA_BPF_FLAGS_GEN]);
420 if (gen_flags & ~CLS_BPF_SUPPORTED_GEN_FLAGS ||
421 !tc_flags_valid(gen_flags)) {
422 ret = -EINVAL;
423 goto errout;
424 }
425 }
Daniel Borkmann045efa82015-09-15 23:05:42 -0700426
Daniel Borkmann045efa82015-09-15 23:05:42 -0700427 prog->exts_integrated = have_exts;
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100428 prog->gen_flags = gen_flags;
Daniel Borkmann045efa82015-09-15 23:05:42 -0700429
430 ret = is_bpf ? cls_bpf_prog_from_ops(tb, prog) :
Daniel Borkmannc46646d2015-09-30 01:41:51 +0200431 cls_bpf_prog_from_efd(tb, prog, tp);
WANG Congb9a24bb2016-08-19 12:36:54 -0700432 if (ret < 0)
433 goto errout;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100434
Daniel Borkmannef146fa2015-09-23 21:56:47 +0200435 if (tb[TCA_BPF_CLASSID]) {
436 prog->res.classid = nla_get_u32(tb[TCA_BPF_CLASSID]);
437 tcf_bind_filter(tp, &prog->res, base);
438 }
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100439
Daniel Borkmannef146fa2015-09-23 21:56:47 +0200440 tcf_exts_change(tp, &prog->exts, &exts);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100441 return 0;
WANG Congb9a24bb2016-08-19 12:36:54 -0700442
443errout:
444 tcf_exts_destroy(&exts);
445 return ret;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100446}
447
448static u32 cls_bpf_grab_new_handle(struct tcf_proto *tp,
449 struct cls_bpf_head *head)
450{
451 unsigned int i = 0x80000000;
Daniel Borkmann3f2ab132015-01-22 10:41:02 +0100452 u32 handle;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100453
454 do {
455 if (++head->hgen == 0x7FFFFFFF)
456 head->hgen = 1;
457 } while (--i > 0 && cls_bpf_get(tp, head->hgen));
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100458
Daniel Borkmann3f2ab132015-01-22 10:41:02 +0100459 if (unlikely(i == 0)) {
460 pr_err("Insufficient number of handles\n");
461 handle = 0;
462 } else {
463 handle = head->hgen;
464 }
465
466 return handle;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100467}
468
469static int cls_bpf_change(struct net *net, struct sk_buff *in_skb,
470 struct tcf_proto *tp, unsigned long base,
471 u32 handle, struct nlattr **tca,
Cong Wang2f7ef2f2014-04-25 13:54:06 -0700472 unsigned long *arg, bool ovr)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100473{
John Fastabend1f947bf2014-09-12 20:10:24 -0700474 struct cls_bpf_head *head = rtnl_dereference(tp->root);
475 struct cls_bpf_prog *oldprog = (struct cls_bpf_prog *) *arg;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100476 struct nlattr *tb[TCA_BPF_MAX + 1];
John Fastabend1f947bf2014-09-12 20:10:24 -0700477 struct cls_bpf_prog *prog;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100478 int ret;
479
480 if (tca[TCA_OPTIONS] == NULL)
481 return -EINVAL;
482
483 ret = nla_parse_nested(tb, TCA_BPF_MAX, tca[TCA_OPTIONS], bpf_policy);
484 if (ret < 0)
485 return ret;
486
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100487 prog = kzalloc(sizeof(*prog), GFP_KERNEL);
John Fastabend1f947bf2014-09-12 20:10:24 -0700488 if (!prog)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100489 return -ENOBUFS;
490
WANG Congb9a24bb2016-08-19 12:36:54 -0700491 ret = tcf_exts_init(&prog->exts, TCA_BPF_ACT, TCA_BPF_POLICE);
492 if (ret < 0)
493 goto errout;
John Fastabend1f947bf2014-09-12 20:10:24 -0700494
495 if (oldprog) {
496 if (handle && oldprog->handle != handle) {
497 ret = -EINVAL;
498 goto errout;
499 }
500 }
501
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100502 if (handle == 0)
503 prog->handle = cls_bpf_grab_new_handle(tp, head);
504 else
505 prog->handle = handle;
506 if (prog->handle == 0) {
507 ret = -EINVAL;
508 goto errout;
509 }
510
Jamal Hadi Salim5a7a5552016-09-18 08:45:33 -0400511 ret = cls_bpf_modify_existing(net, tp, prog, base, tb, tca[TCA_RATE],
512 ovr);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100513 if (ret < 0)
514 goto errout;
515
Jakub Kicinskieadb4142016-09-21 11:43:55 +0100516 ret = cls_bpf_offload(tp, prog, oldprog);
517 if (ret) {
518 cls_bpf_delete_prog(tp, prog);
519 return ret;
520 }
Jakub Kicinski332ae8e2016-09-21 11:43:53 +0100521
John Fastabend1f947bf2014-09-12 20:10:24 -0700522 if (oldprog) {
Daniel Borkmannf6bfc462015-07-17 22:38:43 +0200523 list_replace_rcu(&oldprog->link, &prog->link);
John Fastabend18cdb372014-10-05 21:28:52 -0700524 tcf_unbind_filter(tp, &oldprog->res);
John Fastabend1f947bf2014-09-12 20:10:24 -0700525 call_rcu(&oldprog->rcu, __cls_bpf_delete_prog);
526 } else {
527 list_add_rcu(&prog->link, &head->plist);
528 }
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100529
530 *arg = (unsigned long) prog;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100531 return 0;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100532
WANG Congb9a24bb2016-08-19 12:36:54 -0700533errout:
534 tcf_exts_destroy(&prog->exts);
535 kfree(prog);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100536 return ret;
537}
538
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100539static int cls_bpf_dump_bpf_info(const struct cls_bpf_prog *prog,
540 struct sk_buff *skb)
541{
542 struct nlattr *nla;
543
544 if (nla_put_u16(skb, TCA_BPF_OPS_LEN, prog->bpf_num_ops))
545 return -EMSGSIZE;
546
547 nla = nla_reserve(skb, TCA_BPF_OPS, prog->bpf_num_ops *
548 sizeof(struct sock_filter));
549 if (nla == NULL)
550 return -EMSGSIZE;
551
552 memcpy(nla_data(nla), prog->bpf_ops, nla_len(nla));
553
554 return 0;
555}
556
557static int cls_bpf_dump_ebpf_info(const struct cls_bpf_prog *prog,
558 struct sk_buff *skb)
559{
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100560 if (prog->bpf_name &&
561 nla_put_string(skb, TCA_BPF_NAME, prog->bpf_name))
562 return -EMSGSIZE;
563
564 return 0;
565}
566
WANG Cong832d1d52014-01-09 16:14:01 -0800567static int cls_bpf_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100568 struct sk_buff *skb, struct tcmsg *tm)
569{
570 struct cls_bpf_prog *prog = (struct cls_bpf_prog *) fh;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100571 struct nlattr *nest;
Daniel Borkmannbf007d12015-09-23 21:56:46 +0200572 u32 bpf_flags = 0;
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100573 int ret;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100574
575 if (prog == NULL)
576 return skb->len;
577
578 tm->tcm_handle = prog->handle;
579
Jakub Kicinski68d64062016-09-21 11:44:02 +0100580 cls_bpf_offload_update_stats(tp, prog);
581
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100582 nest = nla_nest_start(skb, TCA_OPTIONS);
583 if (nest == NULL)
584 goto nla_put_failure;
585
Daniel Borkmannef146fa2015-09-23 21:56:47 +0200586 if (prog->res.classid &&
587 nla_put_u32(skb, TCA_BPF_CLASSID, prog->res.classid))
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100588 goto nla_put_failure;
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100589
Daniel Borkmanne2e9b652015-03-01 12:31:48 +0100590 if (cls_bpf_is_ebpf(prog))
591 ret = cls_bpf_dump_ebpf_info(prog, skb);
592 else
593 ret = cls_bpf_dump_bpf_info(prog, skb);
594 if (ret)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100595 goto nla_put_failure;
596
WANG Cong5da57f42013-12-15 20:15:07 -0800597 if (tcf_exts_dump(skb, &prog->exts) < 0)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100598 goto nla_put_failure;
599
Daniel Borkmannbf007d12015-09-23 21:56:46 +0200600 if (prog->exts_integrated)
601 bpf_flags |= TCA_BPF_FLAG_ACT_DIRECT;
602 if (bpf_flags && nla_put_u32(skb, TCA_BPF_FLAGS, bpf_flags))
603 goto nla_put_failure;
Jakub Kicinski0d01d452016-09-21 11:43:54 +0100604 if (prog->gen_flags &&
605 nla_put_u32(skb, TCA_BPF_FLAGS_GEN, prog->gen_flags))
606 goto nla_put_failure;
Daniel Borkmannbf007d12015-09-23 21:56:46 +0200607
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100608 nla_nest_end(skb, nest);
609
WANG Cong5da57f42013-12-15 20:15:07 -0800610 if (tcf_exts_dump_stats(skb, &prog->exts) < 0)
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100611 goto nla_put_failure;
612
613 return skb->len;
614
615nla_put_failure:
616 nla_nest_cancel(skb, nest);
617 return -1;
618}
619
620static void cls_bpf_walk(struct tcf_proto *tp, struct tcf_walker *arg)
621{
John Fastabend1f947bf2014-09-12 20:10:24 -0700622 struct cls_bpf_head *head = rtnl_dereference(tp->root);
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100623 struct cls_bpf_prog *prog;
624
Jiri Pirko3fe6b492014-12-02 18:00:33 +0100625 list_for_each_entry(prog, &head->plist, link) {
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100626 if (arg->count < arg->skip)
627 goto skip;
628 if (arg->fn(tp, (unsigned long) prog, arg) < 0) {
629 arg->stop = 1;
630 break;
631 }
632skip:
633 arg->count++;
634 }
635}
636
637static struct tcf_proto_ops cls_bpf_ops __read_mostly = {
638 .kind = "bpf",
639 .owner = THIS_MODULE,
640 .classify = cls_bpf_classify,
641 .init = cls_bpf_init,
642 .destroy = cls_bpf_destroy,
643 .get = cls_bpf_get,
Daniel Borkmann7d1d65c2013-10-28 16:43:02 +0100644 .change = cls_bpf_change,
645 .delete = cls_bpf_delete,
646 .walk = cls_bpf_walk,
647 .dump = cls_bpf_dump,
648};
649
650static int __init cls_bpf_init_mod(void)
651{
652 return register_tcf_proto_ops(&cls_bpf_ops);
653}
654
655static void __exit cls_bpf_exit_mod(void)
656{
657 unregister_tcf_proto_ops(&cls_bpf_ops);
658}
659
660module_init(cls_bpf_init_mod);
661module_exit(cls_bpf_exit_mod);