blob: 963e4bf0aab8ae23d999305208c757fbc0f49ebe [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/cls_api.c Packet classifier API.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
12 *
13 * Eduardo J. Blanco <ejbs@netlabs.com.uy> :990222: kmod support
14 *
15 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
18#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/string.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/errno.h>
Jiri Pirko33a48922017-02-09 14:38:57 +010022#include <linux/err.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/init.h>
25#include <linux/kmod.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090026#include <linux/slab.h>
Jiri Pirko48617382018-01-17 11:46:46 +010027#include <linux/idr.h>
Denis V. Lunevb8542722007-12-01 00:21:31 +110028#include <net/net_namespace.h>
29#include <net/sock.h>
Arnaldo Carvalho de Melodc5fc572007-03-25 23:06:12 -070030#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#include <net/pkt_sched.h>
32#include <net/pkt_cls.h>
33
Linus Torvalds1da177e2005-04-16 15:20:36 -070034/* The list of all installed classifier types */
WANG Cong36272872013-12-15 20:15:11 -080035static LIST_HEAD(tcf_proto_base);
Linus Torvalds1da177e2005-04-16 15:20:36 -070036
37/* Protects list of registered TC modules. It is pure SMP lock. */
38static DEFINE_RWLOCK(cls_mod_lock);
39
40/* Find classifier type by string name */
41
Jiri Pirko33a48922017-02-09 14:38:57 +010042static const struct tcf_proto_ops *tcf_proto_lookup_ops(const char *kind)
Linus Torvalds1da177e2005-04-16 15:20:36 -070043{
Eric Dumazetdcd76082013-12-20 10:04:18 -080044 const struct tcf_proto_ops *t, *res = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46 if (kind) {
47 read_lock(&cls_mod_lock);
WANG Cong36272872013-12-15 20:15:11 -080048 list_for_each_entry(t, &tcf_proto_base, head) {
Jiri Pirko33a48922017-02-09 14:38:57 +010049 if (strcmp(kind, t->kind) == 0) {
Eric Dumazetdcd76082013-12-20 10:04:18 -080050 if (try_module_get(t->owner))
51 res = t;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 break;
53 }
54 }
55 read_unlock(&cls_mod_lock);
56 }
Eric Dumazetdcd76082013-12-20 10:04:18 -080057 return res;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058}
59
60/* Register(unregister) new classifier type */
61
62int register_tcf_proto_ops(struct tcf_proto_ops *ops)
63{
WANG Cong36272872013-12-15 20:15:11 -080064 struct tcf_proto_ops *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -070065 int rc = -EEXIST;
66
67 write_lock(&cls_mod_lock);
WANG Cong36272872013-12-15 20:15:11 -080068 list_for_each_entry(t, &tcf_proto_base, head)
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 if (!strcmp(ops->kind, t->kind))
70 goto out;
71
WANG Cong36272872013-12-15 20:15:11 -080072 list_add_tail(&ops->head, &tcf_proto_base);
Linus Torvalds1da177e2005-04-16 15:20:36 -070073 rc = 0;
74out:
75 write_unlock(&cls_mod_lock);
76 return rc;
77}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -080078EXPORT_SYMBOL(register_tcf_proto_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Cong Wang7aa00452017-10-26 18:24:28 -070080static struct workqueue_struct *tc_filter_wq;
81
Linus Torvalds1da177e2005-04-16 15:20:36 -070082int unregister_tcf_proto_ops(struct tcf_proto_ops *ops)
83{
WANG Cong36272872013-12-15 20:15:11 -080084 struct tcf_proto_ops *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -070085 int rc = -ENOENT;
86
Daniel Borkmannc78e1742015-05-20 17:13:33 +020087 /* Wait for outstanding call_rcu()s, if any, from a
88 * tcf_proto_ops's destroy() handler.
89 */
90 rcu_barrier();
Cong Wang7aa00452017-10-26 18:24:28 -070091 flush_workqueue(tc_filter_wq);
Daniel Borkmannc78e1742015-05-20 17:13:33 +020092
Linus Torvalds1da177e2005-04-16 15:20:36 -070093 write_lock(&cls_mod_lock);
Eric Dumazetdcd76082013-12-20 10:04:18 -080094 list_for_each_entry(t, &tcf_proto_base, head) {
95 if (t == ops) {
96 list_del(&t->head);
97 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 break;
Eric Dumazetdcd76082013-12-20 10:04:18 -080099 }
100 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 write_unlock(&cls_mod_lock);
102 return rc;
103}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -0800104EXPORT_SYMBOL(unregister_tcf_proto_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105
Cong Wang7aa00452017-10-26 18:24:28 -0700106bool tcf_queue_work(struct work_struct *work)
107{
108 return queue_work(tc_filter_wq, work);
109}
110EXPORT_SYMBOL(tcf_queue_work);
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112/* Select new prio value from the range, managed by kernel. */
113
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -0800114static inline u32 tcf_auto_prio(struct tcf_proto *tp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115{
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -0800116 u32 first = TC_H_MAKE(0xC0000000U, 0U);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117
118 if (tp)
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000119 first = tp->prio - 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Jiri Pirko79619732017-05-17 11:07:58 +0200121 return TC_H_MAJ(first);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122}
123
Jiri Pirko33a48922017-02-09 14:38:57 +0100124static struct tcf_proto *tcf_proto_create(const char *kind, u32 protocol,
Alexander Aringc35a4ac2018-01-18 11:20:50 -0500125 u32 prio, struct tcf_chain *chain,
126 struct netlink_ext_ack *extack)
Jiri Pirko33a48922017-02-09 14:38:57 +0100127{
128 struct tcf_proto *tp;
129 int err;
130
131 tp = kzalloc(sizeof(*tp), GFP_KERNEL);
132 if (!tp)
133 return ERR_PTR(-ENOBUFS);
134
135 err = -ENOENT;
136 tp->ops = tcf_proto_lookup_ops(kind);
137 if (!tp->ops) {
138#ifdef CONFIG_MODULES
139 rtnl_unlock();
140 request_module("cls_%s", kind);
141 rtnl_lock();
142 tp->ops = tcf_proto_lookup_ops(kind);
143 /* We dropped the RTNL semaphore in order to perform
144 * the module load. So, even if we succeeded in loading
145 * the module we have to replay the request. We indicate
146 * this using -EAGAIN.
147 */
148 if (tp->ops) {
149 module_put(tp->ops->owner);
150 err = -EAGAIN;
151 } else {
Alexander Aringc35a4ac2018-01-18 11:20:50 -0500152 NL_SET_ERR_MSG(extack, "TC classifier not found");
Jiri Pirko33a48922017-02-09 14:38:57 +0100153 err = -ENOENT;
154 }
Jiri Pirko33a48922017-02-09 14:38:57 +0100155#endif
Jiri Pirkod68d75f2018-05-11 17:45:32 +0200156 goto errout;
Jiri Pirko33a48922017-02-09 14:38:57 +0100157 }
158 tp->classify = tp->ops->classify;
159 tp->protocol = protocol;
160 tp->prio = prio;
Jiri Pirko5bc17012017-05-17 11:08:01 +0200161 tp->chain = chain;
Jiri Pirko33a48922017-02-09 14:38:57 +0100162
163 err = tp->ops->init(tp);
164 if (err) {
165 module_put(tp->ops->owner);
166 goto errout;
167 }
168 return tp;
169
170errout:
171 kfree(tp);
172 return ERR_PTR(err);
173}
174
Jakub Kicinski715df5e2018-01-24 12:54:13 -0800175static void tcf_proto_destroy(struct tcf_proto *tp,
176 struct netlink_ext_ack *extack)
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100177{
Jakub Kicinski715df5e2018-01-24 12:54:13 -0800178 tp->ops->destroy(tp, extack);
WANG Cong763dbf62017-04-19 14:21:21 -0700179 module_put(tp->ops->owner);
180 kfree_rcu(tp, rcu);
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100181}
182
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100183struct tcf_filter_chain_list_item {
184 struct list_head list;
185 tcf_chain_head_change_t *chain_head_change;
186 void *chain_head_change_priv;
187};
188
Jiri Pirko5bc17012017-05-17 11:08:01 +0200189static struct tcf_chain *tcf_chain_create(struct tcf_block *block,
190 u32 chain_index)
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200191{
Jiri Pirko5bc17012017-05-17 11:08:01 +0200192 struct tcf_chain *chain;
193
194 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
195 if (!chain)
196 return NULL;
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100197 INIT_LIST_HEAD(&chain->filter_chain_list);
Jiri Pirko5bc17012017-05-17 11:08:01 +0200198 list_add_tail(&chain->list, &block->chain_list);
199 chain->block = block;
200 chain->index = chain_index;
Cong Wange2ef7542017-09-11 16:33:31 -0700201 chain->refcnt = 1;
Jiri Pirko5bc17012017-05-17 11:08:01 +0200202 return chain;
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200203}
204
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100205static void tcf_chain_head_change_item(struct tcf_filter_chain_list_item *item,
206 struct tcf_proto *tp_head)
207{
208 if (item->chain_head_change)
209 item->chain_head_change(tp_head, item->chain_head_change_priv);
210}
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100211static void tcf_chain_head_change(struct tcf_chain *chain,
212 struct tcf_proto *tp_head)
213{
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100214 struct tcf_filter_chain_list_item *item;
215
216 list_for_each_entry(item, &chain->filter_chain_list, list)
217 tcf_chain_head_change_item(item, tp_head);
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100218}
219
Jiri Pirkof93e1cd2017-05-20 15:01:32 +0200220static void tcf_chain_flush(struct tcf_chain *chain)
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100221{
Roman Kapld7aa04a2017-11-20 22:21:13 +0100222 struct tcf_proto *tp = rtnl_dereference(chain->filter_chain);
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100223
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100224 tcf_chain_head_change(chain, NULL);
Roman Kapld7aa04a2017-11-20 22:21:13 +0100225 while (tp) {
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200226 RCU_INIT_POINTER(chain->filter_chain, tp->next);
Jakub Kicinski715df5e2018-01-24 12:54:13 -0800227 tcf_proto_destroy(tp, NULL);
Roman Kapld7aa04a2017-11-20 22:21:13 +0100228 tp = rtnl_dereference(chain->filter_chain);
229 tcf_chain_put(chain);
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100230 }
Jiri Pirkof93e1cd2017-05-20 15:01:32 +0200231}
232
233static void tcf_chain_destroy(struct tcf_chain *chain)
234{
Cong Wangefbf7892017-12-04 10:48:18 -0800235 struct tcf_block *block = chain->block;
236
Cong Wange2ef7542017-09-11 16:33:31 -0700237 list_del(&chain->list);
238 kfree(chain);
Cong Wangefbf7892017-12-04 10:48:18 -0800239 if (list_empty(&block->chain_list))
240 kfree(block);
Cong Wange2ef7542017-09-11 16:33:31 -0700241}
Jiri Pirko744a4cf2017-08-22 22:46:49 +0200242
Cong Wange2ef7542017-09-11 16:33:31 -0700243static void tcf_chain_hold(struct tcf_chain *chain)
244{
245 ++chain->refcnt;
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200246}
247
WANG Cong367a8ce2017-05-23 09:42:37 -0700248struct tcf_chain *tcf_chain_get(struct tcf_block *block, u32 chain_index,
249 bool create)
Jiri Pirko5bc17012017-05-17 11:08:01 +0200250{
251 struct tcf_chain *chain;
252
253 list_for_each_entry(chain, &block->chain_list, list) {
Cong Wange2ef7542017-09-11 16:33:31 -0700254 if (chain->index == chain_index) {
255 tcf_chain_hold(chain);
256 return chain;
257 }
Jiri Pirko5bc17012017-05-17 11:08:01 +0200258 }
Jiri Pirko80532382017-09-06 13:14:19 +0200259
Cong Wange2ef7542017-09-11 16:33:31 -0700260 return create ? tcf_chain_create(block, chain_index) : NULL;
Jiri Pirko5bc17012017-05-17 11:08:01 +0200261}
262EXPORT_SYMBOL(tcf_chain_get);
263
264void tcf_chain_put(struct tcf_chain *chain)
265{
Cong Wange2ef7542017-09-11 16:33:31 -0700266 if (--chain->refcnt == 0)
Jiri Pirko5bc17012017-05-17 11:08:01 +0200267 tcf_chain_destroy(chain);
268}
269EXPORT_SYMBOL(tcf_chain_put);
270
Jiri Pirkocaa72602018-01-17 11:46:50 +0100271static bool tcf_block_offload_in_use(struct tcf_block *block)
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200272{
Jiri Pirkocaa72602018-01-17 11:46:50 +0100273 return block->offloadcnt;
274}
275
276static int tcf_block_offload_cmd(struct tcf_block *block,
277 struct net_device *dev,
278 struct tcf_block_ext_info *ei,
279 enum tc_block_command command)
280{
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200281 struct tc_block_offload bo = {};
282
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200283 bo.command = command;
284 bo.binder_type = ei->binder_type;
285 bo.block = block;
Jiri Pirkocaa72602018-01-17 11:46:50 +0100286 return dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_BLOCK, &bo);
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200287}
288
Jiri Pirkocaa72602018-01-17 11:46:50 +0100289static int tcf_block_offload_bind(struct tcf_block *block, struct Qdisc *q,
290 struct tcf_block_ext_info *ei)
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200291{
Jiri Pirkocaa72602018-01-17 11:46:50 +0100292 struct net_device *dev = q->dev_queue->dev;
293 int err;
294
295 if (!dev->netdev_ops->ndo_setup_tc)
296 goto no_offload_dev_inc;
297
298 /* If tc offload feature is disabled and the block we try to bind
299 * to already has some offloaded filters, forbid to bind.
300 */
301 if (!tc_can_offload(dev) && tcf_block_offload_in_use(block))
302 return -EOPNOTSUPP;
303
304 err = tcf_block_offload_cmd(block, dev, ei, TC_BLOCK_BIND);
305 if (err == -EOPNOTSUPP)
306 goto no_offload_dev_inc;
307 return err;
308
309no_offload_dev_inc:
310 if (tcf_block_offload_in_use(block))
311 return -EOPNOTSUPP;
312 block->nooffloaddevcnt++;
313 return 0;
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200314}
315
316static void tcf_block_offload_unbind(struct tcf_block *block, struct Qdisc *q,
317 struct tcf_block_ext_info *ei)
318{
Jiri Pirkocaa72602018-01-17 11:46:50 +0100319 struct net_device *dev = q->dev_queue->dev;
320 int err;
321
322 if (!dev->netdev_ops->ndo_setup_tc)
323 goto no_offload_dev_dec;
324 err = tcf_block_offload_cmd(block, dev, ei, TC_BLOCK_UNBIND);
325 if (err == -EOPNOTSUPP)
326 goto no_offload_dev_dec;
327 return;
328
329no_offload_dev_dec:
330 WARN_ON(block->nooffloaddevcnt-- == 0);
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200331}
332
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100333static int
334tcf_chain_head_change_cb_add(struct tcf_chain *chain,
335 struct tcf_block_ext_info *ei,
336 struct netlink_ext_ack *extack)
337{
338 struct tcf_filter_chain_list_item *item;
339
340 item = kmalloc(sizeof(*item), GFP_KERNEL);
341 if (!item) {
342 NL_SET_ERR_MSG(extack, "Memory allocation for head change callback item failed");
343 return -ENOMEM;
344 }
345 item->chain_head_change = ei->chain_head_change;
346 item->chain_head_change_priv = ei->chain_head_change_priv;
347 if (chain->filter_chain)
348 tcf_chain_head_change_item(item, chain->filter_chain);
349 list_add(&item->list, &chain->filter_chain_list);
350 return 0;
351}
352
353static void
354tcf_chain_head_change_cb_del(struct tcf_chain *chain,
355 struct tcf_block_ext_info *ei)
356{
357 struct tcf_filter_chain_list_item *item;
358
359 list_for_each_entry(item, &chain->filter_chain_list, list) {
360 if ((!ei->chain_head_change && !ei->chain_head_change_priv) ||
361 (item->chain_head_change == ei->chain_head_change &&
362 item->chain_head_change_priv == ei->chain_head_change_priv)) {
363 tcf_chain_head_change_item(item, NULL);
364 list_del(&item->list);
365 kfree(item);
366 return;
367 }
368 }
369 WARN_ON(1);
370}
371
Jiri Pirko48617382018-01-17 11:46:46 +0100372struct tcf_net {
373 struct idr idr;
374};
375
376static unsigned int tcf_net_id;
377
378static int tcf_block_insert(struct tcf_block *block, struct net *net,
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100379 struct netlink_ext_ack *extack)
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100380{
Jiri Pirko48617382018-01-17 11:46:46 +0100381 struct tcf_net *tn = net_generic(net, tcf_net_id);
Jiri Pirko48617382018-01-17 11:46:46 +0100382
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100383 return idr_alloc_u32(&tn->idr, block, &block->index, block->index,
384 GFP_KERNEL);
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100385}
386
Jiri Pirko48617382018-01-17 11:46:46 +0100387static void tcf_block_remove(struct tcf_block *block, struct net *net)
Jiri Pirko6529eab2017-05-17 11:07:55 +0200388{
Jiri Pirko48617382018-01-17 11:46:46 +0100389 struct tcf_net *tn = net_generic(net, tcf_net_id);
390
Matthew Wilcox9c160942017-11-28 09:48:43 -0500391 idr_remove(&tn->idr, block->index);
Jiri Pirko48617382018-01-17 11:46:46 +0100392}
393
394static struct tcf_block *tcf_block_create(struct net *net, struct Qdisc *q,
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100395 u32 block_index,
Jiri Pirko48617382018-01-17 11:46:46 +0100396 struct netlink_ext_ack *extack)
397{
398 struct tcf_block *block;
Jiri Pirko5bc17012017-05-17 11:08:01 +0200399 struct tcf_chain *chain;
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200400 int err;
Jiri Pirko6529eab2017-05-17 11:07:55 +0200401
Jiri Pirko48617382018-01-17 11:46:46 +0100402 block = kzalloc(sizeof(*block), GFP_KERNEL);
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500403 if (!block) {
404 NL_SET_ERR_MSG(extack, "Memory allocation for block failed");
Jiri Pirko48617382018-01-17 11:46:46 +0100405 return ERR_PTR(-ENOMEM);
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500406 }
Jiri Pirko5bc17012017-05-17 11:08:01 +0200407 INIT_LIST_HEAD(&block->chain_list);
Jiri Pirkoacb67442017-10-19 15:50:31 +0200408 INIT_LIST_HEAD(&block->cb_list);
Jiri Pirkof36fe1c2018-01-17 11:46:48 +0100409 INIT_LIST_HEAD(&block->owner_list);
Jiri Pirkoacb67442017-10-19 15:50:31 +0200410
Jiri Pirko5bc17012017-05-17 11:08:01 +0200411 /* Create chain 0 by default, it has to be always present. */
412 chain = tcf_chain_create(block, 0);
413 if (!chain) {
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500414 NL_SET_ERR_MSG(extack, "Failed to create new tcf chain");
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200415 err = -ENOMEM;
416 goto err_chain_create;
417 }
Jiri Pirko48617382018-01-17 11:46:46 +0100418 block->refcnt = 1;
419 block->net = net;
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100420 block->index = block_index;
421
422 /* Don't store q pointer for blocks which are shared */
423 if (!tcf_block_shared(block))
424 block->q = q;
Jiri Pirko48617382018-01-17 11:46:46 +0100425 return block;
426
427err_chain_create:
428 kfree(block);
429 return ERR_PTR(err);
430}
431
432static struct tcf_block *tcf_block_lookup(struct net *net, u32 block_index)
433{
434 struct tcf_net *tn = net_generic(net, tcf_net_id);
435
Matthew Wilcox322d8842017-11-28 10:01:24 -0500436 return idr_find(&tn->idr, block_index);
Jiri Pirko48617382018-01-17 11:46:46 +0100437}
438
439static struct tcf_chain *tcf_block_chain_zero(struct tcf_block *block)
440{
441 return list_first_entry(&block->chain_list, struct tcf_chain, list);
442}
443
Jiri Pirkof36fe1c2018-01-17 11:46:48 +0100444struct tcf_block_owner_item {
445 struct list_head list;
446 struct Qdisc *q;
447 enum tcf_block_binder_type binder_type;
448};
449
450static void
451tcf_block_owner_netif_keep_dst(struct tcf_block *block,
452 struct Qdisc *q,
453 enum tcf_block_binder_type binder_type)
454{
455 if (block->keep_dst &&
456 binder_type != TCF_BLOCK_BINDER_TYPE_CLSACT_INGRESS &&
457 binder_type != TCF_BLOCK_BINDER_TYPE_CLSACT_EGRESS)
458 netif_keep_dst(qdisc_dev(q));
459}
460
461void tcf_block_netif_keep_dst(struct tcf_block *block)
462{
463 struct tcf_block_owner_item *item;
464
465 block->keep_dst = true;
466 list_for_each_entry(item, &block->owner_list, list)
467 tcf_block_owner_netif_keep_dst(block, item->q,
468 item->binder_type);
469}
470EXPORT_SYMBOL(tcf_block_netif_keep_dst);
471
472static int tcf_block_owner_add(struct tcf_block *block,
473 struct Qdisc *q,
474 enum tcf_block_binder_type binder_type)
475{
476 struct tcf_block_owner_item *item;
477
478 item = kmalloc(sizeof(*item), GFP_KERNEL);
479 if (!item)
480 return -ENOMEM;
481 item->q = q;
482 item->binder_type = binder_type;
483 list_add(&item->list, &block->owner_list);
484 return 0;
485}
486
487static void tcf_block_owner_del(struct tcf_block *block,
488 struct Qdisc *q,
489 enum tcf_block_binder_type binder_type)
490{
491 struct tcf_block_owner_item *item;
492
493 list_for_each_entry(item, &block->owner_list, list) {
494 if (item->q == q && item->binder_type == binder_type) {
495 list_del(&item->list);
496 kfree(item);
497 return;
498 }
499 }
500 WARN_ON(1);
501}
502
Jiri Pirko48617382018-01-17 11:46:46 +0100503int tcf_block_get_ext(struct tcf_block **p_block, struct Qdisc *q,
504 struct tcf_block_ext_info *ei,
505 struct netlink_ext_ack *extack)
506{
507 struct net *net = qdisc_net(q);
508 struct tcf_block *block = NULL;
509 bool created = false;
510 int err;
511
512 if (ei->block_index) {
513 /* block_index not 0 means the shared block is requested */
514 block = tcf_block_lookup(net, ei->block_index);
515 if (block)
516 block->refcnt++;
517 }
518
519 if (!block) {
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100520 block = tcf_block_create(net, q, ei->block_index, extack);
Jiri Pirko48617382018-01-17 11:46:46 +0100521 if (IS_ERR(block))
522 return PTR_ERR(block);
523 created = true;
Jiri Pirkobb047dd2018-02-13 12:00:16 +0100524 if (tcf_block_shared(block)) {
525 err = tcf_block_insert(block, net, extack);
Jiri Pirko48617382018-01-17 11:46:46 +0100526 if (err)
527 goto err_block_insert;
528 }
529 }
530
Jiri Pirkof36fe1c2018-01-17 11:46:48 +0100531 err = tcf_block_owner_add(block, q, ei->binder_type);
532 if (err)
533 goto err_block_owner_add;
534
535 tcf_block_owner_netif_keep_dst(block, q, ei->binder_type);
536
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100537 err = tcf_chain_head_change_cb_add(tcf_block_chain_zero(block),
538 ei, extack);
539 if (err)
540 goto err_chain_head_change_cb_add;
Jiri Pirkocaa72602018-01-17 11:46:50 +0100541
542 err = tcf_block_offload_bind(block, q, ei);
543 if (err)
544 goto err_block_offload_bind;
545
Jiri Pirko6529eab2017-05-17 11:07:55 +0200546 *p_block = block;
547 return 0;
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200548
Jiri Pirkocaa72602018-01-17 11:46:50 +0100549err_block_offload_bind:
550 tcf_chain_head_change_cb_del(tcf_block_chain_zero(block), ei);
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100551err_chain_head_change_cb_add:
Jiri Pirkof36fe1c2018-01-17 11:46:48 +0100552 tcf_block_owner_del(block, q, ei->binder_type);
553err_block_owner_add:
Jiri Pirko48617382018-01-17 11:46:46 +0100554 if (created) {
555 if (tcf_block_shared(block))
556 tcf_block_remove(block, net);
557err_block_insert:
558 kfree(tcf_block_chain_zero(block));
559 kfree(block);
560 } else {
561 block->refcnt--;
562 }
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200563 return err;
Jiri Pirko6529eab2017-05-17 11:07:55 +0200564}
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200565EXPORT_SYMBOL(tcf_block_get_ext);
566
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100567static void tcf_chain_head_change_dflt(struct tcf_proto *tp_head, void *priv)
568{
569 struct tcf_proto __rcu **p_filter_chain = priv;
570
571 rcu_assign_pointer(*p_filter_chain, tp_head);
572}
573
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200574int tcf_block_get(struct tcf_block **p_block,
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500575 struct tcf_proto __rcu **p_filter_chain, struct Qdisc *q,
576 struct netlink_ext_ack *extack)
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200577{
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100578 struct tcf_block_ext_info ei = {
579 .chain_head_change = tcf_chain_head_change_dflt,
580 .chain_head_change_priv = p_filter_chain,
581 };
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200582
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100583 WARN_ON(!p_filter_chain);
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500584 return tcf_block_get_ext(p_block, q, &ei, extack);
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200585}
Jiri Pirko6529eab2017-05-17 11:07:55 +0200586EXPORT_SYMBOL(tcf_block_get);
587
Cong Wang7aa00452017-10-26 18:24:28 -0700588/* XXX: Standalone actions are not allowed to jump to any chain, and bound
Roman Kapla60b3f52017-11-24 12:27:58 +0100589 * actions should be all removed after flushing.
Cong Wang7aa00452017-10-26 18:24:28 -0700590 */
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100591void tcf_block_put_ext(struct tcf_block *block, struct Qdisc *q,
David S. Millere1ea2f92017-10-30 14:10:01 +0900592 struct tcf_block_ext_info *ei)
Cong Wang7aa00452017-10-26 18:24:28 -0700593{
Cong Wangefbf7892017-12-04 10:48:18 -0800594 struct tcf_chain *chain, *tmp;
Cong Wang1697c4b2017-09-11 16:33:32 -0700595
David S. Millerc30abd52017-12-16 22:11:55 -0500596 if (!block)
597 return;
Jiri Pirkoa9b19442018-01-17 11:46:45 +0100598 tcf_chain_head_change_cb_del(tcf_block_chain_zero(block), ei);
Jiri Pirkof36fe1c2018-01-17 11:46:48 +0100599 tcf_block_owner_del(block, q, ei->binder_type);
Roman Kapla60b3f52017-11-24 12:27:58 +0100600
Jiri Pirko48617382018-01-17 11:46:46 +0100601 if (--block->refcnt == 0) {
602 if (tcf_block_shared(block))
603 tcf_block_remove(block, block->net);
604
605 /* Hold a refcnt for all chains, so that they don't disappear
606 * while we are iterating.
607 */
608 list_for_each_entry(chain, &block->chain_list, list)
609 tcf_chain_hold(chain);
610
611 list_for_each_entry(chain, &block->chain_list, list)
612 tcf_chain_flush(chain);
613 }
Cong Wang1697c4b2017-09-11 16:33:32 -0700614
Jiri Pirko4bb1b112017-11-02 15:07:01 +0100615 tcf_block_offload_unbind(block, q, ei);
616
Jiri Pirko48617382018-01-17 11:46:46 +0100617 if (block->refcnt == 0) {
618 /* At this point, all the chains should have refcnt >= 1. */
619 list_for_each_entry_safe(chain, tmp, &block->chain_list, list)
620 tcf_chain_put(chain);
Jiri Pirkodf45bf82017-12-08 19:27:27 +0100621
Jiri Pirko48617382018-01-17 11:46:46 +0100622 /* Finally, put chain 0 and allow block to be freed. */
623 tcf_chain_put(tcf_block_chain_zero(block));
624 }
Jiri Pirko6529eab2017-05-17 11:07:55 +0200625}
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200626EXPORT_SYMBOL(tcf_block_put_ext);
627
628void tcf_block_put(struct tcf_block *block)
629{
630 struct tcf_block_ext_info ei = {0, };
631
Jiri Pirko4853f122017-12-21 13:13:59 +0100632 if (!block)
633 return;
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100634 tcf_block_put_ext(block, block->q, &ei);
Jiri Pirko8c4083b2017-10-19 15:50:29 +0200635}
David S. Millere1ea2f92017-10-30 14:10:01 +0900636
Jiri Pirko6529eab2017-05-17 11:07:55 +0200637EXPORT_SYMBOL(tcf_block_put);
Jiri Pirkocf1facd2017-02-09 14:38:56 +0100638
Jiri Pirkoacb67442017-10-19 15:50:31 +0200639struct tcf_block_cb {
640 struct list_head list;
641 tc_setup_cb_t *cb;
642 void *cb_ident;
643 void *cb_priv;
644 unsigned int refcnt;
645};
646
647void *tcf_block_cb_priv(struct tcf_block_cb *block_cb)
648{
649 return block_cb->cb_priv;
650}
651EXPORT_SYMBOL(tcf_block_cb_priv);
652
653struct tcf_block_cb *tcf_block_cb_lookup(struct tcf_block *block,
654 tc_setup_cb_t *cb, void *cb_ident)
655{ struct tcf_block_cb *block_cb;
656
657 list_for_each_entry(block_cb, &block->cb_list, list)
658 if (block_cb->cb == cb && block_cb->cb_ident == cb_ident)
659 return block_cb;
660 return NULL;
661}
662EXPORT_SYMBOL(tcf_block_cb_lookup);
663
664void tcf_block_cb_incref(struct tcf_block_cb *block_cb)
665{
666 block_cb->refcnt++;
667}
668EXPORT_SYMBOL(tcf_block_cb_incref);
669
670unsigned int tcf_block_cb_decref(struct tcf_block_cb *block_cb)
671{
672 return --block_cb->refcnt;
673}
674EXPORT_SYMBOL(tcf_block_cb_decref);
675
676struct tcf_block_cb *__tcf_block_cb_register(struct tcf_block *block,
677 tc_setup_cb_t *cb, void *cb_ident,
678 void *cb_priv)
679{
680 struct tcf_block_cb *block_cb;
681
Jiri Pirkocaa72602018-01-17 11:46:50 +0100682 /* At this point, playback of previous block cb calls is not supported,
683 * so forbid to register to block which already has some offloaded
684 * filters present.
685 */
686 if (tcf_block_offload_in_use(block))
687 return ERR_PTR(-EOPNOTSUPP);
688
Jiri Pirkoacb67442017-10-19 15:50:31 +0200689 block_cb = kzalloc(sizeof(*block_cb), GFP_KERNEL);
690 if (!block_cb)
Jiri Pirkocaa72602018-01-17 11:46:50 +0100691 return ERR_PTR(-ENOMEM);
Jiri Pirkoacb67442017-10-19 15:50:31 +0200692 block_cb->cb = cb;
693 block_cb->cb_ident = cb_ident;
694 block_cb->cb_priv = cb_priv;
695 list_add(&block_cb->list, &block->cb_list);
696 return block_cb;
697}
698EXPORT_SYMBOL(__tcf_block_cb_register);
699
700int tcf_block_cb_register(struct tcf_block *block,
701 tc_setup_cb_t *cb, void *cb_ident,
702 void *cb_priv)
703{
704 struct tcf_block_cb *block_cb;
705
706 block_cb = __tcf_block_cb_register(block, cb, cb_ident, cb_priv);
Jiri Pirkocaa72602018-01-17 11:46:50 +0100707 return IS_ERR(block_cb) ? PTR_ERR(block_cb) : 0;
Jiri Pirkoacb67442017-10-19 15:50:31 +0200708}
709EXPORT_SYMBOL(tcf_block_cb_register);
710
711void __tcf_block_cb_unregister(struct tcf_block_cb *block_cb)
712{
713 list_del(&block_cb->list);
714 kfree(block_cb);
715}
716EXPORT_SYMBOL(__tcf_block_cb_unregister);
717
718void tcf_block_cb_unregister(struct tcf_block *block,
719 tc_setup_cb_t *cb, void *cb_ident)
720{
721 struct tcf_block_cb *block_cb;
722
723 block_cb = tcf_block_cb_lookup(block, cb, cb_ident);
724 if (!block_cb)
725 return;
726 __tcf_block_cb_unregister(block_cb);
727}
728EXPORT_SYMBOL(tcf_block_cb_unregister);
729
730static int tcf_block_cb_call(struct tcf_block *block, enum tc_setup_type type,
731 void *type_data, bool err_stop)
732{
733 struct tcf_block_cb *block_cb;
734 int ok_count = 0;
735 int err;
736
Jiri Pirkocaa72602018-01-17 11:46:50 +0100737 /* Make sure all netdevs sharing this block are offload-capable. */
738 if (block->nooffloaddevcnt && err_stop)
739 return -EOPNOTSUPP;
740
Jiri Pirkoacb67442017-10-19 15:50:31 +0200741 list_for_each_entry(block_cb, &block->cb_list, list) {
742 err = block_cb->cb(type, type_data, block_cb->cb_priv);
743 if (err) {
744 if (err_stop)
745 return err;
746 } else {
747 ok_count++;
748 }
749 }
750 return ok_count;
751}
752
Jiri Pirko87d83092017-05-17 11:07:54 +0200753/* Main classifier routine: scans classifier chain attached
754 * to this qdisc, (optionally) tests for protocol and asks
755 * specific classifiers.
756 */
757int tcf_classify(struct sk_buff *skb, const struct tcf_proto *tp,
758 struct tcf_result *res, bool compat_mode)
759{
760 __be16 protocol = tc_skb_protocol(skb);
761#ifdef CONFIG_NET_CLS_ACT
762 const int max_reclassify_loop = 4;
Jiri Pirkoee538dc2017-05-23 09:11:59 +0200763 const struct tcf_proto *orig_tp = tp;
764 const struct tcf_proto *first_tp;
Jiri Pirko87d83092017-05-17 11:07:54 +0200765 int limit = 0;
766
767reclassify:
768#endif
769 for (; tp; tp = rcu_dereference_bh(tp->next)) {
770 int err;
771
772 if (tp->protocol != protocol &&
773 tp->protocol != htons(ETH_P_ALL))
774 continue;
775
776 err = tp->classify(skb, tp, res);
777#ifdef CONFIG_NET_CLS_ACT
Jiri Pirkodb505142017-05-17 11:08:03 +0200778 if (unlikely(err == TC_ACT_RECLASSIFY && !compat_mode)) {
Jiri Pirkoee538dc2017-05-23 09:11:59 +0200779 first_tp = orig_tp;
Jiri Pirko87d83092017-05-17 11:07:54 +0200780 goto reset;
Jiri Pirkodb505142017-05-17 11:08:03 +0200781 } else if (unlikely(TC_ACT_EXT_CMP(err, TC_ACT_GOTO_CHAIN))) {
Jiri Pirkoee538dc2017-05-23 09:11:59 +0200782 first_tp = res->goto_tp;
Jiri Pirkodb505142017-05-17 11:08:03 +0200783 goto reset;
784 }
Jiri Pirko87d83092017-05-17 11:07:54 +0200785#endif
786 if (err >= 0)
787 return err;
788 }
789
790 return TC_ACT_UNSPEC; /* signal: continue lookup */
791#ifdef CONFIG_NET_CLS_ACT
792reset:
793 if (unlikely(limit++ >= max_reclassify_loop)) {
Jiri Pirko9d3aaff2018-01-17 11:46:47 +0100794 net_notice_ratelimited("%u: reclassify loop, rule prio %u, protocol %02x\n",
795 tp->chain->block->index,
796 tp->prio & 0xffff,
Jiri Pirko87d83092017-05-17 11:07:54 +0200797 ntohs(tp->protocol));
798 return TC_ACT_SHOT;
799 }
800
Jiri Pirkoee538dc2017-05-23 09:11:59 +0200801 tp = first_tp;
Jiri Pirko87d83092017-05-17 11:07:54 +0200802 protocol = tc_skb_protocol(skb);
803 goto reclassify;
804#endif
805}
806EXPORT_SYMBOL(tcf_classify);
807
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200808struct tcf_chain_info {
809 struct tcf_proto __rcu **pprev;
810 struct tcf_proto __rcu *next;
811};
812
813static struct tcf_proto *tcf_chain_tp_prev(struct tcf_chain_info *chain_info)
814{
815 return rtnl_dereference(*chain_info->pprev);
816}
817
818static void tcf_chain_tp_insert(struct tcf_chain *chain,
819 struct tcf_chain_info *chain_info,
820 struct tcf_proto *tp)
821{
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100822 if (*chain_info->pprev == chain->filter_chain)
823 tcf_chain_head_change(chain, tp);
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200824 RCU_INIT_POINTER(tp->next, tcf_chain_tp_prev(chain_info));
825 rcu_assign_pointer(*chain_info->pprev, tp);
Cong Wange2ef7542017-09-11 16:33:31 -0700826 tcf_chain_hold(chain);
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200827}
828
829static void tcf_chain_tp_remove(struct tcf_chain *chain,
830 struct tcf_chain_info *chain_info,
831 struct tcf_proto *tp)
832{
833 struct tcf_proto *next = rtnl_dereference(chain_info->next);
834
Jiri Pirkoc7eb7d72017-11-03 11:46:24 +0100835 if (tp == chain->filter_chain)
836 tcf_chain_head_change(chain, next);
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200837 RCU_INIT_POINTER(*chain_info->pprev, next);
Cong Wange2ef7542017-09-11 16:33:31 -0700838 tcf_chain_put(chain);
Jiri Pirko2190d1d2017-05-17 11:07:59 +0200839}
840
841static struct tcf_proto *tcf_chain_tp_find(struct tcf_chain *chain,
842 struct tcf_chain_info *chain_info,
843 u32 protocol, u32 prio,
844 bool prio_allocate)
845{
846 struct tcf_proto **pprev;
847 struct tcf_proto *tp;
848
849 /* Check the chain for existence of proto-tcf with this priority */
850 for (pprev = &chain->filter_chain;
851 (tp = rtnl_dereference(*pprev)); pprev = &tp->next) {
852 if (tp->prio >= prio) {
853 if (tp->prio == prio) {
854 if (prio_allocate ||
855 (tp->protocol != protocol && protocol))
856 return ERR_PTR(-EINVAL);
857 } else {
858 tp = NULL;
859 }
860 break;
861 }
862 }
863 chain_info->pprev = pprev;
864 chain_info->next = tp ? tp->next : NULL;
865 return tp;
866}
867
WANG Cong71203712017-08-07 15:26:50 -0700868static int tcf_fill_node(struct net *net, struct sk_buff *skb,
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100869 struct tcf_proto *tp, struct tcf_block *block,
870 struct Qdisc *q, u32 parent, void *fh,
871 u32 portid, u32 seq, u16 flags, int event)
WANG Cong71203712017-08-07 15:26:50 -0700872{
873 struct tcmsg *tcm;
874 struct nlmsghdr *nlh;
875 unsigned char *b = skb_tail_pointer(skb);
876
877 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*tcm), flags);
878 if (!nlh)
879 goto out_nlmsg_trim;
880 tcm = nlmsg_data(nlh);
881 tcm->tcm_family = AF_UNSPEC;
882 tcm->tcm__pad1 = 0;
883 tcm->tcm__pad2 = 0;
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100884 if (q) {
885 tcm->tcm_ifindex = qdisc_dev(q)->ifindex;
886 tcm->tcm_parent = parent;
887 } else {
888 tcm->tcm_ifindex = TCM_IFINDEX_MAGIC_BLOCK;
889 tcm->tcm_block_index = block->index;
890 }
WANG Cong71203712017-08-07 15:26:50 -0700891 tcm->tcm_info = TC_H_MAKE(tp->prio, tp->protocol);
892 if (nla_put_string(skb, TCA_KIND, tp->ops->kind))
893 goto nla_put_failure;
894 if (nla_put_u32(skb, TCA_CHAIN, tp->chain->index))
895 goto nla_put_failure;
896 if (!fh) {
897 tcm->tcm_handle = 0;
898 } else {
899 if (tp->ops->dump && tp->ops->dump(net, tp, fh, skb, tcm) < 0)
900 goto nla_put_failure;
901 }
902 nlh->nlmsg_len = skb_tail_pointer(skb) - b;
903 return skb->len;
904
905out_nlmsg_trim:
906nla_put_failure:
907 nlmsg_trim(skb, b);
908 return -1;
909}
910
911static int tfilter_notify(struct net *net, struct sk_buff *oskb,
912 struct nlmsghdr *n, struct tcf_proto *tp,
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100913 struct tcf_block *block, struct Qdisc *q,
914 u32 parent, void *fh, int event, bool unicast)
WANG Cong71203712017-08-07 15:26:50 -0700915{
916 struct sk_buff *skb;
917 u32 portid = oskb ? NETLINK_CB(oskb).portid : 0;
918
919 skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
920 if (!skb)
921 return -ENOBUFS;
922
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100923 if (tcf_fill_node(net, skb, tp, block, q, parent, fh, portid,
924 n->nlmsg_seq, n->nlmsg_flags, event) <= 0) {
WANG Cong71203712017-08-07 15:26:50 -0700925 kfree_skb(skb);
926 return -EINVAL;
927 }
928
929 if (unicast)
930 return netlink_unicast(net->rtnl, skb, portid, MSG_DONTWAIT);
931
932 return rtnetlink_send(skb, net, portid, RTNLGRP_TC,
933 n->nlmsg_flags & NLM_F_ECHO);
934}
935
936static int tfilter_del_notify(struct net *net, struct sk_buff *oskb,
937 struct nlmsghdr *n, struct tcf_proto *tp,
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100938 struct tcf_block *block, struct Qdisc *q,
Alexander Aringc35a4ac2018-01-18 11:20:50 -0500939 u32 parent, void *fh, bool unicast, bool *last,
940 struct netlink_ext_ack *extack)
WANG Cong71203712017-08-07 15:26:50 -0700941{
942 struct sk_buff *skb;
943 u32 portid = oskb ? NETLINK_CB(oskb).portid : 0;
944 int err;
945
946 skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
947 if (!skb)
948 return -ENOBUFS;
949
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100950 if (tcf_fill_node(net, skb, tp, block, q, parent, fh, portid,
951 n->nlmsg_seq, n->nlmsg_flags, RTM_DELTFILTER) <= 0) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -0500952 NL_SET_ERR_MSG(extack, "Failed to build del event notification");
WANG Cong71203712017-08-07 15:26:50 -0700953 kfree_skb(skb);
954 return -EINVAL;
955 }
956
Alexander Aring571acf22018-01-18 11:20:53 -0500957 err = tp->ops->delete(tp, fh, last, extack);
WANG Cong71203712017-08-07 15:26:50 -0700958 if (err) {
959 kfree_skb(skb);
960 return err;
961 }
962
963 if (unicast)
964 return netlink_unicast(net->rtnl, skb, portid, MSG_DONTWAIT);
965
Alexander Aringc35a4ac2018-01-18 11:20:50 -0500966 err = rtnetlink_send(skb, net, portid, RTNLGRP_TC,
967 n->nlmsg_flags & NLM_F_ECHO);
968 if (err < 0)
969 NL_SET_ERR_MSG(extack, "Failed to send filter delete notification");
970 return err;
WANG Cong71203712017-08-07 15:26:50 -0700971}
972
973static void tfilter_notify_chain(struct net *net, struct sk_buff *oskb,
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100974 struct tcf_block *block, struct Qdisc *q,
975 u32 parent, struct nlmsghdr *n,
WANG Cong71203712017-08-07 15:26:50 -0700976 struct tcf_chain *chain, int event)
977{
978 struct tcf_proto *tp;
979
980 for (tp = rtnl_dereference(chain->filter_chain);
981 tp; tp = rtnl_dereference(tp->next))
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100982 tfilter_notify(net, oskb, n, tp, block,
983 q, parent, 0, event, false);
WANG Cong71203712017-08-07 15:26:50 -0700984}
985
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986/* Add/change/delete/get a filter node */
987
David Ahernc21ef3e2017-04-16 09:48:24 -0700988static int tc_ctl_tfilter(struct sk_buff *skb, struct nlmsghdr *n,
989 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900991 struct net *net = sock_net(skb->sk);
Patrick McHardyadd93b62008-01-22 22:11:33 -0800992 struct nlattr *tca[TCA_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 struct tcmsg *t;
994 u32 protocol;
995 u32 prio;
Jiri Pirko9d36d9e2017-05-17 11:07:57 +0200996 bool prio_allocate;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997 u32 parent;
Jiri Pirko5bc17012017-05-17 11:08:01 +0200998 u32 chain_index;
Jiri Pirko7960d1d2018-01-17 11:46:51 +0100999 struct Qdisc *q = NULL;
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001000 struct tcf_chain_info chain_info;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001001 struct tcf_chain *chain = NULL;
Jiri Pirko6529eab2017-05-17 11:07:55 +02001002 struct tcf_block *block;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003 struct tcf_proto *tp;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001004 unsigned long cl;
WANG Cong8113c092017-08-04 21:31:43 -07001005 void *fh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001006 int err;
Daniel Borkmann628185c2016-12-21 18:04:11 +01001007 int tp_created;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008
Stéphane Graber4e8bbb82014-04-30 11:25:43 -04001009 if ((n->nlmsg_type != RTM_GETTFILTER) &&
David S. Miller5f013c9b2014-05-12 13:19:14 -04001010 !netlink_ns_capable(skb, net->user_ns, CAP_NET_ADMIN))
Eric W. Biedermandfc47ef2012-11-16 03:03:00 +00001011 return -EPERM;
Hong zhi guode179c82013-03-25 17:36:33 +00001012
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013replay:
Daniel Borkmann628185c2016-12-21 18:04:11 +01001014 tp_created = 0;
1015
David Ahernc21ef3e2017-04-16 09:48:24 -07001016 err = nlmsg_parse(n, sizeof(*t), tca, TCA_MAX, NULL, extack);
Hong zhi guode179c82013-03-25 17:36:33 +00001017 if (err < 0)
1018 return err;
1019
David S. Miller942b8162012-06-26 21:48:50 -07001020 t = nlmsg_data(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001021 protocol = TC_H_MIN(t->tcm_info);
1022 prio = TC_H_MAJ(t->tcm_info);
Jiri Pirko9d36d9e2017-05-17 11:07:57 +02001023 prio_allocate = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001024 parent = t->tcm_parent;
1025 cl = 0;
1026
1027 if (prio == 0) {
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001028 switch (n->nlmsg_type) {
1029 case RTM_DELTFILTER:
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001030 if (protocol || t->tcm_handle || tca[TCA_KIND]) {
1031 NL_SET_ERR_MSG(extack, "Cannot flush filters with protocol, handle or kind set");
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001032 return -ENOENT;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001033 }
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001034 break;
1035 case RTM_NEWTFILTER:
1036 /* If no priority is provided by the user,
1037 * we allocate one.
1038 */
1039 if (n->nlmsg_flags & NLM_F_CREATE) {
1040 prio = TC_H_MAKE(0x80000000U, 0U);
Jiri Pirko9d36d9e2017-05-17 11:07:57 +02001041 prio_allocate = true;
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001042 break;
1043 }
1044 /* fall-through */
1045 default:
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001046 NL_SET_ERR_MSG(extack, "Invalid filter command with priority of zero");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047 return -ENOENT;
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001048 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049 }
1050
1051 /* Find head of filter chain. */
1052
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001053 if (t->tcm_ifindex == TCM_IFINDEX_MAGIC_BLOCK) {
1054 block = tcf_block_lookup(net, t->tcm_block_index);
1055 if (!block) {
1056 NL_SET_ERR_MSG(extack, "Block of given index was not found");
1057 err = -EINVAL;
1058 goto errout;
1059 }
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001060 } else {
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001061 const struct Qdisc_class_ops *cops;
1062 struct net_device *dev;
1063
1064 /* Find link */
1065 dev = __dev_get_by_index(net, t->tcm_ifindex);
1066 if (!dev)
1067 return -ENODEV;
1068
1069 /* Find qdisc */
1070 if (!parent) {
1071 q = dev->qdisc;
1072 parent = q->handle;
1073 } else {
1074 q = qdisc_lookup(dev, TC_H_MAJ(t->tcm_parent));
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001075 if (!q) {
1076 NL_SET_ERR_MSG(extack, "Parent Qdisc doesn't exists");
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001077 return -EINVAL;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001078 }
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001079 }
1080
1081 /* Is it classful? */
1082 cops = q->ops->cl_ops;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001083 if (!cops) {
1084 NL_SET_ERR_MSG(extack, "Qdisc not classful");
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001085 return -EINVAL;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001086 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001087
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001088 if (!cops->tcf_block) {
1089 NL_SET_ERR_MSG(extack, "Class doesn't support blocks");
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001090 return -EOPNOTSUPP;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001091 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001092
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001093 /* Do we search for filter, attached to class? */
1094 if (TC_H_MIN(parent)) {
1095 cl = cops->find(q, parent);
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001096 if (cl == 0) {
1097 NL_SET_ERR_MSG(extack, "Specified class doesn't exist");
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001098 return -ENOENT;
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001099 }
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001100 }
Patrick McHardy71ebe5e2009-09-04 06:41:15 +00001101
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001102 /* And the last stroke */
1103 block = cops->tcf_block(q, cl, extack);
1104 if (!block) {
1105 err = -EINVAL;
1106 goto errout;
1107 }
1108 if (tcf_block_shared(block)) {
1109 NL_SET_ERR_MSG(extack, "This filter block is shared. Please use the block index to manipulate the filters");
1110 err = -EOPNOTSUPP;
1111 goto errout;
1112 }
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001113 }
Jiri Pirko5bc17012017-05-17 11:08:01 +02001114
1115 chain_index = tca[TCA_CHAIN] ? nla_get_u32(tca[TCA_CHAIN]) : 0;
1116 if (chain_index > TC_ACT_EXT_VAL_MASK) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001117 NL_SET_ERR_MSG(extack, "Specified chain index exceeds upper limit");
Jiri Pirko5bc17012017-05-17 11:08:01 +02001118 err = -EINVAL;
1119 goto errout;
1120 }
WANG Cong367a8ce2017-05-23 09:42:37 -07001121 chain = tcf_chain_get(block, chain_index,
1122 n->nlmsg_type == RTM_NEWTFILTER);
Jiri Pirko5bc17012017-05-17 11:08:01 +02001123 if (!chain) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001124 NL_SET_ERR_MSG(extack, "Cannot find specified filter chain");
WANG Cong367a8ce2017-05-23 09:42:37 -07001125 err = n->nlmsg_type == RTM_NEWTFILTER ? -ENOMEM : -EINVAL;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001126 goto errout;
1127 }
Jiri Pirko6529eab2017-05-17 11:07:55 +02001128
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001129 if (n->nlmsg_type == RTM_DELTFILTER && prio == 0) {
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001130 tfilter_notify_chain(net, skb, block, q, parent, n,
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001131 chain, RTM_DELTFILTER);
Jiri Pirkof93e1cd2017-05-20 15:01:32 +02001132 tcf_chain_flush(chain);
Daniel Borkmannea7f8272016-06-10 23:10:22 +02001133 err = 0;
1134 goto errout;
1135 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001137 tp = tcf_chain_tp_find(chain, &chain_info, protocol,
1138 prio, prio_allocate);
1139 if (IS_ERR(tp)) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001140 NL_SET_ERR_MSG(extack, "Filter with specified priority/protocol not found");
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001141 err = PTR_ERR(tp);
1142 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143 }
1144
1145 if (tp == NULL) {
1146 /* Proto-tcf does not exist, create new one */
1147
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001148 if (tca[TCA_KIND] == NULL || !protocol) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001149 NL_SET_ERR_MSG(extack, "Filter kind and protocol must be specified");
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001150 err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001151 goto errout;
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001152 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153
Eric Dumazetcc7ec452011-01-19 19:26:56 +00001154 if (n->nlmsg_type != RTM_NEWTFILTER ||
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001155 !(n->nlmsg_flags & NLM_F_CREATE)) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001156 NL_SET_ERR_MSG(extack, "Need both RTM_NEWTFILTER and NLM_F_CREATE to create a new filter");
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001157 err = -ENOENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 goto errout;
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001159 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160
Jiri Pirko9d36d9e2017-05-17 11:07:57 +02001161 if (prio_allocate)
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001162 prio = tcf_auto_prio(tcf_chain_tp_prev(&chain_info));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163
Jiri Pirko33a48922017-02-09 14:38:57 +01001164 tp = tcf_proto_create(nla_data(tca[TCA_KIND]),
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001165 protocol, prio, chain, extack);
Jiri Pirko33a48922017-02-09 14:38:57 +01001166 if (IS_ERR(tp)) {
1167 err = PTR_ERR(tp);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 goto errout;
1169 }
Minoru Usui12186be2009-06-02 02:17:34 -07001170 tp_created = 1;
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001171 } else if (tca[TCA_KIND] && nla_strcmp(tca[TCA_KIND], tp->ops->kind)) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001172 NL_SET_ERR_MSG(extack, "Specified filter kind does not match existing one");
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001173 err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 goto errout;
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001175 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176
1177 fh = tp->ops->get(tp, t->tcm_handle);
1178
WANG Cong8113c092017-08-04 21:31:43 -07001179 if (!fh) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180 if (n->nlmsg_type == RTM_DELTFILTER && t->tcm_handle == 0) {
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001181 tcf_chain_tp_remove(chain, &chain_info, tp);
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001182 tfilter_notify(net, skb, n, tp, block, q, parent, fh,
Eric Dumazetfa59b272016-10-09 20:25:55 -07001183 RTM_DELTFILTER, false);
Jakub Kicinski715df5e2018-01-24 12:54:13 -08001184 tcf_proto_destroy(tp, extack);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001185 err = 0;
1186 goto errout;
1187 }
1188
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001189 if (n->nlmsg_type != RTM_NEWTFILTER ||
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001190 !(n->nlmsg_flags & NLM_F_CREATE)) {
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001191 NL_SET_ERR_MSG(extack, "Need both RTM_NEWTFILTER and NLM_F_CREATE to create a new filter");
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001192 err = -ENOENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193 goto errout;
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001194 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195 } else {
WANG Cong763dbf62017-04-19 14:21:21 -07001196 bool last;
1197
Linus Torvalds1da177e2005-04-16 15:20:36 -07001198 switch (n->nlmsg_type) {
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +09001199 case RTM_NEWTFILTER:
Minoru Usui12186be2009-06-02 02:17:34 -07001200 if (n->nlmsg_flags & NLM_F_EXCL) {
1201 if (tp_created)
Jakub Kicinski715df5e2018-01-24 12:54:13 -08001202 tcf_proto_destroy(tp, NULL);
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001203 NL_SET_ERR_MSG(extack, "Filter already exists");
Jiri Pirko6bb16e72017-02-09 14:38:58 +01001204 err = -EEXIST;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205 goto errout;
Minoru Usui12186be2009-06-02 02:17:34 -07001206 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207 break;
1208 case RTM_DELTFILTER:
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001209 err = tfilter_del_notify(net, skb, n, tp, block,
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001210 q, parent, fh, false, &last,
1211 extack);
Jiri Pirko40c81b22017-02-09 14:39:00 +01001212 if (err)
1213 goto errout;
WANG Cong763dbf62017-04-19 14:21:21 -07001214 if (last) {
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001215 tcf_chain_tp_remove(chain, &chain_info, tp);
Jakub Kicinski715df5e2018-01-24 12:54:13 -08001216 tcf_proto_destroy(tp, extack);
WANG Cong763dbf62017-04-19 14:21:21 -07001217 }
Jiri Pirkod7cf52c2017-02-14 16:27:13 +01001218 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001219 case RTM_GETTFILTER:
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001220 err = tfilter_notify(net, skb, n, tp, block, q, parent,
1221 fh, RTM_NEWTFILTER, true);
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001222 if (err < 0)
1223 NL_SET_ERR_MSG(extack, "Failed to send filter notify message");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224 goto errout;
1225 default:
Alexander Aringc35a4ac2018-01-18 11:20:50 -05001226 NL_SET_ERR_MSG(extack, "Invalid netlink message type");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227 err = -EINVAL;
1228 goto errout;
1229 }
1230 }
1231
Cong Wang2f7ef2f2014-04-25 13:54:06 -07001232 err = tp->ops->change(net, skb, tp, cl, t->tcm_handle, tca, &fh,
Alexander Aring7306db32018-01-18 11:20:51 -05001233 n->nlmsg_flags & NLM_F_CREATE ? TCA_ACT_NOREPLACE : TCA_ACT_REPLACE,
1234 extack);
Minoru Usui12186be2009-06-02 02:17:34 -07001235 if (err == 0) {
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001236 if (tp_created)
1237 tcf_chain_tp_insert(chain, &chain_info, tp);
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001238 tfilter_notify(net, skb, n, tp, block, q, parent, fh,
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001239 RTM_NEWTFILTER, false);
Minoru Usui12186be2009-06-02 02:17:34 -07001240 } else {
1241 if (tp_created)
Jakub Kicinski715df5e2018-01-24 12:54:13 -08001242 tcf_proto_destroy(tp, NULL);
Minoru Usui12186be2009-06-02 02:17:34 -07001243 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244
1245errout:
Jiri Pirko5bc17012017-05-17 11:08:01 +02001246 if (chain)
1247 tcf_chain_put(chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248 if (err == -EAGAIN)
1249 /* Replay the request. */
1250 goto replay;
1251 return err;
1252}
1253
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001254struct tcf_dump_args {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001255 struct tcf_walker w;
1256 struct sk_buff *skb;
1257 struct netlink_callback *cb;
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001258 struct tcf_block *block;
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001259 struct Qdisc *q;
1260 u32 parent;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261};
1262
WANG Cong8113c092017-08-04 21:31:43 -07001263static int tcf_node_dump(struct tcf_proto *tp, void *n, struct tcf_walker *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264{
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001265 struct tcf_dump_args *a = (void *)arg;
WANG Cong832d1d52014-01-09 16:14:01 -08001266 struct net *net = sock_net(a->skb->sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001268 return tcf_fill_node(net, a->skb, tp, a->block, a->q, a->parent,
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001269 n, NETLINK_CB(a->cb->skb).portid,
Jamal Hadi Salim5a7a5552016-09-18 08:45:33 -04001270 a->cb->nlh->nlmsg_seq, NLM_F_MULTI,
1271 RTM_NEWTFILTER);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272}
1273
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001274static bool tcf_chain_dump(struct tcf_chain *chain, struct Qdisc *q, u32 parent,
1275 struct sk_buff *skb, struct netlink_callback *cb,
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001276 long index_start, long *p_index)
1277{
1278 struct net *net = sock_net(skb->sk);
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001279 struct tcf_block *block = chain->block;
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001280 struct tcmsg *tcm = nlmsg_data(cb->nlh);
1281 struct tcf_dump_args arg;
1282 struct tcf_proto *tp;
1283
1284 for (tp = rtnl_dereference(chain->filter_chain);
1285 tp; tp = rtnl_dereference(tp->next), (*p_index)++) {
1286 if (*p_index < index_start)
1287 continue;
1288 if (TC_H_MAJ(tcm->tcm_info) &&
1289 TC_H_MAJ(tcm->tcm_info) != tp->prio)
1290 continue;
1291 if (TC_H_MIN(tcm->tcm_info) &&
1292 TC_H_MIN(tcm->tcm_info) != tp->protocol)
1293 continue;
1294 if (*p_index > index_start)
1295 memset(&cb->args[1], 0,
1296 sizeof(cb->args) - sizeof(cb->args[0]));
1297 if (cb->args[1] == 0) {
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001298 if (tcf_fill_node(net, skb, tp, block, q, parent, 0,
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001299 NETLINK_CB(cb->skb).portid,
1300 cb->nlh->nlmsg_seq, NLM_F_MULTI,
1301 RTM_NEWTFILTER) <= 0)
Jiri Pirko5bc17012017-05-17 11:08:01 +02001302 return false;
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001303
1304 cb->args[1] = 1;
1305 }
1306 if (!tp->ops->walk)
1307 continue;
1308 arg.w.fn = tcf_node_dump;
1309 arg.skb = skb;
1310 arg.cb = cb;
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001311 arg.block = block;
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001312 arg.q = q;
1313 arg.parent = parent;
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001314 arg.w.stop = 0;
1315 arg.w.skip = cb->args[1] - 1;
1316 arg.w.count = 0;
1317 tp->ops->walk(tp, &arg.w);
1318 cb->args[1] = arg.w.count + 1;
1319 if (arg.w.stop)
Jiri Pirko5bc17012017-05-17 11:08:01 +02001320 return false;
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001321 }
Jiri Pirko5bc17012017-05-17 11:08:01 +02001322 return true;
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001323}
1324
Eric Dumazetbd27a872009-11-05 20:57:26 -08001325/* called with RTNL */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001326static int tc_dump_tfilter(struct sk_buff *skb, struct netlink_callback *cb)
1327{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001328 struct net *net = sock_net(skb->sk);
Jiri Pirko5bc17012017-05-17 11:08:01 +02001329 struct nlattr *tca[TCA_MAX + 1];
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001330 struct Qdisc *q = NULL;
Jiri Pirko6529eab2017-05-17 11:07:55 +02001331 struct tcf_block *block;
Jiri Pirko2190d1d2017-05-17 11:07:59 +02001332 struct tcf_chain *chain;
David S. Miller942b8162012-06-26 21:48:50 -07001333 struct tcmsg *tcm = nlmsg_data(cb->nlh);
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001334 long index_start;
1335 long index;
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001336 u32 parent;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001337 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338
Hong zhi guo573ce262013-03-27 06:47:04 +00001339 if (nlmsg_len(cb->nlh) < sizeof(*tcm))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 return skb->len;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001341
1342 err = nlmsg_parse(cb->nlh, sizeof(*tcm), tca, TCA_MAX, NULL, NULL);
1343 if (err)
1344 return err;
1345
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001346 if (tcm->tcm_ifindex == TCM_IFINDEX_MAGIC_BLOCK) {
1347 block = tcf_block_lookup(net, tcm->tcm_block_index);
1348 if (!block)
WANG Cong143976c2017-08-24 16:51:29 -07001349 goto out;
Jiri Pirkod680b352018-01-18 16:14:49 +01001350 /* If we work with block index, q is NULL and parent value
1351 * will never be used in the following code. The check
1352 * in tcf_fill_node prevents it. However, compiler does not
1353 * see that far, so set parent to zero to silence the warning
1354 * about parent being uninitialized.
1355 */
1356 parent = 0;
Jiri Pirko7960d1d2018-01-17 11:46:51 +01001357 } else {
1358 const struct Qdisc_class_ops *cops;
1359 struct net_device *dev;
1360 unsigned long cl = 0;
1361
1362 dev = __dev_get_by_index(net, tcm->tcm_ifindex);
1363 if (!dev)
1364 return skb->len;
1365
1366 parent = tcm->tcm_parent;
1367 if (!parent) {
1368 q = dev->qdisc;
1369 parent = q->handle;
1370 } else {
1371 q = qdisc_lookup(dev, TC_H_MAJ(tcm->tcm_parent));
1372 }
1373 if (!q)
1374 goto out;
1375 cops = q->ops->cl_ops;
1376 if (!cops)
1377 goto out;
1378 if (!cops->tcf_block)
1379 goto out;
1380 if (TC_H_MIN(tcm->tcm_parent)) {
1381 cl = cops->find(q, tcm->tcm_parent);
1382 if (cl == 0)
1383 goto out;
1384 }
1385 block = cops->tcf_block(q, cl, NULL);
1386 if (!block)
1387 goto out;
1388 if (tcf_block_shared(block))
1389 q = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001390 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001391
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001392 index_start = cb->args[0];
1393 index = 0;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001394
1395 list_for_each_entry(chain, &block->chain_list, list) {
1396 if (tca[TCA_CHAIN] &&
1397 nla_get_u32(tca[TCA_CHAIN]) != chain->index)
1398 continue;
Jiri Pirkoa10fa202017-10-13 14:01:05 +02001399 if (!tcf_chain_dump(chain, q, parent, skb, cb,
Roman Kapl5ae437a2018-02-19 21:32:51 +01001400 index_start, &index)) {
1401 err = -EMSGSIZE;
Jiri Pirko5bc17012017-05-17 11:08:01 +02001402 break;
Roman Kapl5ae437a2018-02-19 21:32:51 +01001403 }
Jiri Pirko5bc17012017-05-17 11:08:01 +02001404 }
1405
Jiri Pirkoacb31fa2017-05-17 11:08:00 +02001406 cb->args[0] = index;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001407
Linus Torvalds1da177e2005-04-16 15:20:36 -07001408out:
Roman Kapl5ae437a2018-02-19 21:32:51 +01001409 /* If we did no progress, the error (EMSGSIZE) is real */
1410 if (skb->len == 0 && err)
1411 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001412 return skb->len;
1413}
1414
WANG Cong18d02642014-09-25 10:26:37 -07001415void tcf_exts_destroy(struct tcf_exts *exts)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001416{
1417#ifdef CONFIG_NET_CLS_ACT
WANG Cong22dc13c2016-08-13 22:35:00 -07001418 LIST_HEAD(actions);
1419
Cong Wang2d132eb2017-10-26 18:24:40 -07001420 ASSERT_RTNL();
WANG Cong22dc13c2016-08-13 22:35:00 -07001421 tcf_exts_to_list(exts, &actions);
1422 tcf_action_destroy(&actions, TCA_ACT_UNBIND);
1423 kfree(exts->actions);
1424 exts->nr_actions = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001425#endif
1426}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001427EXPORT_SYMBOL(tcf_exts_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001428
Benjamin LaHaisec1b52732013-01-14 05:15:39 +00001429int tcf_exts_validate(struct net *net, struct tcf_proto *tp, struct nlattr **tb,
Alexander Aring50a56192018-01-18 11:20:52 -05001430 struct nlattr *rate_tlv, struct tcf_exts *exts, bool ovr,
1431 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001432{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001433#ifdef CONFIG_NET_CLS_ACT
1434 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001435 struct tc_action *act;
Roman Mashakd04e6992018-03-08 16:59:17 -05001436 size_t attr_size = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001437
WANG Cong5da57f42013-12-15 20:15:07 -08001438 if (exts->police && tb[exts->police]) {
Jiri Pirko9fb9f252017-05-17 11:08:02 +02001439 act = tcf_action_init_1(net, tp, tb[exts->police],
1440 rate_tlv, "police", ovr,
Alexander Aringaea0d722018-02-15 10:54:54 -05001441 TCA_ACT_BIND, extack);
Patrick McHardyab27cfb2008-01-23 20:33:13 -08001442 if (IS_ERR(act))
1443 return PTR_ERR(act);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444
WANG Cong33be6272013-12-15 20:15:05 -08001445 act->type = exts->type = TCA_OLD_COMPAT;
WANG Cong22dc13c2016-08-13 22:35:00 -07001446 exts->actions[0] = act;
1447 exts->nr_actions = 1;
WANG Cong5da57f42013-12-15 20:15:07 -08001448 } else if (exts->action && tb[exts->action]) {
WANG Cong22dc13c2016-08-13 22:35:00 -07001449 LIST_HEAD(actions);
1450 int err, i = 0;
1451
Jiri Pirko9fb9f252017-05-17 11:08:02 +02001452 err = tcf_action_init(net, tp, tb[exts->action],
1453 rate_tlv, NULL, ovr, TCA_ACT_BIND,
Roman Mashakd04e6992018-03-08 16:59:17 -05001454 &actions, &attr_size, extack);
WANG Cong33be6272013-12-15 20:15:05 -08001455 if (err)
1456 return err;
WANG Cong22dc13c2016-08-13 22:35:00 -07001457 list_for_each_entry(act, &actions, list)
1458 exts->actions[i++] = act;
1459 exts->nr_actions = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001460 }
Cong Wange4b95c42017-11-06 13:47:19 -08001461 exts->net = net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001463#else
WANG Cong5da57f42013-12-15 20:15:07 -08001464 if ((exts->action && tb[exts->action]) ||
Alexander Aring50a56192018-01-18 11:20:52 -05001465 (exts->police && tb[exts->police])) {
1466 NL_SET_ERR_MSG(extack, "Classifier actions are not supported per compile options (CONFIG_NET_CLS_ACT)");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467 return -EOPNOTSUPP;
Alexander Aring50a56192018-01-18 11:20:52 -05001468 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001469#endif
1470
1471 return 0;
1472}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001473EXPORT_SYMBOL(tcf_exts_validate);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001474
Jiri Pirko9b0d4442017-08-04 14:29:15 +02001475void tcf_exts_change(struct tcf_exts *dst, struct tcf_exts *src)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476{
1477#ifdef CONFIG_NET_CLS_ACT
WANG Cong22dc13c2016-08-13 22:35:00 -07001478 struct tcf_exts old = *dst;
1479
Jiri Pirko9b0d4442017-08-04 14:29:15 +02001480 *dst = *src;
WANG Cong22dc13c2016-08-13 22:35:00 -07001481 tcf_exts_destroy(&old);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001482#endif
1483}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001484EXPORT_SYMBOL(tcf_exts_change);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001485
WANG Cong22dc13c2016-08-13 22:35:00 -07001486#ifdef CONFIG_NET_CLS_ACT
1487static struct tc_action *tcf_exts_first_act(struct tcf_exts *exts)
1488{
1489 if (exts->nr_actions == 0)
1490 return NULL;
1491 else
1492 return exts->actions[0];
1493}
1494#endif
WANG Cong33be6272013-12-15 20:15:05 -08001495
WANG Cong5da57f42013-12-15 20:15:07 -08001496int tcf_exts_dump(struct sk_buff *skb, struct tcf_exts *exts)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497{
1498#ifdef CONFIG_NET_CLS_ACT
Cong Wang9cc63db2014-07-16 14:25:30 -07001499 struct nlattr *nest;
1500
Jiri Pirko978dfd82017-08-04 14:29:03 +02001501 if (exts->action && tcf_exts_has_actions(exts)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001502 /*
1503 * again for backward compatible mode - we want
1504 * to work with both old and new modes of entering
1505 * tc data even if iproute2 was newer - jhs
1506 */
WANG Cong33be6272013-12-15 20:15:05 -08001507 if (exts->type != TCA_OLD_COMPAT) {
WANG Cong22dc13c2016-08-13 22:35:00 -07001508 LIST_HEAD(actions);
1509
WANG Cong5da57f42013-12-15 20:15:07 -08001510 nest = nla_nest_start(skb, exts->action);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001511 if (nest == NULL)
1512 goto nla_put_failure;
WANG Cong22dc13c2016-08-13 22:35:00 -07001513
1514 tcf_exts_to_list(exts, &actions);
1515 if (tcf_action_dump(skb, &actions, 0, 0) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -08001516 goto nla_put_failure;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001517 nla_nest_end(skb, nest);
WANG Cong5da57f42013-12-15 20:15:07 -08001518 } else if (exts->police) {
WANG Cong33be6272013-12-15 20:15:05 -08001519 struct tc_action *act = tcf_exts_first_act(exts);
WANG Cong5da57f42013-12-15 20:15:07 -08001520 nest = nla_nest_start(skb, exts->police);
Jamal Hadi Salim63acd682013-12-23 08:02:12 -05001521 if (nest == NULL || !act)
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001522 goto nla_put_failure;
WANG Cong33be6272013-12-15 20:15:05 -08001523 if (tcf_action_dump_old(skb, act, 0, 0) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -08001524 goto nla_put_failure;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001525 nla_nest_end(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001526 }
1527 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001528 return 0;
Cong Wang9cc63db2014-07-16 14:25:30 -07001529
1530nla_put_failure:
1531 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001532 return -1;
Cong Wang9cc63db2014-07-16 14:25:30 -07001533#else
1534 return 0;
1535#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001536}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001537EXPORT_SYMBOL(tcf_exts_dump);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001538
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001539
WANG Cong5da57f42013-12-15 20:15:07 -08001540int tcf_exts_dump_stats(struct sk_buff *skb, struct tcf_exts *exts)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001541{
1542#ifdef CONFIG_NET_CLS_ACT
WANG Cong33be6272013-12-15 20:15:05 -08001543 struct tc_action *a = tcf_exts_first_act(exts);
Ignacy Gawędzkib057df22015-02-03 19:05:18 +01001544 if (a != NULL && tcf_action_copy_stats(skb, a, 1) < 0)
WANG Cong33be6272013-12-15 20:15:05 -08001545 return -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546#endif
1547 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001548}
Stephen Hemmingeraa767bf2008-01-21 02:26:41 -08001549EXPORT_SYMBOL(tcf_exts_dump_stats);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001550
Jiri Pirko717503b2017-10-11 09:41:09 +02001551static int tc_exts_setup_cb_egdev_call(struct tcf_exts *exts,
1552 enum tc_setup_type type,
1553 void *type_data, bool err_stop)
Jiri Pirkob3f55bd2017-10-11 09:41:08 +02001554{
1555 int ok_count = 0;
1556#ifdef CONFIG_NET_CLS_ACT
1557 const struct tc_action *a;
1558 struct net_device *dev;
Or Gerlitz9d452ce2017-10-24 08:58:02 +03001559 int i, ret;
Jiri Pirkob3f55bd2017-10-11 09:41:08 +02001560
1561 if (!tcf_exts_has_actions(exts))
1562 return 0;
1563
Or Gerlitz9d452ce2017-10-24 08:58:02 +03001564 for (i = 0; i < exts->nr_actions; i++) {
1565 a = exts->actions[i];
Jiri Pirkob3f55bd2017-10-11 09:41:08 +02001566 if (!a->ops->get_dev)
1567 continue;
1568 dev = a->ops->get_dev(a);
Jiri Pirko7612fb02017-11-01 11:47:40 +01001569 if (!dev)
Jiri Pirkob3f55bd2017-10-11 09:41:08 +02001570 continue;
1571 ret = tc_setup_cb_egdev_call(dev, type, type_data, err_stop);
1572 if (ret < 0)
1573 return ret;
1574 ok_count += ret;
1575 }
1576#endif
1577 return ok_count;
1578}
Jiri Pirko717503b2017-10-11 09:41:09 +02001579
Jiri Pirko208c0f42017-10-19 15:50:32 +02001580int tc_setup_cb_call(struct tcf_block *block, struct tcf_exts *exts,
1581 enum tc_setup_type type, void *type_data, bool err_stop)
Jiri Pirko717503b2017-10-11 09:41:09 +02001582{
Jiri Pirko208c0f42017-10-19 15:50:32 +02001583 int ok_count;
1584 int ret;
1585
1586 ret = tcf_block_cb_call(block, type, type_data, err_stop);
1587 if (ret < 0)
1588 return ret;
1589 ok_count = ret;
1590
1591 if (!exts)
1592 return ok_count;
1593 ret = tc_exts_setup_cb_egdev_call(exts, type, type_data, err_stop);
1594 if (ret < 0)
1595 return ret;
1596 ok_count += ret;
1597
1598 return ok_count;
Jiri Pirko717503b2017-10-11 09:41:09 +02001599}
1600EXPORT_SYMBOL(tc_setup_cb_call);
Jiri Pirkob3f55bd2017-10-11 09:41:08 +02001601
Jiri Pirko48617382018-01-17 11:46:46 +01001602static __net_init int tcf_net_init(struct net *net)
1603{
1604 struct tcf_net *tn = net_generic(net, tcf_net_id);
1605
1606 idr_init(&tn->idr);
1607 return 0;
1608}
1609
1610static void __net_exit tcf_net_exit(struct net *net)
1611{
1612 struct tcf_net *tn = net_generic(net, tcf_net_id);
1613
1614 idr_destroy(&tn->idr);
1615}
1616
1617static struct pernet_operations tcf_net_ops = {
1618 .init = tcf_net_init,
1619 .exit = tcf_net_exit,
1620 .id = &tcf_net_id,
1621 .size = sizeof(struct tcf_net),
1622};
1623
Linus Torvalds1da177e2005-04-16 15:20:36 -07001624static int __init tc_filter_init(void)
1625{
Jiri Pirko48617382018-01-17 11:46:46 +01001626 int err;
1627
Cong Wang7aa00452017-10-26 18:24:28 -07001628 tc_filter_wq = alloc_ordered_workqueue("tc_filter_workqueue", 0);
1629 if (!tc_filter_wq)
1630 return -ENOMEM;
1631
Jiri Pirko48617382018-01-17 11:46:46 +01001632 err = register_pernet_subsys(&tcf_net_ops);
1633 if (err)
1634 goto err_register_pernet_subsys;
1635
Florian Westphalb97bac62017-08-09 20:41:48 +02001636 rtnl_register(PF_UNSPEC, RTM_NEWTFILTER, tc_ctl_tfilter, NULL, 0);
1637 rtnl_register(PF_UNSPEC, RTM_DELTFILTER, tc_ctl_tfilter, NULL, 0);
Thomas Graf82623c02007-03-22 11:56:22 -07001638 rtnl_register(PF_UNSPEC, RTM_GETTFILTER, tc_ctl_tfilter,
Florian Westphalb97bac62017-08-09 20:41:48 +02001639 tc_dump_tfilter, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001640
Linus Torvalds1da177e2005-04-16 15:20:36 -07001641 return 0;
Jiri Pirko48617382018-01-17 11:46:46 +01001642
1643err_register_pernet_subsys:
1644 destroy_workqueue(tc_filter_wq);
1645 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001646}
1647
1648subsys_initcall(tc_filter_init);