blob: e282e7382117a54cc6147d3e427f8e5c1fa5bf5c [file] [log] [blame]
Thomas Gleixner9952f692019-05-28 10:10:04 -07001// SPDX-License-Identifier: GPL-2.0-only
Alexander Duyck92651942008-09-12 16:29:34 -07002/*
3 * Copyright (c) 2008, Intel Corporation.
4 *
Alexander Duyck92651942008-09-12 16:29:34 -07005 * Author: Alexander Duyck <alexander.h.duyck@intel.com>
6 */
7
8#include <linux/module.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09009#include <linux/slab.h>
Alexander Duyck92651942008-09-12 16:29:34 -070010#include <linux/types.h>
11#include <linux/kernel.h>
12#include <linux/string.h>
13#include <linux/errno.h>
14#include <linux/skbuff.h>
15#include <net/netlink.h>
16#include <net/pkt_sched.h>
Jiri Pirkocf1facd2017-02-09 14:38:56 +010017#include <net/pkt_cls.h>
Alexander Duyck92651942008-09-12 16:29:34 -070018
19struct multiq_sched_data {
20 u16 bands;
21 u16 max_bands;
22 u16 curband;
John Fastabend25d8c0d2014-09-12 20:05:27 -070023 struct tcf_proto __rcu *filter_list;
Jiri Pirko6529eab2017-05-17 11:07:55 +020024 struct tcf_block *block;
Alexander Duyck92651942008-09-12 16:29:34 -070025 struct Qdisc **queues;
26};
27
28
29static struct Qdisc *
30multiq_classify(struct sk_buff *skb, struct Qdisc *sch, int *qerr)
31{
32 struct multiq_sched_data *q = qdisc_priv(sch);
33 u32 band;
34 struct tcf_result res;
John Fastabend25d8c0d2014-09-12 20:05:27 -070035 struct tcf_proto *fl = rcu_dereference_bh(q->filter_list);
Alexander Duyck92651942008-09-12 16:29:34 -070036 int err;
37
38 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;
Davide Caratti3aa26052021-07-28 20:08:00 +020039 err = tcf_classify(skb, NULL, fl, &res, false);
Alexander Duyck92651942008-09-12 16:29:34 -070040#ifdef CONFIG_NET_CLS_ACT
41 switch (err) {
42 case TC_ACT_STOLEN:
43 case TC_ACT_QUEUED:
Jiri Pirkoe25ea212017-06-06 14:12:02 +020044 case TC_ACT_TRAP:
Alexander Duyck92651942008-09-12 16:29:34 -070045 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;
Gustavo A. R. Silva964201d2020-07-07 12:21:38 -050046 fallthrough;
Alexander Duyck92651942008-09-12 16:29:34 -070047 case TC_ACT_SHOT:
48 return NULL;
49 }
50#endif
51 band = skb_get_queue_mapping(skb);
52
53 if (band >= q->bands)
54 return q->queues[0];
55
56 return q->queues[band];
57}
58
59static int
Petr Machataac5c66f2020-07-14 20:03:08 +030060multiq_enqueue(struct sk_buff *skb, struct Qdisc *sch,
Eric Dumazet520ac302016-06-21 23:16:49 -070061 struct sk_buff **to_free)
Alexander Duyck92651942008-09-12 16:29:34 -070062{
63 struct Qdisc *qdisc;
64 int ret;
65
66 qdisc = multiq_classify(skb, sch, &ret);
67#ifdef CONFIG_NET_CLS_ACT
68 if (qdisc == NULL) {
69
70 if (ret & __NET_XMIT_BYPASS)
John Fastabend25331d62014-09-28 11:53:29 -070071 qdisc_qstats_drop(sch);
Eric Dumazet520ac302016-06-21 23:16:49 -070072 __qdisc_drop(skb, to_free);
Alexander Duyck92651942008-09-12 16:29:34 -070073 return ret;
74 }
75#endif
76
Petr Machataac5c66f2020-07-14 20:03:08 +030077 ret = qdisc_enqueue(skb, qdisc, to_free);
Alexander Duyck92651942008-09-12 16:29:34 -070078 if (ret == NET_XMIT_SUCCESS) {
Alexander Duyck92651942008-09-12 16:29:34 -070079 sch->q.qlen++;
80 return NET_XMIT_SUCCESS;
81 }
82 if (net_xmit_drop_count(ret))
John Fastabend25331d62014-09-28 11:53:29 -070083 qdisc_qstats_drop(sch);
Alexander Duyck92651942008-09-12 16:29:34 -070084 return ret;
85}
86
Alexander Duyck92651942008-09-12 16:29:34 -070087static struct sk_buff *multiq_dequeue(struct Qdisc *sch)
88{
89 struct multiq_sched_data *q = qdisc_priv(sch);
90 struct Qdisc *qdisc;
91 struct sk_buff *skb;
92 int band;
93
94 for (band = 0; band < q->bands; band++) {
95 /* cycle through bands to ensure fairness */
96 q->curband++;
97 if (q->curband >= q->bands)
98 q->curband = 0;
99
100 /* Check that target subqueue is available before
Jarek Poplawskif30ab412008-11-13 22:56:30 -0800101 * pulling an skb to avoid head-of-line blocking.
Alexander Duyck92651942008-09-12 16:29:34 -0700102 */
Tom Herbert734664982011-11-28 16:32:44 +0000103 if (!netif_xmit_stopped(
104 netdev_get_tx_queue(qdisc_dev(sch), q->curband))) {
Alexander Duyck92651942008-09-12 16:29:34 -0700105 qdisc = q->queues[q->curband];
106 skb = qdisc->dequeue(qdisc);
107 if (skb) {
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800108 qdisc_bstats_update(sch, skb);
Alexander Duyck92651942008-09-12 16:29:34 -0700109 sch->q.qlen--;
110 return skb;
111 }
112 }
113 }
114 return NULL;
115
116}
117
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700118static struct sk_buff *multiq_peek(struct Qdisc *sch)
119{
120 struct multiq_sched_data *q = qdisc_priv(sch);
121 unsigned int curband = q->curband;
122 struct Qdisc *qdisc;
123 struct sk_buff *skb;
124 int band;
125
126 for (band = 0; band < q->bands; band++) {
127 /* cycle through bands to ensure fairness */
128 curband++;
129 if (curband >= q->bands)
130 curband = 0;
131
132 /* Check that target subqueue is available before
Jarek Poplawskif30ab412008-11-13 22:56:30 -0800133 * pulling an skb to avoid head-of-line blocking.
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700134 */
Tom Herbert734664982011-11-28 16:32:44 +0000135 if (!netif_xmit_stopped(
136 netdev_get_tx_queue(qdisc_dev(sch), curband))) {
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700137 qdisc = q->queues[curband];
138 skb = qdisc->ops->peek(qdisc);
139 if (skb)
140 return skb;
141 }
142 }
143 return NULL;
144
145}
146
Alexander Duyck92651942008-09-12 16:29:34 -0700147static void
148multiq_reset(struct Qdisc *sch)
149{
150 u16 band;
151 struct multiq_sched_data *q = qdisc_priv(sch);
152
153 for (band = 0; band < q->bands; band++)
154 qdisc_reset(q->queues[band]);
155 sch->q.qlen = 0;
156 q->curband = 0;
157}
158
159static void
160multiq_destroy(struct Qdisc *sch)
161{
162 int band;
163 struct multiq_sched_data *q = qdisc_priv(sch);
164
Jiri Pirko6529eab2017-05-17 11:07:55 +0200165 tcf_block_put(q->block);
Alexander Duyck92651942008-09-12 16:29:34 -0700166 for (band = 0; band < q->bands; band++)
Vlad Buslov86bd4462018-09-24 19:22:50 +0300167 qdisc_put(q->queues[band]);
Alexander Duyck92651942008-09-12 16:29:34 -0700168
169 kfree(q->queues);
170}
171
Alexander Aring20307212017-12-20 12:35:14 -0500172static int multiq_tune(struct Qdisc *sch, struct nlattr *opt,
173 struct netlink_ext_ack *extack)
Alexander Duyck92651942008-09-12 16:29:34 -0700174{
175 struct multiq_sched_data *q = qdisc_priv(sch);
176 struct tc_multiq_qopt *qopt;
Vlad Buslovc2999f72019-09-24 18:51:17 +0300177 struct Qdisc **removed;
178 int i, n_removed = 0;
Alexander Duyck92651942008-09-12 16:29:34 -0700179
180 if (!netif_is_multiqueue(qdisc_dev(sch)))
Jarek Poplawski149490f2009-02-10 00:11:21 -0800181 return -EOPNOTSUPP;
Alexander Duyck92651942008-09-12 16:29:34 -0700182 if (nla_len(opt) < sizeof(*qopt))
183 return -EINVAL;
184
185 qopt = nla_data(opt);
186
187 qopt->bands = qdisc_dev(sch)->real_num_tx_queues;
188
Vlad Buslovc2999f72019-09-24 18:51:17 +0300189 removed = kmalloc(sizeof(*removed) * (q->max_bands - q->bands),
190 GFP_KERNEL);
191 if (!removed)
192 return -ENOMEM;
193
Alexander Duyck92651942008-09-12 16:29:34 -0700194 sch_tree_lock(sch);
195 q->bands = qopt->bands;
196 for (i = q->bands; i < q->max_bands; i++) {
Alexander Duyckf07d1502008-09-12 17:57:23 -0700197 if (q->queues[i] != &noop_qdisc) {
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800198 struct Qdisc *child = q->queues[i];
Paolo Abenie5f0e8f2019-03-28 16:53:13 +0100199
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800200 q->queues[i] = &noop_qdisc;
Vlad Buslovc2999f72019-09-24 18:51:17 +0300201 qdisc_purge_queue(child);
202 removed[n_removed++] = child;
Alexander Duyck92651942008-09-12 16:29:34 -0700203 }
204 }
205
206 sch_tree_unlock(sch);
207
Vlad Buslovc2999f72019-09-24 18:51:17 +0300208 for (i = 0; i < n_removed; i++)
209 qdisc_put(removed[i]);
210 kfree(removed);
211
Alexander Duyck92651942008-09-12 16:29:34 -0700212 for (i = 0; i < q->bands; i++) {
213 if (q->queues[i] == &noop_qdisc) {
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800214 struct Qdisc *child, *old;
Changli Gao3511c912010-10-16 13:04:08 +0000215 child = qdisc_create_dflt(sch->dev_queue,
Alexander Duyck92651942008-09-12 16:29:34 -0700216 &pfifo_qdisc_ops,
217 TC_H_MAKE(sch->handle,
Alexander Aringa38a98822017-12-20 12:35:21 -0500218 i + 1), extack);
Alexander Duyck92651942008-09-12 16:29:34 -0700219 if (child) {
220 sch_tree_lock(sch);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800221 old = q->queues[i];
222 q->queues[i] = child;
Jiri Kosina49b49972017-03-08 16:03:32 +0100223 if (child != &noop_qdisc)
224 qdisc_hash_add(child, true);
Alexander Duyck92651942008-09-12 16:29:34 -0700225
Vlad Buslovc2999f72019-09-24 18:51:17 +0300226 if (old != &noop_qdisc)
227 qdisc_purge_queue(old);
Alexander Duyck92651942008-09-12 16:29:34 -0700228 sch_tree_unlock(sch);
Vlad Buslovc2999f72019-09-24 18:51:17 +0300229 qdisc_put(old);
Alexander Duyck92651942008-09-12 16:29:34 -0700230 }
231 }
232 }
233 return 0;
234}
235
Alexander Aringe63d7df2017-12-20 12:35:13 -0500236static int multiq_init(struct Qdisc *sch, struct nlattr *opt,
237 struct netlink_ext_ack *extack)
Alexander Duyck92651942008-09-12 16:29:34 -0700238{
239 struct multiq_sched_data *q = qdisc_priv(sch);
Alexander Duyckf07d1502008-09-12 17:57:23 -0700240 int i, err;
Alexander Duyck92651942008-09-12 16:29:34 -0700241
242 q->queues = NULL;
243
Alexander Aringac8ef4a2017-12-20 12:35:11 -0500244 if (!opt)
Alexander Duyck92651942008-09-12 16:29:34 -0700245 return -EINVAL;
246
Alexander Aring8d1a77f2017-12-20 12:35:19 -0500247 err = tcf_block_get(&q->block, &q->filter_list, sch, extack);
Jiri Pirko6529eab2017-05-17 11:07:55 +0200248 if (err)
249 return err;
250
Alexander Duyck92651942008-09-12 16:29:34 -0700251 q->max_bands = qdisc_dev(sch)->num_tx_queues;
252
253 q->queues = kcalloc(q->max_bands, sizeof(struct Qdisc *), GFP_KERNEL);
254 if (!q->queues)
255 return -ENOBUFS;
256 for (i = 0; i < q->max_bands; i++)
257 q->queues[i] = &noop_qdisc;
258
Alexander Aring20307212017-12-20 12:35:14 -0500259 return multiq_tune(sch, opt, extack);
Alexander Duyck92651942008-09-12 16:29:34 -0700260}
261
262static int multiq_dump(struct Qdisc *sch, struct sk_buff *skb)
263{
264 struct multiq_sched_data *q = qdisc_priv(sch);
265 unsigned char *b = skb_tail_pointer(skb);
266 struct tc_multiq_qopt opt;
267
268 opt.bands = q->bands;
269 opt.max_bands = q->max_bands;
270
David S. Miller1b34ec42012-03-29 05:11:39 -0400271 if (nla_put(skb, TCA_OPTIONS, sizeof(opt), &opt))
272 goto nla_put_failure;
Alexander Duyck92651942008-09-12 16:29:34 -0700273
274 return skb->len;
275
276nla_put_failure:
277 nlmsg_trim(skb, b);
278 return -1;
279}
280
281static int multiq_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
Alexander Aring653d6fd2017-12-20 12:35:17 -0500282 struct Qdisc **old, struct netlink_ext_ack *extack)
Alexander Duyck92651942008-09-12 16:29:34 -0700283{
284 struct multiq_sched_data *q = qdisc_priv(sch);
285 unsigned long band = arg - 1;
286
Alexander Duyck92651942008-09-12 16:29:34 -0700287 if (new == NULL)
288 new = &noop_qdisc;
289
WANG Cong86a79962016-02-25 14:55:00 -0800290 *old = qdisc_replace(sch, new, &q->queues[band]);
Alexander Duyck92651942008-09-12 16:29:34 -0700291 return 0;
292}
293
294static struct Qdisc *
295multiq_leaf(struct Qdisc *sch, unsigned long arg)
296{
297 struct multiq_sched_data *q = qdisc_priv(sch);
298 unsigned long band = arg - 1;
299
Alexander Duyck92651942008-09-12 16:29:34 -0700300 return q->queues[band];
301}
302
WANG Cong143976c2017-08-24 16:51:29 -0700303static unsigned long multiq_find(struct Qdisc *sch, u32 classid)
Alexander Duyck92651942008-09-12 16:29:34 -0700304{
305 struct multiq_sched_data *q = qdisc_priv(sch);
306 unsigned long band = TC_H_MIN(classid);
307
308 if (band - 1 >= q->bands)
309 return 0;
310 return band;
311}
312
313static unsigned long multiq_bind(struct Qdisc *sch, unsigned long parent,
314 u32 classid)
315{
WANG Cong143976c2017-08-24 16:51:29 -0700316 return multiq_find(sch, classid);
Alexander Duyck92651942008-09-12 16:29:34 -0700317}
318
319
WANG Cong143976c2017-08-24 16:51:29 -0700320static void multiq_unbind(struct Qdisc *q, unsigned long cl)
Alexander Duyck92651942008-09-12 16:29:34 -0700321{
Alexander Duyck92651942008-09-12 16:29:34 -0700322}
323
Alexander Duyck92651942008-09-12 16:29:34 -0700324static int multiq_dump_class(struct Qdisc *sch, unsigned long cl,
325 struct sk_buff *skb, struct tcmsg *tcm)
326{
327 struct multiq_sched_data *q = qdisc_priv(sch);
328
Alexander Duyck92651942008-09-12 16:29:34 -0700329 tcm->tcm_handle |= TC_H_MIN(cl);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000330 tcm->tcm_info = q->queues[cl - 1]->handle;
Alexander Duyck92651942008-09-12 16:29:34 -0700331 return 0;
332}
333
334static int multiq_dump_class_stats(struct Qdisc *sch, unsigned long cl,
335 struct gnet_dump *d)
336{
337 struct multiq_sched_data *q = qdisc_priv(sch);
338 struct Qdisc *cl_q;
339
340 cl_q = q->queues[cl - 1];
Eric Dumazetedb09eb2016-06-06 09:37:16 -0700341 if (gnet_stats_copy_basic(qdisc_root_sleeping_running(sch),
Dust Li14e54ab2019-11-28 14:29:09 +0800342 d, cl_q->cpu_bstats, &cl_q->bstats) < 0 ||
Paolo Abeni5dd431b2019-03-28 16:53:12 +0100343 qdisc_qstats_copy(d, cl_q) < 0)
Alexander Duyck92651942008-09-12 16:29:34 -0700344 return -1;
345
346 return 0;
347}
348
349static void multiq_walk(struct Qdisc *sch, struct qdisc_walker *arg)
350{
351 struct multiq_sched_data *q = qdisc_priv(sch);
352 int band;
353
354 if (arg->stop)
355 return;
356
357 for (band = 0; band < q->bands; band++) {
358 if (arg->count < arg->skip) {
359 arg->count++;
360 continue;
361 }
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000362 if (arg->fn(sch, band + 1, arg) < 0) {
Alexander Duyck92651942008-09-12 16:29:34 -0700363 arg->stop = 1;
364 break;
365 }
366 arg->count++;
367 }
368}
369
Alexander Aringcbaacc42017-12-20 12:35:16 -0500370static struct tcf_block *multiq_tcf_block(struct Qdisc *sch, unsigned long cl,
371 struct netlink_ext_ack *extack)
Alexander Duyck92651942008-09-12 16:29:34 -0700372{
373 struct multiq_sched_data *q = qdisc_priv(sch);
374
375 if (cl)
376 return NULL;
Jiri Pirko6529eab2017-05-17 11:07:55 +0200377 return q->block;
Alexander Duyck92651942008-09-12 16:29:34 -0700378}
379
380static const struct Qdisc_class_ops multiq_class_ops = {
381 .graft = multiq_graft,
382 .leaf = multiq_leaf,
WANG Cong143976c2017-08-24 16:51:29 -0700383 .find = multiq_find,
Alexander Duyck92651942008-09-12 16:29:34 -0700384 .walk = multiq_walk,
Jiri Pirko6529eab2017-05-17 11:07:55 +0200385 .tcf_block = multiq_tcf_block,
Alexander Duyck92651942008-09-12 16:29:34 -0700386 .bind_tcf = multiq_bind,
WANG Cong143976c2017-08-24 16:51:29 -0700387 .unbind_tcf = multiq_unbind,
Alexander Duyck92651942008-09-12 16:29:34 -0700388 .dump = multiq_dump_class,
389 .dump_stats = multiq_dump_class_stats,
390};
391
392static struct Qdisc_ops multiq_qdisc_ops __read_mostly = {
393 .next = NULL,
394 .cl_ops = &multiq_class_ops,
395 .id = "multiq",
396 .priv_size = sizeof(struct multiq_sched_data),
397 .enqueue = multiq_enqueue,
398 .dequeue = multiq_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700399 .peek = multiq_peek,
Alexander Duyck92651942008-09-12 16:29:34 -0700400 .init = multiq_init,
401 .reset = multiq_reset,
402 .destroy = multiq_destroy,
403 .change = multiq_tune,
404 .dump = multiq_dump,
405 .owner = THIS_MODULE,
406};
407
408static int __init multiq_module_init(void)
409{
410 return register_qdisc(&multiq_qdisc_ops);
411}
412
413static void __exit multiq_module_exit(void)
414{
415 unregister_qdisc(&multiq_qdisc_ops);
416}
417
418module_init(multiq_module_init)
419module_exit(multiq_module_exit)
420
421MODULE_LICENSE("GPL");