blob: e9ccf7daea7d84eeefe5e872b3497a6f0edc7ea9 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/cls_rsvp.h Template file for RSVPv[46] classifiers.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 */
11
12/*
13 Comparing to general packet classification problem,
14 RSVP needs only sevaral relatively simple rules:
15
16 * (dst, protocol) are always specified,
17 so that we are able to hash them.
18 * src may be exact, or may be wildcard, so that
19 we can keep a hash table plus one wildcard entry.
20 * source port (or flow label) is important only if src is given.
21
22 IMPLEMENTATION.
23
24 We use a two level hash table: The top level is keyed by
25 destination address and protocol ID, every bucket contains a list
26 of "rsvp sessions", identified by destination address, protocol and
27 DPI(="Destination Port ID"): triple (key, mask, offset).
28
29 Every bucket has a smaller hash table keyed by source address
30 (cf. RSVP flowspec) and one wildcard entry for wildcard reservations.
31 Every bucket is again a list of "RSVP flows", selected by
32 source address and SPI(="Source Port ID" here rather than
33 "security parameter index"): triple (key, mask, offset).
34
35
36 NOTE 1. All the packets with IPv6 extension headers (but AH and ESP)
37 and all fragmented packets go to the best-effort traffic class.
38
39
40 NOTE 2. Two "port id"'s seems to be redundant, rfc2207 requires
41 only one "Generalized Port Identifier". So that for classic
42 ah, esp (and udp,tcp) both *pi should coincide or one of them
43 should be wildcard.
44
45 At first sight, this redundancy is just a waste of CPU
46 resources. But DPI and SPI add the possibility to assign different
47 priorities to GPIs. Look also at note 4 about tunnels below.
48
49
50 NOTE 3. One complication is the case of tunneled packets.
51 We implement it as following: if the first lookup
52 matches a special session with "tunnelhdr" value not zero,
53 flowid doesn't contain the true flow ID, but the tunnel ID (1...255).
54 In this case, we pull tunnelhdr bytes and restart lookup
55 with tunnel ID added to the list of keys. Simple and stupid 8)8)
56 It's enough for PIMREG and IPIP.
57
58
59 NOTE 4. Two GPIs make it possible to parse even GRE packets.
60 F.e. DPI can select ETH_P_IP (and necessary flags to make
61 tunnelhdr correct) in GRE protocol field and SPI matches
62 GRE key. Is it not nice? 8)8)
63
64
65 Well, as result, despite its simplicity, we get a pretty
66 powerful classification engine. */
67
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Eric Dumazetcc7ec452011-01-19 19:26:56 +000069struct rsvp_head {
Linus Torvalds1da177e2005-04-16 15:20:36 -070070 u32 tmap[256/32];
71 u32 hgenerator;
72 u8 tgenerator;
John Fastabendb929d862014-09-12 20:09:49 -070073 struct rsvp_session __rcu *ht[256];
74 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075};
76
Eric Dumazetcc7ec452011-01-19 19:26:56 +000077struct rsvp_session {
John Fastabendb929d862014-09-12 20:09:49 -070078 struct rsvp_session __rcu *next;
79 __be32 dst[RSVP_DST_LEN];
80 struct tc_rsvp_gpi dpi;
81 u8 protocol;
82 u8 tunnelid;
Linus Torvalds1da177e2005-04-16 15:20:36 -070083 /* 16 (src,sport) hash slots, and one wildcard source slot */
John Fastabendb929d862014-09-12 20:09:49 -070084 struct rsvp_filter __rcu *ht[16 + 1];
85 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070086};
87
88
Eric Dumazetcc7ec452011-01-19 19:26:56 +000089struct rsvp_filter {
John Fastabendb929d862014-09-12 20:09:49 -070090 struct rsvp_filter __rcu *next;
91 __be32 src[RSVP_DST_LEN];
92 struct tc_rsvp_gpi spi;
93 u8 tunnelhdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -070094
John Fastabendb929d862014-09-12 20:09:49 -070095 struct tcf_result res;
96 struct tcf_exts exts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
John Fastabendb929d862014-09-12 20:09:49 -070098 u32 handle;
99 struct rsvp_session *sess;
Cong Wangaaa908f2018-05-23 15:26:53 -0700100 struct rcu_work rwork;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101};
102
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000103static inline unsigned int hash_dst(__be32 *dst, u8 protocol, u8 tunnelid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000105 unsigned int h = (__force __u32)dst[RSVP_DST_LEN - 1];
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 h ^= h>>16;
108 h ^= h>>8;
109 return (h ^ protocol ^ tunnelid) & 0xFF;
110}
111
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000112static inline unsigned int hash_src(__be32 *src)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000114 unsigned int h = (__force __u32)src[RSVP_DST_LEN-1];
115
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116 h ^= h>>16;
117 h ^= h>>8;
118 h ^= h>>4;
119 return h & 0xF;
120}
121
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122#define RSVP_APPLY_RESULT() \
123{ \
124 int r = tcf_exts_exec(skb, &f->exts, res); \
125 if (r < 0) \
126 continue; \
127 else if (r > 0) \
128 return r; \
129}
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900130
Eric Dumazetdc7f9f62011-07-05 23:25:42 +0000131static int rsvp_classify(struct sk_buff *skb, const struct tcf_proto *tp,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 struct tcf_result *res)
133{
John Fastabendb929d862014-09-12 20:09:49 -0700134 struct rsvp_head *head = rcu_dereference_bh(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 struct rsvp_session *s;
136 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000137 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800138 __be32 *dst, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 u8 protocol;
140 u8 tunnelid = 0;
141 u8 *xprt;
142#if RSVP_DST_LEN == 4
Changli Gao12dc96d2010-08-04 04:55:40 +0000143 struct ipv6hdr *nhptr;
144
145 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
146 return -1;
147 nhptr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148#else
Changli Gao12dc96d2010-08-04 04:55:40 +0000149 struct iphdr *nhptr;
150
151 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
152 return -1;
153 nhptr = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155restart:
156
157#if RSVP_DST_LEN == 4
158 src = &nhptr->saddr.s6_addr32[0];
159 dst = &nhptr->daddr.s6_addr32[0];
160 protocol = nhptr->nexthdr;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000161 xprt = ((u8 *)nhptr) + sizeof(struct ipv6hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162#else
163 src = &nhptr->saddr;
164 dst = &nhptr->daddr;
165 protocol = nhptr->protocol;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000166 xprt = ((u8 *)nhptr) + (nhptr->ihl<<2);
Paul Gortmaker56f8a752011-06-21 20:33:34 -0700167 if (ip_is_fragment(nhptr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 return -1;
169#endif
170
171 h1 = hash_dst(dst, protocol, tunnelid);
172 h2 = hash_src(src);
173
John Fastabendb929d862014-09-12 20:09:49 -0700174 for (s = rcu_dereference_bh(head->ht[h1]); s;
175 s = rcu_dereference_bh(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000176 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN - 1] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800178 !(s->dpi.mask &
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000179 (*(u32 *)(xprt + s->dpi.offset) ^ s->dpi.key)) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800181 dst[0] == s->dst[0] &&
182 dst[1] == s->dst[1] &&
183 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800185 tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186
John Fastabendb929d862014-09-12 20:09:49 -0700187 for (f = rcu_dereference_bh(s->ht[h2]); f;
188 f = rcu_dereference_bh(f->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000189 if (src[RSVP_DST_LEN-1] == f->src[RSVP_DST_LEN - 1] &&
190 !(f->spi.mask & (*(u32 *)(xprt + f->spi.offset) ^ f->spi.key))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800192 &&
193 src[0] == f->src[0] &&
194 src[1] == f->src[1] &&
195 src[2] == f->src[2]
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196#endif
197 ) {
198 *res = f->res;
199 RSVP_APPLY_RESULT();
200
201matched:
202 if (f->tunnelhdr == 0)
203 return 0;
204
205 tunnelid = f->res.classid;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000206 nhptr = (void *)(xprt + f->tunnelhdr - sizeof(*nhptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 goto restart;
208 }
209 }
210
211 /* And wildcard bucket... */
John Fastabendb929d862014-09-12 20:09:49 -0700212 for (f = rcu_dereference_bh(s->ht[16]); f;
213 f = rcu_dereference_bh(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 *res = f->res;
215 RSVP_APPLY_RESULT();
216 goto matched;
217 }
218 return -1;
219 }
220 }
221 return -1;
222}
223
John Fastabend53dfd502014-09-26 10:02:50 -0700224static void rsvp_replace(struct tcf_proto *tp, struct rsvp_filter *n, u32 h)
225{
226 struct rsvp_head *head = rtnl_dereference(tp->root);
227 struct rsvp_session *s;
228 struct rsvp_filter __rcu **ins;
229 struct rsvp_filter *pins;
230 unsigned int h1 = h & 0xFF;
231 unsigned int h2 = (h >> 8) & 0xFF;
232
233 for (s = rtnl_dereference(head->ht[h1]); s;
234 s = rtnl_dereference(s->next)) {
235 for (ins = &s->ht[h2], pins = rtnl_dereference(*ins); ;
236 ins = &pins->next, pins = rtnl_dereference(*ins)) {
237 if (pins->handle == h) {
238 RCU_INIT_POINTER(n->next, pins->next);
239 rcu_assign_pointer(*ins, n);
240 return;
241 }
242 }
243 }
244
245 /* Something went wrong if we are trying to replace a non-existant
246 * node. Mind as well halt instead of silently failing.
247 */
248 BUG_ON(1);
249}
250
WANG Cong8113c092017-08-04 21:31:43 -0700251static void *rsvp_get(struct tcf_proto *tp, u32 handle)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252{
John Fastabendb929d862014-09-12 20:09:49 -0700253 struct rsvp_head *head = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254 struct rsvp_session *s;
255 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000256 unsigned int h1 = handle & 0xFF;
257 unsigned int h2 = (handle >> 8) & 0xFF;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
259 if (h2 > 16)
WANG Cong8113c092017-08-04 21:31:43 -0700260 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261
John Fastabendb929d862014-09-12 20:09:49 -0700262 for (s = rtnl_dereference(head->ht[h1]); s;
263 s = rtnl_dereference(s->next)) {
264 for (f = rtnl_dereference(s->ht[h2]); f;
265 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 if (f->handle == handle)
WANG Cong8113c092017-08-04 21:31:43 -0700267 return f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 }
269 }
WANG Cong8113c092017-08-04 21:31:43 -0700270 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271}
272
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273static int rsvp_init(struct tcf_proto *tp)
274{
275 struct rsvp_head *data;
276
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700277 data = kzalloc(sizeof(struct rsvp_head), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 if (data) {
John Fastabendb929d862014-09-12 20:09:49 -0700279 rcu_assign_pointer(tp->root, data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 return 0;
281 }
282 return -ENOBUFS;
283}
284
Cong Wang96585062017-11-06 13:47:28 -0800285static void __rsvp_delete_filter(struct rsvp_filter *f)
286{
287 tcf_exts_destroy(&f->exts);
288 tcf_exts_put_net(&f->exts);
289 kfree(f);
290}
291
Cong Wangd4f84a42017-10-26 18:24:38 -0700292static void rsvp_delete_filter_work(struct work_struct *work)
293{
Cong Wangaaa908f2018-05-23 15:26:53 -0700294 struct rsvp_filter *f = container_of(to_rcu_work(work),
295 struct rsvp_filter,
296 rwork);
Cong Wangd4f84a42017-10-26 18:24:38 -0700297 rtnl_lock();
Cong Wang96585062017-11-06 13:47:28 -0800298 __rsvp_delete_filter(f);
Cong Wangd4f84a42017-10-26 18:24:38 -0700299 rtnl_unlock();
300}
301
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700302static void rsvp_delete_filter(struct tcf_proto *tp, struct rsvp_filter *f)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303{
304 tcf_unbind_filter(tp, &f->res);
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700305 /* all classifiers are required to call tcf_exts_destroy() after rcu
306 * grace period, since converted-to-rcu actions are relying on that
307 * in cleanup() callback
308 */
Cong Wang96585062017-11-06 13:47:28 -0800309 if (tcf_exts_get_net(&f->exts))
Cong Wangaaa908f2018-05-23 15:26:53 -0700310 tcf_queue_work(&f->rwork, rsvp_delete_filter_work);
Cong Wang96585062017-11-06 13:47:28 -0800311 else
312 __rsvp_delete_filter(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313}
314
Jakub Kicinski715df5e2018-01-24 12:54:13 -0800315static void rsvp_destroy(struct tcf_proto *tp, struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316{
John Fastabendb929d862014-09-12 20:09:49 -0700317 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318 int h1, h2;
319
320 if (data == NULL)
WANG Cong763dbf62017-04-19 14:21:21 -0700321 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000323 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 struct rsvp_session *s;
325
John Fastabendb929d862014-09-12 20:09:49 -0700326 while ((s = rtnl_dereference(data->ht[h1])) != NULL) {
327 RCU_INIT_POINTER(data->ht[h1], s->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000329 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 struct rsvp_filter *f;
331
John Fastabendb929d862014-09-12 20:09:49 -0700332 while ((f = rtnl_dereference(s->ht[h2])) != NULL) {
333 rcu_assign_pointer(s->ht[h2], f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334 rsvp_delete_filter(tp, f);
335 }
336 }
John Fastabendb929d862014-09-12 20:09:49 -0700337 kfree_rcu(s, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338 }
339 }
John Fastabendb929d862014-09-12 20:09:49 -0700340 kfree_rcu(data, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341}
342
Alexander Aring571acf22018-01-18 11:20:53 -0500343static int rsvp_delete(struct tcf_proto *tp, void *arg, bool *last,
344 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345{
John Fastabendb929d862014-09-12 20:09:49 -0700346 struct rsvp_head *head = rtnl_dereference(tp->root);
WANG Cong8113c092017-08-04 21:31:43 -0700347 struct rsvp_filter *nfp, *f = arg;
John Fastabendb929d862014-09-12 20:09:49 -0700348 struct rsvp_filter __rcu **fp;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000349 unsigned int h = f->handle;
John Fastabendb929d862014-09-12 20:09:49 -0700350 struct rsvp_session __rcu **sp;
351 struct rsvp_session *nsp, *s = f->sess;
WANG Cong763dbf62017-04-19 14:21:21 -0700352 int i, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353
John Fastabendb929d862014-09-12 20:09:49 -0700354 fp = &s->ht[(h >> 8) & 0xFF];
355 for (nfp = rtnl_dereference(*fp); nfp;
356 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
357 if (nfp == f) {
358 RCU_INIT_POINTER(*fp, f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 rsvp_delete_filter(tp, f);
360
361 /* Strip tree */
362
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000363 for (i = 0; i <= 16; i++)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364 if (s->ht[i])
WANG Cong763dbf62017-04-19 14:21:21 -0700365 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366
367 /* OK, session has no flows */
John Fastabendb929d862014-09-12 20:09:49 -0700368 sp = &head->ht[h & 0xFF];
369 for (nsp = rtnl_dereference(*sp); nsp;
370 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
371 if (nsp == s) {
372 RCU_INIT_POINTER(*sp, s->next);
373 kfree_rcu(s, rcu);
WANG Cong763dbf62017-04-19 14:21:21 -0700374 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 }
376 }
377
WANG Cong763dbf62017-04-19 14:21:21 -0700378 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 }
380 }
WANG Cong763dbf62017-04-19 14:21:21 -0700381
382out:
383 *last = true;
384 for (h1 = 0; h1 < 256; h1++) {
385 if (rcu_access_pointer(head->ht[h1])) {
386 *last = false;
387 break;
388 }
389 }
390
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391 return 0;
392}
393
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000394static unsigned int gen_handle(struct tcf_proto *tp, unsigned salt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395{
John Fastabendb929d862014-09-12 20:09:49 -0700396 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 int i = 0xFFFF;
398
399 while (i-- > 0) {
400 u32 h;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000401
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402 if ((data->hgenerator += 0x10000) == 0)
403 data->hgenerator = 0x10000;
404 h = data->hgenerator|salt;
Josh Hunt230cfd22017-09-10 15:48:50 -0400405 if (!rsvp_get(tp, h))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 return h;
407 }
408 return 0;
409}
410
411static int tunnel_bts(struct rsvp_head *data)
412{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000413 int n = data->tgenerator >> 5;
414 u32 b = 1 << (data->tgenerator & 0x1F);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900415
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000416 if (data->tmap[n] & b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 return 0;
418 data->tmap[n] |= b;
419 return 1;
420}
421
422static void tunnel_recycle(struct rsvp_head *data)
423{
John Fastabendb929d862014-09-12 20:09:49 -0700424 struct rsvp_session __rcu **sht = data->ht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 u32 tmap[256/32];
426 int h1, h2;
427
428 memset(tmap, 0, sizeof(tmap));
429
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000430 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431 struct rsvp_session *s;
John Fastabendb929d862014-09-12 20:09:49 -0700432 for (s = rtnl_dereference(sht[h1]); s;
433 s = rtnl_dereference(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000434 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 struct rsvp_filter *f;
436
John Fastabendb929d862014-09-12 20:09:49 -0700437 for (f = rtnl_dereference(s->ht[h2]); f;
438 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439 if (f->tunnelhdr == 0)
440 continue;
441 data->tgenerator = f->res.classid;
442 tunnel_bts(data);
443 }
444 }
445 }
446 }
447
448 memcpy(data->tmap, tmap, sizeof(tmap));
449}
450
451static u32 gen_tunnel(struct rsvp_head *data)
452{
453 int i, k;
454
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000455 for (k = 0; k < 2; k++) {
456 for (i = 255; i > 0; i--) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 if (++data->tgenerator == 0)
458 data->tgenerator = 1;
459 if (tunnel_bts(data))
460 return data->tgenerator;
461 }
462 tunnel_recycle(data);
463 }
464 return 0;
465}
466
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800467static const struct nla_policy rsvp_policy[TCA_RSVP_MAX + 1] = {
468 [TCA_RSVP_CLASSID] = { .type = NLA_U32 },
469 [TCA_RSVP_DST] = { .type = NLA_BINARY,
470 .len = RSVP_DST_LEN * sizeof(u32) },
471 [TCA_RSVP_SRC] = { .type = NLA_BINARY,
472 .len = RSVP_DST_LEN * sizeof(u32) },
473 [TCA_RSVP_PINFO] = { .len = sizeof(struct tc_rsvp_pinfo) },
474};
475
Benjamin LaHaisec1b52732013-01-14 05:15:39 +0000476static int rsvp_change(struct net *net, struct sk_buff *in_skb,
Eric W. Biedermanaf4c6642012-05-25 13:42:45 -0600477 struct tcf_proto *tp, unsigned long base,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 u32 handle,
Patrick McHardyadd93b62008-01-22 22:11:33 -0800479 struct nlattr **tca,
Alexander Aring7306db32018-01-18 11:20:51 -0500480 void **arg, bool ovr, struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481{
John Fastabendb929d862014-09-12 20:09:49 -0700482 struct rsvp_head *data = rtnl_dereference(tp->root);
483 struct rsvp_filter *f, *nfp;
484 struct rsvp_filter __rcu **fp;
485 struct rsvp_session *nsp, *s;
486 struct rsvp_session __rcu **sp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487 struct tc_rsvp_pinfo *pinfo = NULL;
Igor Maravić27e95a82011-08-30 03:12:55 +0000488 struct nlattr *opt = tca[TCA_OPTIONS];
Patrick McHardyadd93b62008-01-22 22:11:33 -0800489 struct nlattr *tb[TCA_RSVP_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 struct tcf_exts e;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000491 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800492 __be32 *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493 int err;
494
495 if (opt == NULL)
496 return handle ? -EINVAL : 0;
497
Johannes Bergfceb6432017-04-12 14:34:07 +0200498 err = nla_parse_nested(tb, TCA_RSVP_MAX, opt, rsvp_policy, NULL);
Patrick McHardycee63722008-01-23 20:33:32 -0800499 if (err < 0)
500 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501
WANG Congb9a24bb2016-08-19 12:36:54 -0700502 err = tcf_exts_init(&e, TCA_RSVP_ACT, TCA_RSVP_POLICE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503 if (err < 0)
504 return err;
Alexander Aring50a56192018-01-18 11:20:52 -0500505 err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr, extack);
WANG Congb9a24bb2016-08-19 12:36:54 -0700506 if (err < 0)
507 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508
WANG Cong8113c092017-08-04 21:31:43 -0700509 f = *arg;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000510 if (f) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 /* Node exists: adjust only classid */
John Fastabend53dfd502014-09-26 10:02:50 -0700512 struct rsvp_filter *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513
514 if (f->handle != handle && handle)
515 goto errout2;
John Fastabend53dfd502014-09-26 10:02:50 -0700516
517 n = kmemdup(f, sizeof(*f), GFP_KERNEL);
518 if (!n) {
519 err = -ENOMEM;
520 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 }
522
WANG Congb9a24bb2016-08-19 12:36:54 -0700523 err = tcf_exts_init(&n->exts, TCA_RSVP_ACT, TCA_RSVP_POLICE);
524 if (err < 0) {
525 kfree(n);
526 goto errout2;
527 }
John Fastabend53dfd502014-09-26 10:02:50 -0700528
529 if (tb[TCA_RSVP_CLASSID]) {
530 n->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
531 tcf_bind_filter(tp, &n->res, base);
532 }
533
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200534 tcf_exts_change(&n->exts, &e);
John Fastabend53dfd502014-09-26 10:02:50 -0700535 rsvp_replace(tp, n, handle);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 return 0;
537 }
538
539 /* Now more serious part... */
540 err = -EINVAL;
541 if (handle)
542 goto errout2;
Igor Maravić27e95a82011-08-30 03:12:55 +0000543 if (tb[TCA_RSVP_DST] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 goto errout2;
545
546 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700547 f = kzalloc(sizeof(struct rsvp_filter), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548 if (f == NULL)
549 goto errout2;
550
WANG Congb9a24bb2016-08-19 12:36:54 -0700551 err = tcf_exts_init(&f->exts, TCA_RSVP_ACT, TCA_RSVP_POLICE);
552 if (err < 0)
553 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554 h2 = 16;
Igor Maravić27e95a82011-08-30 03:12:55 +0000555 if (tb[TCA_RSVP_SRC]) {
556 memcpy(f->src, nla_data(tb[TCA_RSVP_SRC]), sizeof(f->src));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 h2 = hash_src(f->src);
558 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000559 if (tb[TCA_RSVP_PINFO]) {
560 pinfo = nla_data(tb[TCA_RSVP_PINFO]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 f->spi = pinfo->spi;
562 f->tunnelhdr = pinfo->tunnelhdr;
563 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000564 if (tb[TCA_RSVP_CLASSID])
565 f->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700566
Igor Maravić27e95a82011-08-30 03:12:55 +0000567 dst = nla_data(tb[TCA_RSVP_DST]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 h1 = hash_dst(dst, pinfo ? pinfo->protocol : 0, pinfo ? pinfo->tunnelid : 0);
569
570 err = -ENOMEM;
571 if ((f->handle = gen_handle(tp, h1 | (h2<<8))) == 0)
572 goto errout;
573
574 if (f->tunnelhdr) {
575 err = -EINVAL;
576 if (f->res.classid > 255)
577 goto errout;
578
579 err = -ENOMEM;
580 if (f->res.classid == 0 &&
581 (f->res.classid = gen_tunnel(data)) == 0)
582 goto errout;
583 }
584
John Fastabendb929d862014-09-12 20:09:49 -0700585 for (sp = &data->ht[h1];
586 (s = rtnl_dereference(*sp)) != NULL;
587 sp = &s->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN-1] &&
589 pinfo && pinfo->protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800590 memcmp(&pinfo->dpi, &s->dpi, sizeof(s->dpi)) == 0 &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800592 dst[0] == s->dst[0] &&
593 dst[1] == s->dst[1] &&
594 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800596 pinfo->tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597
598insert:
599 /* OK, we found appropriate session */
600
601 fp = &s->ht[h2];
602
603 f->sess = s;
604 if (f->tunnelhdr == 0)
605 tcf_bind_filter(tp, &f->res, base);
606
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200607 tcf_exts_change(&f->exts, &e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700608
John Fastabendb929d862014-09-12 20:09:49 -0700609 fp = &s->ht[h2];
610 for (nfp = rtnl_dereference(*fp); nfp;
611 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
612 __u32 mask = nfp->spi.mask & f->spi.mask;
613
614 if (mask != f->spi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700615 break;
John Fastabendb929d862014-09-12 20:09:49 -0700616 }
617 RCU_INIT_POINTER(f->next, nfp);
618 rcu_assign_pointer(*fp, f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619
WANG Cong8113c092017-08-04 21:31:43 -0700620 *arg = f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621 return 0;
622 }
623 }
624
625 /* No session found. Create new one. */
626
627 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700628 s = kzalloc(sizeof(struct rsvp_session), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700629 if (s == NULL)
630 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 memcpy(s->dst, dst, sizeof(s->dst));
632
633 if (pinfo) {
634 s->dpi = pinfo->dpi;
635 s->protocol = pinfo->protocol;
636 s->tunnelid = pinfo->tunnelid;
637 }
John Fastabendb929d862014-09-12 20:09:49 -0700638 sp = &data->ht[h1];
639 for (nsp = rtnl_dereference(*sp); nsp;
640 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
641 if ((nsp->dpi.mask & s->dpi.mask) != s->dpi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642 break;
643 }
John Fastabendb929d862014-09-12 20:09:49 -0700644 RCU_INIT_POINTER(s->next, nsp);
645 rcu_assign_pointer(*sp, s);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900646
Linus Torvalds1da177e2005-04-16 15:20:36 -0700647 goto insert;
648
649errout:
WANG Congb9a24bb2016-08-19 12:36:54 -0700650 tcf_exts_destroy(&f->exts);
Jesper Juhla51482b2005-11-08 09:41:34 -0800651 kfree(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652errout2:
WANG Cong18d02642014-09-25 10:26:37 -0700653 tcf_exts_destroy(&e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654 return err;
655}
656
657static void rsvp_walk(struct tcf_proto *tp, struct tcf_walker *arg)
658{
John Fastabendb929d862014-09-12 20:09:49 -0700659 struct rsvp_head *head = rtnl_dereference(tp->root);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000660 unsigned int h, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700661
662 if (arg->stop)
663 return;
664
665 for (h = 0; h < 256; h++) {
666 struct rsvp_session *s;
667
John Fastabendb929d862014-09-12 20:09:49 -0700668 for (s = rtnl_dereference(head->ht[h]); s;
669 s = rtnl_dereference(s->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 for (h1 = 0; h1 <= 16; h1++) {
671 struct rsvp_filter *f;
672
John Fastabendb929d862014-09-12 20:09:49 -0700673 for (f = rtnl_dereference(s->ht[h1]); f;
674 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 if (arg->count < arg->skip) {
676 arg->count++;
677 continue;
678 }
WANG Cong8113c092017-08-04 21:31:43 -0700679 if (arg->fn(tp, f, arg) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700680 arg->stop = 1;
681 return;
682 }
683 arg->count++;
684 }
685 }
686 }
687 }
688}
689
WANG Cong8113c092017-08-04 21:31:43 -0700690static int rsvp_dump(struct net *net, struct tcf_proto *tp, void *fh,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691 struct sk_buff *skb, struct tcmsg *t)
692{
WANG Cong8113c092017-08-04 21:31:43 -0700693 struct rsvp_filter *f = fh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 struct rsvp_session *s;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800695 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696 struct tc_rsvp_pinfo pinfo;
697
698 if (f == NULL)
699 return skb->len;
700 s = f->sess;
701
702 t->tcm_handle = f->handle;
703
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800704 nest = nla_nest_start(skb, TCA_OPTIONS);
705 if (nest == NULL)
706 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707
David S. Miller1b34ec42012-03-29 05:11:39 -0400708 if (nla_put(skb, TCA_RSVP_DST, sizeof(s->dst), &s->dst))
709 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 pinfo.dpi = s->dpi;
711 pinfo.spi = f->spi;
712 pinfo.protocol = s->protocol;
713 pinfo.tunnelid = s->tunnelid;
714 pinfo.tunnelhdr = f->tunnelhdr;
Patrick McHardy8a470772005-06-28 12:56:45 -0700715 pinfo.pad = 0;
David S. Miller1b34ec42012-03-29 05:11:39 -0400716 if (nla_put(skb, TCA_RSVP_PINFO, sizeof(pinfo), &pinfo))
717 goto nla_put_failure;
718 if (f->res.classid &&
719 nla_put_u32(skb, TCA_RSVP_CLASSID, f->res.classid))
720 goto nla_put_failure;
721 if (((f->handle >> 8) & 0xFF) != 16 &&
722 nla_put(skb, TCA_RSVP_SRC, sizeof(f->src), f->src))
723 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724
WANG Cong5da57f42013-12-15 20:15:07 -0800725 if (tcf_exts_dump(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800726 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800728 nla_nest_end(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729
WANG Cong5da57f42013-12-15 20:15:07 -0800730 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800731 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 return skb->len;
733
Patrick McHardyadd93b62008-01-22 22:11:33 -0800734nla_put_failure:
Jiri Pirko6ea3b442014-12-09 22:23:29 +0100735 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 return -1;
737}
738
Cong Wang07d79fc2017-08-30 14:30:36 -0700739static void rsvp_bind_class(void *fh, u32 classid, unsigned long cl)
740{
741 struct rsvp_filter *f = fh;
742
743 if (f && f->res.classid == classid)
744 f->res.class = cl;
745}
746
Igor Maravić27e95a82011-08-30 03:12:55 +0000747static struct tcf_proto_ops RSVP_OPS __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 .kind = RSVP_ID,
749 .classify = rsvp_classify,
750 .init = rsvp_init,
751 .destroy = rsvp_destroy,
752 .get = rsvp_get,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 .change = rsvp_change,
754 .delete = rsvp_delete,
755 .walk = rsvp_walk,
756 .dump = rsvp_dump,
Cong Wang07d79fc2017-08-30 14:30:36 -0700757 .bind_class = rsvp_bind_class,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 .owner = THIS_MODULE,
759};
760
761static int __init init_rsvp(void)
762{
763 return register_tcf_proto_ops(&RSVP_OPS);
764}
765
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900766static void __exit exit_rsvp(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767{
768 unregister_tcf_proto_ops(&RSVP_OPS);
769}
770
771module_init(init_rsvp)
772module_exit(exit_rsvp)