blob: d36949d9382c41dda54d12269fe1e8ff9c7e397f [file] [log] [blame]
Thomas Gleixner2874c5f2019-05-27 08:55:01 +02001/* SPDX-License-Identifier: GPL-2.0-or-later */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * net/sched/cls_rsvp.h Template file for RSVPv[46] classifiers.
4 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
6 */
7
8/*
9 Comparing to general packet classification problem,
10 RSVP needs only sevaral relatively simple rules:
11
12 * (dst, protocol) are always specified,
13 so that we are able to hash them.
14 * src may be exact, or may be wildcard, so that
15 we can keep a hash table plus one wildcard entry.
16 * source port (or flow label) is important only if src is given.
17
18 IMPLEMENTATION.
19
20 We use a two level hash table: The top level is keyed by
21 destination address and protocol ID, every bucket contains a list
22 of "rsvp sessions", identified by destination address, protocol and
23 DPI(="Destination Port ID"): triple (key, mask, offset).
24
25 Every bucket has a smaller hash table keyed by source address
26 (cf. RSVP flowspec) and one wildcard entry for wildcard reservations.
27 Every bucket is again a list of "RSVP flows", selected by
28 source address and SPI(="Source Port ID" here rather than
29 "security parameter index"): triple (key, mask, offset).
30
31
32 NOTE 1. All the packets with IPv6 extension headers (but AH and ESP)
33 and all fragmented packets go to the best-effort traffic class.
34
35
36 NOTE 2. Two "port id"'s seems to be redundant, rfc2207 requires
37 only one "Generalized Port Identifier". So that for classic
38 ah, esp (and udp,tcp) both *pi should coincide or one of them
39 should be wildcard.
40
41 At first sight, this redundancy is just a waste of CPU
42 resources. But DPI and SPI add the possibility to assign different
43 priorities to GPIs. Look also at note 4 about tunnels below.
44
45
46 NOTE 3. One complication is the case of tunneled packets.
47 We implement it as following: if the first lookup
48 matches a special session with "tunnelhdr" value not zero,
49 flowid doesn't contain the true flow ID, but the tunnel ID (1...255).
50 In this case, we pull tunnelhdr bytes and restart lookup
51 with tunnel ID added to the list of keys. Simple and stupid 8)8)
52 It's enough for PIMREG and IPIP.
53
54
55 NOTE 4. Two GPIs make it possible to parse even GRE packets.
56 F.e. DPI can select ETH_P_IP (and necessary flags to make
57 tunnelhdr correct) in GRE protocol field and SPI matches
58 GRE key. Is it not nice? 8)8)
59
60
61 Well, as result, despite its simplicity, we get a pretty
62 powerful classification engine. */
63
Linus Torvalds1da177e2005-04-16 15:20:36 -070064
Eric Dumazetcc7ec452011-01-19 19:26:56 +000065struct rsvp_head {
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 u32 tmap[256/32];
67 u32 hgenerator;
68 u8 tgenerator;
John Fastabendb929d862014-09-12 20:09:49 -070069 struct rsvp_session __rcu *ht[256];
70 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070071};
72
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073struct rsvp_session {
John Fastabendb929d862014-09-12 20:09:49 -070074 struct rsvp_session __rcu *next;
75 __be32 dst[RSVP_DST_LEN];
76 struct tc_rsvp_gpi dpi;
77 u8 protocol;
78 u8 tunnelid;
Linus Torvalds1da177e2005-04-16 15:20:36 -070079 /* 16 (src,sport) hash slots, and one wildcard source slot */
John Fastabendb929d862014-09-12 20:09:49 -070080 struct rsvp_filter __rcu *ht[16 + 1];
81 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082};
83
84
Eric Dumazetcc7ec452011-01-19 19:26:56 +000085struct rsvp_filter {
John Fastabendb929d862014-09-12 20:09:49 -070086 struct rsvp_filter __rcu *next;
87 __be32 src[RSVP_DST_LEN];
88 struct tc_rsvp_gpi spi;
89 u8 tunnelhdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -070090
John Fastabendb929d862014-09-12 20:09:49 -070091 struct tcf_result res;
92 struct tcf_exts exts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
John Fastabendb929d862014-09-12 20:09:49 -070094 u32 handle;
95 struct rsvp_session *sess;
Cong Wangaaa908f2018-05-23 15:26:53 -070096 struct rcu_work rwork;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097};
98
Eric Dumazetcc7ec452011-01-19 19:26:56 +000099static inline unsigned int hash_dst(__be32 *dst, u8 protocol, u8 tunnelid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000101 unsigned int h = (__force __u32)dst[RSVP_DST_LEN - 1];
102
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103 h ^= h>>16;
104 h ^= h>>8;
105 return (h ^ protocol ^ tunnelid) & 0xFF;
106}
107
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000108static inline unsigned int hash_src(__be32 *src)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000110 unsigned int h = (__force __u32)src[RSVP_DST_LEN-1];
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 h ^= h>>16;
113 h ^= h>>8;
114 h ^= h>>4;
115 return h & 0xF;
116}
117
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118#define RSVP_APPLY_RESULT() \
119{ \
120 int r = tcf_exts_exec(skb, &f->exts, res); \
121 if (r < 0) \
122 continue; \
123 else if (r > 0) \
124 return r; \
125}
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900126
Eric Dumazetdc7f9f62011-07-05 23:25:42 +0000127static int rsvp_classify(struct sk_buff *skb, const struct tcf_proto *tp,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128 struct tcf_result *res)
129{
John Fastabendb929d862014-09-12 20:09:49 -0700130 struct rsvp_head *head = rcu_dereference_bh(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 struct rsvp_session *s;
132 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000133 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800134 __be32 *dst, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 u8 protocol;
136 u8 tunnelid = 0;
137 u8 *xprt;
138#if RSVP_DST_LEN == 4
Changli Gao12dc96d2010-08-04 04:55:40 +0000139 struct ipv6hdr *nhptr;
140
141 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
142 return -1;
143 nhptr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144#else
Changli Gao12dc96d2010-08-04 04:55:40 +0000145 struct iphdr *nhptr;
146
147 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
148 return -1;
149 nhptr = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151restart:
152
153#if RSVP_DST_LEN == 4
154 src = &nhptr->saddr.s6_addr32[0];
155 dst = &nhptr->daddr.s6_addr32[0];
156 protocol = nhptr->nexthdr;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000157 xprt = ((u8 *)nhptr) + sizeof(struct ipv6hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158#else
159 src = &nhptr->saddr;
160 dst = &nhptr->daddr;
161 protocol = nhptr->protocol;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000162 xprt = ((u8 *)nhptr) + (nhptr->ihl<<2);
Paul Gortmaker56f8a752011-06-21 20:33:34 -0700163 if (ip_is_fragment(nhptr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 return -1;
165#endif
166
167 h1 = hash_dst(dst, protocol, tunnelid);
168 h2 = hash_src(src);
169
John Fastabendb929d862014-09-12 20:09:49 -0700170 for (s = rcu_dereference_bh(head->ht[h1]); s;
171 s = rcu_dereference_bh(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000172 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN - 1] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800174 !(s->dpi.mask &
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000175 (*(u32 *)(xprt + s->dpi.offset) ^ s->dpi.key)) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800177 dst[0] == s->dst[0] &&
178 dst[1] == s->dst[1] &&
179 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800181 tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182
John Fastabendb929d862014-09-12 20:09:49 -0700183 for (f = rcu_dereference_bh(s->ht[h2]); f;
184 f = rcu_dereference_bh(f->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000185 if (src[RSVP_DST_LEN-1] == f->src[RSVP_DST_LEN - 1] &&
186 !(f->spi.mask & (*(u32 *)(xprt + f->spi.offset) ^ f->spi.key))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800188 &&
189 src[0] == f->src[0] &&
190 src[1] == f->src[1] &&
191 src[2] == f->src[2]
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192#endif
193 ) {
194 *res = f->res;
195 RSVP_APPLY_RESULT();
196
197matched:
198 if (f->tunnelhdr == 0)
199 return 0;
200
201 tunnelid = f->res.classid;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000202 nhptr = (void *)(xprt + f->tunnelhdr - sizeof(*nhptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 goto restart;
204 }
205 }
206
207 /* And wildcard bucket... */
John Fastabendb929d862014-09-12 20:09:49 -0700208 for (f = rcu_dereference_bh(s->ht[16]); f;
209 f = rcu_dereference_bh(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210 *res = f->res;
211 RSVP_APPLY_RESULT();
212 goto matched;
213 }
214 return -1;
215 }
216 }
217 return -1;
218}
219
John Fastabend53dfd502014-09-26 10:02:50 -0700220static void rsvp_replace(struct tcf_proto *tp, struct rsvp_filter *n, u32 h)
221{
222 struct rsvp_head *head = rtnl_dereference(tp->root);
223 struct rsvp_session *s;
224 struct rsvp_filter __rcu **ins;
225 struct rsvp_filter *pins;
226 unsigned int h1 = h & 0xFF;
227 unsigned int h2 = (h >> 8) & 0xFF;
228
229 for (s = rtnl_dereference(head->ht[h1]); s;
230 s = rtnl_dereference(s->next)) {
231 for (ins = &s->ht[h2], pins = rtnl_dereference(*ins); ;
232 ins = &pins->next, pins = rtnl_dereference(*ins)) {
233 if (pins->handle == h) {
234 RCU_INIT_POINTER(n->next, pins->next);
235 rcu_assign_pointer(*ins, n);
236 return;
237 }
238 }
239 }
240
241 /* Something went wrong if we are trying to replace a non-existant
242 * node. Mind as well halt instead of silently failing.
243 */
244 BUG_ON(1);
245}
246
WANG Cong8113c092017-08-04 21:31:43 -0700247static void *rsvp_get(struct tcf_proto *tp, u32 handle)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248{
John Fastabendb929d862014-09-12 20:09:49 -0700249 struct rsvp_head *head = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 struct rsvp_session *s;
251 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000252 unsigned int h1 = handle & 0xFF;
253 unsigned int h2 = (handle >> 8) & 0xFF;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
255 if (h2 > 16)
WANG Cong8113c092017-08-04 21:31:43 -0700256 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
John Fastabendb929d862014-09-12 20:09:49 -0700258 for (s = rtnl_dereference(head->ht[h1]); s;
259 s = rtnl_dereference(s->next)) {
260 for (f = rtnl_dereference(s->ht[h2]); f;
261 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 if (f->handle == handle)
WANG Cong8113c092017-08-04 21:31:43 -0700263 return f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 }
265 }
WANG Cong8113c092017-08-04 21:31:43 -0700266 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267}
268
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269static int rsvp_init(struct tcf_proto *tp)
270{
271 struct rsvp_head *data;
272
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700273 data = kzalloc(sizeof(struct rsvp_head), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 if (data) {
John Fastabendb929d862014-09-12 20:09:49 -0700275 rcu_assign_pointer(tp->root, data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 return 0;
277 }
278 return -ENOBUFS;
279}
280
Cong Wang96585062017-11-06 13:47:28 -0800281static void __rsvp_delete_filter(struct rsvp_filter *f)
282{
283 tcf_exts_destroy(&f->exts);
284 tcf_exts_put_net(&f->exts);
285 kfree(f);
286}
287
Cong Wangd4f84a42017-10-26 18:24:38 -0700288static void rsvp_delete_filter_work(struct work_struct *work)
289{
Cong Wangaaa908f2018-05-23 15:26:53 -0700290 struct rsvp_filter *f = container_of(to_rcu_work(work),
291 struct rsvp_filter,
292 rwork);
Cong Wangd4f84a42017-10-26 18:24:38 -0700293 rtnl_lock();
Cong Wang96585062017-11-06 13:47:28 -0800294 __rsvp_delete_filter(f);
Cong Wangd4f84a42017-10-26 18:24:38 -0700295 rtnl_unlock();
296}
297
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700298static void rsvp_delete_filter(struct tcf_proto *tp, struct rsvp_filter *f)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299{
300 tcf_unbind_filter(tp, &f->res);
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700301 /* all classifiers are required to call tcf_exts_destroy() after rcu
302 * grace period, since converted-to-rcu actions are relying on that
303 * in cleanup() callback
304 */
Cong Wang96585062017-11-06 13:47:28 -0800305 if (tcf_exts_get_net(&f->exts))
Cong Wangaaa908f2018-05-23 15:26:53 -0700306 tcf_queue_work(&f->rwork, rsvp_delete_filter_work);
Cong Wang96585062017-11-06 13:47:28 -0800307 else
308 __rsvp_delete_filter(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309}
310
Vlad Buslov12db03b2019-02-11 10:55:45 +0200311static void rsvp_destroy(struct tcf_proto *tp, bool rtnl_held,
312 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313{
John Fastabendb929d862014-09-12 20:09:49 -0700314 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 int h1, h2;
316
317 if (data == NULL)
WANG Cong763dbf62017-04-19 14:21:21 -0700318 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000320 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321 struct rsvp_session *s;
322
John Fastabendb929d862014-09-12 20:09:49 -0700323 while ((s = rtnl_dereference(data->ht[h1])) != NULL) {
324 RCU_INIT_POINTER(data->ht[h1], s->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000326 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 struct rsvp_filter *f;
328
John Fastabendb929d862014-09-12 20:09:49 -0700329 while ((f = rtnl_dereference(s->ht[h2])) != NULL) {
330 rcu_assign_pointer(s->ht[h2], f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 rsvp_delete_filter(tp, f);
332 }
333 }
John Fastabendb929d862014-09-12 20:09:49 -0700334 kfree_rcu(s, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 }
336 }
John Fastabendb929d862014-09-12 20:09:49 -0700337 kfree_rcu(data, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338}
339
Alexander Aring571acf22018-01-18 11:20:53 -0500340static int rsvp_delete(struct tcf_proto *tp, void *arg, bool *last,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200341 bool rtnl_held, struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342{
John Fastabendb929d862014-09-12 20:09:49 -0700343 struct rsvp_head *head = rtnl_dereference(tp->root);
WANG Cong8113c092017-08-04 21:31:43 -0700344 struct rsvp_filter *nfp, *f = arg;
John Fastabendb929d862014-09-12 20:09:49 -0700345 struct rsvp_filter __rcu **fp;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000346 unsigned int h = f->handle;
John Fastabendb929d862014-09-12 20:09:49 -0700347 struct rsvp_session __rcu **sp;
348 struct rsvp_session *nsp, *s = f->sess;
WANG Cong763dbf62017-04-19 14:21:21 -0700349 int i, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350
John Fastabendb929d862014-09-12 20:09:49 -0700351 fp = &s->ht[(h >> 8) & 0xFF];
352 for (nfp = rtnl_dereference(*fp); nfp;
353 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
354 if (nfp == f) {
355 RCU_INIT_POINTER(*fp, f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 rsvp_delete_filter(tp, f);
357
358 /* Strip tree */
359
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000360 for (i = 0; i <= 16; i++)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361 if (s->ht[i])
WANG Cong763dbf62017-04-19 14:21:21 -0700362 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363
364 /* OK, session has no flows */
John Fastabendb929d862014-09-12 20:09:49 -0700365 sp = &head->ht[h & 0xFF];
366 for (nsp = rtnl_dereference(*sp); nsp;
367 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
368 if (nsp == s) {
369 RCU_INIT_POINTER(*sp, s->next);
370 kfree_rcu(s, rcu);
WANG Cong763dbf62017-04-19 14:21:21 -0700371 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 }
373 }
374
WANG Cong763dbf62017-04-19 14:21:21 -0700375 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 }
377 }
WANG Cong763dbf62017-04-19 14:21:21 -0700378
379out:
380 *last = true;
381 for (h1 = 0; h1 < 256; h1++) {
382 if (rcu_access_pointer(head->ht[h1])) {
383 *last = false;
384 break;
385 }
386 }
387
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 return 0;
389}
390
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000391static unsigned int gen_handle(struct tcf_proto *tp, unsigned salt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392{
John Fastabendb929d862014-09-12 20:09:49 -0700393 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 int i = 0xFFFF;
395
396 while (i-- > 0) {
397 u32 h;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if ((data->hgenerator += 0x10000) == 0)
400 data->hgenerator = 0x10000;
401 h = data->hgenerator|salt;
Josh Hunt230cfd22017-09-10 15:48:50 -0400402 if (!rsvp_get(tp, h))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 return h;
404 }
405 return 0;
406}
407
408static int tunnel_bts(struct rsvp_head *data)
409{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000410 int n = data->tgenerator >> 5;
411 u32 b = 1 << (data->tgenerator & 0x1F);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900412
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000413 if (data->tmap[n] & b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 return 0;
415 data->tmap[n] |= b;
416 return 1;
417}
418
419static void tunnel_recycle(struct rsvp_head *data)
420{
John Fastabendb929d862014-09-12 20:09:49 -0700421 struct rsvp_session __rcu **sht = data->ht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 u32 tmap[256/32];
423 int h1, h2;
424
425 memset(tmap, 0, sizeof(tmap));
426
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000427 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 struct rsvp_session *s;
John Fastabendb929d862014-09-12 20:09:49 -0700429 for (s = rtnl_dereference(sht[h1]); s;
430 s = rtnl_dereference(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000431 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432 struct rsvp_filter *f;
433
John Fastabendb929d862014-09-12 20:09:49 -0700434 for (f = rtnl_dereference(s->ht[h2]); f;
435 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436 if (f->tunnelhdr == 0)
437 continue;
438 data->tgenerator = f->res.classid;
439 tunnel_bts(data);
440 }
441 }
442 }
443 }
444
445 memcpy(data->tmap, tmap, sizeof(tmap));
446}
447
448static u32 gen_tunnel(struct rsvp_head *data)
449{
450 int i, k;
451
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000452 for (k = 0; k < 2; k++) {
453 for (i = 255; i > 0; i--) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 if (++data->tgenerator == 0)
455 data->tgenerator = 1;
456 if (tunnel_bts(data))
457 return data->tgenerator;
458 }
459 tunnel_recycle(data);
460 }
461 return 0;
462}
463
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800464static const struct nla_policy rsvp_policy[TCA_RSVP_MAX + 1] = {
465 [TCA_RSVP_CLASSID] = { .type = NLA_U32 },
Eric Dumazetcb3c0e62020-01-31 15:27:04 -0800466 [TCA_RSVP_DST] = { .len = RSVP_DST_LEN * sizeof(u32) },
467 [TCA_RSVP_SRC] = { .len = RSVP_DST_LEN * sizeof(u32) },
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800468 [TCA_RSVP_PINFO] = { .len = sizeof(struct tc_rsvp_pinfo) },
469};
470
Benjamin LaHaisec1b52732013-01-14 05:15:39 +0000471static int rsvp_change(struct net *net, struct sk_buff *in_skb,
Eric W. Biedermanaf4c6642012-05-25 13:42:45 -0600472 struct tcf_proto *tp, unsigned long base,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 u32 handle,
Patrick McHardyadd93b62008-01-22 22:11:33 -0800474 struct nlattr **tca,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200475 void **arg, bool ovr, bool rtnl_held,
476 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700477{
John Fastabendb929d862014-09-12 20:09:49 -0700478 struct rsvp_head *data = rtnl_dereference(tp->root);
479 struct rsvp_filter *f, *nfp;
480 struct rsvp_filter __rcu **fp;
481 struct rsvp_session *nsp, *s;
482 struct rsvp_session __rcu **sp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483 struct tc_rsvp_pinfo *pinfo = NULL;
Igor Maravić27e95a82011-08-30 03:12:55 +0000484 struct nlattr *opt = tca[TCA_OPTIONS];
Patrick McHardyadd93b62008-01-22 22:11:33 -0800485 struct nlattr *tb[TCA_RSVP_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700486 struct tcf_exts e;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000487 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800488 __be32 *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700489 int err;
490
491 if (opt == NULL)
492 return handle ? -EINVAL : 0;
493
Johannes Berg8cb08172019-04-26 14:07:28 +0200494 err = nla_parse_nested_deprecated(tb, TCA_RSVP_MAX, opt, rsvp_policy,
495 NULL);
Patrick McHardycee63722008-01-23 20:33:32 -0800496 if (err < 0)
497 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498
Cong Wang14215102019-02-20 21:37:42 -0800499 err = tcf_exts_init(&e, net, TCA_RSVP_ACT, TCA_RSVP_POLICE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 if (err < 0)
501 return err;
Vlad Buslovec6743a2019-02-11 10:55:43 +0200502 err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr, true,
503 extack);
WANG Congb9a24bb2016-08-19 12:36:54 -0700504 if (err < 0)
505 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506
WANG Cong8113c092017-08-04 21:31:43 -0700507 f = *arg;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000508 if (f) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700509 /* Node exists: adjust only classid */
John Fastabend53dfd502014-09-26 10:02:50 -0700510 struct rsvp_filter *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511
512 if (f->handle != handle && handle)
513 goto errout2;
John Fastabend53dfd502014-09-26 10:02:50 -0700514
515 n = kmemdup(f, sizeof(*f), GFP_KERNEL);
516 if (!n) {
517 err = -ENOMEM;
518 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519 }
520
Cong Wang14215102019-02-20 21:37:42 -0800521 err = tcf_exts_init(&n->exts, net, TCA_RSVP_ACT,
522 TCA_RSVP_POLICE);
WANG Congb9a24bb2016-08-19 12:36:54 -0700523 if (err < 0) {
524 kfree(n);
525 goto errout2;
526 }
John Fastabend53dfd502014-09-26 10:02:50 -0700527
528 if (tb[TCA_RSVP_CLASSID]) {
529 n->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
530 tcf_bind_filter(tp, &n->res, base);
531 }
532
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200533 tcf_exts_change(&n->exts, &e);
John Fastabend53dfd502014-09-26 10:02:50 -0700534 rsvp_replace(tp, n, handle);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535 return 0;
536 }
537
538 /* Now more serious part... */
539 err = -EINVAL;
540 if (handle)
541 goto errout2;
Igor Maravić27e95a82011-08-30 03:12:55 +0000542 if (tb[TCA_RSVP_DST] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700543 goto errout2;
544
545 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700546 f = kzalloc(sizeof(struct rsvp_filter), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 if (f == NULL)
548 goto errout2;
549
Cong Wang14215102019-02-20 21:37:42 -0800550 err = tcf_exts_init(&f->exts, net, TCA_RSVP_ACT, TCA_RSVP_POLICE);
WANG Congb9a24bb2016-08-19 12:36:54 -0700551 if (err < 0)
552 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553 h2 = 16;
Igor Maravić27e95a82011-08-30 03:12:55 +0000554 if (tb[TCA_RSVP_SRC]) {
555 memcpy(f->src, nla_data(tb[TCA_RSVP_SRC]), sizeof(f->src));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700556 h2 = hash_src(f->src);
557 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000558 if (tb[TCA_RSVP_PINFO]) {
559 pinfo = nla_data(tb[TCA_RSVP_PINFO]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700560 f->spi = pinfo->spi;
561 f->tunnelhdr = pinfo->tunnelhdr;
562 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000563 if (tb[TCA_RSVP_CLASSID])
564 f->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565
Igor Maravić27e95a82011-08-30 03:12:55 +0000566 dst = nla_data(tb[TCA_RSVP_DST]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567 h1 = hash_dst(dst, pinfo ? pinfo->protocol : 0, pinfo ? pinfo->tunnelid : 0);
568
569 err = -ENOMEM;
570 if ((f->handle = gen_handle(tp, h1 | (h2<<8))) == 0)
571 goto errout;
572
573 if (f->tunnelhdr) {
574 err = -EINVAL;
575 if (f->res.classid > 255)
576 goto errout;
577
578 err = -ENOMEM;
579 if (f->res.classid == 0 &&
580 (f->res.classid = gen_tunnel(data)) == 0)
581 goto errout;
582 }
583
John Fastabendb929d862014-09-12 20:09:49 -0700584 for (sp = &data->ht[h1];
585 (s = rtnl_dereference(*sp)) != NULL;
586 sp = &s->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN-1] &&
588 pinfo && pinfo->protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800589 memcmp(&pinfo->dpi, &s->dpi, sizeof(s->dpi)) == 0 &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700590#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800591 dst[0] == s->dst[0] &&
592 dst[1] == s->dst[1] &&
593 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800595 pinfo->tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596
597insert:
598 /* OK, we found appropriate session */
599
600 fp = &s->ht[h2];
601
602 f->sess = s;
603 if (f->tunnelhdr == 0)
604 tcf_bind_filter(tp, &f->res, base);
605
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200606 tcf_exts_change(&f->exts, &e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607
John Fastabendb929d862014-09-12 20:09:49 -0700608 fp = &s->ht[h2];
609 for (nfp = rtnl_dereference(*fp); nfp;
610 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
611 __u32 mask = nfp->spi.mask & f->spi.mask;
612
613 if (mask != f->spi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700614 break;
John Fastabendb929d862014-09-12 20:09:49 -0700615 }
616 RCU_INIT_POINTER(f->next, nfp);
617 rcu_assign_pointer(*fp, f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618
WANG Cong8113c092017-08-04 21:31:43 -0700619 *arg = f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700620 return 0;
621 }
622 }
623
624 /* No session found. Create new one. */
625
626 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700627 s = kzalloc(sizeof(struct rsvp_session), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700628 if (s == NULL)
629 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630 memcpy(s->dst, dst, sizeof(s->dst));
631
632 if (pinfo) {
633 s->dpi = pinfo->dpi;
634 s->protocol = pinfo->protocol;
635 s->tunnelid = pinfo->tunnelid;
636 }
John Fastabendb929d862014-09-12 20:09:49 -0700637 sp = &data->ht[h1];
638 for (nsp = rtnl_dereference(*sp); nsp;
639 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
640 if ((nsp->dpi.mask & s->dpi.mask) != s->dpi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641 break;
642 }
John Fastabendb929d862014-09-12 20:09:49 -0700643 RCU_INIT_POINTER(s->next, nsp);
644 rcu_assign_pointer(*sp, s);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900645
Linus Torvalds1da177e2005-04-16 15:20:36 -0700646 goto insert;
647
648errout:
WANG Congb9a24bb2016-08-19 12:36:54 -0700649 tcf_exts_destroy(&f->exts);
Jesper Juhla51482b2005-11-08 09:41:34 -0800650 kfree(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651errout2:
WANG Cong18d02642014-09-25 10:26:37 -0700652 tcf_exts_destroy(&e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700653 return err;
654}
655
Vlad Buslov12db03b2019-02-11 10:55:45 +0200656static void rsvp_walk(struct tcf_proto *tp, struct tcf_walker *arg,
657 bool rtnl_held)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700658{
John Fastabendb929d862014-09-12 20:09:49 -0700659 struct rsvp_head *head = rtnl_dereference(tp->root);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000660 unsigned int h, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700661
662 if (arg->stop)
663 return;
664
665 for (h = 0; h < 256; h++) {
666 struct rsvp_session *s;
667
John Fastabendb929d862014-09-12 20:09:49 -0700668 for (s = rtnl_dereference(head->ht[h]); s;
669 s = rtnl_dereference(s->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 for (h1 = 0; h1 <= 16; h1++) {
671 struct rsvp_filter *f;
672
John Fastabendb929d862014-09-12 20:09:49 -0700673 for (f = rtnl_dereference(s->ht[h1]); f;
674 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 if (arg->count < arg->skip) {
676 arg->count++;
677 continue;
678 }
WANG Cong8113c092017-08-04 21:31:43 -0700679 if (arg->fn(tp, f, arg) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700680 arg->stop = 1;
681 return;
682 }
683 arg->count++;
684 }
685 }
686 }
687 }
688}
689
WANG Cong8113c092017-08-04 21:31:43 -0700690static int rsvp_dump(struct net *net, struct tcf_proto *tp, void *fh,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200691 struct sk_buff *skb, struct tcmsg *t, bool rtnl_held)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692{
WANG Cong8113c092017-08-04 21:31:43 -0700693 struct rsvp_filter *f = fh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 struct rsvp_session *s;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800695 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696 struct tc_rsvp_pinfo pinfo;
697
698 if (f == NULL)
699 return skb->len;
700 s = f->sess;
701
702 t->tcm_handle = f->handle;
703
Michal Kubecekae0be8d2019-04-26 11:13:06 +0200704 nest = nla_nest_start_noflag(skb, TCA_OPTIONS);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800705 if (nest == NULL)
706 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707
David S. Miller1b34ec42012-03-29 05:11:39 -0400708 if (nla_put(skb, TCA_RSVP_DST, sizeof(s->dst), &s->dst))
709 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 pinfo.dpi = s->dpi;
711 pinfo.spi = f->spi;
712 pinfo.protocol = s->protocol;
713 pinfo.tunnelid = s->tunnelid;
714 pinfo.tunnelhdr = f->tunnelhdr;
Patrick McHardy8a470772005-06-28 12:56:45 -0700715 pinfo.pad = 0;
David S. Miller1b34ec42012-03-29 05:11:39 -0400716 if (nla_put(skb, TCA_RSVP_PINFO, sizeof(pinfo), &pinfo))
717 goto nla_put_failure;
718 if (f->res.classid &&
719 nla_put_u32(skb, TCA_RSVP_CLASSID, f->res.classid))
720 goto nla_put_failure;
721 if (((f->handle >> 8) & 0xFF) != 16 &&
722 nla_put(skb, TCA_RSVP_SRC, sizeof(f->src), f->src))
723 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724
WANG Cong5da57f42013-12-15 20:15:07 -0800725 if (tcf_exts_dump(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800726 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800728 nla_nest_end(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729
WANG Cong5da57f42013-12-15 20:15:07 -0800730 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800731 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 return skb->len;
733
Patrick McHardyadd93b62008-01-22 22:11:33 -0800734nla_put_failure:
Jiri Pirko6ea3b442014-12-09 22:23:29 +0100735 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 return -1;
737}
738
Cong Wang2e24cd72020-01-23 16:26:18 -0800739static void rsvp_bind_class(void *fh, u32 classid, unsigned long cl, void *q,
740 unsigned long base)
Cong Wang07d79fc2017-08-30 14:30:36 -0700741{
742 struct rsvp_filter *f = fh;
743
Cong Wang2e24cd72020-01-23 16:26:18 -0800744 if (f && f->res.classid == classid) {
745 if (cl)
746 __tcf_bind_filter(q, &f->res, base);
747 else
748 __tcf_unbind_filter(q, &f->res);
749 }
Cong Wang07d79fc2017-08-30 14:30:36 -0700750}
751
Igor Maravić27e95a82011-08-30 03:12:55 +0000752static struct tcf_proto_ops RSVP_OPS __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 .kind = RSVP_ID,
754 .classify = rsvp_classify,
755 .init = rsvp_init,
756 .destroy = rsvp_destroy,
757 .get = rsvp_get,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 .change = rsvp_change,
759 .delete = rsvp_delete,
760 .walk = rsvp_walk,
761 .dump = rsvp_dump,
Cong Wang07d79fc2017-08-30 14:30:36 -0700762 .bind_class = rsvp_bind_class,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 .owner = THIS_MODULE,
764};
765
766static int __init init_rsvp(void)
767{
768 return register_tcf_proto_ops(&RSVP_OPS);
769}
770
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900771static void __exit exit_rsvp(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772{
773 unregister_tcf_proto_ops(&RSVP_OPS);
774}
775
776module_init(init_rsvp)
777module_exit(exit_rsvp)