blob: 5cd9d6b143c44bf250ca1e53c384e3cf3fab57d2 [file] [log] [blame]
Thomas Gleixner2874c5f2019-05-27 08:55:01 +02001/* SPDX-License-Identifier: GPL-2.0-or-later */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * net/sched/cls_rsvp.h Template file for RSVPv[46] classifiers.
4 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
6 */
7
8/*
9 Comparing to general packet classification problem,
Zheng Yongjun37f2ad22021-05-31 10:00:48 +080010 RSVP needs only several relatively simple rules:
Linus Torvalds1da177e2005-04-16 15:20:36 -070011
12 * (dst, protocol) are always specified,
13 so that we are able to hash them.
14 * src may be exact, or may be wildcard, so that
15 we can keep a hash table plus one wildcard entry.
16 * source port (or flow label) is important only if src is given.
17
18 IMPLEMENTATION.
19
20 We use a two level hash table: The top level is keyed by
21 destination address and protocol ID, every bucket contains a list
22 of "rsvp sessions", identified by destination address, protocol and
23 DPI(="Destination Port ID"): triple (key, mask, offset).
24
25 Every bucket has a smaller hash table keyed by source address
26 (cf. RSVP flowspec) and one wildcard entry for wildcard reservations.
27 Every bucket is again a list of "RSVP flows", selected by
28 source address and SPI(="Source Port ID" here rather than
29 "security parameter index"): triple (key, mask, offset).
30
31
32 NOTE 1. All the packets with IPv6 extension headers (but AH and ESP)
33 and all fragmented packets go to the best-effort traffic class.
34
35
36 NOTE 2. Two "port id"'s seems to be redundant, rfc2207 requires
37 only one "Generalized Port Identifier". So that for classic
38 ah, esp (and udp,tcp) both *pi should coincide or one of them
39 should be wildcard.
40
41 At first sight, this redundancy is just a waste of CPU
42 resources. But DPI and SPI add the possibility to assign different
43 priorities to GPIs. Look also at note 4 about tunnels below.
44
45
46 NOTE 3. One complication is the case of tunneled packets.
47 We implement it as following: if the first lookup
48 matches a special session with "tunnelhdr" value not zero,
49 flowid doesn't contain the true flow ID, but the tunnel ID (1...255).
50 In this case, we pull tunnelhdr bytes and restart lookup
51 with tunnel ID added to the list of keys. Simple and stupid 8)8)
52 It's enough for PIMREG and IPIP.
53
54
55 NOTE 4. Two GPIs make it possible to parse even GRE packets.
56 F.e. DPI can select ETH_P_IP (and necessary flags to make
57 tunnelhdr correct) in GRE protocol field and SPI matches
58 GRE key. Is it not nice? 8)8)
59
60
61 Well, as result, despite its simplicity, we get a pretty
62 powerful classification engine. */
63
Linus Torvalds1da177e2005-04-16 15:20:36 -070064
Eric Dumazetcc7ec452011-01-19 19:26:56 +000065struct rsvp_head {
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 u32 tmap[256/32];
67 u32 hgenerator;
68 u8 tgenerator;
John Fastabendb929d862014-09-12 20:09:49 -070069 struct rsvp_session __rcu *ht[256];
70 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070071};
72
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073struct rsvp_session {
John Fastabendb929d862014-09-12 20:09:49 -070074 struct rsvp_session __rcu *next;
75 __be32 dst[RSVP_DST_LEN];
76 struct tc_rsvp_gpi dpi;
77 u8 protocol;
78 u8 tunnelid;
Linus Torvalds1da177e2005-04-16 15:20:36 -070079 /* 16 (src,sport) hash slots, and one wildcard source slot */
John Fastabendb929d862014-09-12 20:09:49 -070080 struct rsvp_filter __rcu *ht[16 + 1];
81 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082};
83
84
Eric Dumazetcc7ec452011-01-19 19:26:56 +000085struct rsvp_filter {
John Fastabendb929d862014-09-12 20:09:49 -070086 struct rsvp_filter __rcu *next;
87 __be32 src[RSVP_DST_LEN];
88 struct tc_rsvp_gpi spi;
89 u8 tunnelhdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -070090
John Fastabendb929d862014-09-12 20:09:49 -070091 struct tcf_result res;
92 struct tcf_exts exts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
John Fastabendb929d862014-09-12 20:09:49 -070094 u32 handle;
95 struct rsvp_session *sess;
Cong Wangaaa908f2018-05-23 15:26:53 -070096 struct rcu_work rwork;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097};
98
Eric Dumazetcc7ec452011-01-19 19:26:56 +000099static inline unsigned int hash_dst(__be32 *dst, u8 protocol, u8 tunnelid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000101 unsigned int h = (__force __u32)dst[RSVP_DST_LEN - 1];
102
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103 h ^= h>>16;
104 h ^= h>>8;
105 return (h ^ protocol ^ tunnelid) & 0xFF;
106}
107
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000108static inline unsigned int hash_src(__be32 *src)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000110 unsigned int h = (__force __u32)src[RSVP_DST_LEN-1];
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 h ^= h>>16;
113 h ^= h>>8;
114 h ^= h>>4;
115 return h & 0xF;
116}
117
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118#define RSVP_APPLY_RESULT() \
119{ \
120 int r = tcf_exts_exec(skb, &f->exts, res); \
121 if (r < 0) \
122 continue; \
123 else if (r > 0) \
124 return r; \
125}
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900126
Eric Dumazetdc7f9f62011-07-05 23:25:42 +0000127static int rsvp_classify(struct sk_buff *skb, const struct tcf_proto *tp,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128 struct tcf_result *res)
129{
John Fastabendb929d862014-09-12 20:09:49 -0700130 struct rsvp_head *head = rcu_dereference_bh(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 struct rsvp_session *s;
132 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000133 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800134 __be32 *dst, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 u8 protocol;
136 u8 tunnelid = 0;
137 u8 *xprt;
138#if RSVP_DST_LEN == 4
Changli Gao12dc96d2010-08-04 04:55:40 +0000139 struct ipv6hdr *nhptr;
140
141 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
142 return -1;
143 nhptr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144#else
Changli Gao12dc96d2010-08-04 04:55:40 +0000145 struct iphdr *nhptr;
146
147 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
148 return -1;
149 nhptr = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151restart:
152
153#if RSVP_DST_LEN == 4
154 src = &nhptr->saddr.s6_addr32[0];
155 dst = &nhptr->daddr.s6_addr32[0];
156 protocol = nhptr->nexthdr;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000157 xprt = ((u8 *)nhptr) + sizeof(struct ipv6hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158#else
159 src = &nhptr->saddr;
160 dst = &nhptr->daddr;
161 protocol = nhptr->protocol;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000162 xprt = ((u8 *)nhptr) + (nhptr->ihl<<2);
Paul Gortmaker56f8a752011-06-21 20:33:34 -0700163 if (ip_is_fragment(nhptr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 return -1;
165#endif
166
167 h1 = hash_dst(dst, protocol, tunnelid);
168 h2 = hash_src(src);
169
John Fastabendb929d862014-09-12 20:09:49 -0700170 for (s = rcu_dereference_bh(head->ht[h1]); s;
171 s = rcu_dereference_bh(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000172 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN - 1] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800174 !(s->dpi.mask &
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000175 (*(u32 *)(xprt + s->dpi.offset) ^ s->dpi.key)) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800177 dst[0] == s->dst[0] &&
178 dst[1] == s->dst[1] &&
179 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800181 tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182
John Fastabendb929d862014-09-12 20:09:49 -0700183 for (f = rcu_dereference_bh(s->ht[h2]); f;
184 f = rcu_dereference_bh(f->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000185 if (src[RSVP_DST_LEN-1] == f->src[RSVP_DST_LEN - 1] &&
186 !(f->spi.mask & (*(u32 *)(xprt + f->spi.offset) ^ f->spi.key))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800188 &&
189 src[0] == f->src[0] &&
190 src[1] == f->src[1] &&
191 src[2] == f->src[2]
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192#endif
193 ) {
194 *res = f->res;
195 RSVP_APPLY_RESULT();
196
197matched:
198 if (f->tunnelhdr == 0)
199 return 0;
200
201 tunnelid = f->res.classid;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000202 nhptr = (void *)(xprt + f->tunnelhdr - sizeof(*nhptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 goto restart;
204 }
205 }
206
207 /* And wildcard bucket... */
John Fastabendb929d862014-09-12 20:09:49 -0700208 for (f = rcu_dereference_bh(s->ht[16]); f;
209 f = rcu_dereference_bh(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210 *res = f->res;
211 RSVP_APPLY_RESULT();
212 goto matched;
213 }
214 return -1;
215 }
216 }
217 return -1;
218}
219
John Fastabend53dfd502014-09-26 10:02:50 -0700220static void rsvp_replace(struct tcf_proto *tp, struct rsvp_filter *n, u32 h)
221{
222 struct rsvp_head *head = rtnl_dereference(tp->root);
223 struct rsvp_session *s;
224 struct rsvp_filter __rcu **ins;
225 struct rsvp_filter *pins;
226 unsigned int h1 = h & 0xFF;
227 unsigned int h2 = (h >> 8) & 0xFF;
228
229 for (s = rtnl_dereference(head->ht[h1]); s;
230 s = rtnl_dereference(s->next)) {
231 for (ins = &s->ht[h2], pins = rtnl_dereference(*ins); ;
232 ins = &pins->next, pins = rtnl_dereference(*ins)) {
233 if (pins->handle == h) {
234 RCU_INIT_POINTER(n->next, pins->next);
235 rcu_assign_pointer(*ins, n);
236 return;
237 }
238 }
239 }
240
Menglong Donge5a4b172020-11-09 02:02:17 -0500241 /* Something went wrong if we are trying to replace a non-existent
John Fastabend53dfd502014-09-26 10:02:50 -0700242 * node. Mind as well halt instead of silently failing.
243 */
244 BUG_ON(1);
245}
246
WANG Cong8113c092017-08-04 21:31:43 -0700247static void *rsvp_get(struct tcf_proto *tp, u32 handle)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248{
John Fastabendb929d862014-09-12 20:09:49 -0700249 struct rsvp_head *head = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 struct rsvp_session *s;
251 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000252 unsigned int h1 = handle & 0xFF;
253 unsigned int h2 = (handle >> 8) & 0xFF;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
255 if (h2 > 16)
WANG Cong8113c092017-08-04 21:31:43 -0700256 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
John Fastabendb929d862014-09-12 20:09:49 -0700258 for (s = rtnl_dereference(head->ht[h1]); s;
259 s = rtnl_dereference(s->next)) {
260 for (f = rtnl_dereference(s->ht[h2]); f;
261 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 if (f->handle == handle)
WANG Cong8113c092017-08-04 21:31:43 -0700263 return f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 }
265 }
WANG Cong8113c092017-08-04 21:31:43 -0700266 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267}
268
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269static int rsvp_init(struct tcf_proto *tp)
270{
271 struct rsvp_head *data;
272
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700273 data = kzalloc(sizeof(struct rsvp_head), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 if (data) {
John Fastabendb929d862014-09-12 20:09:49 -0700275 rcu_assign_pointer(tp->root, data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 return 0;
277 }
278 return -ENOBUFS;
279}
280
Cong Wang96585062017-11-06 13:47:28 -0800281static void __rsvp_delete_filter(struct rsvp_filter *f)
282{
283 tcf_exts_destroy(&f->exts);
284 tcf_exts_put_net(&f->exts);
285 kfree(f);
286}
287
Cong Wangd4f84a42017-10-26 18:24:38 -0700288static void rsvp_delete_filter_work(struct work_struct *work)
289{
Cong Wangaaa908f2018-05-23 15:26:53 -0700290 struct rsvp_filter *f = container_of(to_rcu_work(work),
291 struct rsvp_filter,
292 rwork);
Cong Wangd4f84a42017-10-26 18:24:38 -0700293 rtnl_lock();
Cong Wang96585062017-11-06 13:47:28 -0800294 __rsvp_delete_filter(f);
Cong Wangd4f84a42017-10-26 18:24:38 -0700295 rtnl_unlock();
296}
297
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700298static void rsvp_delete_filter(struct tcf_proto *tp, struct rsvp_filter *f)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299{
300 tcf_unbind_filter(tp, &f->res);
Alexei Starovoitov9e528d82015-08-25 20:06:34 -0700301 /* all classifiers are required to call tcf_exts_destroy() after rcu
302 * grace period, since converted-to-rcu actions are relying on that
303 * in cleanup() callback
304 */
Cong Wang96585062017-11-06 13:47:28 -0800305 if (tcf_exts_get_net(&f->exts))
Cong Wangaaa908f2018-05-23 15:26:53 -0700306 tcf_queue_work(&f->rwork, rsvp_delete_filter_work);
Cong Wang96585062017-11-06 13:47:28 -0800307 else
308 __rsvp_delete_filter(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309}
310
Vlad Buslov12db03b2019-02-11 10:55:45 +0200311static void rsvp_destroy(struct tcf_proto *tp, bool rtnl_held,
312 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313{
John Fastabendb929d862014-09-12 20:09:49 -0700314 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 int h1, h2;
316
317 if (data == NULL)
WANG Cong763dbf62017-04-19 14:21:21 -0700318 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000320 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321 struct rsvp_session *s;
322
John Fastabendb929d862014-09-12 20:09:49 -0700323 while ((s = rtnl_dereference(data->ht[h1])) != NULL) {
324 RCU_INIT_POINTER(data->ht[h1], s->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000326 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 struct rsvp_filter *f;
328
John Fastabendb929d862014-09-12 20:09:49 -0700329 while ((f = rtnl_dereference(s->ht[h2])) != NULL) {
330 rcu_assign_pointer(s->ht[h2], f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 rsvp_delete_filter(tp, f);
332 }
333 }
John Fastabendb929d862014-09-12 20:09:49 -0700334 kfree_rcu(s, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 }
336 }
John Fastabendb929d862014-09-12 20:09:49 -0700337 kfree_rcu(data, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338}
339
Alexander Aring571acf22018-01-18 11:20:53 -0500340static int rsvp_delete(struct tcf_proto *tp, void *arg, bool *last,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200341 bool rtnl_held, struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342{
John Fastabendb929d862014-09-12 20:09:49 -0700343 struct rsvp_head *head = rtnl_dereference(tp->root);
WANG Cong8113c092017-08-04 21:31:43 -0700344 struct rsvp_filter *nfp, *f = arg;
John Fastabendb929d862014-09-12 20:09:49 -0700345 struct rsvp_filter __rcu **fp;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000346 unsigned int h = f->handle;
John Fastabendb929d862014-09-12 20:09:49 -0700347 struct rsvp_session __rcu **sp;
348 struct rsvp_session *nsp, *s = f->sess;
WANG Cong763dbf62017-04-19 14:21:21 -0700349 int i, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350
John Fastabendb929d862014-09-12 20:09:49 -0700351 fp = &s->ht[(h >> 8) & 0xFF];
352 for (nfp = rtnl_dereference(*fp); nfp;
353 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
354 if (nfp == f) {
355 RCU_INIT_POINTER(*fp, f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 rsvp_delete_filter(tp, f);
357
358 /* Strip tree */
359
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000360 for (i = 0; i <= 16; i++)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361 if (s->ht[i])
WANG Cong763dbf62017-04-19 14:21:21 -0700362 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363
364 /* OK, session has no flows */
John Fastabendb929d862014-09-12 20:09:49 -0700365 sp = &head->ht[h & 0xFF];
366 for (nsp = rtnl_dereference(*sp); nsp;
367 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
368 if (nsp == s) {
369 RCU_INIT_POINTER(*sp, s->next);
370 kfree_rcu(s, rcu);
WANG Cong763dbf62017-04-19 14:21:21 -0700371 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 }
373 }
374
WANG Cong763dbf62017-04-19 14:21:21 -0700375 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 }
377 }
WANG Cong763dbf62017-04-19 14:21:21 -0700378
379out:
380 *last = true;
381 for (h1 = 0; h1 < 256; h1++) {
382 if (rcu_access_pointer(head->ht[h1])) {
383 *last = false;
384 break;
385 }
386 }
387
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 return 0;
389}
390
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000391static unsigned int gen_handle(struct tcf_proto *tp, unsigned salt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392{
John Fastabendb929d862014-09-12 20:09:49 -0700393 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 int i = 0xFFFF;
395
396 while (i-- > 0) {
397 u32 h;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if ((data->hgenerator += 0x10000) == 0)
400 data->hgenerator = 0x10000;
401 h = data->hgenerator|salt;
Josh Hunt230cfd22017-09-10 15:48:50 -0400402 if (!rsvp_get(tp, h))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 return h;
404 }
405 return 0;
406}
407
408static int tunnel_bts(struct rsvp_head *data)
409{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000410 int n = data->tgenerator >> 5;
411 u32 b = 1 << (data->tgenerator & 0x1F);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900412
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000413 if (data->tmap[n] & b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 return 0;
415 data->tmap[n] |= b;
416 return 1;
417}
418
419static void tunnel_recycle(struct rsvp_head *data)
420{
John Fastabendb929d862014-09-12 20:09:49 -0700421 struct rsvp_session __rcu **sht = data->ht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 u32 tmap[256/32];
423 int h1, h2;
424
425 memset(tmap, 0, sizeof(tmap));
426
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000427 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 struct rsvp_session *s;
John Fastabendb929d862014-09-12 20:09:49 -0700429 for (s = rtnl_dereference(sht[h1]); s;
430 s = rtnl_dereference(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000431 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432 struct rsvp_filter *f;
433
John Fastabendb929d862014-09-12 20:09:49 -0700434 for (f = rtnl_dereference(s->ht[h2]); f;
435 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436 if (f->tunnelhdr == 0)
437 continue;
438 data->tgenerator = f->res.classid;
439 tunnel_bts(data);
440 }
441 }
442 }
443 }
444
445 memcpy(data->tmap, tmap, sizeof(tmap));
446}
447
448static u32 gen_tunnel(struct rsvp_head *data)
449{
450 int i, k;
451
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000452 for (k = 0; k < 2; k++) {
453 for (i = 255; i > 0; i--) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 if (++data->tgenerator == 0)
455 data->tgenerator = 1;
456 if (tunnel_bts(data))
457 return data->tgenerator;
458 }
459 tunnel_recycle(data);
460 }
461 return 0;
462}
463
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800464static const struct nla_policy rsvp_policy[TCA_RSVP_MAX + 1] = {
465 [TCA_RSVP_CLASSID] = { .type = NLA_U32 },
Eric Dumazetcb3c0e62020-01-31 15:27:04 -0800466 [TCA_RSVP_DST] = { .len = RSVP_DST_LEN * sizeof(u32) },
467 [TCA_RSVP_SRC] = { .len = RSVP_DST_LEN * sizeof(u32) },
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800468 [TCA_RSVP_PINFO] = { .len = sizeof(struct tc_rsvp_pinfo) },
469};
470
Benjamin LaHaisec1b52732013-01-14 05:15:39 +0000471static int rsvp_change(struct net *net, struct sk_buff *in_skb,
Eric W. Biedermanaf4c6642012-05-25 13:42:45 -0600472 struct tcf_proto *tp, unsigned long base,
Cong Wang695176b2021-07-29 16:12:14 -0700473 u32 handle, struct nlattr **tca,
474 void **arg, u32 flags,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200475 struct netlink_ext_ack *extack)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476{
John Fastabendb929d862014-09-12 20:09:49 -0700477 struct rsvp_head *data = rtnl_dereference(tp->root);
478 struct rsvp_filter *f, *nfp;
479 struct rsvp_filter __rcu **fp;
480 struct rsvp_session *nsp, *s;
481 struct rsvp_session __rcu **sp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482 struct tc_rsvp_pinfo *pinfo = NULL;
Igor Maravić27e95a82011-08-30 03:12:55 +0000483 struct nlattr *opt = tca[TCA_OPTIONS];
Patrick McHardyadd93b62008-01-22 22:11:33 -0800484 struct nlattr *tb[TCA_RSVP_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485 struct tcf_exts e;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000486 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800487 __be32 *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488 int err;
489
490 if (opt == NULL)
491 return handle ? -EINVAL : 0;
492
Johannes Berg8cb08172019-04-26 14:07:28 +0200493 err = nla_parse_nested_deprecated(tb, TCA_RSVP_MAX, opt, rsvp_policy,
494 NULL);
Patrick McHardycee63722008-01-23 20:33:32 -0800495 if (err < 0)
496 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497
Cong Wang14215102019-02-20 21:37:42 -0800498 err = tcf_exts_init(&e, net, TCA_RSVP_ACT, TCA_RSVP_POLICE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 if (err < 0)
500 return err;
Cong Wang695176b2021-07-29 16:12:14 -0700501 err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, flags,
Vlad Buslovec6743a2019-02-11 10:55:43 +0200502 extack);
WANG Congb9a24bb2016-08-19 12:36:54 -0700503 if (err < 0)
504 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
WANG Cong8113c092017-08-04 21:31:43 -0700506 f = *arg;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000507 if (f) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 /* Node exists: adjust only classid */
John Fastabend53dfd502014-09-26 10:02:50 -0700509 struct rsvp_filter *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
511 if (f->handle != handle && handle)
512 goto errout2;
John Fastabend53dfd502014-09-26 10:02:50 -0700513
514 n = kmemdup(f, sizeof(*f), GFP_KERNEL);
515 if (!n) {
516 err = -ENOMEM;
517 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518 }
519
Cong Wang14215102019-02-20 21:37:42 -0800520 err = tcf_exts_init(&n->exts, net, TCA_RSVP_ACT,
521 TCA_RSVP_POLICE);
WANG Congb9a24bb2016-08-19 12:36:54 -0700522 if (err < 0) {
523 kfree(n);
524 goto errout2;
525 }
John Fastabend53dfd502014-09-26 10:02:50 -0700526
527 if (tb[TCA_RSVP_CLASSID]) {
528 n->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
529 tcf_bind_filter(tp, &n->res, base);
530 }
531
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200532 tcf_exts_change(&n->exts, &e);
John Fastabend53dfd502014-09-26 10:02:50 -0700533 rsvp_replace(tp, n, handle);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 return 0;
535 }
536
537 /* Now more serious part... */
538 err = -EINVAL;
539 if (handle)
540 goto errout2;
Igor Maravić27e95a82011-08-30 03:12:55 +0000541 if (tb[TCA_RSVP_DST] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542 goto errout2;
543
544 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700545 f = kzalloc(sizeof(struct rsvp_filter), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546 if (f == NULL)
547 goto errout2;
548
Cong Wang14215102019-02-20 21:37:42 -0800549 err = tcf_exts_init(&f->exts, net, TCA_RSVP_ACT, TCA_RSVP_POLICE);
WANG Congb9a24bb2016-08-19 12:36:54 -0700550 if (err < 0)
551 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552 h2 = 16;
Igor Maravić27e95a82011-08-30 03:12:55 +0000553 if (tb[TCA_RSVP_SRC]) {
554 memcpy(f->src, nla_data(tb[TCA_RSVP_SRC]), sizeof(f->src));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 h2 = hash_src(f->src);
556 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000557 if (tb[TCA_RSVP_PINFO]) {
558 pinfo = nla_data(tb[TCA_RSVP_PINFO]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 f->spi = pinfo->spi;
560 f->tunnelhdr = pinfo->tunnelhdr;
561 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000562 if (tb[TCA_RSVP_CLASSID])
563 f->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564
Igor Maravić27e95a82011-08-30 03:12:55 +0000565 dst = nla_data(tb[TCA_RSVP_DST]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700566 h1 = hash_dst(dst, pinfo ? pinfo->protocol : 0, pinfo ? pinfo->tunnelid : 0);
567
568 err = -ENOMEM;
569 if ((f->handle = gen_handle(tp, h1 | (h2<<8))) == 0)
570 goto errout;
571
572 if (f->tunnelhdr) {
573 err = -EINVAL;
574 if (f->res.classid > 255)
575 goto errout;
576
577 err = -ENOMEM;
578 if (f->res.classid == 0 &&
579 (f->res.classid = gen_tunnel(data)) == 0)
580 goto errout;
581 }
582
John Fastabendb929d862014-09-12 20:09:49 -0700583 for (sp = &data->ht[h1];
584 (s = rtnl_dereference(*sp)) != NULL;
585 sp = &s->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN-1] &&
587 pinfo && pinfo->protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800588 memcmp(&pinfo->dpi, &s->dpi, sizeof(s->dpi)) == 0 &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800590 dst[0] == s->dst[0] &&
591 dst[1] == s->dst[1] &&
592 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800594 pinfo->tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595
596insert:
597 /* OK, we found appropriate session */
598
599 fp = &s->ht[h2];
600
601 f->sess = s;
602 if (f->tunnelhdr == 0)
603 tcf_bind_filter(tp, &f->res, base);
604
Jiri Pirko9b0d4442017-08-04 14:29:15 +0200605 tcf_exts_change(&f->exts, &e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606
John Fastabendb929d862014-09-12 20:09:49 -0700607 fp = &s->ht[h2];
608 for (nfp = rtnl_dereference(*fp); nfp;
609 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
610 __u32 mask = nfp->spi.mask & f->spi.mask;
611
612 if (mask != f->spi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 break;
John Fastabendb929d862014-09-12 20:09:49 -0700614 }
615 RCU_INIT_POINTER(f->next, nfp);
616 rcu_assign_pointer(*fp, f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617
WANG Cong8113c092017-08-04 21:31:43 -0700618 *arg = f;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 return 0;
620 }
621 }
622
623 /* No session found. Create new one. */
624
625 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700626 s = kzalloc(sizeof(struct rsvp_session), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627 if (s == NULL)
628 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700629 memcpy(s->dst, dst, sizeof(s->dst));
630
631 if (pinfo) {
632 s->dpi = pinfo->dpi;
633 s->protocol = pinfo->protocol;
634 s->tunnelid = pinfo->tunnelid;
635 }
John Fastabendb929d862014-09-12 20:09:49 -0700636 sp = &data->ht[h1];
637 for (nsp = rtnl_dereference(*sp); nsp;
638 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
639 if ((nsp->dpi.mask & s->dpi.mask) != s->dpi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 break;
641 }
John Fastabendb929d862014-09-12 20:09:49 -0700642 RCU_INIT_POINTER(s->next, nsp);
643 rcu_assign_pointer(*sp, s);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900644
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 goto insert;
646
647errout:
WANG Congb9a24bb2016-08-19 12:36:54 -0700648 tcf_exts_destroy(&f->exts);
Jesper Juhla51482b2005-11-08 09:41:34 -0800649 kfree(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650errout2:
WANG Cong18d02642014-09-25 10:26:37 -0700651 tcf_exts_destroy(&e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 return err;
653}
654
Vlad Buslov12db03b2019-02-11 10:55:45 +0200655static void rsvp_walk(struct tcf_proto *tp, struct tcf_walker *arg,
656 bool rtnl_held)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700657{
John Fastabendb929d862014-09-12 20:09:49 -0700658 struct rsvp_head *head = rtnl_dereference(tp->root);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000659 unsigned int h, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660
661 if (arg->stop)
662 return;
663
664 for (h = 0; h < 256; h++) {
665 struct rsvp_session *s;
666
John Fastabendb929d862014-09-12 20:09:49 -0700667 for (s = rtnl_dereference(head->ht[h]); s;
668 s = rtnl_dereference(s->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 for (h1 = 0; h1 <= 16; h1++) {
670 struct rsvp_filter *f;
671
John Fastabendb929d862014-09-12 20:09:49 -0700672 for (f = rtnl_dereference(s->ht[h1]); f;
673 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700674 if (arg->count < arg->skip) {
675 arg->count++;
676 continue;
677 }
WANG Cong8113c092017-08-04 21:31:43 -0700678 if (arg->fn(tp, f, arg) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679 arg->stop = 1;
680 return;
681 }
682 arg->count++;
683 }
684 }
685 }
686 }
687}
688
WANG Cong8113c092017-08-04 21:31:43 -0700689static int rsvp_dump(struct net *net, struct tcf_proto *tp, void *fh,
Vlad Buslov12db03b2019-02-11 10:55:45 +0200690 struct sk_buff *skb, struct tcmsg *t, bool rtnl_held)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691{
WANG Cong8113c092017-08-04 21:31:43 -0700692 struct rsvp_filter *f = fh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700693 struct rsvp_session *s;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800694 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695 struct tc_rsvp_pinfo pinfo;
696
697 if (f == NULL)
698 return skb->len;
699 s = f->sess;
700
701 t->tcm_handle = f->handle;
702
Michal Kubecekae0be8d2019-04-26 11:13:06 +0200703 nest = nla_nest_start_noflag(skb, TCA_OPTIONS);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800704 if (nest == NULL)
705 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706
David S. Miller1b34ec42012-03-29 05:11:39 -0400707 if (nla_put(skb, TCA_RSVP_DST, sizeof(s->dst), &s->dst))
708 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709 pinfo.dpi = s->dpi;
710 pinfo.spi = f->spi;
711 pinfo.protocol = s->protocol;
712 pinfo.tunnelid = s->tunnelid;
713 pinfo.tunnelhdr = f->tunnelhdr;
Patrick McHardy8a470772005-06-28 12:56:45 -0700714 pinfo.pad = 0;
David S. Miller1b34ec42012-03-29 05:11:39 -0400715 if (nla_put(skb, TCA_RSVP_PINFO, sizeof(pinfo), &pinfo))
716 goto nla_put_failure;
717 if (f->res.classid &&
718 nla_put_u32(skb, TCA_RSVP_CLASSID, f->res.classid))
719 goto nla_put_failure;
720 if (((f->handle >> 8) & 0xFF) != 16 &&
721 nla_put(skb, TCA_RSVP_SRC, sizeof(f->src), f->src))
722 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723
WANG Cong5da57f42013-12-15 20:15:07 -0800724 if (tcf_exts_dump(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800725 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800727 nla_nest_end(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728
WANG Cong5da57f42013-12-15 20:15:07 -0800729 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800730 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 return skb->len;
732
Patrick McHardyadd93b62008-01-22 22:11:33 -0800733nla_put_failure:
Jiri Pirko6ea3b442014-12-09 22:23:29 +0100734 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 return -1;
736}
737
Cong Wang2e24cd72020-01-23 16:26:18 -0800738static void rsvp_bind_class(void *fh, u32 classid, unsigned long cl, void *q,
739 unsigned long base)
Cong Wang07d79fc2017-08-30 14:30:36 -0700740{
741 struct rsvp_filter *f = fh;
742
Cong Wang2e24cd72020-01-23 16:26:18 -0800743 if (f && f->res.classid == classid) {
744 if (cl)
745 __tcf_bind_filter(q, &f->res, base);
746 else
747 __tcf_unbind_filter(q, &f->res);
748 }
Cong Wang07d79fc2017-08-30 14:30:36 -0700749}
750
Igor Maravić27e95a82011-08-30 03:12:55 +0000751static struct tcf_proto_ops RSVP_OPS __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752 .kind = RSVP_ID,
753 .classify = rsvp_classify,
754 .init = rsvp_init,
755 .destroy = rsvp_destroy,
756 .get = rsvp_get,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700757 .change = rsvp_change,
758 .delete = rsvp_delete,
759 .walk = rsvp_walk,
760 .dump = rsvp_dump,
Cong Wang07d79fc2017-08-30 14:30:36 -0700761 .bind_class = rsvp_bind_class,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762 .owner = THIS_MODULE,
763};
764
765static int __init init_rsvp(void)
766{
767 return register_tcf_proto_ops(&RSVP_OPS);
768}
769
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900770static void __exit exit_rsvp(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771{
772 unregister_tcf_proto_ops(&RSVP_OPS);
773}
774
775module_init(init_rsvp)
776module_exit(exit_rsvp)