blob: a00ca4c00c3576e63fae319f4cc3f2e7056bb371 [file] [log] [blame]
Pavel Emelyanov7eb95152007-10-15 02:31:52 -07001/*
2 * inet fragments management
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Pavel Emelyanov <xemul@openvz.org>
10 * Started as consolidation of ipv4/ip_fragment.c,
11 * ipv6/reassembly. and ipv6 nf conntrack reassembly
12 */
13
14#include <linux/list.h>
15#include <linux/spinlock.h>
16#include <linux/module.h>
17#include <linux/timer.h>
18#include <linux/mm.h>
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070019#include <linux/random.h>
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -070020#include <linux/skbuff.h>
21#include <linux/rtnetlink.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090022#include <linux/slab.h>
Pavel Emelyanov7eb95152007-10-15 02:31:52 -070023
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +000024#include <net/sock.h>
Pavel Emelyanov7eb95152007-10-15 02:31:52 -070025#include <net/inet_frag.h>
Hannes Frederic Sowabe991972013-03-22 08:24:37 +000026#include <net/inet_ecn.h>
27
Florian Westphalb13d3cb2014-07-24 16:50:32 +020028#define INETFRAGS_EVICT_BUCKETS 128
29#define INETFRAGS_EVICT_MAX 512
30
Florian Westphale3a57d12014-07-24 16:50:35 +020031/* don't rebuild inetfrag table with new secret more often than this */
32#define INETFRAGS_MIN_REBUILD_INTERVAL (5 * HZ)
33
Hannes Frederic Sowabe991972013-03-22 08:24:37 +000034/* Given the OR values of all fragments, apply RFC 3168 5.3 requirements
35 * Value : 0xff if frame should be dropped.
36 * 0 or INET_ECN_CE value, to be ORed in to final iph->tos field
37 */
38const u8 ip_frag_ecn_table[16] = {
39 /* at least one fragment had CE, and others ECT_0 or ECT_1 */
40 [IPFRAG_ECN_CE | IPFRAG_ECN_ECT_0] = INET_ECN_CE,
41 [IPFRAG_ECN_CE | IPFRAG_ECN_ECT_1] = INET_ECN_CE,
42 [IPFRAG_ECN_CE | IPFRAG_ECN_ECT_0 | IPFRAG_ECN_ECT_1] = INET_ECN_CE,
43
44 /* invalid combinations : drop frame */
45 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_CE] = 0xff,
46 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_ECT_0] = 0xff,
47 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_ECT_1] = 0xff,
48 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_ECT_0 | IPFRAG_ECN_ECT_1] = 0xff,
49 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_CE | IPFRAG_ECN_ECT_0] = 0xff,
50 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_CE | IPFRAG_ECN_ECT_1] = 0xff,
51 [IPFRAG_ECN_NOT_ECT | IPFRAG_ECN_CE | IPFRAG_ECN_ECT_0 | IPFRAG_ECN_ECT_1] = 0xff,
52};
53EXPORT_SYMBOL(ip_frag_ecn_table);
Pavel Emelyanov7eb95152007-10-15 02:31:52 -070054
Florian Westphalfb3cfe62014-07-24 16:50:30 +020055static unsigned int
56inet_frag_hashfn(const struct inet_frags *f, const struct inet_frag_queue *q)
57{
58 return f->hashfn(q) & (INETFRAGS_HASHSZ - 1);
59}
60
Florian Westphale3a57d12014-07-24 16:50:35 +020061static bool inet_frag_may_rebuild(struct inet_frags *f)
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070062{
Florian Westphale3a57d12014-07-24 16:50:35 +020063 return time_after(jiffies,
64 f->last_rebuild_jiffies + INETFRAGS_MIN_REBUILD_INTERVAL);
65}
66
67static void inet_frag_secret_rebuild(struct inet_frags *f)
68{
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070069 int i;
70
Florian Westphalab1c7242014-07-24 16:50:36 +020071 write_seqlock_bh(&f->rnd_seqlock);
Florian Westphale3a57d12014-07-24 16:50:35 +020072
73 if (!inet_frag_may_rebuild(f))
74 goto out;
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000075
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070076 get_random_bytes(&f->rnd, sizeof(u32));
Florian Westphale3a57d12014-07-24 16:50:35 +020077
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070078 for (i = 0; i < INETFRAGS_HASHSZ; i++) {
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000079 struct inet_frag_bucket *hb;
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070080 struct inet_frag_queue *q;
Sasha Levinb67bfe02013-02-27 17:06:00 -080081 struct hlist_node *n;
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070082
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000083 hb = &f->hash[i];
Florian Westphalab1c7242014-07-24 16:50:36 +020084 spin_lock(&hb->chain_lock);
85
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000086 hlist_for_each_entry_safe(q, n, &hb->chain, list) {
Florian Westphalfb3cfe62014-07-24 16:50:30 +020087 unsigned int hval = inet_frag_hashfn(f, q);
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070088
89 if (hval != i) {
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000090 struct inet_frag_bucket *hb_dest;
91
Pavel Emelyanov321a3a92007-10-15 02:38:08 -070092 hlist_del(&q->list);
93
94 /* Relink to new hash chain. */
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +000095 hb_dest = &f->hash[hval];
Florian Westphalab1c7242014-07-24 16:50:36 +020096
97 /* This is the only place where we take
98 * another chain_lock while already holding
99 * one. As this will not run concurrently,
100 * we cannot deadlock on hb_dest lock below, if its
101 * already locked it will be released soon since
102 * other caller cannot be waiting for hb lock
103 * that we've taken above.
104 */
105 spin_lock_nested(&hb_dest->chain_lock,
106 SINGLE_DEPTH_NESTING);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000107 hlist_add_head(&q->list, &hb_dest->chain);
Florian Westphalab1c7242014-07-24 16:50:36 +0200108 spin_unlock(&hb_dest->chain_lock);
Pavel Emelyanov321a3a92007-10-15 02:38:08 -0700109 }
110 }
Florian Westphalab1c7242014-07-24 16:50:36 +0200111 spin_unlock(&hb->chain_lock);
Pavel Emelyanov321a3a92007-10-15 02:38:08 -0700112 }
Pavel Emelyanov321a3a92007-10-15 02:38:08 -0700113
Florian Westphale3a57d12014-07-24 16:50:35 +0200114 f->rebuild = false;
115 f->last_rebuild_jiffies = jiffies;
116out:
Florian Westphalab1c7242014-07-24 16:50:36 +0200117 write_sequnlock_bh(&f->rnd_seqlock);
Pavel Emelyanov321a3a92007-10-15 02:38:08 -0700118}
119
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200120static bool inet_fragq_should_evict(const struct inet_frag_queue *q)
121{
122 return q->net->low_thresh == 0 ||
123 frag_mem_limit(q->net) >= q->net->low_thresh;
124}
125
126static unsigned int
127inet_evict_bucket(struct inet_frags *f, struct inet_frag_bucket *hb)
128{
129 struct inet_frag_queue *fq;
130 struct hlist_node *n;
131 unsigned int evicted = 0;
132 HLIST_HEAD(expired);
133
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200134 spin_lock(&hb->chain_lock);
135
136 hlist_for_each_entry_safe(fq, n, &hb->chain, list) {
137 if (!inet_fragq_should_evict(fq))
138 continue;
139
Florian Westphal5719b292015-07-23 12:05:39 +0200140 if (!del_timer(&fq->timer))
141 continue;
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200142
Nikolay Aleksandrov06aa8b82014-08-01 12:29:44 +0200143 fq->flags |= INET_FRAG_EVICTED;
Florian Westphald1fe1942015-07-23 12:05:37 +0200144 hlist_add_head(&fq->list_evictor, &expired);
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200145 ++evicted;
146 }
147
148 spin_unlock(&hb->chain_lock);
149
Florian Westphald1fe1942015-07-23 12:05:37 +0200150 hlist_for_each_entry_safe(fq, n, &expired, list_evictor)
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200151 f->frag_expire((unsigned long) fq);
152
153 return evicted;
154}
155
156static void inet_frag_worker(struct work_struct *work)
157{
158 unsigned int budget = INETFRAGS_EVICT_BUCKETS;
159 unsigned int i, evicted = 0;
160 struct inet_frags *f;
161
162 f = container_of(work, struct inet_frags, frags_work);
163
164 BUILD_BUG_ON(INETFRAGS_EVICT_BUCKETS >= INETFRAGS_HASHSZ);
165
Florian Westphalab1c7242014-07-24 16:50:36 +0200166 local_bh_disable();
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200167
168 for (i = ACCESS_ONCE(f->next_bucket); budget; --budget) {
169 evicted += inet_evict_bucket(f, &f->hash[i]);
170 i = (i + 1) & (INETFRAGS_HASHSZ - 1);
171 if (evicted > INETFRAGS_EVICT_MAX)
172 break;
173 }
174
175 f->next_bucket = i;
176
Florian Westphalab1c7242014-07-24 16:50:36 +0200177 local_bh_enable();
178
Florian Westphale3a57d12014-07-24 16:50:35 +0200179 if (f->rebuild && inet_frag_may_rebuild(f))
180 inet_frag_secret_rebuild(f);
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200181}
182
183static void inet_frag_schedule_worker(struct inet_frags *f)
184{
185 if (unlikely(!work_pending(&f->frags_work)))
186 schedule_work(&f->frags_work);
187}
188
Nikolay Aleksandrovd4ad4d22014-08-01 12:29:48 +0200189int inet_frags_init(struct inet_frags *f)
Pavel Emelyanov7eb95152007-10-15 02:31:52 -0700190{
191 int i;
192
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200193 INIT_WORK(&f->frags_work, inet_frag_worker);
194
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000195 for (i = 0; i < INETFRAGS_HASHSZ; i++) {
196 struct inet_frag_bucket *hb = &f->hash[i];
Pavel Emelyanov7eb95152007-10-15 02:31:52 -0700197
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000198 spin_lock_init(&hb->chain_lock);
199 INIT_HLIST_HEAD(&hb->chain);
200 }
Florian Westphalab1c7242014-07-24 16:50:36 +0200201
202 seqlock_init(&f->rnd_seqlock);
Florian Westphale3a57d12014-07-24 16:50:35 +0200203 f->last_rebuild_jiffies = 0;
Nikolay Aleksandrovd4ad4d22014-08-01 12:29:48 +0200204 f->frags_cachep = kmem_cache_create(f->frags_cache_name, f->qsize, 0, 0,
205 NULL);
206 if (!f->frags_cachep)
207 return -ENOMEM;
208
209 return 0;
Pavel Emelyanov7eb95152007-10-15 02:31:52 -0700210}
211EXPORT_SYMBOL(inet_frags_init);
212
Pavel Emelyanove5a2bb82008-01-22 06:06:23 -0800213void inet_frags_init_net(struct netns_frags *nf)
214{
Jesper Dangaard Brouerd4336732013-01-28 23:45:12 +0000215 init_frag_mem_limit(nf);
Pavel Emelyanove5a2bb82008-01-22 06:06:23 -0800216}
217EXPORT_SYMBOL(inet_frags_init_net);
218
Pavel Emelyanov7eb95152007-10-15 02:31:52 -0700219void inet_frags_fini(struct inet_frags *f)
220{
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200221 cancel_work_sync(&f->frags_work);
Nikolay Aleksandrovd4ad4d22014-08-01 12:29:48 +0200222 kmem_cache_destroy(f->frags_cachep);
Pavel Emelyanov7eb95152007-10-15 02:31:52 -0700223}
224EXPORT_SYMBOL(inet_frags_fini);
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700225
Pavel Emelyanov81566e82008-01-22 06:12:39 -0800226void inet_frags_exit_net(struct netns_frags *nf, struct inet_frags *f)
227{
Florian Westphalab1c7242014-07-24 16:50:36 +0200228 unsigned int seq;
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200229 int i;
230
Pavel Emelyanov81566e82008-01-22 06:12:39 -0800231 nf->low_thresh = 0;
David S. Millere8e16b702008-03-28 17:30:18 -0700232
Florian Westphalab1c7242014-07-24 16:50:36 +0200233evict_again:
Florian Westphal5719b292015-07-23 12:05:39 +0200234 local_bh_disable();
Florian Westphalab1c7242014-07-24 16:50:36 +0200235 seq = read_seqbegin(&f->rnd_seqlock);
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200236
237 for (i = 0; i < INETFRAGS_HASHSZ ; i++)
238 inet_evict_bucket(f, &f->hash[i]);
239
Florian Westphalab1c7242014-07-24 16:50:36 +0200240 local_bh_enable();
Florian Westphal5719b292015-07-23 12:05:39 +0200241 cond_resched();
242
243 if (read_seqretry(&f->rnd_seqlock, seq) ||
244 percpu_counter_sum(&nf->mem))
245 goto evict_again;
Jesper Dangaard Brouer6d7b8572013-01-28 23:45:33 +0000246
247 percpu_counter_destroy(&nf->mem);
Pavel Emelyanov81566e82008-01-22 06:12:39 -0800248}
249EXPORT_SYMBOL(inet_frags_exit_net);
250
Florian Westphalab1c7242014-07-24 16:50:36 +0200251static struct inet_frag_bucket *
252get_frag_bucket_locked(struct inet_frag_queue *fq, struct inet_frags *f)
253__acquires(hb->chain_lock)
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700254{
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000255 struct inet_frag_bucket *hb;
Florian Westphalab1c7242014-07-24 16:50:36 +0200256 unsigned int seq, hash;
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000257
Florian Westphalab1c7242014-07-24 16:50:36 +0200258 restart:
259 seq = read_seqbegin(&f->rnd_seqlock);
260
Florian Westphalfb3cfe62014-07-24 16:50:30 +0200261 hash = inet_frag_hashfn(f, fq);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000262 hb = &f->hash[hash];
263
264 spin_lock(&hb->chain_lock);
Florian Westphalab1c7242014-07-24 16:50:36 +0200265 if (read_seqretry(&f->rnd_seqlock, seq)) {
266 spin_unlock(&hb->chain_lock);
267 goto restart;
268 }
269
270 return hb;
271}
272
273static inline void fq_unlink(struct inet_frag_queue *fq, struct inet_frags *f)
274{
275 struct inet_frag_bucket *hb;
276
277 hb = get_frag_bucket_locked(fq, f);
Florian Westphald1fe1942015-07-23 12:05:37 +0200278 hlist_del(&fq->list);
Florian Westphal5719b292015-07-23 12:05:39 +0200279 fq->flags |= INET_FRAG_COMPLETE;
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000280 spin_unlock(&hb->chain_lock);
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700281}
282
283void inet_frag_kill(struct inet_frag_queue *fq, struct inet_frags *f)
284{
285 if (del_timer(&fq->timer))
286 atomic_dec(&fq->refcnt);
287
Nikolay Aleksandrov06aa8b82014-08-01 12:29:44 +0200288 if (!(fq->flags & INET_FRAG_COMPLETE)) {
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700289 fq_unlink(fq, f);
290 atomic_dec(&fq->refcnt);
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700291 }
292}
Pavel Emelyanov277e6502007-10-15 02:37:18 -0700293EXPORT_SYMBOL(inet_frag_kill);
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700294
Pavel Emelyanov6ddc0822008-01-22 06:07:25 -0800295static inline void frag_kfree_skb(struct netns_frags *nf, struct inet_frags *f,
Nikolay Aleksandrov06aa8b82014-08-01 12:29:44 +0200296 struct sk_buff *skb)
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700297{
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700298 if (f->skb_free)
299 f->skb_free(skb);
300 kfree_skb(skb);
301}
302
Florian Westphal3fd588e2014-07-24 16:50:34 +0200303void inet_frag_destroy(struct inet_frag_queue *q, struct inet_frags *f)
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700304{
305 struct sk_buff *fp;
Pavel Emelyanov6ddc0822008-01-22 06:07:25 -0800306 struct netns_frags *nf;
Jesper Dangaard Brouerd4336732013-01-28 23:45:12 +0000307 unsigned int sum, sum_truesize = 0;
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700308
Nikolay Aleksandrov06aa8b82014-08-01 12:29:44 +0200309 WARN_ON(!(q->flags & INET_FRAG_COMPLETE));
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700310 WARN_ON(del_timer(&q->timer) != 0);
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700311
312 /* Release all fragment data. */
313 fp = q->fragments;
Pavel Emelyanov6ddc0822008-01-22 06:07:25 -0800314 nf = q->net;
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700315 while (fp) {
316 struct sk_buff *xp = fp->next;
317
Jesper Dangaard Brouerd4336732013-01-28 23:45:12 +0000318 sum_truesize += fp->truesize;
319 frag_kfree_skb(nf, f, fp);
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700320 fp = xp;
321 }
Jesper Dangaard Brouerd4336732013-01-28 23:45:12 +0000322 sum = sum_truesize + f->qsize;
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700323
Pavel Emelyanovc9547702007-10-17 19:48:26 -0700324 if (f->destructor)
325 f->destructor(q);
Nikolay Aleksandrovd4ad4d22014-08-01 12:29:48 +0200326 kmem_cache_free(f->frags_cachep, q);
Florian Westphal5719b292015-07-23 12:05:39 +0200327
328 sub_frag_mem_limit(nf, sum);
Pavel Emelyanov1e4b8282007-10-15 02:39:14 -0700329}
330EXPORT_SYMBOL(inet_frag_destroy);
Pavel Emelyanov8e7999c2007-10-15 02:40:06 -0700331
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800332static struct inet_frag_queue *inet_frag_intern(struct netns_frags *nf,
Nikolay Aleksandrovf926e232014-08-01 12:29:46 +0200333 struct inet_frag_queue *qp_in,
334 struct inet_frags *f,
335 void *arg)
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700336{
Florian Westphalab1c7242014-07-24 16:50:36 +0200337 struct inet_frag_bucket *hb = get_frag_bucket_locked(qp_in, f);
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700338 struct inet_frag_queue *qp;
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000339
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700340#ifdef CONFIG_SMP
341 /* With SMP race we have to recheck hash table, because
Florian Westphalab1c7242014-07-24 16:50:36 +0200342 * such entry could have been created on other cpu before
343 * we acquired hash bucket lock.
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700344 */
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000345 hlist_for_each_entry(qp, &hb->chain, list) {
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800346 if (qp->net == nf && f->match(qp, arg)) {
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700347 atomic_inc(&qp->refcnt);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000348 spin_unlock(&hb->chain_lock);
Nikolay Aleksandrov06aa8b82014-08-01 12:29:44 +0200349 qp_in->flags |= INET_FRAG_COMPLETE;
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700350 inet_frag_put(qp_in, f);
351 return qp;
352 }
353 }
354#endif
355 qp = qp_in;
Pavel Emelyanovb2fd5322008-01-22 06:09:37 -0800356 if (!mod_timer(&qp->timer, jiffies + nf->timeout))
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700357 atomic_inc(&qp->refcnt);
358
359 atomic_inc(&qp->refcnt);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000360 hlist_add_head(&qp->list, &hb->chain);
Florian Westphal3fd588e2014-07-24 16:50:34 +0200361
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000362 spin_unlock(&hb->chain_lock);
Nikolay Aleksandrov24b9bf42014-03-03 23:19:18 +0100363
Pavel Emelyanov2588fe12007-10-17 19:44:34 -0700364 return qp;
365}
Pavel Emelyanove521db92007-10-17 19:45:23 -0700366
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800367static struct inet_frag_queue *inet_frag_alloc(struct netns_frags *nf,
Nikolay Aleksandrovf926e232014-08-01 12:29:46 +0200368 struct inet_frags *f,
369 void *arg)
Pavel Emelyanove521db92007-10-17 19:45:23 -0700370{
371 struct inet_frag_queue *q;
372
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200373 if (frag_mem_limit(nf) > nf->high_thresh) {
374 inet_frag_schedule_worker(f);
Florian Westphal86e93e42014-07-24 16:50:31 +0200375 return NULL;
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200376 }
Florian Westphal86e93e42014-07-24 16:50:31 +0200377
Nikolay Aleksandrovd4ad4d22014-08-01 12:29:48 +0200378 q = kmem_cache_zalloc(f->frags_cachep, GFP_ATOMIC);
Ian Morris51456b22015-04-03 09:17:26 +0100379 if (!q)
Pavel Emelyanove521db92007-10-17 19:45:23 -0700380 return NULL;
381
Gao feng54db0cc2012-06-08 01:21:40 +0000382 q->net = nf;
Pavel Emelyanovc6fda282007-10-17 19:46:47 -0700383 f->constructor(q, arg);
Florian Westphal0e60d242015-07-23 12:05:38 +0200384 add_frag_mem_limit(nf, f->qsize);
Jesper Dangaard Brouerd4336732013-01-28 23:45:12 +0000385
Pavel Emelyanove521db92007-10-17 19:45:23 -0700386 setup_timer(&q->timer, f->frag_expire, (unsigned long)q);
387 spin_lock_init(&q->lock);
388 atomic_set(&q->refcnt, 1);
389
390 return q;
391}
Pavel Emelyanovc6fda282007-10-17 19:46:47 -0700392
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800393static struct inet_frag_queue *inet_frag_create(struct netns_frags *nf,
Nikolay Aleksandrovf926e232014-08-01 12:29:46 +0200394 struct inet_frags *f,
395 void *arg)
Pavel Emelyanovc6fda282007-10-17 19:46:47 -0700396{
397 struct inet_frag_queue *q;
398
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800399 q = inet_frag_alloc(nf, f, arg);
Ian Morris51456b22015-04-03 09:17:26 +0100400 if (!q)
Pavel Emelyanovc6fda282007-10-17 19:46:47 -0700401 return NULL;
402
Pavel Emelyanov9a375802008-06-27 20:06:08 -0700403 return inet_frag_intern(nf, q, f, arg);
Pavel Emelyanovc6fda282007-10-17 19:46:47 -0700404}
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700405
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800406struct inet_frag_queue *inet_frag_find(struct netns_frags *nf,
Nikolay Aleksandrovf926e232014-08-01 12:29:46 +0200407 struct inet_frags *f, void *key,
408 unsigned int hash)
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700409{
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000410 struct inet_frag_bucket *hb;
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700411 struct inet_frag_queue *q;
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +0000412 int depth = 0;
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700413
Florian Westphalb13d3cb2014-07-24 16:50:32 +0200414 if (frag_mem_limit(nf) > nf->low_thresh)
415 inet_frag_schedule_worker(f);
Florian Westphal86e93e42014-07-24 16:50:31 +0200416
Florian Westphalfb3cfe62014-07-24 16:50:30 +0200417 hash &= (INETFRAGS_HASHSZ - 1);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000418 hb = &f->hash[hash];
419
420 spin_lock(&hb->chain_lock);
421 hlist_for_each_entry(q, &hb->chain, list) {
Pavel Emelyanovac18e752008-01-22 06:02:14 -0800422 if (q->net == nf && f->match(q, key)) {
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700423 atomic_inc(&q->refcnt);
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000424 spin_unlock(&hb->chain_lock);
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700425 return q;
426 }
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +0000427 depth++;
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700428 }
Jesper Dangaard Brouer19952cc2013-04-03 23:38:16 +0000429 spin_unlock(&hb->chain_lock);
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700430
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +0000431 if (depth <= INETFRAGS_MAXDEPTH)
432 return inet_frag_create(nf, f, key);
Florian Westphale3a57d12014-07-24 16:50:35 +0200433
434 if (inet_frag_may_rebuild(f)) {
Florian Westphalab1c7242014-07-24 16:50:36 +0200435 if (!f->rebuild)
436 f->rebuild = true;
Florian Westphale3a57d12014-07-24 16:50:35 +0200437 inet_frag_schedule_worker(f);
438 }
439
440 return ERR_PTR(-ENOBUFS);
Pavel Emelyanovabd65232007-10-17 19:47:21 -0700441}
442EXPORT_SYMBOL(inet_frag_find);
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +0000443
444void inet_frag_maybe_warn_overflow(struct inet_frag_queue *q,
445 const char *prefix)
446{
447 static const char msg[] = "inet_frag_find: Fragment hash bucket"
448 " list length grew over limit " __stringify(INETFRAGS_MAXDEPTH)
449 ". Dropping fragment.\n";
450
451 if (PTR_ERR(q) == -ENOBUFS)
Joe Perchesba7a46f2014-11-11 10:59:17 -0800452 net_dbg_ratelimited("%s%s", prefix, msg);
Hannes Frederic Sowa5a3da1f2013-03-15 11:32:30 +0000453}
454EXPORT_SYMBOL(inet_frag_maybe_warn_overflow);