blob: b08c7cb5c9d6cf96da17646db74542b409a3910b [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* SCTP kernel reference Implementation
2 * Copyright (c) 1999-2000 Cisco, Inc.
3 * Copyright (c) 1999-2001 Motorola, Inc.
4 * Copyright (c) 2001-2003 International Business Machines, Corp.
5 * Copyright (c) 2001 Intel Corp.
6 * Copyright (c) 2001 Nokia, Inc.
7 * Copyright (c) 2001 La Monte H.P. Yarroll
8 *
9 * This file is part of the SCTP kernel reference Implementation
10 *
11 * These functions handle all input from the IP layer into SCTP.
12 *
13 * The SCTP reference implementation is free software;
14 * you can redistribute it and/or modify it under the terms of
15 * the GNU General Public License as published by
16 * the Free Software Foundation; either version 2, or (at your option)
17 * any later version.
18 *
19 * The SCTP reference implementation is distributed in the hope that it
20 * will be useful, but WITHOUT ANY WARRANTY; without even the implied
21 * ************************
22 * warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
23 * See the GNU General Public License for more details.
24 *
25 * You should have received a copy of the GNU General Public License
26 * along with GNU CC; see the file COPYING. If not, write to
27 * the Free Software Foundation, 59 Temple Place - Suite 330,
28 * Boston, MA 02111-1307, USA.
29 *
30 * Please send any bug reports or fixes you make to the
31 * email address(es):
32 * lksctp developers <lksctp-developers@lists.sourceforge.net>
33 *
34 * Or submit a bug report through the following website:
35 * http://www.sf.net/projects/lksctp
36 *
37 * Written or modified by:
38 * La Monte H.P. Yarroll <piggy@acm.org>
39 * Karl Knutson <karl@athena.chicago.il.us>
40 * Xingang Guo <xingang.guo@intel.com>
41 * Jon Grimm <jgrimm@us.ibm.com>
42 * Hui Huang <hui.huang@nokia.com>
43 * Daisy Chang <daisyc@us.ibm.com>
44 * Sridhar Samudrala <sri@us.ibm.com>
45 * Ardelle Fan <ardelle.fan@intel.com>
46 *
47 * Any bugs reported given to us we will try to fix... any fixes shared will
48 * be incorporated into the next SCTP release.
49 */
50
51#include <linux/types.h>
52#include <linux/list.h> /* For struct list_head */
53#include <linux/socket.h>
54#include <linux/ip.h>
55#include <linux/time.h> /* For struct timeval */
56#include <net/ip.h>
57#include <net/icmp.h>
58#include <net/snmp.h>
59#include <net/sock.h>
60#include <net/xfrm.h>
61#include <net/sctp/sctp.h>
62#include <net/sctp/sm.h>
Vlad Yasevich9ad09772007-12-16 14:06:41 -080063#include <net/sctp/checksum.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070064
65/* Forward declarations for internal helpers. */
66static int sctp_rcv_ootb(struct sk_buff *);
67static struct sctp_association *__sctp_rcv_lookup(struct sk_buff *skb,
68 const union sctp_addr *laddr,
69 const union sctp_addr *paddr,
70 struct sctp_transport **transportp);
71static struct sctp_endpoint *__sctp_rcv_lookup_endpoint(const union sctp_addr *laddr);
72static struct sctp_association *__sctp_lookup_association(
73 const union sctp_addr *local,
74 const union sctp_addr *peer,
75 struct sctp_transport **pt);
76
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -070077static void sctp_add_backlog(struct sock *sk, struct sk_buff *skb);
78
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
80/* Calculate the SCTP checksum of an SCTP packet. */
81static inline int sctp_rcv_checksum(struct sk_buff *skb)
82{
Linus Torvalds1da177e2005-04-16 15:20:36 -070083 struct sk_buff *list = skb_shinfo(skb)->frag_list;
Arnaldo Carvalho de Melo2c0fd382007-03-13 13:59:32 -030084 struct sctphdr *sh = sctp_hdr(skb);
85 __u32 cmp = ntohl(sh->checksum);
86 __u32 val = sctp_start_cksum((__u8 *)sh, skb_headlen(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
88 for (; list; list = list->next)
89 val = sctp_update_cksum((__u8 *)list->data, skb_headlen(list),
90 val);
91
92 val = sctp_end_cksum(val);
93
94 if (val != cmp) {
95 /* CRC failure, dump it. */
96 SCTP_INC_STATS_BH(SCTP_MIB_CHECKSUMERRORS);
97 return -1;
98 }
99 return 0;
100}
101
David S. Miller79af02c2005-07-08 21:47:49 -0700102struct sctp_input_cb {
103 union {
104 struct inet_skb_parm h4;
105#if defined(CONFIG_IPV6) || defined (CONFIG_IPV6_MODULE)
106 struct inet6_skb_parm h6;
107#endif
108 } header;
109 struct sctp_chunk *chunk;
110};
111#define SCTP_INPUT_CB(__skb) ((struct sctp_input_cb *)&((__skb)->cb[0]))
112
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113/*
114 * This is the routine which IP calls when receiving an SCTP packet.
115 */
116int sctp_rcv(struct sk_buff *skb)
117{
118 struct sock *sk;
119 struct sctp_association *asoc;
120 struct sctp_endpoint *ep = NULL;
121 struct sctp_ep_common *rcvr;
122 struct sctp_transport *transport = NULL;
123 struct sctp_chunk *chunk;
124 struct sctphdr *sh;
125 union sctp_addr src;
126 union sctp_addr dest;
127 int family;
128 struct sctp_af *af;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129
130 if (skb->pkt_type!=PACKET_HOST)
131 goto discard_it;
132
133 SCTP_INC_STATS_BH(SCTP_MIB_INSCTPPACKS);
134
Herbert Xu28cd7752006-10-29 23:46:42 -0800135 if (skb_linearize(skb))
136 goto discard_it;
137
Arnaldo Carvalho de Melo2c0fd382007-03-13 13:59:32 -0300138 sh = sctp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139
140 /* Pull up the IP and SCTP headers. */
Arnaldo Carvalho de Meloea2ae172007-04-25 17:55:53 -0700141 __skb_pull(skb, skb_transport_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 if (skb->len < sizeof(struct sctphdr))
143 goto discard_it;
Herbert Xu60476372007-04-09 11:59:39 -0700144 if (!skb_csum_unnecessary(skb) && sctp_rcv_checksum(skb) < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 goto discard_it;
146
147 skb_pull(skb, sizeof(struct sctphdr));
148
149 /* Make sure we at least have chunk headers worth of data left. */
150 if (skb->len < sizeof(struct sctp_chunkhdr))
151 goto discard_it;
152
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700153 family = ipver2af(ip_hdr(skb)->version);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 af = sctp_get_af_specific(family);
155 if (unlikely(!af))
156 goto discard_it;
157
158 /* Initialize local addresses for lookups. */
159 af->from_skb(&src, skb, 1);
160 af->from_skb(&dest, skb, 0);
161
162 /* If the packet is to or from a non-unicast address,
163 * silently discard the packet.
164 *
165 * This is not clearly defined in the RFC except in section
166 * 8.4 - OOTB handling. However, based on the book "Stream Control
167 * Transmission Protocol" 2.1, "It is important to note that the
168 * IP address of an SCTP transport address must be a routable
169 * unicast address. In other words, IP multicast addresses and
170 * IP broadcast addresses cannot be used in an SCTP transport
171 * address."
172 */
Vlad Yasevich5636bef2006-06-17 22:55:35 -0700173 if (!af->addr_valid(&src, NULL, skb) ||
174 !af->addr_valid(&dest, NULL, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175 goto discard_it;
176
Al Virod55c41b2006-11-20 17:09:40 -0800177 asoc = __sctp_rcv_lookup(skb, &src, &dest, &transport);
Al Viro1c7d1fc2006-11-20 17:08:09 -0800178
Neil Horman0fd9a652005-06-13 15:11:24 -0700179 if (!asoc)
Al Virod55c41b2006-11-20 17:09:40 -0800180 ep = __sctp_rcv_lookup_endpoint(&dest);
Neil Horman0fd9a652005-06-13 15:11:24 -0700181
182 /* Retrieve the common input handling substructure. */
183 rcvr = asoc ? &asoc->base : &ep->base;
184 sk = rcvr->sk;
185
186 /*
187 * If a frame arrives on an interface and the receiving socket is
188 * bound to another interface, via SO_BINDTODEVICE, treat it as OOTB
189 */
190 if (sk->sk_bound_dev_if && (sk->sk_bound_dev_if != af->skb_iif(skb)))
191 {
Neil Horman0fd9a652005-06-13 15:11:24 -0700192 if (asoc) {
193 sctp_association_put(asoc);
194 asoc = NULL;
195 } else {
196 sctp_endpoint_put(ep);
197 ep = NULL;
198 }
199 sk = sctp_get_ctl_sock();
200 ep = sctp_sk(sk)->ep;
201 sctp_endpoint_hold(ep);
Neil Horman0fd9a652005-06-13 15:11:24 -0700202 rcvr = &ep->base;
203 }
204
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 /*
206 * RFC 2960, 8.4 - Handle "Out of the blue" Packets.
207 * An SCTP packet is called an "out of the blue" (OOTB)
208 * packet if it is correctly formed, i.e., passed the
209 * receiver's checksum check, but the receiver is not
210 * able to identify the association to which this
211 * packet belongs.
212 */
213 if (!asoc) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 if (sctp_rcv_ootb(skb)) {
215 SCTP_INC_STATS_BH(SCTP_MIB_OUTOFBLUES);
216 goto discard_release;
217 }
218 }
219
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 if (!xfrm_policy_check(sk, XFRM_POLICY_IN, skb, family))
221 goto discard_release;
Patrick McHardyb59c2702006-01-06 23:06:10 -0800222 nf_reset(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
Dmitry Mishinfda9ef52006-08-31 15:28:39 -0700224 if (sk_filter(sk, skb))
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900225 goto discard_release;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226
227 /* Create an SCTP packet structure. */
228 chunk = sctp_chunkify(skb, asoc, sk);
Herbert Xu2babf9d2006-03-25 01:25:29 -0800229 if (!chunk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 goto discard_release;
David S. Miller79af02c2005-07-08 21:47:49 -0700231 SCTP_INPUT_CB(skb)->chunk = chunk;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233 /* Remember what endpoint is to handle this packet. */
234 chunk->rcvr = rcvr;
235
236 /* Remember the SCTP header. */
237 chunk->sctp_hdr = sh;
238
239 /* Set the source and destination addresses of the incoming chunk. */
Al Virod55c41b2006-11-20 17:09:40 -0800240 sctp_init_addrs(chunk, &src, &dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241
242 /* Remember where we came from. */
243 chunk->transport = transport;
244
245 /* Acquire access to the sock lock. Note: We are safe from other
246 * bottom halves on this lock, but a user may be in the lock too,
247 * so check if it is busy.
248 */
249 sctp_bh_lock_sock(sk);
250
Sridhar Samudralaac0b0462006-08-22 00:15:33 -0700251 if (sock_owned_by_user(sk)) {
252 SCTP_INC_STATS_BH(SCTP_MIB_IN_PKT_BACKLOG);
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700253 sctp_add_backlog(sk, skb);
Sridhar Samudralaac0b0462006-08-22 00:15:33 -0700254 } else {
255 SCTP_INC_STATS_BH(SCTP_MIB_IN_PKT_SOFTIRQ);
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700256 sctp_inq_push(&chunk->rcvr->inqueue, chunk);
Sridhar Samudralaac0b0462006-08-22 00:15:33 -0700257 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259 sctp_bh_unlock_sock(sk);
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700260
261 /* Release the asoc/ep ref we took in the lookup calls. */
262 if (asoc)
263 sctp_association_put(asoc);
264 else
265 sctp_endpoint_put(ep);
Sridhar Samudrala7a48f922006-01-17 11:51:28 -0800266
Herbert Xu2babf9d2006-03-25 01:25:29 -0800267 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
269discard_it:
Sridhar Samudralaac0b0462006-08-22 00:15:33 -0700270 SCTP_INC_STATS_BH(SCTP_MIB_IN_PKT_DISCARDS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271 kfree_skb(skb);
Herbert Xu2babf9d2006-03-25 01:25:29 -0800272 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273
274discard_release:
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700275 /* Release the asoc/ep ref we took in the lookup calls. */
Neil Horman0fd9a652005-06-13 15:11:24 -0700276 if (asoc)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 sctp_association_put(asoc);
Neil Horman0fd9a652005-06-13 15:11:24 -0700278 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 sctp_endpoint_put(ep);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280
281 goto discard_it;
282}
283
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700284/* Process the backlog queue of the socket. Every skb on
285 * the backlog holds a ref on an association or endpoint.
286 * We hold this ref throughout the state machine to make
287 * sure that the structure we need is still around.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 */
289int sctp_backlog_rcv(struct sock *sk, struct sk_buff *skb)
290{
David S. Miller79af02c2005-07-08 21:47:49 -0700291 struct sctp_chunk *chunk = SCTP_INPUT_CB(skb)->chunk;
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900292 struct sctp_inq *inqueue = &chunk->rcvr->inqueue;
293 struct sctp_ep_common *rcvr = NULL;
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700294 int backloged = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900296 rcvr = chunk->rcvr;
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800297
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700298 /* If the rcvr is dead then the association or endpoint
299 * has been deleted and we can safely drop the chunk
300 * and refs that we are holding.
301 */
302 if (rcvr->dead) {
303 sctp_chunk_free(chunk);
304 goto done;
305 }
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800306
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700307 if (unlikely(rcvr->sk != sk)) {
308 /* In this case, the association moved from one socket to
309 * another. We are currently sitting on the backlog of the
310 * old socket, so we need to move.
311 * However, since we are here in the process context we
312 * need to take make sure that the user doesn't own
313 * the new socket when we process the packet.
314 * If the new socket is user-owned, queue the chunk to the
315 * backlog of the new socket without dropping any refs.
316 * Otherwise, we can safely push the chunk on the inqueue.
317 */
Sridhar Samudrala7a48f922006-01-17 11:51:28 -0800318
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700319 sk = rcvr->sk;
320 sctp_bh_lock_sock(sk);
321
322 if (sock_owned_by_user(sk)) {
323 sk_add_backlog(sk, skb);
324 backloged = 1;
325 } else
326 sctp_inq_push(inqueue, chunk);
327
328 sctp_bh_unlock_sock(sk);
329
330 /* If the chunk was backloged again, don't drop refs */
331 if (backloged)
332 return 0;
333 } else {
334 sctp_inq_push(inqueue, chunk);
335 }
336
337done:
338 /* Release the refs we took in sctp_add_backlog */
339 if (SCTP_EP_TYPE_ASSOCIATION == rcvr->type)
340 sctp_association_put(sctp_assoc(rcvr));
341 else if (SCTP_EP_TYPE_SOCKET == rcvr->type)
342 sctp_endpoint_put(sctp_ep(rcvr));
343 else
344 BUG();
345
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900346 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347}
348
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700349static void sctp_add_backlog(struct sock *sk, struct sk_buff *skb)
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800350{
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700351 struct sctp_chunk *chunk = SCTP_INPUT_CB(skb)->chunk;
352 struct sctp_ep_common *rcvr = chunk->rcvr;
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800353
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700354 /* Hold the assoc/ep while hanging on the backlog queue.
355 * This way, we know structures we need will not disappear from us
356 */
357 if (SCTP_EP_TYPE_ASSOCIATION == rcvr->type)
358 sctp_association_hold(sctp_assoc(rcvr));
359 else if (SCTP_EP_TYPE_SOCKET == rcvr->type)
360 sctp_endpoint_hold(sctp_ep(rcvr));
361 else
362 BUG();
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800363
Vladislav Yasevich61c9fed2006-05-19 11:01:18 -0700364 sk_add_backlog(sk, skb);
Sridhar Samudralac4d24442006-01-17 11:56:26 -0800365}
366
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367/* Handle icmp frag needed error. */
368void sctp_icmp_frag_needed(struct sock *sk, struct sctp_association *asoc,
369 struct sctp_transport *t, __u32 pmtu)
370{
Vlad Yasevich8a479492007-06-07 14:21:05 -0400371 if (!t || (t->pathmtu == pmtu))
Frank Filz52ccb8e2005-12-22 11:36:46 -0800372 return;
373
Vlad Yasevich8a479492007-06-07 14:21:05 -0400374 if (sock_owned_by_user(sk)) {
375 asoc->pmtu_pending = 1;
376 t->pmtu_pending = 1;
377 return;
378 }
379
Frank Filz52ccb8e2005-12-22 11:36:46 -0800380 if (t->param_flags & SPP_PMTUD_ENABLE) {
Vlad Yasevichc910b472007-06-07 13:47:03 -0400381 /* Update transports view of the MTU */
382 sctp_transport_update_pmtu(t, pmtu);
Frank Filz52ccb8e2005-12-22 11:36:46 -0800383
384 /* Update association pmtu. */
385 sctp_assoc_sync_pmtu(asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 }
387
Frank Filz52ccb8e2005-12-22 11:36:46 -0800388 /* Retransmit with the new pmtu setting.
389 * Normally, if PMTU discovery is disabled, an ICMP Fragmentation
390 * Needed will never be sent, but if a message was sent before
391 * PMTU discovery was disabled that was larger than the PMTU, it
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900392 * would not be fragmented, so it must be re-transmitted fragmented.
Frank Filz52ccb8e2005-12-22 11:36:46 -0800393 */
394 sctp_retransmit(&asoc->outqueue, t, SCTP_RTXR_PMTUD);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395}
396
397/*
398 * SCTP Implementer's Guide, 2.37 ICMP handling procedures
399 *
400 * ICMP8) If the ICMP code is a "Unrecognized next header type encountered"
401 * or a "Protocol Unreachable" treat this message as an abort
402 * with the T bit set.
403 *
404 * This function sends an event to the state machine, which will abort the
405 * association.
406 *
407 */
408void sctp_icmp_proto_unreachable(struct sock *sk,
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900409 struct sctp_association *asoc,
410 struct sctp_transport *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411{
412 SCTP_DEBUG_PRINTK("%s\n", __FUNCTION__);
413
414 sctp_do_sm(SCTP_EVENT_T_OTHER,
415 SCTP_ST_OTHER(SCTP_EVENT_ICMP_PROTO_UNREACH),
Frank Filz3f7a87d2005-06-20 13:14:57 -0700416 asoc->state, asoc->ep, asoc, t,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 GFP_ATOMIC);
418
419}
420
421/* Common lookup code for icmp/icmpv6 error handler. */
422struct sock *sctp_err_lookup(int family, struct sk_buff *skb,
423 struct sctphdr *sctphdr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 struct sctp_association **app,
425 struct sctp_transport **tpp)
426{
427 union sctp_addr saddr;
428 union sctp_addr daddr;
429 struct sctp_af *af;
430 struct sock *sk = NULL;
Sridhar Samudrala8de8c872006-05-19 10:58:12 -0700431 struct sctp_association *asoc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432 struct sctp_transport *transport = NULL;
433
Sridhar Samudralad1ad1ff2005-07-18 13:44:10 -0700434 *app = NULL; *tpp = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435
436 af = sctp_get_af_specific(family);
437 if (unlikely(!af)) {
438 return NULL;
439 }
440
441 /* Initialize local addresses for lookups. */
442 af->from_skb(&saddr, skb, 1);
443 af->from_skb(&daddr, skb, 0);
444
445 /* Look for an association that matches the incoming ICMP error
446 * packet.
447 */
Al Virod55c41b2006-11-20 17:09:40 -0800448 asoc = __sctp_lookup_association(&saddr, &daddr, &transport);
Sridhar Samudralad1ad1ff2005-07-18 13:44:10 -0700449 if (!asoc)
450 return NULL;
451
452 sk = asoc->base.sk;
453
454 if (ntohl(sctphdr->vtag) != asoc->c.peer_vtag) {
455 ICMP_INC_STATS_BH(ICMP_MIB_INERRORS);
456 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 }
458
Linus Torvalds1da177e2005-04-16 15:20:36 -0700459 sctp_bh_lock_sock(sk);
460
461 /* If too many ICMPs get dropped on busy
462 * servers this needs to be solved differently.
463 */
464 if (sock_owned_by_user(sk))
465 NET_INC_STATS_BH(LINUX_MIB_LOCKDROPPEDICMPS);
466
Linus Torvalds1da177e2005-04-16 15:20:36 -0700467 *app = asoc;
468 *tpp = transport;
469 return sk;
470
471out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472 if (asoc)
473 sctp_association_put(asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700474 return NULL;
475}
476
477/* Common cleanup code for icmp/icmpv6 error handler. */
Sridhar Samudralad1ad1ff2005-07-18 13:44:10 -0700478void sctp_err_finish(struct sock *sk, struct sctp_association *asoc)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479{
480 sctp_bh_unlock_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 if (asoc)
482 sctp_association_put(asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483}
484
485/*
486 * This routine is called by the ICMP module when it gets some
487 * sort of error condition. If err < 0 then the socket should
488 * be closed and the error returned to the user. If err > 0
489 * it's just the icmp type << 8 | icmp code. After adjustment
490 * header points to the first 8 bytes of the sctp header. We need
491 * to find the appropriate port.
492 *
493 * The locking strategy used here is very "optimistic". When
494 * someone else accesses the socket the ICMP is just dropped
495 * and for some paths there is no check at all.
496 * A more general error queue to queue errors for later handling
497 * is probably better.
498 *
499 */
500void sctp_v4_err(struct sk_buff *skb, __u32 info)
501{
502 struct iphdr *iph = (struct iphdr *)skb->data;
Arnaldo Carvalho de Meloa27ef742007-03-13 17:17:10 -0300503 const int ihlen = iph->ihl * 4;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300504 const int type = icmp_hdr(skb)->type;
505 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506 struct sock *sk;
Sridhar Samudrala8de8c872006-05-19 10:58:12 -0700507 struct sctp_association *asoc = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 struct sctp_transport *transport;
509 struct inet_sock *inet;
Arnaldo Carvalho de Melo2e07fa92007-04-10 21:22:35 -0700510 sk_buff_data_t saveip, savesctp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 int err;
512
Arnaldo Carvalho de Meloa27ef742007-03-13 17:17:10 -0300513 if (skb->len < ihlen + 8) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700514 ICMP_INC_STATS_BH(ICMP_MIB_INERRORS);
515 return;
516 }
517
518 /* Fix up skb to look at the embedded net header. */
Arnaldo Carvalho de Melob0e380b2007-04-10 21:21:55 -0700519 saveip = skb->network_header;
520 savesctp = skb->transport_header;
Arnaldo Carvalho de Melo31c77112007-03-10 19:04:55 -0300521 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloa27ef742007-03-13 17:17:10 -0300522 skb_set_transport_header(skb, ihlen);
523 sk = sctp_err_lookup(AF_INET, skb, sctp_hdr(skb), &asoc, &transport);
Arnaldo Carvalho de Melo2e07fa92007-04-10 21:22:35 -0700524 /* Put back, the original values. */
Arnaldo Carvalho de Melob0e380b2007-04-10 21:21:55 -0700525 skb->network_header = saveip;
526 skb->transport_header = savesctp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 if (!sk) {
528 ICMP_INC_STATS_BH(ICMP_MIB_INERRORS);
529 return;
530 }
531 /* Warning: The sock lock is held. Remember to call
532 * sctp_err_finish!
533 */
534
535 switch (type) {
536 case ICMP_PARAMETERPROB:
537 err = EPROTO;
538 break;
539 case ICMP_DEST_UNREACH:
540 if (code > NR_ICMP_UNREACH)
541 goto out_unlock;
542
543 /* PMTU discovery (RFC1191) */
544 if (ICMP_FRAG_NEEDED == code) {
545 sctp_icmp_frag_needed(sk, asoc, transport, info);
546 goto out_unlock;
547 }
548 else {
549 if (ICMP_PROT_UNREACH == code) {
Sridhar Samudralad1ad1ff2005-07-18 13:44:10 -0700550 sctp_icmp_proto_unreachable(sk, asoc,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 transport);
552 goto out_unlock;
553 }
554 }
555 err = icmp_err_convert[code].errno;
556 break;
557 case ICMP_TIME_EXCEEDED:
558 /* Ignore any time exceeded errors due to fragment reassembly
559 * timeouts.
560 */
561 if (ICMP_EXC_FRAGTIME == code)
562 goto out_unlock;
563
564 err = EHOSTUNREACH;
565 break;
566 default:
567 goto out_unlock;
568 }
569
570 inet = inet_sk(sk);
571 if (!sock_owned_by_user(sk) && inet->recverr) {
572 sk->sk_err = err;
573 sk->sk_error_report(sk);
574 } else { /* Only an error on timeout */
575 sk->sk_err_soft = err;
576 }
577
578out_unlock:
Sridhar Samudralad1ad1ff2005-07-18 13:44:10 -0700579 sctp_err_finish(sk, asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580}
581
582/*
583 * RFC 2960, 8.4 - Handle "Out of the blue" Packets.
584 *
585 * This function scans all the chunks in the OOTB packet to determine if
586 * the packet should be discarded right away. If a response might be needed
587 * for this packet, or, if further processing is possible, the packet will
588 * be queued to a proper inqueue for the next phase of handling.
589 *
590 * Output:
591 * Return 0 - If further processing is needed.
592 * Return 1 - If the packet can be discarded right away.
593 */
sebastian@breakpoint.cc04675212007-07-26 23:21:31 +0200594static int sctp_rcv_ootb(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595{
596 sctp_chunkhdr_t *ch;
597 __u8 *ch_end;
598 sctp_errhdr_t *err;
599
600 ch = (sctp_chunkhdr_t *) skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601
602 /* Scan through all the chunks in the packet. */
Tsutomu Fujiia7d1f1b2006-01-17 11:57:09 -0800603 do {
604 /* Break out if chunk length is less then minimal. */
605 if (ntohs(ch->length) < sizeof(sctp_chunkhdr_t))
606 break;
607
608 ch_end = ((__u8 *)ch) + WORD_ROUND(ntohs(ch->length));
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700609 if (ch_end > skb_tail_pointer(skb))
Tsutomu Fujiia7d1f1b2006-01-17 11:57:09 -0800610 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611
612 /* RFC 8.4, 2) If the OOTB packet contains an ABORT chunk, the
613 * receiver MUST silently discard the OOTB packet and take no
614 * further action.
615 */
616 if (SCTP_CID_ABORT == ch->type)
617 goto discard;
618
619 /* RFC 8.4, 6) If the packet contains a SHUTDOWN COMPLETE
620 * chunk, the receiver should silently discard the packet
621 * and take no further action.
622 */
623 if (SCTP_CID_SHUTDOWN_COMPLETE == ch->type)
624 goto discard;
625
Vlad Yasevich3c77f962007-09-17 15:14:28 -0400626 /* RFC 4460, 2.11.2
627 * This will discard packets with INIT chunk bundled as
628 * subsequent chunks in the packet. When INIT is first,
629 * the normal INIT processing will discard the chunk.
630 */
631 if (SCTP_CID_INIT == ch->type && (void *)ch != skb->data)
632 goto discard;
633
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 /* RFC 8.4, 7) If the packet contains a "Stale cookie" ERROR
635 * or a COOKIE ACK the SCTP Packet should be silently
636 * discarded.
637 */
638 if (SCTP_CID_COOKIE_ACK == ch->type)
639 goto discard;
640
641 if (SCTP_CID_ERROR == ch->type) {
642 sctp_walk_errors(err, ch) {
643 if (SCTP_ERROR_STALE_COOKIE == err->cause)
644 goto discard;
645 }
646 }
647
648 ch = (sctp_chunkhdr_t *) ch_end;
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700649 } while (ch_end < skb_tail_pointer(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650
651 return 0;
652
653discard:
654 return 1;
655}
656
657/* Insert endpoint into the hash table. */
658static void __sctp_hash_endpoint(struct sctp_endpoint *ep)
659{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660 struct sctp_ep_common *epb;
661 struct sctp_hashbucket *head;
662
663 epb = &ep->base;
664
665 epb->hashent = sctp_ep_hashfn(epb->bind_addr.port);
666 head = &sctp_ep_hashtable[epb->hashent];
667
668 sctp_write_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500669 hlist_add_head(&epb->node, &head->chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 sctp_write_unlock(&head->lock);
671}
672
673/* Add an endpoint to the hash. Local BH-safe. */
674void sctp_hash_endpoint(struct sctp_endpoint *ep)
675{
676 sctp_local_bh_disable();
677 __sctp_hash_endpoint(ep);
678 sctp_local_bh_enable();
679}
680
681/* Remove endpoint from the hash table. */
682static void __sctp_unhash_endpoint(struct sctp_endpoint *ep)
683{
684 struct sctp_hashbucket *head;
685 struct sctp_ep_common *epb;
686
687 epb = &ep->base;
688
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500689 if (hlist_unhashed(&epb->node))
690 return;
691
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692 epb->hashent = sctp_ep_hashfn(epb->bind_addr.port);
693
694 head = &sctp_ep_hashtable[epb->hashent];
695
696 sctp_write_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500697 __hlist_del(&epb->node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 sctp_write_unlock(&head->lock);
699}
700
701/* Remove endpoint from the hash. Local BH-safe. */
702void sctp_unhash_endpoint(struct sctp_endpoint *ep)
703{
704 sctp_local_bh_disable();
705 __sctp_unhash_endpoint(ep);
706 sctp_local_bh_enable();
707}
708
709/* Look up an endpoint. */
710static struct sctp_endpoint *__sctp_rcv_lookup_endpoint(const union sctp_addr *laddr)
711{
712 struct sctp_hashbucket *head;
713 struct sctp_ep_common *epb;
714 struct sctp_endpoint *ep;
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500715 struct hlist_node *node;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700716 int hash;
717
Al Viro1c7d1fc2006-11-20 17:08:09 -0800718 hash = sctp_ep_hashfn(ntohs(laddr->v4.sin_port));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700719 head = &sctp_ep_hashtable[hash];
720 read_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500721 sctp_for_each_hentry(epb, node, &head->chain) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722 ep = sctp_ep(epb);
723 if (sctp_endpoint_is_match(ep, laddr))
724 goto hit;
725 }
726
727 ep = sctp_sk((sctp_get_ctl_sock()))->ep;
728 epb = &ep->base;
729
730hit:
731 sctp_endpoint_hold(ep);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 read_unlock(&head->lock);
733 return ep;
734}
735
736/* Insert association into the hash table. */
737static void __sctp_hash_established(struct sctp_association *asoc)
738{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739 struct sctp_ep_common *epb;
740 struct sctp_hashbucket *head;
741
742 epb = &asoc->base;
743
744 /* Calculate which chain this entry will belong to. */
745 epb->hashent = sctp_assoc_hashfn(epb->bind_addr.port, asoc->peer.port);
746
747 head = &sctp_assoc_hashtable[epb->hashent];
748
749 sctp_write_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500750 hlist_add_head(&epb->node, &head->chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 sctp_write_unlock(&head->lock);
752}
753
754/* Add an association to the hash. Local BH-safe. */
755void sctp_hash_established(struct sctp_association *asoc)
756{
Vlad Yasevichde76e692006-10-30 18:55:11 -0800757 if (asoc->temp)
758 return;
759
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760 sctp_local_bh_disable();
761 __sctp_hash_established(asoc);
762 sctp_local_bh_enable();
763}
764
765/* Remove association from the hash table. */
766static void __sctp_unhash_established(struct sctp_association *asoc)
767{
768 struct sctp_hashbucket *head;
769 struct sctp_ep_common *epb;
770
771 epb = &asoc->base;
772
773 epb->hashent = sctp_assoc_hashfn(epb->bind_addr.port,
774 asoc->peer.port);
775
776 head = &sctp_assoc_hashtable[epb->hashent];
777
778 sctp_write_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500779 __hlist_del(&epb->node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 sctp_write_unlock(&head->lock);
781}
782
783/* Remove association from the hash table. Local BH-safe. */
784void sctp_unhash_established(struct sctp_association *asoc)
785{
Vlad Yasevichde76e692006-10-30 18:55:11 -0800786 if (asoc->temp)
787 return;
788
Linus Torvalds1da177e2005-04-16 15:20:36 -0700789 sctp_local_bh_disable();
790 __sctp_unhash_established(asoc);
791 sctp_local_bh_enable();
792}
793
794/* Look up an association. */
795static struct sctp_association *__sctp_lookup_association(
796 const union sctp_addr *local,
797 const union sctp_addr *peer,
798 struct sctp_transport **pt)
799{
800 struct sctp_hashbucket *head;
801 struct sctp_ep_common *epb;
802 struct sctp_association *asoc;
803 struct sctp_transport *transport;
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500804 struct hlist_node *node;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700805 int hash;
806
807 /* Optimize here for direct hit, only listening connections can
808 * have wildcards anyways.
809 */
Al Viroe2fcced2006-11-20 17:08:41 -0800810 hash = sctp_assoc_hashfn(ntohs(local->v4.sin_port), ntohs(peer->v4.sin_port));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700811 head = &sctp_assoc_hashtable[hash];
812 read_lock(&head->lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -0500813 sctp_for_each_hentry(epb, node, &head->chain) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814 asoc = sctp_assoc(epb);
815 transport = sctp_assoc_is_match(asoc, local, peer);
816 if (transport)
817 goto hit;
818 }
819
820 read_unlock(&head->lock);
821
822 return NULL;
823
824hit:
825 *pt = transport;
826 sctp_association_hold(asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700827 read_unlock(&head->lock);
828 return asoc;
829}
830
831/* Look up an association. BH-safe. */
832SCTP_STATIC
833struct sctp_association *sctp_lookup_association(const union sctp_addr *laddr,
834 const union sctp_addr *paddr,
835 struct sctp_transport **transportp)
836{
837 struct sctp_association *asoc;
838
839 sctp_local_bh_disable();
840 asoc = __sctp_lookup_association(laddr, paddr, transportp);
841 sctp_local_bh_enable();
842
843 return asoc;
844}
845
846/* Is there an association matching the given local and peer addresses? */
847int sctp_has_association(const union sctp_addr *laddr,
848 const union sctp_addr *paddr)
849{
850 struct sctp_association *asoc;
851 struct sctp_transport *transport;
852
Al Viro6c7be552006-11-20 17:11:50 -0800853 if ((asoc = sctp_lookup_association(laddr, paddr, &transport))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 sctp_association_put(asoc);
855 return 1;
856 }
857
858 return 0;
859}
860
861/*
862 * SCTP Implementors Guide, 2.18 Handling of address
863 * parameters within the INIT or INIT-ACK.
864 *
865 * D) When searching for a matching TCB upon reception of an INIT
866 * or INIT-ACK chunk the receiver SHOULD use not only the
867 * source address of the packet (containing the INIT or
868 * INIT-ACK) but the receiver SHOULD also use all valid
869 * address parameters contained within the chunk.
870 *
871 * 2.18.3 Solution description
872 *
873 * This new text clearly specifies to an implementor the need
874 * to look within the INIT or INIT-ACK. Any implementation that
875 * does not do this, may not be able to establish associations
876 * in certain circumstances.
877 *
878 */
879static struct sctp_association *__sctp_rcv_init_lookup(struct sk_buff *skb,
880 const union sctp_addr *laddr, struct sctp_transport **transportp)
881{
882 struct sctp_association *asoc;
883 union sctp_addr addr;
884 union sctp_addr *paddr = &addr;
Arnaldo Carvalho de Melo2c0fd382007-03-13 13:59:32 -0300885 struct sctphdr *sh = sctp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700886 sctp_chunkhdr_t *ch;
887 union sctp_params params;
888 sctp_init_chunk_t *init;
889 struct sctp_transport *transport;
890 struct sctp_af *af;
891
892 ch = (sctp_chunkhdr_t *) skb->data;
893
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894 /* The code below will attempt to walk the chunk and extract
895 * parameter information. Before we do that, we need to verify
896 * that the chunk length doesn't cause overflow. Otherwise, we'll
897 * walk off the end.
898 */
899 if (WORD_ROUND(ntohs(ch->length)) > skb->len)
900 return NULL;
901
902 /*
903 * This code will NOT touch anything inside the chunk--it is
904 * strictly READ-ONLY.
905 *
906 * RFC 2960 3 SCTP packet Format
907 *
908 * Multiple chunks can be bundled into one SCTP packet up to
909 * the MTU size, except for the INIT, INIT ACK, and SHUTDOWN
910 * COMPLETE chunks. These chunks MUST NOT be bundled with any
911 * other chunk in a packet. See Section 6.10 for more details
912 * on chunk bundling.
913 */
914
915 /* Find the start of the TLVs and the end of the chunk. This is
916 * the region we search for address parameters.
917 */
918 init = (sctp_init_chunk_t *)skb->data;
919
920 /* Walk the parameters looking for embedded addresses. */
921 sctp_walk_params(params, init, init_hdr.params) {
922
923 /* Note: Ignoring hostname addresses. */
924 af = sctp_get_af_specific(param_type2af(params.p->type));
925 if (!af)
926 continue;
927
Al Virodd86d132006-11-20 17:11:13 -0800928 af->from_addr_param(paddr, params.addr, sh->source, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700929
Al Virodd86d132006-11-20 17:11:13 -0800930 asoc = __sctp_lookup_association(laddr, paddr, &transport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 if (asoc)
932 return asoc;
933 }
934
935 return NULL;
936}
937
Vlad Yasevichbbd0d592007-10-03 17:51:34 -0700938/* SCTP-AUTH, Section 6.3:
939* If the receiver does not find a STCB for a packet containing an AUTH
940* chunk as the first chunk and not a COOKIE-ECHO chunk as the second
941* chunk, it MUST use the chunks after the AUTH chunk to look up an existing
942* association.
943*
944* This means that any chunks that can help us identify the association need
945* to be looked at to find this assocation.
946*
947* TODO: The only chunk currently defined that can do that is ASCONF, but we
948* don't support that functionality yet.
949*/
950static struct sctp_association *__sctp_rcv_auth_lookup(struct sk_buff *skb,
951 const union sctp_addr *paddr,
952 const union sctp_addr *laddr,
953 struct sctp_transport **transportp)
954{
955 /* XXX - walk through the chunks looking for something that can
956 * help us find the association. INIT, and INIT-ACK are not permitted.
957 * That leaves ASCONF, but we don't support that yet.
958 */
959 return NULL;
960}
961
962/*
963 * There are circumstances when we need to look inside the SCTP packet
964 * for information to help us find the association. Examples
965 * include looking inside of INIT/INIT-ACK chunks or after the AUTH
966 * chunks.
967 */
968static struct sctp_association *__sctp_rcv_lookup_harder(struct sk_buff *skb,
969 const union sctp_addr *paddr,
970 const union sctp_addr *laddr,
971 struct sctp_transport **transportp)
972{
973 sctp_chunkhdr_t *ch;
974
975 ch = (sctp_chunkhdr_t *) skb->data;
976
977 /* If this is INIT/INIT-ACK look inside the chunk too. */
978 switch (ch->type) {
979 case SCTP_CID_INIT:
980 case SCTP_CID_INIT_ACK:
981 return __sctp_rcv_init_lookup(skb, laddr, transportp);
982 break;
983
984 case SCTP_CID_AUTH:
985 return __sctp_rcv_auth_lookup(skb, paddr, laddr, transportp);
986 break;
987 }
988
989 return NULL;
990}
991
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992/* Lookup an association for an inbound skb. */
993static struct sctp_association *__sctp_rcv_lookup(struct sk_buff *skb,
994 const union sctp_addr *paddr,
995 const union sctp_addr *laddr,
996 struct sctp_transport **transportp)
997{
998 struct sctp_association *asoc;
999
1000 asoc = __sctp_lookup_association(laddr, paddr, transportp);
1001
1002 /* Further lookup for INIT/INIT-ACK packets.
1003 * SCTP Implementors Guide, 2.18 Handling of address
1004 * parameters within the INIT or INIT-ACK.
1005 */
1006 if (!asoc)
Vlad Yasevichbbd0d592007-10-03 17:51:34 -07001007 asoc = __sctp_rcv_lookup_harder(skb, paddr, laddr, transportp);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008
1009 return asoc;
1010}