blob: 35928fefae3327f97688f0857de63bc17e3429d6 [file] [log] [blame]
Thomas Gleixner47505b82019-05-23 11:14:41 +02001// SPDX-License-Identifier: GPL-2.0-or-later
Vlad Yasevich60c778b2008-01-11 09:57:09 -05002/* SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 * (C) Copyright IBM Corp. 2001, 2004
4 * Copyright (c) 1999-2000 Cisco, Inc.
5 * Copyright (c) 1999-2001 Motorola, Inc.
6 * Copyright (c) 2001 Intel Corp.
7 * Copyright (c) 2001 Nokia, Inc.
8 * Copyright (c) 2001 La Monte H.P. Yarroll
9 *
Vlad Yasevich60c778b2008-01-11 09:57:09 -050010 * This file is part of the SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 *
12 * Initialization/cleanup for SCTP protocol support.
13 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070014 * Please send any bug reports or fixes you make to the
15 * email address(es):
Daniel Borkmann91705c62013-07-23 14:51:47 +020016 * lksctp developers <linux-sctp@vger.kernel.org>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070018 * Written or modified by:
19 * La Monte H.P. Yarroll <piggy@acm.org>
20 * Karl Knutson <karl@athena.chicago.il.us>
21 * Jon Grimm <jgrimm@us.ibm.com>
22 * Sridhar Samudrala <sri@us.ibm.com>
23 * Daisy Chang <daisyc@us.ibm.com>
24 * Ardelle Fan <ardelle.fan@intel.com>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025 */
26
Joe Perches145ce502010-08-24 13:21:08 +000027#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
28
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include <linux/module.h>
30#include <linux/init.h>
31#include <linux/netdevice.h>
32#include <linux/inetdevice.h>
33#include <linux/seq_file.h>
Mike Rapoport57c8a662018-10-30 15:09:49 -070034#include <linux/memblock.h>
Vlad Yasevich845525a2008-07-18 23:08:21 -070035#include <linux/highmem.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090036#include <linux/slab.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020037#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070038#include <net/protocol.h>
39#include <net/ip.h>
40#include <net/ipv6.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020041#include <net/route.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <net/sctp/sctp.h>
43#include <net/addrconf.h>
44#include <net/inet_common.h>
45#include <net/inet_ecn.h>
Xin Long965ae442020-10-29 15:04:58 +080046#include <net/udp_tunnel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047
Neil Hormand9749fb2016-02-18 16:10:57 -050048#define MAX_SCTP_PORT_HASH_ENTRIES (64 * 1024)
49
Linus Torvalds1da177e2005-04-16 15:20:36 -070050/* Global data structures. */
Brian Haley4cbf1ca2006-09-18 00:04:22 -070051struct sctp_globals sctp_globals __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052
53struct idr sctp_assocs_id;
54DEFINE_SPINLOCK(sctp_assocs_id_lock);
55
Linus Torvalds1da177e2005-04-16 15:20:36 -070056static struct sctp_pf *sctp_pf_inet6_specific;
57static struct sctp_pf *sctp_pf_inet_specific;
58static struct sctp_af *sctp_af_v4_specific;
59static struct sctp_af *sctp_af_v6_specific;
60
Christoph Lametere18b8902006-12-06 20:33:20 -080061struct kmem_cache *sctp_chunk_cachep __read_mostly;
62struct kmem_cache *sctp_bucket_cachep __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070063
Eric Dumazet8d987e52010-11-09 23:24:26 +000064long sysctl_sctp_mem[3];
Vlad Yasevich007e3932007-09-16 16:04:37 -070065int sysctl_sctp_rmem[3];
66int sysctl_sctp_wmem[3];
Neil Horman4d93df02007-08-15 16:07:44 -070067
Linus Torvalds1da177e2005-04-16 15:20:36 -070068/* Private helper to extract ipv4 address and stash them in
69 * the protocol structure.
70 */
71static void sctp_v4_copy_addrlist(struct list_head *addrlist,
72 struct net_device *dev)
73{
74 struct in_device *in_dev;
75 struct in_ifaddr *ifa;
76 struct sctp_sockaddr_entry *addr;
77
78 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -070079 if ((in_dev = __in_dev_get_rcu(dev)) == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 rcu_read_unlock();
81 return;
82 }
83
Florian Westphalcd5a4112019-05-31 18:27:07 +020084 in_dev_for_each_ifa_rcu(ifa, in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070085 /* Add the address to the local list. */
Daniel Borkmann939cfa72013-06-17 11:40:04 +020086 addr = kzalloc(sizeof(*addr), GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -070087 if (addr) {
Al Viro2a6fd782006-11-20 17:04:42 -080088 addr->a.v4.sin_family = AF_INET;
Al Viro2a6fd782006-11-20 17:04:42 -080089 addr->a.v4.sin_addr.s_addr = ifa->ifa_local;
Vlad Yasevich29303542007-09-16 16:02:12 -070090 addr->valid = 1;
91 INIT_LIST_HEAD(&addr->list);
Linus Torvalds1da177e2005-04-16 15:20:36 -070092 list_add_tail(&addr->list, addrlist);
93 }
94 }
95
96 rcu_read_unlock();
97}
98
99/* Extract our IP addresses from the system and stash them in the
100 * protocol structure.
101 */
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000102static void sctp_get_local_addr_list(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103{
104 struct net_device *dev;
105 struct list_head *pos;
106 struct sctp_af *af;
107
Eric Dumazetc6d14c82009-11-04 05:43:23 -0800108 rcu_read_lock();
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000109 for_each_netdev_rcu(net, dev) {
Dave Jones2c0740e2013-06-17 22:26:52 -0400110 list_for_each(pos, &sctp_address_families) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 af = list_entry(pos, struct sctp_af, list);
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000112 af->copy_addrlist(&net->sctp.local_addr_list, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113 }
114 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -0800115 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116}
117
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118/* Free the existing local addresses. */
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000119static void sctp_free_local_addr_list(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120{
121 struct sctp_sockaddr_entry *addr;
122 struct list_head *pos, *temp;
123
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000124 list_for_each_safe(pos, temp, &net->sctp.local_addr_list) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 addr = list_entry(pos, struct sctp_sockaddr_entry, list);
126 list_del(pos);
127 kfree(addr);
128 }
129}
130
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131/* Copy the local addresses which are valid for 'scope' into 'bp'. */
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000132int sctp_copy_local_addr_list(struct net *net, struct sctp_bind_addr *bp,
Xin Long1c662012017-08-05 19:59:54 +0800133 enum sctp_scope scope, gfp_t gfp, int copy_flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134{
135 struct sctp_sockaddr_entry *addr;
Xin Long2e3ce5b2017-02-24 15:18:46 +0800136 union sctp_addr laddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 int error = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138
Vlad Yasevich29303542007-09-16 16:02:12 -0700139 rcu_read_lock();
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000140 list_for_each_entry_rcu(addr, &net->sctp.local_addr_list, list) {
Vlad Yasevich29303542007-09-16 16:02:12 -0700141 if (!addr->valid)
142 continue;
Xin Long165f2cf2016-12-20 13:49:49 +0800143 if (!sctp_in_scope(net, &addr->a, scope))
144 continue;
145
146 /* Now that the address is in scope, check to see if
147 * the address type is really supported by the local
148 * sock as well as the remote peer.
149 */
150 if (addr->a.sa.sa_family == AF_INET &&
Marcelo Ricardo Leitner471e39d2020-06-24 17:34:18 -0300151 (!(copy_flags & SCTP_ADDR4_ALLOWED) ||
152 !(copy_flags & SCTP_ADDR4_PEERSUPP)))
Xin Long165f2cf2016-12-20 13:49:49 +0800153 continue;
154 if (addr->a.sa.sa_family == AF_INET6 &&
155 (!(copy_flags & SCTP_ADDR6_ALLOWED) ||
156 !(copy_flags & SCTP_ADDR6_PEERSUPP)))
157 continue;
158
Xin Long2e3ce5b2017-02-24 15:18:46 +0800159 laddr = addr->a;
160 /* also works for setting ipv6 address port */
161 laddr.v4.sin_port = htons(bp->port);
162 if (sctp_bind_addr_state(bp, &laddr) != -1)
Xin Longb8607802016-12-20 13:49:50 +0800163 continue;
164
Xin Long165f2cf2016-12-20 13:49:49 +0800165 error = sctp_add_bind_addr(bp, &addr->a, sizeof(addr->a),
166 SCTP_ADDR_SRC, GFP_ATOMIC);
167 if (error)
168 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 }
170
Vlad Yasevich29303542007-09-16 16:02:12 -0700171 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 return error;
173}
174
Richard Hainesb7e10c22018-02-24 16:18:51 +0000175/* Copy over any ip options */
176static void sctp_v4_copy_ip_options(struct sock *sk, struct sock *newsk)
177{
178 struct inet_sock *newinet, *inet = inet_sk(sk);
179 struct ip_options_rcu *inet_opt, *newopt = NULL;
180
181 newinet = inet_sk(newsk);
182
183 rcu_read_lock();
184 inet_opt = rcu_dereference(inet->inet_opt);
185 if (inet_opt) {
186 newopt = sock_kmalloc(newsk, sizeof(*inet_opt) +
187 inet_opt->opt.optlen, GFP_ATOMIC);
188 if (newopt)
189 memcpy(newopt, inet_opt, sizeof(*inet_opt) +
190 inet_opt->opt.optlen);
191 else
192 pr_err("%s: Failed to copy ip options\n", __func__);
193 }
194 RCU_INIT_POINTER(newinet->inet_opt, newopt);
195 rcu_read_unlock();
196}
197
198/* Account for the IP options */
199static int sctp_v4_ip_options_len(struct sock *sk)
200{
201 struct inet_sock *inet = inet_sk(sk);
202 struct ip_options_rcu *inet_opt;
203 int len = 0;
204
205 rcu_read_lock();
206 inet_opt = rcu_dereference(inet->inet_opt);
207 if (inet_opt)
208 len = inet_opt->opt.optlen;
209
210 rcu_read_unlock();
211 return len;
212}
213
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214/* Initialize a sctp_addr from in incoming skb. */
215static void sctp_v4_from_skb(union sctp_addr *addr, struct sk_buff *skb,
216 int is_saddr)
217{
Marcelo Ricardo Leitner0630c562016-12-28 09:26:33 -0200218 /* Always called on head skb, so this is safe */
219 struct sctphdr *sh = sctp_hdr(skb);
220 struct sockaddr_in *sa = &addr->v4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222 addr->v4.sin_family = AF_INET;
223
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 if (is_saddr) {
Marcelo Ricardo Leitner0630c562016-12-28 09:26:33 -0200225 sa->sin_port = sh->source;
226 sa->sin_addr.s_addr = ip_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 } else {
Marcelo Ricardo Leitner0630c562016-12-28 09:26:33 -0200228 sa->sin_port = sh->dest;
229 sa->sin_addr.s_addr = ip_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 }
Xin Longb6f33202019-12-09 13:45:54 +0800231 memset(sa->sin_zero, 0, sizeof(sa->sin_zero));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232}
233
234/* Initialize an sctp_addr from a socket. */
235static void sctp_v4_from_sk(union sctp_addr *addr, struct sock *sk)
236{
237 addr->v4.sin_family = AF_INET;
Al Viro7dcdbd92006-11-20 17:24:21 -0800238 addr->v4.sin_port = 0;
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000239 addr->v4.sin_addr.s_addr = inet_sk(sk)->inet_rcv_saddr;
Xin Longb6f33202019-12-09 13:45:54 +0800240 memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241}
242
243/* Initialize sk->sk_rcv_saddr from sctp_addr. */
244static void sctp_v4_to_sk_saddr(union sctp_addr *addr, struct sock *sk)
245{
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000246 inet_sk(sk)->inet_rcv_saddr = addr->v4.sin_addr.s_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247}
248
249/* Initialize sk->sk_daddr from sctp_addr. */
250static void sctp_v4_to_sk_daddr(union sctp_addr *addr, struct sock *sk)
251{
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000252 inet_sk(sk)->inet_daddr = addr->v4.sin_addr.s_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253}
254
255/* Initialize a sctp_addr from an address parameter. */
Marcelo Ricardo Leitner0c5dc072021-06-28 16:13:41 -0300256static bool sctp_v4_from_addr_param(union sctp_addr *addr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257 union sctp_addr_param *param,
Al Virodd86d132006-11-20 17:11:13 -0800258 __be16 port, int iif)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259{
Marcelo Ricardo Leitner0c5dc072021-06-28 16:13:41 -0300260 if (ntohs(param->v4.param_hdr.length) < sizeof(struct sctp_ipv4addr_param))
261 return false;
262
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 addr->v4.sin_family = AF_INET;
264 addr->v4.sin_port = port;
265 addr->v4.sin_addr.s_addr = param->v4.addr.s_addr;
Xin Longb6f33202019-12-09 13:45:54 +0800266 memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero));
Marcelo Ricardo Leitner0c5dc072021-06-28 16:13:41 -0300267
268 return true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269}
270
271/* Initialize an address parameter from a sctp_addr and return the length
272 * of the address parameter.
273 */
274static int sctp_v4_to_addr_param(const union sctp_addr *addr,
275 union sctp_addr_param *param)
276{
Xin Longa38905e2017-07-17 11:29:49 +0800277 int length = sizeof(struct sctp_ipv4addr_param);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278
279 param->v4.param_hdr.type = SCTP_PARAM_IPV4_ADDRESS;
Al Virodbc16db2006-11-20 17:01:42 -0800280 param->v4.param_hdr.length = htons(length);
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900281 param->v4.addr.s_addr = addr->v4.sin_addr.s_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282
283 return length;
284}
285
286/* Initialize a sctp_addr from a dst_entry. */
David S. Miller18a353f42011-05-03 20:55:05 -0700287static void sctp_v4_dst_saddr(union sctp_addr *saddr, struct flowi4 *fl4,
Al Viro854d43a2006-11-20 17:06:24 -0800288 __be16 port)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290 saddr->v4.sin_family = AF_INET;
291 saddr->v4.sin_port = port;
David S. Miller18a353f42011-05-03 20:55:05 -0700292 saddr->v4.sin_addr.s_addr = fl4->saddr;
Xin Longb6f33202019-12-09 13:45:54 +0800293 memset(saddr->v4.sin_zero, 0, sizeof(saddr->v4.sin_zero));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294}
295
296/* Compare two addresses exactly. */
297static int sctp_v4_cmp_addr(const union sctp_addr *addr1,
298 const union sctp_addr *addr2)
299{
300 if (addr1->sa.sa_family != addr2->sa.sa_family)
301 return 0;
302 if (addr1->v4.sin_port != addr2->v4.sin_port)
303 return 0;
304 if (addr1->v4.sin_addr.s_addr != addr2->v4.sin_addr.s_addr)
305 return 0;
306
307 return 1;
308}
309
310/* Initialize addr struct to INADDR_ANY. */
Al Viro6fbfa9f2006-11-20 17:24:53 -0800311static void sctp_v4_inaddr_any(union sctp_addr *addr, __be16 port)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312{
313 addr->v4.sin_family = AF_INET;
Al Viroe6f1ceb2008-03-17 22:44:53 -0700314 addr->v4.sin_addr.s_addr = htonl(INADDR_ANY);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 addr->v4.sin_port = port;
Xin Longb6f33202019-12-09 13:45:54 +0800316 memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317}
318
319/* Is this a wildcard address? */
320static int sctp_v4_is_any(const union sctp_addr *addr)
321{
Al Viroe6f1ceb2008-03-17 22:44:53 -0700322 return htonl(INADDR_ANY) == addr->v4.sin_addr.s_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323}
324
325/* This function checks if the address is a valid address to be used for
326 * SCTP binding.
327 *
328 * Output:
329 * Return 0 - If the address is a non-unicast or an illegal address.
330 * Return 1 - If the address is a unicast.
331 */
Vlad Yasevich5636bef2006-06-17 22:55:35 -0700332static int sctp_v4_addr_valid(union sctp_addr *addr,
333 struct sctp_sock *sp,
334 const struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335{
Vlad Yasevich7dab83d2008-07-18 23:05:40 -0700336 /* IPv4 addresses not allowed */
337 if (sp && ipv6_only_sock(sctp_opt2sk(sp)))
338 return 0;
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 /* Is this a non-unicast address or a unusable SCTP address? */
Joe Perchesb5cb2bb2007-12-16 13:46:59 -0800341 if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 return 0;
343
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900344 /* Is this a broadcast address? */
Eric Dumazet511c3f92009-06-02 05:14:27 +0000345 if (skb && skb_rtable(skb)->rt_flags & RTCF_BROADCAST)
YOSHIFUJI Hideakid808ad92007-02-09 23:25:18 +0900346 return 0;
Vlad Yasevich5636bef2006-06-17 22:55:35 -0700347
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 return 1;
349}
350
351/* Should this be available for binding? */
352static int sctp_v4_available(union sctp_addr *addr, struct sctp_sock *sp)
353{
Eric W. Biedermanbb2db452012-08-06 08:46:26 +0000354 struct net *net = sock_net(&sp->inet.sk);
355 int ret = inet_addr_type(net, addr->v4.sin_addr.s_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357
Al Viroe6f1ceb2008-03-17 22:44:53 -0700358 if (addr->v4.sin_addr.s_addr != htonl(INADDR_ANY) &&
Neil Hormancdac4e02005-06-13 15:12:33 -0700359 ret != RTN_LOCAL &&
360 !sp->inet.freebind &&
Vincent Bernat49a60152014-09-05 15:09:03 +0200361 !net->ipv4.sysctl_ip_nonlocal_bind)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 return 0;
Neil Hormancdac4e02005-06-13 15:12:33 -0700363
Vlad Yasevich7dab83d2008-07-18 23:05:40 -0700364 if (ipv6_only_sock(sctp_opt2sk(sp)))
365 return 0;
366
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367 return 1;
368}
369
370/* Checking the loopback, private and other address scopes as defined in
371 * RFC 1918. The IPv4 scoping is based on the draft for SCTP IPv4
372 * scoping <draft-stewart-tsvwg-sctp-ipv4-00.txt>.
373 *
374 * Level 0 - unusable SCTP addresses
375 * Level 1 - loopback address
376 * Level 2 - link-local addresses
377 * Level 3 - private addresses.
378 * Level 4 - global addresses
379 * For INIT and INIT-ACK address list, let L be the level of
Randy Dunlap93c32162020-08-22 16:15:59 -0700380 * requested destination address, sender and receiver
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 * SHOULD include all of its addresses with level greater
382 * than or equal to L.
Bhaskar Dutta72388432009-09-03 17:25:47 +0530383 *
384 * IPv4 scoping can be controlled through sysctl option
385 * net.sctp.addr_scope_policy
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 */
Xin Long1c662012017-08-05 19:59:54 +0800387static enum sctp_scope sctp_v4_scope(union sctp_addr *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388{
Xin Long1c662012017-08-05 19:59:54 +0800389 enum sctp_scope retval;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391 /* Check for unusable SCTP addresses. */
Joe Perchesb5cb2bb2007-12-16 13:46:59 -0800392 if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 retval = SCTP_SCOPE_UNUSABLE;
Joe Perchesb5cb2bb2007-12-16 13:46:59 -0800394 } else if (ipv4_is_loopback(addr->v4.sin_addr.s_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 retval = SCTP_SCOPE_LOOPBACK;
Joe Perchesb5cb2bb2007-12-16 13:46:59 -0800396 } else if (ipv4_is_linklocal_169(addr->v4.sin_addr.s_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 retval = SCTP_SCOPE_LINK;
Joe Perchesb5cb2bb2007-12-16 13:46:59 -0800398 } else if (ipv4_is_private_10(addr->v4.sin_addr.s_addr) ||
399 ipv4_is_private_172(addr->v4.sin_addr.s_addr) ||
Xin Long1d11fa22021-06-29 23:34:08 -0400400 ipv4_is_private_192(addr->v4.sin_addr.s_addr) ||
401 ipv4_is_test_198(addr->v4.sin_addr.s_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402 retval = SCTP_SCOPE_PRIVATE;
403 } else {
404 retval = SCTP_SCOPE_GLOBAL;
405 }
406
407 return retval;
408}
409
410/* Returns a valid dst cache entry for the given source and destination ip
411 * addresses. If an association is passed, trys to get a dst entry with a
412 * source address that matches an address in the bind address list.
413 */
Vlad Yasevichda0420b2011-04-26 21:54:17 +0000414static void sctp_v4_get_dst(struct sctp_transport *t, union sctp_addr *saddr,
415 struct flowi *fl, struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416{
Vlad Yasevichda0420b2011-04-26 21:54:17 +0000417 struct sctp_association *asoc = t->asoc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418 struct rtable *rt;
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300419 struct flowi _fl;
420 struct flowi4 *fl4 = &_fl.u.ip4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 struct sctp_bind_addr *bp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 struct sctp_sockaddr_entry *laddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423 struct dst_entry *dst = NULL;
Vlad Yasevichda0420b2011-04-26 21:54:17 +0000424 union sctp_addr *daddr = &t->ipaddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 union sctp_addr dst_saddr;
Xin Long8a9c58d2018-07-02 18:21:12 +0800426 __u8 tos = inet_sk(sk)->tos;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427
Xin Long8a9c58d2018-07-02 18:21:12 +0800428 if (t->dscp & SCTP_DSCP_SET_MASK)
429 tos = t->dscp & SCTP_DSCP_VAL_MASK;
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300430 memset(&_fl, 0x0, sizeof(_fl));
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000431 fl4->daddr = daddr->v4.sin_addr.s_addr;
432 fl4->fl4_dport = daddr->v4.sin_port;
433 fl4->flowi4_proto = IPPROTO_SCTP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434 if (asoc) {
Xin Long8a9c58d2018-07-02 18:21:12 +0800435 fl4->flowi4_tos = RT_CONN_FLAGS_TOS(asoc->base.sk, tos);
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000436 fl4->flowi4_oif = asoc->base.sk->sk_bound_dev_if;
437 fl4->fl4_sport = htons(asoc->base.bind_addr.port);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700438 }
Wei Yongjun6429d3d2010-04-30 21:42:44 -0400439 if (saddr) {
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000440 fl4->saddr = saddr->v4.sin_addr.s_addr;
Xin Longecf938f2019-01-22 02:42:41 +0800441 if (!fl4->fl4_sport)
442 fl4->fl4_sport = saddr->v4.sin_port;
Wei Yongjun6429d3d2010-04-30 21:42:44 -0400443 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444
Daniel Borkmannbb333812013-06-28 19:49:40 +0200445 pr_debug("%s: dst:%pI4, src:%pI4 - ", __func__, &fl4->daddr,
446 &fl4->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447
Eric W. Biedermanbb2db452012-08-06 08:46:26 +0000448 rt = ip_route_output_key(sock_net(sk), fl4);
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300449 if (!IS_ERR(rt)) {
Changli Gaod8d1f302010-06-10 23:31:35 -0700450 dst = &rt->dst;
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300451 t->dst = dst;
452 memcpy(fl, &_fl, sizeof(_fl));
453 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454
455 /* If there is no association or if a source address is passed, no
456 * more validation is required.
457 */
458 if (!asoc || saddr)
459 goto out;
460
461 bp = &asoc->base.bind_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462
463 if (dst) {
464 /* Walk through the bind address list and look for a bind
465 * address that matches the source address of the returned dst.
466 */
David S. Miller18a353f42011-05-03 20:55:05 -0700467 sctp_v4_dst_saddr(&dst_saddr, fl4, htons(bp->port));
Vlad Yasevich559cf712007-09-16 16:03:28 -0700468 rcu_read_lock();
469 list_for_each_entry_rcu(laddr, &bp->address_list, list) {
Michio Honda8a07eb02011-04-26 20:19:36 +0900470 if (!laddr->valid || (laddr->state == SCTP_ADDR_DEL) ||
471 (laddr->state != SCTP_ADDR_SRC &&
472 !asoc->src_out_of_asoc_ok))
Sridhar Samudraladc022a92006-07-21 14:49:25 -0700473 continue;
Al Viro854d43a2006-11-20 17:06:24 -0800474 if (sctp_v4_cmp_addr(&dst_saddr, &laddr->a))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475 goto out_unlock;
476 }
Vlad Yasevich559cf712007-09-16 16:03:28 -0700477 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478
479 /* None of the bound addresses match the source address of the
480 * dst. So release it.
481 */
482 dst_release(dst);
483 dst = NULL;
484 }
485
486 /* Walk through the bind address list and try to get a dst that
487 * matches a bind address as the source address.
488 */
Vlad Yasevich559cf712007-09-16 16:03:28 -0700489 rcu_read_lock();
490 list_for_each_entry_rcu(laddr, &bp->address_list, list) {
Marcelo Ricardo Leitner0ca50d12015-07-17 12:34:18 -0300491 struct net_device *odev;
492
Vlad Yasevich559cf712007-09-16 16:03:28 -0700493 if (!laddr->valid)
494 continue;
Marcelo Ricardo Leitner07868282015-07-17 12:34:17 -0300495 if (laddr->state != SCTP_ADDR_SRC ||
496 AF_INET != laddr->a.sa.sa_family)
497 continue;
Xufeng Zhang85350872014-04-25 16:55:41 +0800498
Marcelo Ricardo Leitner07868282015-07-17 12:34:17 -0300499 fl4->fl4_sport = laddr->a.v4.sin_port;
500 flowi4_update_output(fl4,
501 asoc->base.sk->sk_bound_dev_if,
Xin Long8a9c58d2018-07-02 18:21:12 +0800502 RT_CONN_FLAGS_TOS(asoc->base.sk, tos),
Marcelo Ricardo Leitner07868282015-07-17 12:34:17 -0300503 daddr->v4.sin_addr.s_addr,
504 laddr->a.v4.sin_addr.s_addr);
505
506 rt = ip_route_output_key(sock_net(sk), fl4);
507 if (IS_ERR(rt))
508 continue;
509
Marcelo Ricardo Leitner0ca50d12015-07-17 12:34:18 -0300510 /* Ensure the src address belongs to the output
511 * interface.
512 */
513 odev = __ip_dev_find(sock_net(sk), laddr->a.v4.sin_addr.s_addr,
514 false);
Marcelo Ricardo Leitnerd82f0f1f2015-09-02 16:20:21 -0300515 if (!odev || odev->ifindex != fl4->flowi4_oif) {
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300516 if (!dst) {
Tommi Rantala4a31a6b2018-02-05 21:48:14 +0200517 dst = &rt->dst;
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300518 t->dst = dst;
519 memcpy(fl, &_fl, sizeof(_fl));
520 } else {
Marcelo Ricardo Leitner410f0382015-09-02 16:20:22 -0300521 dst_release(&rt->dst);
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300522 }
Marcelo Ricardo Leitner0ca50d12015-07-17 12:34:18 -0300523 continue;
Marcelo Ricardo Leitnerd82f0f1f2015-09-02 16:20:21 -0300524 }
Marcelo Ricardo Leitner0ca50d12015-07-17 12:34:18 -0300525
Tommi Rantala4a31a6b2018-02-05 21:48:14 +0200526 dst_release(dst);
Marcelo Ricardo Leitner07868282015-07-17 12:34:17 -0300527 dst = &rt->dst;
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300528 t->dst = dst;
529 memcpy(fl, &_fl, sizeof(_fl));
Marcelo Ricardo Leitner07868282015-07-17 12:34:17 -0300530 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700531 }
532
533out_unlock:
Vlad Yasevich559cf712007-09-16 16:03:28 -0700534 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535out:
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300536 if (dst) {
Daniel Borkmannbb333812013-06-28 19:49:40 +0200537 pr_debug("rt_dst:%pI4, rt_src:%pI4\n",
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300538 &fl->u.ip4.daddr, &fl->u.ip4.saddr);
539 } else {
540 t->dst = NULL;
Daniel Borkmannbb333812013-06-28 19:49:40 +0200541 pr_debug("no route\n");
Marcelo Ricardo Leitner582eea22020-03-26 20:47:46 -0300542 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700543}
544
545/* For v4, the source address is cached in the route entry(dst). So no need
546 * to cache it separately and hence this is an empty routine.
547 */
YOSHIFUJI Hideakie5117102008-05-29 19:55:05 +0900548static void sctp_v4_get_saddr(struct sctp_sock *sk,
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000549 struct sctp_transport *t,
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000550 struct flowi *fl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551{
Vlad Yasevich9914ae32011-04-26 21:51:31 +0000552 union sctp_addr *saddr = &t->saddr;
553 struct rtable *rt = (struct rtable *)t->dst;
Vladislav Yasevich23ec47a2005-11-11 16:05:55 -0800554
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 if (rt) {
556 saddr->v4.sin_family = AF_INET;
David S. Miller902ebd32011-05-09 14:49:13 -0700557 saddr->v4.sin_addr.s_addr = fl->u.ip4.saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558 }
559}
560
561/* What interface did this skb arrive on? */
562static int sctp_v4_skb_iif(const struct sk_buff *skb)
563{
David S. Miller92101b32012-07-23 16:29:00 -0700564 return inet_iif(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565}
566
567/* Was this packet marked by Explicit Congestion Notification? */
568static int sctp_v4_is_ce(const struct sk_buff *skb)
569{
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700570 return INET_ECN_is_ce(ip_hdr(skb)->tos);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571}
572
573/* Create and initialize a new sk for the socket returned by accept(). */
574static struct sock *sctp_v4_create_accept_sk(struct sock *sk,
David Howellscdfbabf2017-03-09 08:09:05 +0000575 struct sctp_association *asoc,
576 bool kern)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900578 struct sock *newsk = sk_alloc(sock_net(sk), PF_INET, GFP_KERNEL,
David Howellscdfbabf2017-03-09 08:09:05 +0000579 sk->sk_prot, kern);
Vlad Yasevich914e1c82009-02-13 08:33:44 +0000580 struct inet_sock *newinet;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581
582 if (!newsk)
583 goto out;
584
585 sock_init_data(NULL, newsk);
586
Vlad Yasevich914e1c82009-02-13 08:33:44 +0000587 sctp_copy_sock(newsk, sk, asoc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 sock_reset_flag(newsk, SOCK_ZAPPED);
589
Richard Hainesb7e10c22018-02-24 16:18:51 +0000590 sctp_v4_copy_ip_options(sk, newsk);
591
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592 newinet = inet_sk(newsk);
593
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000594 newinet->inet_daddr = asoc->peer.primary_addr.v4.sin_addr.s_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -0700596 sk_refcnt_debug_inc(newsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597
598 if (newsk->sk_prot->init(newsk)) {
599 sk_common_release(newsk);
600 newsk = NULL;
601 }
602
603out:
604 return newsk;
605}
606
Jason Gunthorpe299ee122014-07-30 12:40:53 -0600607static int sctp_v4_addr_to_user(struct sctp_sock *sp, union sctp_addr *addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700608{
Jason Gunthorpe299ee122014-07-30 12:40:53 -0600609 /* No address mapping for V4 sockets */
Xin Long09279e62019-03-31 16:58:15 +0800610 memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero));
Jason Gunthorpe299ee122014-07-30 12:40:53 -0600611 return sizeof(struct sockaddr_in);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700612}
613
614/* Dump the v4 addr to the seq file. */
615static void sctp_v4_seq_dump_addr(struct seq_file *seq, union sctp_addr *addr)
616{
Harvey Harrison21454aa2008-10-31 00:54:56 -0700617 seq_printf(seq, "%pI4 ", &addr->v4.sin_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618}
619
Vlad Yasevichb9031d92008-06-04 12:40:15 -0700620static void sctp_v4_ecn_capable(struct sock *sk)
621{
622 INET_ECN_xmit(sk);
623}
624
Kees Cook9c3b5752017-10-24 01:45:31 -0700625static void sctp_addr_wq_timeout_handler(struct timer_list *t)
Michio Honda9f7d6532011-04-26 19:32:51 +0900626{
Kees Cook9c3b5752017-10-24 01:45:31 -0700627 struct net *net = from_timer(net, t, sctp.addr_wq_timer);
Michio Honda9f7d6532011-04-26 19:32:51 +0900628 struct sctp_sockaddr_entry *addrw, *temp;
629 struct sctp_sock *sp;
630
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000631 spin_lock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900632
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000633 list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) {
Daniel Borkmannbb333812013-06-28 19:49:40 +0200634 pr_debug("%s: the first ent in wq:%p is addr:%pISc for cmd:%d at "
635 "entry:%p\n", __func__, &net->sctp.addr_waitq, &addrw->a.sa,
636 addrw->state, addrw);
Michio Honda9f7d6532011-04-26 19:32:51 +0900637
Eric Dumazetdfd56b82011-12-10 09:48:31 +0000638#if IS_ENABLED(CONFIG_IPV6)
Michio Honda9f7d6532011-04-26 19:32:51 +0900639 /* Now we send an ASCONF for each association */
640 /* Note. we currently don't handle link local IPv6 addressees */
641 if (addrw->a.sa.sa_family == AF_INET6) {
642 struct in6_addr *in6;
643
644 if (ipv6_addr_type(&addrw->a.v6.sin6_addr) &
645 IPV6_ADDR_LINKLOCAL)
646 goto free_next;
647
648 in6 = (struct in6_addr *)&addrw->a.v6.sin6_addr;
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000649 if (ipv6_chk_addr(net, in6, NULL, 0) == 0 &&
Michio Honda9f7d6532011-04-26 19:32:51 +0900650 addrw->state == SCTP_ADDR_NEW) {
651 unsigned long timeo_val;
652
Daniel Borkmannbb333812013-06-28 19:49:40 +0200653 pr_debug("%s: this is on DAD, trying %d sec "
654 "later\n", __func__,
655 SCTP_ADDRESS_TICK_DELAY);
656
Michio Honda9f7d6532011-04-26 19:32:51 +0900657 timeo_val = jiffies;
658 timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY);
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000659 mod_timer(&net->sctp.addr_wq_timer, timeo_val);
Michio Honda9f7d6532011-04-26 19:32:51 +0900660 break;
661 }
662 }
David S. Miller5d0c90c2011-06-06 13:05:55 -0700663#endif
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000664 list_for_each_entry(sp, &net->sctp.auto_asconf_splist, auto_asconf_list) {
Michio Honda9f7d6532011-04-26 19:32:51 +0900665 struct sock *sk;
666
667 sk = sctp_opt2sk(sp);
668 /* ignore bound-specific endpoints */
669 if (!sctp_is_ep_boundall(sk))
670 continue;
wangweidong5bc1d1b2014-01-21 15:44:12 +0800671 bh_lock_sock(sk);
Michio Honda9f7d6532011-04-26 19:32:51 +0900672 if (sctp_asconf_mgmt(sp, addrw) < 0)
Daniel Borkmannbb333812013-06-28 19:49:40 +0200673 pr_debug("%s: sctp_asconf_mgmt failed\n", __func__);
wangweidong5bc1d1b2014-01-21 15:44:12 +0800674 bh_unlock_sock(sk);
Michio Honda9f7d6532011-04-26 19:32:51 +0900675 }
Daniel Halperin39d84a52012-06-18 11:04:55 +0000676#if IS_ENABLED(CONFIG_IPV6)
Michio Honda9f7d6532011-04-26 19:32:51 +0900677free_next:
Daniel Halperin39d84a52012-06-18 11:04:55 +0000678#endif
Michio Honda9f7d6532011-04-26 19:32:51 +0900679 list_del(&addrw->list);
680 kfree(addrw);
681 }
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000682 spin_unlock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900683}
684
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000685static void sctp_free_addr_wq(struct net *net)
Michio Honda9f7d6532011-04-26 19:32:51 +0900686{
687 struct sctp_sockaddr_entry *addrw;
688 struct sctp_sockaddr_entry *temp;
689
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000690 spin_lock_bh(&net->sctp.addr_wq_lock);
691 del_timer(&net->sctp.addr_wq_timer);
692 list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) {
Michio Honda9f7d6532011-04-26 19:32:51 +0900693 list_del(&addrw->list);
694 kfree(addrw);
695 }
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000696 spin_unlock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900697}
698
699/* lookup the entry for the same address in the addr_waitq
700 * sctp_addr_wq MUST be locked
701 */
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000702static struct sctp_sockaddr_entry *sctp_addr_wq_lookup(struct net *net,
703 struct sctp_sockaddr_entry *addr)
Michio Honda9f7d6532011-04-26 19:32:51 +0900704{
705 struct sctp_sockaddr_entry *addrw;
706
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000707 list_for_each_entry(addrw, &net->sctp.addr_waitq, list) {
Michio Honda9f7d6532011-04-26 19:32:51 +0900708 if (addrw->a.sa.sa_family != addr->a.sa.sa_family)
709 continue;
710 if (addrw->a.sa.sa_family == AF_INET) {
711 if (addrw->a.v4.sin_addr.s_addr ==
712 addr->a.v4.sin_addr.s_addr)
713 return addrw;
714 } else if (addrw->a.sa.sa_family == AF_INET6) {
715 if (ipv6_addr_equal(&addrw->a.v6.sin6_addr,
716 &addr->a.v6.sin6_addr))
717 return addrw;
718 }
719 }
720 return NULL;
721}
722
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000723void sctp_addr_wq_mgmt(struct net *net, struct sctp_sockaddr_entry *addr, int cmd)
Michio Honda9f7d6532011-04-26 19:32:51 +0900724{
725 struct sctp_sockaddr_entry *addrw;
726 unsigned long timeo_val;
727
728 /* first, we check if an opposite message already exist in the queue.
729 * If we found such message, it is removed.
730 * This operation is a bit stupid, but the DHCP client attaches the
731 * new address after a couple of addition and deletion of that address
732 */
733
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000734 spin_lock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900735 /* Offsets existing events in addr_wq */
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000736 addrw = sctp_addr_wq_lookup(net, addr);
Michio Honda9f7d6532011-04-26 19:32:51 +0900737 if (addrw) {
738 if (addrw->state != cmd) {
Daniel Borkmannbb333812013-06-28 19:49:40 +0200739 pr_debug("%s: offsets existing entry for %d, addr:%pISc "
740 "in wq:%p\n", __func__, addrw->state, &addrw->a.sa,
741 &net->sctp.addr_waitq);
742
Michio Honda9f7d6532011-04-26 19:32:51 +0900743 list_del(&addrw->list);
744 kfree(addrw);
745 }
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000746 spin_unlock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900747 return;
748 }
749
750 /* OK, we have to add the new address to the wait queue */
751 addrw = kmemdup(addr, sizeof(struct sctp_sockaddr_entry), GFP_ATOMIC);
752 if (addrw == NULL) {
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000753 spin_unlock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900754 return;
755 }
756 addrw->state = cmd;
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000757 list_add_tail(&addrw->list, &net->sctp.addr_waitq);
Daniel Borkmannbb333812013-06-28 19:49:40 +0200758
759 pr_debug("%s: add new entry for cmd:%d, addr:%pISc in wq:%p\n",
760 __func__, addrw->state, &addrw->a.sa, &net->sctp.addr_waitq);
Michio Honda9f7d6532011-04-26 19:32:51 +0900761
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000762 if (!timer_pending(&net->sctp.addr_wq_timer)) {
Michio Honda9f7d6532011-04-26 19:32:51 +0900763 timeo_val = jiffies;
764 timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY);
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000765 mod_timer(&net->sctp.addr_wq_timer, timeo_val);
Michio Honda9f7d6532011-04-26 19:32:51 +0900766 }
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000767 spin_unlock_bh(&net->sctp.addr_wq_lock);
Michio Honda9f7d6532011-04-26 19:32:51 +0900768}
769
Vlad Yasevich29303542007-09-16 16:02:12 -0700770/* Event handler for inet address addition/deletion events.
771 * The sctp_local_addr_list needs to be protocted by a spin lock since
772 * multiple notifiers (say IPv4 and IPv6) may be running at the same
773 * time and thus corrupt the list.
774 * The reader side is protected with RCU.
775 */
Adrian Bunk24123182006-12-20 16:08:22 -0800776static int sctp_inetaddr_event(struct notifier_block *this, unsigned long ev,
777 void *ptr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700778{
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800779 struct in_ifaddr *ifa = (struct in_ifaddr *)ptr;
Vlad Yasevich29303542007-09-16 16:02:12 -0700780 struct sctp_sockaddr_entry *addr = NULL;
781 struct sctp_sockaddr_entry *temp;
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000782 struct net *net = dev_net(ifa->ifa_dev->dev);
Chidambar 'ilLogict' Zinnoury22626212008-03-11 18:05:02 -0700783 int found = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800785 switch (ev) {
786 case NETDEV_UP:
Xin Long400b8b92019-01-14 18:34:02 +0800787 addr = kzalloc(sizeof(*addr), GFP_ATOMIC);
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800788 if (addr) {
789 addr->a.v4.sin_family = AF_INET;
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800790 addr->a.v4.sin_addr.s_addr = ifa->ifa_local;
Vlad Yasevich29303542007-09-16 16:02:12 -0700791 addr->valid = 1;
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000792 spin_lock_bh(&net->sctp.local_addr_lock);
793 list_add_tail_rcu(&addr->list, &net->sctp.local_addr_list);
794 sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_NEW);
795 spin_unlock_bh(&net->sctp.local_addr_lock);
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800796 }
797 break;
798 case NETDEV_DOWN:
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000799 spin_lock_bh(&net->sctp.local_addr_lock);
Vlad Yasevich29303542007-09-16 16:02:12 -0700800 list_for_each_entry_safe(addr, temp,
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000801 &net->sctp.local_addr_list, list) {
Pavel Emelyanova40a7d12008-04-12 18:40:38 -0700802 if (addr->a.sa.sa_family == AF_INET &&
803 addr->a.v4.sin_addr.s_addr ==
804 ifa->ifa_local) {
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000805 sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_DEL);
Chidambar 'ilLogict' Zinnoury22626212008-03-11 18:05:02 -0700806 found = 1;
Vlad Yasevich29303542007-09-16 16:02:12 -0700807 addr->valid = 0;
808 list_del_rcu(&addr->list);
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800809 break;
810 }
811 }
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000812 spin_unlock_bh(&net->sctp.local_addr_lock);
Chidambar 'ilLogict' Zinnoury22626212008-03-11 18:05:02 -0700813 if (found)
Lai Jiangshan1231f0b2011-03-15 18:05:02 +0800814 kfree_rcu(addr, rcu);
Sridhar Samudrala29c7cf92006-12-13 16:26:26 -0800815 break;
816 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817
818 return NOTIFY_DONE;
819}
820
821/*
822 * Initialize the control inode/socket with a control endpoint data
823 * structure. This endpoint is reserved exclusively for the OOTB processing.
824 */
Eric W. Biederman2ce95502012-08-06 08:43:06 +0000825static int sctp_ctl_sock_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826{
827 int err;
Brian Haleyfb13d9f2009-03-04 03:20:26 -0800828 sa_family_t family = PF_INET;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700829
830 if (sctp_get_pf_specific(PF_INET6))
831 family = PF_INET6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832
Eric W. Biederman2ce95502012-08-06 08:43:06 +0000833 err = inet_ctl_sock_create(&net->sctp.ctl_sock, family,
834 SOCK_SEQPACKET, IPPROTO_SCTP, net);
Brian Haleyfb13d9f2009-03-04 03:20:26 -0800835
836 /* If IPv6 socket could not be created, try the IPv4 socket */
837 if (err < 0 && family == PF_INET6)
Eric W. Biederman2ce95502012-08-06 08:43:06 +0000838 err = inet_ctl_sock_create(&net->sctp.ctl_sock, AF_INET,
Brian Haleyfb13d9f2009-03-04 03:20:26 -0800839 SOCK_SEQPACKET, IPPROTO_SCTP,
Eric W. Biederman2ce95502012-08-06 08:43:06 +0000840 net);
Brian Haleyfb13d9f2009-03-04 03:20:26 -0800841
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842 if (err < 0) {
Joe Perches145ce502010-08-24 13:21:08 +0000843 pr_err("Failed to create the SCTP control socket\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844 return err;
845 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846 return 0;
847}
848
Xin Long965ae442020-10-29 15:04:58 +0800849static int sctp_udp_rcv(struct sock *sk, struct sk_buff *skb)
850{
Xin Longa1dd2cf2020-10-29 15:05:03 +0800851 SCTP_INPUT_CB(skb)->encap_port = udp_hdr(skb)->source;
852
Xin Long965ae442020-10-29 15:04:58 +0800853 skb_set_transport_header(skb, sizeof(struct udphdr));
854 sctp_rcv(skb);
855 return 0;
856}
857
858int sctp_udp_sock_start(struct net *net)
859{
860 struct udp_tunnel_sock_cfg tuncfg = {NULL};
861 struct udp_port_cfg udp_conf = {0};
862 struct socket *sock;
863 int err;
864
865 udp_conf.family = AF_INET;
866 udp_conf.local_ip.s_addr = htonl(INADDR_ANY);
867 udp_conf.local_udp_port = htons(net->sctp.udp_port);
868 err = udp_sock_create(net, &udp_conf, &sock);
869 if (err) {
870 pr_err("Failed to create the SCTP UDP tunneling v4 sock\n");
871 return err;
872 }
873
874 tuncfg.encap_type = 1;
875 tuncfg.encap_rcv = sctp_udp_rcv;
Xin Long9e47df02021-06-22 14:05:00 -0400876 tuncfg.encap_err_lookup = sctp_udp_v4_err;
Xin Long965ae442020-10-29 15:04:58 +0800877 setup_udp_tunnel_sock(net, sock, &tuncfg);
878 net->sctp.udp4_sock = sock->sk;
879
Xin Long9d6ba262020-10-29 15:04:59 +0800880#if IS_ENABLED(CONFIG_IPV6)
881 memset(&udp_conf, 0, sizeof(udp_conf));
882
883 udp_conf.family = AF_INET6;
884 udp_conf.local_ip6 = in6addr_any;
885 udp_conf.local_udp_port = htons(net->sctp.udp_port);
886 udp_conf.use_udp6_rx_checksums = true;
887 udp_conf.ipv6_v6only = true;
888 err = udp_sock_create(net, &udp_conf, &sock);
889 if (err) {
890 pr_err("Failed to create the SCTP UDP tunneling v6 sock\n");
891 udp_tunnel_sock_release(net->sctp.udp4_sock->sk_socket);
892 net->sctp.udp4_sock = NULL;
893 return err;
894 }
895
896 tuncfg.encap_type = 1;
897 tuncfg.encap_rcv = sctp_udp_rcv;
Xin Long9e47df02021-06-22 14:05:00 -0400898 tuncfg.encap_err_lookup = sctp_udp_v6_err;
Xin Long9d6ba262020-10-29 15:04:59 +0800899 setup_udp_tunnel_sock(net, sock, &tuncfg);
900 net->sctp.udp6_sock = sock->sk;
901#endif
902
Xin Long965ae442020-10-29 15:04:58 +0800903 return 0;
904}
905
906void sctp_udp_sock_stop(struct net *net)
907{
908 if (net->sctp.udp4_sock) {
909 udp_tunnel_sock_release(net->sctp.udp4_sock->sk_socket);
910 net->sctp.udp4_sock = NULL;
911 }
Xin Long9d6ba262020-10-29 15:04:59 +0800912 if (net->sctp.udp6_sock) {
913 udp_tunnel_sock_release(net->sctp.udp6_sock->sk_socket);
914 net->sctp.udp6_sock = NULL;
915 }
Xin Long965ae442020-10-29 15:04:58 +0800916}
917
Linus Torvalds1da177e2005-04-16 15:20:36 -0700918/* Register address family specific functions. */
919int sctp_register_af(struct sctp_af *af)
920{
921 switch (af->sa_family) {
922 case AF_INET:
923 if (sctp_af_v4_specific)
924 return 0;
925 sctp_af_v4_specific = af;
926 break;
927 case AF_INET6:
928 if (sctp_af_v6_specific)
929 return 0;
930 sctp_af_v6_specific = af;
931 break;
932 default:
933 return 0;
934 }
935
936 INIT_LIST_HEAD(&af->list);
937 list_add_tail(&af->list, &sctp_address_families);
938 return 1;
939}
940
941/* Get the table of functions for manipulating a particular address
942 * family.
943 */
944struct sctp_af *sctp_get_af_specific(sa_family_t family)
945{
946 switch (family) {
947 case AF_INET:
948 return sctp_af_v4_specific;
949 case AF_INET6:
950 return sctp_af_v6_specific;
951 default:
952 return NULL;
953 }
954}
955
956/* Common code to initialize a AF_INET msg_name. */
957static void sctp_inet_msgname(char *msgname, int *addr_len)
958{
959 struct sockaddr_in *sin;
960
961 sin = (struct sockaddr_in *)msgname;
962 *addr_len = sizeof(struct sockaddr_in);
963 sin->sin_family = AF_INET;
964 memset(sin->sin_zero, 0, sizeof(sin->sin_zero));
965}
966
967/* Copy the primary address of the peer primary address as the msg_name. */
968static void sctp_inet_event_msgname(struct sctp_ulpevent *event, char *msgname,
969 int *addr_len)
970{
971 struct sockaddr_in *sin, *sinfrom;
972
973 if (msgname) {
974 struct sctp_association *asoc;
975
976 asoc = event->asoc;
977 sctp_inet_msgname(msgname, addr_len);
978 sin = (struct sockaddr_in *)msgname;
979 sinfrom = &asoc->peer.primary_addr.v4;
980 sin->sin_port = htons(asoc->peer.port);
981 sin->sin_addr.s_addr = sinfrom->sin_addr.s_addr;
982 }
983}
984
985/* Initialize and copy out a msgname from an inbound skb. */
986static void sctp_inet_skb_msgname(struct sk_buff *skb, char *msgname, int *len)
987{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 if (msgname) {
Arnaldo Carvalho de Melo2c0fd382007-03-13 13:59:32 -0300989 struct sctphdr *sh = sctp_hdr(skb);
990 struct sockaddr_in *sin = (struct sockaddr_in *)msgname;
991
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992 sctp_inet_msgname(msgname, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 sin->sin_port = sh->source;
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700994 sin->sin_addr.s_addr = ip_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700995 }
996}
997
998/* Do we support this AF? */
999static int sctp_inet_af_supported(sa_family_t family, struct sctp_sock *sp)
1000{
1001 /* PF_INET only supports AF_INET addresses. */
Eric Dumazeta02cec22010-09-22 20:43:57 +00001002 return AF_INET == family;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003}
1004
1005/* Address matching with wildcards allowed. */
1006static int sctp_inet_cmp_addr(const union sctp_addr *addr1,
1007 const union sctp_addr *addr2,
1008 struct sctp_sock *opt)
1009{
1010 /* PF_INET only supports AF_INET addresses. */
1011 if (addr1->sa.sa_family != addr2->sa.sa_family)
1012 return 0;
Al Viroe6f1ceb2008-03-17 22:44:53 -07001013 if (htonl(INADDR_ANY) == addr1->v4.sin_addr.s_addr ||
1014 htonl(INADDR_ANY) == addr2->v4.sin_addr.s_addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 return 1;
1016 if (addr1->v4.sin_addr.s_addr == addr2->v4.sin_addr.s_addr)
1017 return 1;
1018
1019 return 0;
1020}
1021
1022/* Verify that provided sockaddr looks bindable. Common verification has
1023 * already been taken care of.
1024 */
1025static int sctp_inet_bind_verify(struct sctp_sock *opt, union sctp_addr *addr)
1026{
1027 return sctp_v4_available(addr, opt);
1028}
1029
1030/* Verify that sockaddr looks sendable. Common verification has already
1031 * been taken care of.
1032 */
1033static int sctp_inet_send_verify(struct sctp_sock *opt, union sctp_addr *addr)
1034{
1035 return 1;
1036}
1037
1038/* Fill in Supported Address Type information for INIT and INIT-ACK
1039 * chunks. Returns number of addresses supported.
1040 */
1041static int sctp_inet_supported_addrs(const struct sctp_sock *opt,
Al Viro3dbe8652006-11-20 17:25:49 -08001042 __be16 *types)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043{
1044 types[0] = SCTP_PARAM_IPV4_ADDRESS;
1045 return 1;
1046}
1047
1048/* Wrapper routine that calls the ip transmit routine. */
Xin Long600af7f2020-10-29 15:05:06 +08001049static inline int sctp_v4_xmit(struct sk_buff *skb, struct sctp_transport *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001050{
Xin Long600af7f2020-10-29 15:05:06 +08001051 struct dst_entry *dst = dst_clone(t->dst);
1052 struct flowi4 *fl4 = &t->fl.u.ip4;
1053 struct sock *sk = skb->sk;
1054 struct inet_sock *inet = inet_sk(sk);
Xin Long8a9c58d2018-07-02 18:21:12 +08001055 __u8 dscp = inet->tos;
Xin Long600af7f2020-10-29 15:05:06 +08001056 __be16 df = 0;
Herbert Xuf8803742008-08-03 21:15:08 -07001057
Daniel Borkmannbb333812013-06-28 19:49:40 +02001058 pr_debug("%s: skb:%p, len:%d, src:%pI4, dst:%pI4\n", __func__, skb,
Xin Long600af7f2020-10-29 15:05:06 +08001059 skb->len, &fl4->saddr, &fl4->daddr);
Xin Long8a9c58d2018-07-02 18:21:12 +08001060
Xin Long600af7f2020-10-29 15:05:06 +08001061 if (t->dscp & SCTP_DSCP_SET_MASK)
1062 dscp = t->dscp & SCTP_DSCP_VAL_MASK;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001063
Xin Long600af7f2020-10-29 15:05:06 +08001064 inet->pmtudisc = t->param_flags & SPP_PMTUD_ENABLE ? IP_PMTUDISC_DO
1065 : IP_PMTUDISC_DONT;
1066 SCTP_INC_STATS(sock_net(sk), SCTP_MIB_OUTSCTPPACKS);
Herbert Xuf8803742008-08-03 21:15:08 -07001067
Xin Long600af7f2020-10-29 15:05:06 +08001068 if (!t->encap_port || !sctp_sk(sk)->udp_port) {
1069 skb_dst_set(skb, dst);
1070 return __ip_queue_xmit(sk, skb, &t->fl, dscp);
1071 }
Daniel Borkmannbb333812013-06-28 19:49:40 +02001072
Xin Long600af7f2020-10-29 15:05:06 +08001073 if (skb_is_gso(skb))
1074 skb_shinfo(skb)->gso_type |= SKB_GSO_UDP_TUNNEL_CSUM;
1075
1076 if (ip_dont_fragment(sk, dst) && !skb->ignore_df)
1077 df = htons(IP_DF);
1078
1079 skb->encapsulation = 1;
1080 skb_reset_inner_mac_header(skb);
1081 skb_reset_inner_transport_header(skb);
1082 skb_set_inner_ipproto(skb, IPPROTO_SCTP);
1083 udp_tunnel_xmit_skb((struct rtable *)dst, sk, skb, fl4->saddr,
1084 fl4->daddr, dscp, ip4_dst_hoplimit(dst), df,
1085 sctp_sk(sk)->udp_port, t->encap_port, false, false);
1086 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001087}
1088
Neil Horman15efbe72008-02-15 09:53:59 -05001089static struct sctp_af sctp_af_inet;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001090
1091static struct sctp_pf sctp_pf_inet = {
1092 .event_msgname = sctp_inet_event_msgname,
1093 .skb_msgname = sctp_inet_skb_msgname,
1094 .af_supported = sctp_inet_af_supported,
1095 .cmp_addr = sctp_inet_cmp_addr,
1096 .bind_verify = sctp_inet_bind_verify,
1097 .send_verify = sctp_inet_send_verify,
1098 .supported_addrs = sctp_inet_supported_addrs,
1099 .create_accept_sk = sctp_v4_create_accept_sk,
Jason Gunthorpe299ee122014-07-30 12:40:53 -06001100 .addr_to_user = sctp_v4_addr_to_user,
1101 .to_sk_saddr = sctp_v4_to_sk_saddr,
1102 .to_sk_daddr = sctp_v4_to_sk_daddr,
Richard Hainesb7e10c22018-02-24 16:18:51 +00001103 .copy_ip_options = sctp_v4_copy_ip_options,
Neil Horman15efbe72008-02-15 09:53:59 -05001104 .af = &sctp_af_inet
Linus Torvalds1da177e2005-04-16 15:20:36 -07001105};
1106
1107/* Notifier for inetaddr addition/deletion events. */
1108static struct notifier_block sctp_inetaddr_notifier = {
1109 .notifier_call = sctp_inetaddr_event,
1110};
1111
1112/* Socket operations. */
Eric Dumazet90ddc4f2005-12-22 12:49:22 -08001113static const struct proto_ops inet_seqpacket_ops = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001114 .family = PF_INET,
1115 .owner = THIS_MODULE,
1116 .release = inet_release, /* Needs to be wrapped... */
1117 .bind = inet_bind,
Xin Long644fbde2018-05-20 16:39:10 +08001118 .connect = sctp_inet_connect,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001119 .socketpair = sock_no_socketpair,
1120 .accept = inet_accept,
1121 .getname = inet_getname, /* Semantics are different. */
Linus Torvaldsa11e1d42018-06-28 09:43:44 -07001122 .poll = sctp_poll,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001123 .ioctl = inet_ioctl,
Arnd Bergmannc7cbdbf2019-04-17 22:51:48 +02001124 .gettstamp = sock_gettstamp,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001125 .listen = sctp_inet_listen,
1126 .shutdown = inet_shutdown, /* Looks harmless. */
1127 .setsockopt = sock_common_setsockopt, /* IP_SOL IP_OPTION is a problem */
1128 .getsockopt = sock_common_getsockopt,
1129 .sendmsg = inet_sendmsg,
Xin Longfd2d1802016-07-22 21:25:42 +08001130 .recvmsg = inet_recvmsg,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001131 .mmap = sock_no_mmap,
1132 .sendpage = sock_no_sendpage,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001133};
1134
1135/* Registration with AF_INET family. */
1136static struct inet_protosw sctp_seqpacket_protosw = {
1137 .type = SOCK_SEQPACKET,
1138 .protocol = IPPROTO_SCTP,
1139 .prot = &sctp_prot,
1140 .ops = &inet_seqpacket_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141 .flags = SCTP_PROTOSW_FLAG
1142};
1143static struct inet_protosw sctp_stream_protosw = {
1144 .type = SOCK_STREAM,
1145 .protocol = IPPROTO_SCTP,
1146 .prot = &sctp_prot,
1147 .ops = &inet_seqpacket_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001148 .flags = SCTP_PROTOSW_FLAG
1149};
1150
Xin Longa1dd2cf2020-10-29 15:05:03 +08001151static int sctp4_rcv(struct sk_buff *skb)
1152{
Xin Long03560102020-11-04 14:55:32 +08001153 SCTP_INPUT_CB(skb)->encap_port = 0;
Xin Longa1dd2cf2020-10-29 15:05:03 +08001154 return sctp_rcv(skb);
1155}
1156
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157/* Register with IP layer. */
Alexey Dobriyan32613092009-09-14 12:21:47 +00001158static const struct net_protocol sctp_protocol = {
Xin Longa1dd2cf2020-10-29 15:05:03 +08001159 .handler = sctp4_rcv,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160 .err_handler = sctp_v4_err,
1161 .no_policy = 1,
Hannes Frederic Sowa8ed1dc42014-01-09 10:01:17 +01001162 .icmp_strict_tag_validation = 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163};
1164
1165/* IPv4 address related functions. */
Neil Horman15efbe72008-02-15 09:53:59 -05001166static struct sctp_af sctp_af_inet = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001167 .sa_family = AF_INET,
1168 .sctp_xmit = sctp_v4_xmit,
1169 .setsockopt = ip_setsockopt,
1170 .getsockopt = ip_getsockopt,
1171 .get_dst = sctp_v4_get_dst,
1172 .get_saddr = sctp_v4_get_saddr,
1173 .copy_addrlist = sctp_v4_copy_addrlist,
1174 .from_skb = sctp_v4_from_skb,
1175 .from_sk = sctp_v4_from_sk,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001176 .from_addr_param = sctp_v4_from_addr_param,
1177 .to_addr_param = sctp_v4_to_addr_param,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001178 .cmp_addr = sctp_v4_cmp_addr,
1179 .addr_valid = sctp_v4_addr_valid,
1180 .inaddr_any = sctp_v4_inaddr_any,
1181 .is_any = sctp_v4_is_any,
1182 .available = sctp_v4_available,
1183 .scope = sctp_v4_scope,
1184 .skb_iif = sctp_v4_skb_iif,
1185 .is_ce = sctp_v4_is_ce,
1186 .seq_dump_addr = sctp_v4_seq_dump_addr,
Vlad Yasevichb9031d92008-06-04 12:40:15 -07001187 .ecn_capable = sctp_v4_ecn_capable,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001188 .net_header_len = sizeof(struct iphdr),
1189 .sockaddr_len = sizeof(struct sockaddr_in),
Richard Hainesb7e10c22018-02-24 16:18:51 +00001190 .ip_options_len = sctp_v4_ip_options_len,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191};
1192
wangweidong8d726512013-12-23 12:16:53 +08001193struct sctp_pf *sctp_get_pf_specific(sa_family_t family)
1194{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195 switch (family) {
1196 case PF_INET:
1197 return sctp_pf_inet_specific;
1198 case PF_INET6:
1199 return sctp_pf_inet6_specific;
1200 default:
1201 return NULL;
1202 }
1203}
1204
1205/* Register the PF specific function table. */
1206int sctp_register_pf(struct sctp_pf *pf, sa_family_t family)
1207{
1208 switch (family) {
1209 case PF_INET:
1210 if (sctp_pf_inet_specific)
1211 return 0;
1212 sctp_pf_inet_specific = pf;
1213 break;
1214 case PF_INET6:
1215 if (sctp_pf_inet6_specific)
1216 return 0;
1217 sctp_pf_inet6_specific = pf;
1218 break;
1219 default:
1220 return 0;
1221 }
1222 return 1;
1223}
1224
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001225static inline int init_sctp_mibs(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001226{
WANG Cong698365f2014-05-05 15:55:55 -07001227 net->sctp.sctp_statistics = alloc_percpu(struct sctp_mib);
1228 if (!net->sctp.sctp_statistics)
1229 return -ENOMEM;
1230 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231}
1232
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001233static inline void cleanup_sctp_mibs(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001234{
WANG Cong698365f2014-05-05 15:55:55 -07001235 free_percpu(net->sctp.sctp_statistics);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236}
1237
Vlad Yasevich270637a2008-03-20 15:17:14 -07001238static void sctp_v4_pf_init(void)
1239{
1240 /* Initialize the SCTP specific PF functions. */
1241 sctp_register_pf(&sctp_pf_inet, PF_INET);
1242 sctp_register_af(&sctp_af_inet);
1243}
1244
1245static void sctp_v4_pf_exit(void)
1246{
1247 list_del(&sctp_af_inet.list);
1248}
1249
1250static int sctp_v4_protosw_init(void)
1251{
1252 int rc;
1253
1254 rc = proto_register(&sctp_prot, 1);
1255 if (rc)
1256 return rc;
1257
1258 /* Register SCTP(UDP and TCP style) with socket layer. */
1259 inet_register_protosw(&sctp_seqpacket_protosw);
1260 inet_register_protosw(&sctp_stream_protosw);
1261
1262 return 0;
1263}
1264
1265static void sctp_v4_protosw_exit(void)
1266{
1267 inet_unregister_protosw(&sctp_stream_protosw);
1268 inet_unregister_protosw(&sctp_seqpacket_protosw);
1269 proto_unregister(&sctp_prot);
1270}
1271
1272static int sctp_v4_add_protocol(void)
1273{
1274 /* Register notifier for inet address additions/deletions. */
1275 register_inetaddr_notifier(&sctp_inetaddr_notifier);
1276
1277 /* Register SCTP with inet layer. */
1278 if (inet_add_protocol(&sctp_protocol, IPPROTO_SCTP) < 0)
1279 return -EAGAIN;
1280
1281 return 0;
1282}
1283
1284static void sctp_v4_del_protocol(void)
1285{
1286 inet_del_protocol(&sctp_protocol, IPPROTO_SCTP);
1287 unregister_inetaddr_notifier(&sctp_inetaddr_notifier);
1288}
1289
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001290static int __net_init sctp_defaults_init(struct net *net)
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001291{
Eric W. Biederman2ce95502012-08-06 08:43:06 +00001292 int status;
1293
Eric W. Biedermane1fc3b12012-08-07 07:29:57 +00001294 /*
1295 * 14. Suggested SCTP Protocol Parameter Values
1296 */
1297 /* The following protocol parameters are RECOMMENDED: */
1298 /* RTO.Initial - 3 seconds */
1299 net->sctp.rto_initial = SCTP_RTO_INITIAL;
1300 /* RTO.Min - 1 second */
1301 net->sctp.rto_min = SCTP_RTO_MIN;
1302 /* RTO.Max - 60 seconds */
1303 net->sctp.rto_max = SCTP_RTO_MAX;
1304 /* RTO.Alpha - 1/8 */
1305 net->sctp.rto_alpha = SCTP_RTO_ALPHA;
1306 /* RTO.Beta - 1/4 */
1307 net->sctp.rto_beta = SCTP_RTO_BETA;
1308
1309 /* Valid.Cookie.Life - 60 seconds */
1310 net->sctp.valid_cookie_life = SCTP_DEFAULT_COOKIE_LIFE;
1311
1312 /* Whether Cookie Preservative is enabled(1) or not(0) */
1313 net->sctp.cookie_preserve_enable = 1;
1314
Neil Horman3c681982012-10-24 09:20:03 +00001315 /* Default sctp sockets to use md5 as their hmac alg */
Neil Horman0d0863b2012-12-14 15:22:01 +00001316#if defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_MD5)
Neil Horman3c681982012-10-24 09:20:03 +00001317 net->sctp.sctp_hmac_alg = "md5";
Neil Horman0d0863b2012-12-14 15:22:01 +00001318#elif defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_SHA1)
Neil Horman3c681982012-10-24 09:20:03 +00001319 net->sctp.sctp_hmac_alg = "sha1";
1320#else
1321 net->sctp.sctp_hmac_alg = NULL;
1322#endif
1323
Eric W. Biedermane1fc3b12012-08-07 07:29:57 +00001324 /* Max.Burst - 4 */
1325 net->sctp.max_burst = SCTP_DEFAULT_MAX_BURST;
1326
Xin Long34515e92019-11-08 13:20:35 +08001327 /* Disable of Primary Path Switchover by default */
1328 net->sctp.ps_retrans = SCTP_PS_RETRANS_MAX;
1329
Zhu Yanjun566178f2015-12-16 13:55:04 +08001330 /* Enable pf state by default */
1331 net->sctp.pf_enable = 1;
1332
Xin Longaef587b2019-11-08 13:20:32 +08001333 /* Ignore pf exposure feature by default */
1334 net->sctp.pf_expose = SCTP_PF_EXPOSE_UNSET;
1335
Eric W. Biedermane1fc3b12012-08-07 07:29:57 +00001336 /* Association.Max.Retrans - 10 attempts
1337 * Path.Max.Retrans - 5 attempts (per destination address)
1338 * Max.Init.Retransmits - 8 attempts
1339 */
1340 net->sctp.max_retrans_association = 10;
1341 net->sctp.max_retrans_path = 5;
1342 net->sctp.max_retrans_init = 8;
1343
1344 /* Sendbuffer growth - do per-socket accounting */
1345 net->sctp.sndbuf_policy = 0;
1346
1347 /* Rcvbuffer growth - do per-socket accounting */
1348 net->sctp.rcvbuf_policy = 0;
1349
1350 /* HB.interval - 30 seconds */
1351 net->sctp.hb_interval = SCTP_DEFAULT_TIMEOUT_HEARTBEAT;
1352
1353 /* delayed SACK timeout */
1354 net->sctp.sack_timeout = SCTP_DEFAULT_TIMEOUT_SACK;
1355
1356 /* Disable ADDIP by default. */
1357 net->sctp.addip_enable = 0;
1358 net->sctp.addip_noauth = 0;
1359 net->sctp.default_auto_asconf = 0;
1360
1361 /* Enable PR-SCTP by default. */
1362 net->sctp.prsctp_enable = 1;
1363
Xin Longc28445c2017-01-18 00:44:45 +08001364 /* Disable RECONF by default. */
1365 net->sctp.reconf_enable = 0;
1366
Eric W. Biedermane1fc3b12012-08-07 07:29:57 +00001367 /* Disable AUTH by default. */
1368 net->sctp.auth_enable = 0;
1369
Xin Long1b0b8112019-08-26 16:30:02 +08001370 /* Enable ECN by default. */
1371 net->sctp.ecn_enable = 1;
1372
Xin Long965ae442020-10-29 15:04:58 +08001373 /* Set UDP tunneling listening port to 0 by default */
1374 net->sctp.udp_port = 0;
1375
Xin Longe8a30012020-10-29 15:05:01 +08001376 /* Set remote encap port to 0 by default */
1377 net->sctp.encap_port = 0;
1378
Eric W. Biedermane1fc3b12012-08-07 07:29:57 +00001379 /* Set SCOPE policy to enabled */
1380 net->sctp.scope_policy = SCTP_SCOPE_POLICY_ENABLE;
1381
1382 /* Set the default rwnd update threshold */
1383 net->sctp.rwnd_upd_shift = SCTP_DEFAULT_RWND_SHIFT;
1384
1385 /* Initialize maximum autoclose timeout. */
1386 net->sctp.max_autoclose = INT_MAX / HZ;
1387
Eric W. Biedermanebb7e952012-08-07 07:23:59 +00001388 status = sctp_sysctl_net_register(net);
1389 if (status)
1390 goto err_sysctl_register;
1391
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001392 /* Allocate and initialise sctp mibs. */
1393 status = init_sctp_mibs(net);
1394 if (status)
1395 goto err_init_mibs;
1396
Al Virod47d08c2018-03-16 23:32:51 +00001397#ifdef CONFIG_PROC_FS
Eric W. Biederman13d782f2012-08-06 08:45:15 +00001398 /* Initialize proc fs directory. */
1399 status = sctp_proc_init(net);
1400 if (status)
1401 goto err_init_proc;
Al Virod47d08c2018-03-16 23:32:51 +00001402#endif
Eric W. Biederman13d782f2012-08-06 08:45:15 +00001403
1404 sctp_dbg_objcnt_init(net);
1405
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001406 /* Initialize the local address list. */
1407 INIT_LIST_HEAD(&net->sctp.local_addr_list);
1408 spin_lock_init(&net->sctp.local_addr_lock);
1409 sctp_get_local_addr_list(net);
1410
1411 /* Initialize the address event list */
1412 INIT_LIST_HEAD(&net->sctp.addr_waitq);
1413 INIT_LIST_HEAD(&net->sctp.auto_asconf_splist);
1414 spin_lock_init(&net->sctp.addr_wq_lock);
1415 net->sctp.addr_wq_timer.expires = 0;
Kees Cook9c3b5752017-10-24 01:45:31 -07001416 timer_setup(&net->sctp.addr_wq_timer, sctp_addr_wq_timeout_handler, 0);
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001417
1418 return 0;
Eric W. Biederman2ce95502012-08-06 08:43:06 +00001419
Arnd Bergmann7ae665f2018-03-28 16:14:56 +02001420#ifdef CONFIG_PROC_FS
Eric W. Biederman13d782f2012-08-06 08:45:15 +00001421err_init_proc:
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001422 cleanup_sctp_mibs(net);
Arnd Bergmann7ae665f2018-03-28 16:14:56 +02001423#endif
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001424err_init_mibs:
Eric W. Biedermanebb7e952012-08-07 07:23:59 +00001425 sctp_sysctl_net_unregister(net);
1426err_sysctl_register:
Eric W. Biederman2ce95502012-08-06 08:43:06 +00001427 return status;
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001428}
1429
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001430static void __net_exit sctp_defaults_exit(struct net *net)
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001431{
1432 /* Free the local address list */
1433 sctp_free_addr_wq(net);
1434 sctp_free_local_addr_list(net);
Eric W. Biederman2ce95502012-08-06 08:43:06 +00001435
Al Virod47d08c2018-03-16 23:32:51 +00001436#ifdef CONFIG_PROC_FS
1437 remove_proc_subtree("sctp", net->proc_net);
1438 net->sctp.proc_net_sctp = NULL;
1439#endif
Eric W. Biedermanb01a2402012-08-06 08:47:55 +00001440 cleanup_sctp_mibs(net);
Eric W. Biedermanebb7e952012-08-07 07:23:59 +00001441 sctp_sysctl_net_unregister(net);
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001442}
1443
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001444static struct pernet_operations sctp_defaults_ops = {
1445 .init = sctp_defaults_init,
1446 .exit = sctp_defaults_exit,
1447};
1448
1449static int __net_init sctp_ctrlsock_init(struct net *net)
1450{
1451 int status;
1452
1453 /* Initialize the control inode/socket for handling OOTB packets. */
1454 status = sctp_ctl_sock_init(net);
1455 if (status)
1456 pr_err("Failed to initialize the SCTP control sock\n");
1457
1458 return status;
1459}
1460
Christophe JAILLETb456d722019-09-11 18:02:39 +02001461static void __net_exit sctp_ctrlsock_exit(struct net *net)
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001462{
1463 /* Free the control endpoint. */
1464 inet_ctl_sock_destroy(net->sctp.ctl_sock);
1465}
1466
1467static struct pernet_operations sctp_ctrlsock_ops = {
1468 .init = sctp_ctrlsock_init,
1469 .exit = sctp_ctrlsock_exit,
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001470};
1471
Linus Torvalds1da177e2005-04-16 15:20:36 -07001472/* Initialize the universe into something sensible. */
Daniel Borkmanndda91922013-06-17 11:40:05 +02001473static __init int sctp_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001474{
Arun KSca79b0c2018-12-28 00:34:29 -08001475 unsigned long nr_pages = totalram_pages();
Colin Ian King623b57be2020-07-24 14:09:19 +01001476 unsigned long limit;
1477 unsigned long goal;
Neil Hormand9749fb2016-02-18 16:10:57 -05001478 int max_entry_order;
Colin Ian King623b57be2020-07-24 14:09:19 +01001479 int num_entries;
1480 int max_share;
1481 int status;
1482 int order;
1483 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001484
Eyal Birgerb4772ef2015-03-01 14:58:29 +02001485 sock_skb_cb_check_size(sizeof(struct sctp_ulpevent));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001486
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001487 /* Allocate bind_bucket and chunk caches. */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001488 status = -ENOBUFS;
1489 sctp_bucket_cachep = kmem_cache_create("sctp_bind_bucket",
1490 sizeof(struct sctp_bind_bucket),
1491 0, SLAB_HWCACHE_ALIGN,
Paul Mundt20c2df82007-07-20 10:11:58 +09001492 NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493 if (!sctp_bucket_cachep)
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001494 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495
1496 sctp_chunk_cachep = kmem_cache_create("sctp_chunk",
1497 sizeof(struct sctp_chunk),
1498 0, SLAB_HWCACHE_ALIGN,
Paul Mundt20c2df82007-07-20 10:11:58 +09001499 NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001500 if (!sctp_chunk_cachep)
1501 goto err_chunk_cachep;
1502
Tejun Heo908c7f12014-09-08 09:51:29 +09001503 status = percpu_counter_init(&sctp_sockets_allocated, 0, GFP_KERNEL);
Eric W. Biederman632c9282012-08-06 08:44:24 +00001504 if (status)
1505 goto err_percpu_counter_init;
1506
Linus Torvalds1da177e2005-04-16 15:20:36 -07001507 /* Implementation specific variables. */
1508
1509 /* Initialize default stream count setup information. */
1510 sctp_max_instreams = SCTP_DEFAULT_INSTREAMS;
1511 sctp_max_outstreams = SCTP_DEFAULT_OUTSTREAMS;
1512
1513 /* Initialize handle used for association ids. */
1514 idr_init(&sctp_assocs_id);
1515
Eric Dumazetf03d78d2011-07-07 00:27:05 -07001516 limit = nr_free_buffer_pages() / 8;
Neil Horman4d93df02007-08-15 16:07:44 -07001517 limit = max(limit, 128UL);
1518 sysctl_sctp_mem[0] = limit / 4 * 3;
1519 sysctl_sctp_mem[1] = limit;
1520 sysctl_sctp_mem[2] = sysctl_sctp_mem[0] * 2;
1521
1522 /* Set per-socket limits to no more than 1/128 the pressure threshold*/
1523 limit = (sysctl_sctp_mem[1]) << (PAGE_SHIFT - 7);
1524 max_share = min(4UL*1024*1024, limit);
1525
Vlad Yasevich845525a2008-07-18 23:08:21 -07001526 sysctl_sctp_rmem[0] = SK_MEM_QUANTUM; /* give each asoc 1 page min */
Eric Dumazet87fb4b72011-10-13 07:28:54 +00001527 sysctl_sctp_rmem[1] = 1500 * SKB_TRUESIZE(1);
Neil Horman4d93df02007-08-15 16:07:44 -07001528 sysctl_sctp_rmem[2] = max(sysctl_sctp_rmem[1], max_share);
1529
Hideo Aoki3ab224b2007-12-31 00:11:19 -08001530 sysctl_sctp_wmem[0] = SK_MEM_QUANTUM;
Neil Horman4d93df02007-08-15 16:07:44 -07001531 sysctl_sctp_wmem[1] = 16*1024;
1532 sysctl_sctp_wmem[2] = max(64*1024, max_share);
1533
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534 /* Size and allocate the association hash table.
1535 * The methodology is similar to that of the tcp hash tables.
Neil Hormand9749fb2016-02-18 16:10:57 -05001536 * Though not identical. Start by getting a goal size
Linus Torvalds1da177e2005-04-16 15:20:36 -07001537 */
Arun KS3d6357d2018-12-28 00:34:20 -08001538 if (nr_pages >= (128 * 1024))
1539 goal = nr_pages >> (22 - PAGE_SHIFT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001540 else
Arun KS3d6357d2018-12-28 00:34:20 -08001541 goal = nr_pages >> (24 - PAGE_SHIFT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001542
Neil Hormand9749fb2016-02-18 16:10:57 -05001543 /* Then compute the page order for said goal */
1544 order = get_order(goal);
1545
1546 /* Now compute the required page order for the maximum sized table we
1547 * want to create
1548 */
1549 max_entry_order = get_order(MAX_SCTP_PORT_HASH_ENTRIES *
1550 sizeof(struct sctp_bind_hashbucket));
1551
1552 /* Limit the page order by that maximum hash table size */
1553 order = min(order, max_entry_order);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001554
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555 /* Allocate and initialize the endpoint hash table. */
1556 sctp_ep_hashsize = 64;
Zhang Yanfei3b77d662013-03-12 13:39:47 +08001557 sctp_ep_hashtable =
Kees Cook6da2ec52018-06-12 13:55:00 -07001558 kmalloc_array(64, sizeof(struct sctp_hashbucket), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559 if (!sctp_ep_hashtable) {
Joe Perches145ce502010-08-24 13:21:08 +00001560 pr_err("Failed endpoint_hash alloc\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001561 status = -ENOMEM;
1562 goto err_ehash_alloc;
1563 }
1564 for (i = 0; i < sctp_ep_hashsize; i++) {
1565 rwlock_init(&sctp_ep_hashtable[i].lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -05001566 INIT_HLIST_HEAD(&sctp_ep_hashtable[i].chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001567 }
1568
Neil Hormand9749fb2016-02-18 16:10:57 -05001569 /* Allocate and initialize the SCTP port hash table.
1570 * Note that order is initalized to start at the max sized
1571 * table we want to support. If we can't get that many pages
1572 * reduce the order and try again
1573 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001574 do {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001575 sctp_port_hashtable = (struct sctp_bind_hashbucket *)
Eric Dumazet6857a022015-12-15 15:33:39 -08001576 __get_free_pages(GFP_KERNEL | __GFP_NOWARN, order);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577 } while (!sctp_port_hashtable && --order > 0);
Neil Hormand9749fb2016-02-18 16:10:57 -05001578
Linus Torvalds1da177e2005-04-16 15:20:36 -07001579 if (!sctp_port_hashtable) {
Joe Perches145ce502010-08-24 13:21:08 +00001580 pr_err("Failed bind hash alloc\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001581 status = -ENOMEM;
1582 goto err_bhash_alloc;
1583 }
Neil Hormand9749fb2016-02-18 16:10:57 -05001584
1585 /* Now compute the number of entries that will fit in the
1586 * port hash space we allocated
1587 */
1588 num_entries = (1UL << order) * PAGE_SIZE /
1589 sizeof(struct sctp_bind_hashbucket);
1590
Randy Dunlap93c32162020-08-22 16:15:59 -07001591 /* And finish by rounding it down to the nearest power of two.
1592 * This wastes some memory of course, but it's needed because
Neil Hormand9749fb2016-02-18 16:10:57 -05001593 * the hash function operates based on the assumption that
Randy Dunlap93c32162020-08-22 16:15:59 -07001594 * the number of entries is a power of two.
Neil Hormand9749fb2016-02-18 16:10:57 -05001595 */
1596 sctp_port_hashsize = rounddown_pow_of_two(num_entries);
1597
Linus Torvalds1da177e2005-04-16 15:20:36 -07001598 for (i = 0; i < sctp_port_hashsize; i++) {
1599 spin_lock_init(&sctp_port_hashtable[i].lock);
Vlad Yasevichd970dbf2007-11-09 11:43:40 -05001600 INIT_HLIST_HEAD(&sctp_port_hashtable[i].chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001601 }
1602
Wei Yongjuna5e27d12016-06-13 23:08:26 +08001603 status = sctp_transport_hashtable_init();
1604 if (status)
Xin Long4f008782015-12-30 23:50:47 +08001605 goto err_thash_alloc;
1606
Neil Hormand9749fb2016-02-18 16:10:57 -05001607 pr_info("Hash tables configured (bind %d/%d)\n", sctp_port_hashsize,
1608 num_entries);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001609
Linus Torvalds1da177e2005-04-16 15:20:36 -07001610 sctp_sysctl_register();
1611
1612 INIT_LIST_HEAD(&sctp_address_families);
Vlad Yasevich270637a2008-03-20 15:17:14 -07001613 sctp_v4_pf_init();
1614 sctp_v6_pf_init();
Xin Long1ba896f2017-11-26 20:16:08 +08001615 sctp_sched_ops_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001616
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001617 status = register_pernet_subsys(&sctp_defaults_ops);
1618 if (status)
1619 goto err_register_defaults;
Vlad Yasevich270637a2008-03-20 15:17:14 -07001620
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001621 status = sctp_v4_protosw_init();
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001622 if (status)
Vlad Yasevich270637a2008-03-20 15:17:14 -07001623 goto err_protosw_init;
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001624
Vlad Yasevich270637a2008-03-20 15:17:14 -07001625 status = sctp_v6_protosw_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001626 if (status)
Vlad Yasevich270637a2008-03-20 15:17:14 -07001627 goto err_v6_protosw_init;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001628
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001629 status = register_pernet_subsys(&sctp_ctrlsock_ops);
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001630 if (status)
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001631 goto err_register_ctrlsock;
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001632
Vlad Yasevich270637a2008-03-20 15:17:14 -07001633 status = sctp_v4_add_protocol();
1634 if (status)
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001635 goto err_add_protocol;
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001636
1637 /* Register SCTP with inet6 layer. */
1638 status = sctp_v6_add_protocol();
1639 if (status)
1640 goto err_v6_add_protocol;
1641
Marcelo Ricardo Leitner90017ac2016-06-02 15:05:43 -03001642 if (sctp_offload_init() < 0)
1643 pr_crit("%s: Cannot add SCTP protocol offload\n", __func__);
1644
Linus Torvalds1da177e2005-04-16 15:20:36 -07001645out:
1646 return status;
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001647err_v6_add_protocol:
Vlad Yasevich270637a2008-03-20 15:17:14 -07001648 sctp_v4_del_protocol();
Vlad Yasevichd1dd5242009-03-02 06:46:50 +00001649err_add_protocol:
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001650 unregister_pernet_subsys(&sctp_ctrlsock_ops);
1651err_register_ctrlsock:
Vlad Yasevich270637a2008-03-20 15:17:14 -07001652 sctp_v6_protosw_exit();
1653err_v6_protosw_init:
1654 sctp_v4_protosw_exit();
1655err_protosw_init:
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001656 unregister_pernet_subsys(&sctp_defaults_ops);
1657err_register_defaults:
Vlad Yasevich270637a2008-03-20 15:17:14 -07001658 sctp_v4_pf_exit();
1659 sctp_v6_pf_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001660 sctp_sysctl_unregister();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001661 free_pages((unsigned long)sctp_port_hashtable,
1662 get_order(sctp_port_hashsize *
1663 sizeof(struct sctp_bind_hashbucket)));
1664err_bhash_alloc:
Xin Long4f008782015-12-30 23:50:47 +08001665 sctp_transport_hashtable_destroy();
1666err_thash_alloc:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001667 kfree(sctp_ep_hashtable);
1668err_ehash_alloc:
Eric W. Biederman632c9282012-08-06 08:44:24 +00001669 percpu_counter_destroy(&sctp_sockets_allocated);
1670err_percpu_counter_init:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001671 kmem_cache_destroy(sctp_chunk_cachep);
1672err_chunk_cachep:
1673 kmem_cache_destroy(sctp_bucket_cachep);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001674 goto out;
1675}
1676
1677/* Exit handler for the SCTP protocol. */
Daniel Borkmanndda91922013-06-17 11:40:05 +02001678static __exit void sctp_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001679{
1680 /* BUG. This should probably do something useful like clean
1681 * up all the remaining associations and all that memory.
1682 */
1683
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001684 /* Unregister with inet6/inet layers. */
1685 sctp_v6_del_protocol();
Vlad Yasevich270637a2008-03-20 15:17:14 -07001686 sctp_v4_del_protocol();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001687
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001688 unregister_pernet_subsys(&sctp_ctrlsock_ops);
Eric W. Biederman4db67e82012-08-06 08:42:04 +00001689
Vlad Yasevich270637a2008-03-20 15:17:14 -07001690 /* Free protosw registrations */
1691 sctp_v6_protosw_exit();
1692 sctp_v4_protosw_exit();
1693
Marcelo Ricardo Leitner8e2d61e2015-09-10 17:31:15 -03001694 unregister_pernet_subsys(&sctp_defaults_ops);
1695
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001696 /* Unregister with socket layer. */
Vlad Yasevich270637a2008-03-20 15:17:14 -07001697 sctp_v6_pf_exit();
1698 sctp_v4_pf_exit();
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001699
Linus Torvalds1da177e2005-04-16 15:20:36 -07001700 sctp_sysctl_unregister();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001701
Linus Torvalds1da177e2005-04-16 15:20:36 -07001702 free_pages((unsigned long)sctp_port_hashtable,
1703 get_order(sctp_port_hashsize *
1704 sizeof(struct sctp_bind_hashbucket)));
Xin Longb5eff712015-12-30 23:50:49 +08001705 kfree(sctp_ep_hashtable);
Xin Long4f008782015-12-30 23:50:47 +08001706 sctp_transport_hashtable_destroy();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001707
Eric W. Biederman632c9282012-08-06 08:44:24 +00001708 percpu_counter_destroy(&sctp_sockets_allocated);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001709
Jesper Dangaard Brouereaa184a2009-06-08 03:11:43 +00001710 rcu_barrier(); /* Wait for completion of call_rcu()'s */
1711
Sridhar Samudrala827bf122007-05-04 13:36:30 -07001712 kmem_cache_destroy(sctp_chunk_cachep);
1713 kmem_cache_destroy(sctp_bucket_cachep);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001714}
1715
1716module_init(sctp_init);
1717module_exit(sctp_exit);
1718
Arnaldo Carvalho de Melobb97d312005-08-09 20:19:14 -07001719/*
1720 * __stringify doesn't likes enums, so use IPPROTO_SCTP value (132) directly.
1721 */
1722MODULE_ALIAS("net-pf-" __stringify(PF_INET) "-proto-132");
Sridhar Samudrala882a3822006-12-13 16:33:35 -08001723MODULE_ALIAS("net-pf-" __stringify(PF_INET6) "-proto-132");
Daniel Borkmann91705c62013-07-23 14:51:47 +02001724MODULE_AUTHOR("Linux Kernel SCTP developers <linux-sctp@vger.kernel.org>");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001725MODULE_DESCRIPTION("Support for the SCTP protocol (RFC2960)");
David S. Miller71acc0d2013-08-09 13:09:41 -07001726module_param_named(no_checksums, sctp_checksum_disable, bool, 0644);
1727MODULE_PARM_DESC(no_checksums, "Disable checksums computing and verification");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001728MODULE_LICENSE("GPL");