blob: 41389bbb08c03a2a52f6dc7919b52e0b65c3eade [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * TCP over IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09008 * Based on:
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
Herbert Xueb4dea52008-12-29 23:04:08 -080026#include <linux/bottom_half.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090041#include <linux/slab.h>
Wang Yufen4aa956d2014-03-29 09:27:29 +080042#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
Arnaldo Carvalho de Melo5324a042005-08-12 09:26:18 -030049#include <net/inet6_hashtables.h>
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -080050#include <net/inet6_connection_sock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059#include <net/snmp.h>
60#include <net/dsfield.h>
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -080061#include <net/timewait_sock.h>
Jeff Garzik18134be2007-10-26 22:53:14 -070062#include <net/netdma.h>
Denis V. Lunev3d58b5f2008-04-03 14:22:32 -070063#include <net/inet_common.h>
David S. Miller6e5714e2011-08-03 20:50:44 -070064#include <net/secure_seq.h>
Glauber Costad1a4c0b2011-12-11 21:47:04 +000065#include <net/tcp_memcontrol.h>
Eliezer Tamir076bb0c2013-07-10 17:13:17 +030066#include <net/busy_poll.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
Linus Torvalds1da177e2005-04-16 15:20:36 -070068#include <linux/proc_fs.h>
69#include <linux/seq_file.h>
70
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080071#include <linux/crypto.h>
72#include <linux/scatterlist.h>
73
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080074static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
Gui Jianfeng6edafaa2008-08-06 23:50:04 -070075static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
76 struct request_sock *req);
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Stephen Hemminger3b401a82009-09-01 19:25:04 +000080static const struct inet_connection_sock_af_ops ipv6_mapped;
81static const struct inet_connection_sock_af_ops ipv6_specific;
David S. Millera9286302006-11-14 19:53:22 -080082#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +000083static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
84static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090085#else
86static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000087 const struct in6_addr *addr)
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090088{
89 return NULL;
90}
David S. Millera9286302006-11-14 19:53:22 -080091#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
Neal Cardwellfae6ef82012-08-19 03:30:38 +000093static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
94{
95 struct dst_entry *dst = skb_dst(skb);
96 const struct rt6_info *rt = (const struct rt6_info *)dst;
97
98 dst_hold(dst);
99 sk->sk_rx_dst = dst;
100 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
101 if (rt->rt6i_node)
102 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
103}
104
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105static void tcp_v6_hash(struct sock *sk)
106{
107 if (sk->sk_state != TCP_CLOSE) {
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -0800108 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 tcp_prot.hash(sk);
110 return;
111 }
112 local_bh_disable();
Eric Dumazet9327f702009-12-04 03:46:54 +0000113 __inet6_hash(sk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 local_bh_enable();
115 }
116}
117
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400118static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700120 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
121 ipv6_hdr(skb)->saddr.s6_addr32,
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700122 tcp_hdr(skb)->dest,
123 tcp_hdr(skb)->source);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
125
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900126static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 int addr_len)
128{
129 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900130 struct inet_sock *inet = inet_sk(sk);
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800131 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 struct ipv6_pinfo *np = inet6_sk(sk);
133 struct tcp_sock *tp = tcp_sk(sk);
Arnaud Ebalard20c59de2010-06-01 21:35:01 +0000134 struct in6_addr *saddr = NULL, *final_p, final;
David S. Miller493f3772010-12-02 12:14:29 -0800135 struct rt6_info *rt;
David S. Miller4c9483b2011-03-12 16:22:43 -0500136 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 struct dst_entry *dst;
138 int addr_type;
139 int err;
140
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900141 if (addr_len < SIN6_LEN_RFC2133)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 return -EINVAL;
143
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900144 if (usin->sin6_family != AF_INET6)
Eric Dumazeta02cec22010-09-22 20:43:57 +0000145 return -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146
David S. Miller4c9483b2011-03-12 16:22:43 -0500147 memset(&fl6, 0, sizeof(fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148
149 if (np->sndflow) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500150 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
151 IP6_ECN_flow_init(fl6.flowlabel);
152 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 struct ip6_flowlabel *flowlabel;
David S. Miller4c9483b2011-03-12 16:22:43 -0500154 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 if (flowlabel == NULL)
156 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 fl6_sock_release(flowlabel);
158 }
159 }
160
161 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900162 * connect() to INADDR_ANY means loopback (BSD'ism).
163 */
164
Weilong Chen4c99aa42013-12-19 18:44:34 +0800165 if (ipv6_addr_any(&usin->sin6_addr))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900166 usin->sin6_addr.s6_addr[15] = 0x1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
168 addr_type = ipv6_addr_type(&usin->sin6_addr);
169
Weilong Chen4c99aa42013-12-19 18:44:34 +0800170 if (addr_type & IPV6_ADDR_MULTICAST)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 return -ENETUNREACH;
172
173 if (addr_type&IPV6_ADDR_LINKLOCAL) {
174 if (addr_len >= sizeof(struct sockaddr_in6) &&
175 usin->sin6_scope_id) {
176 /* If interface is set while binding, indices
177 * must coincide.
178 */
179 if (sk->sk_bound_dev_if &&
180 sk->sk_bound_dev_if != usin->sin6_scope_id)
181 return -EINVAL;
182
183 sk->sk_bound_dev_if = usin->sin6_scope_id;
184 }
185
186 /* Connect to link-local address requires an interface */
187 if (!sk->sk_bound_dev_if)
188 return -EINVAL;
189 }
190
191 if (tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700192 !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 tp->rx_opt.ts_recent = 0;
194 tp->rx_opt.ts_recent_stamp = 0;
195 tp->write_seq = 0;
196 }
197
Eric Dumazetefe42082013-10-03 15:42:29 -0700198 sk->sk_v6_daddr = usin->sin6_addr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500199 np->flow_label = fl6.flowlabel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
201 /*
202 * TCP over IPv4
203 */
204
205 if (addr_type == IPV6_ADDR_MAPPED) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800206 u32 exthdrlen = icsk->icsk_ext_hdr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 struct sockaddr_in sin;
208
209 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
210
211 if (__ipv6_only_sock(sk))
212 return -ENETUNREACH;
213
214 sin.sin_family = AF_INET;
215 sin.sin_port = usin->sin6_port;
216 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
217
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800218 icsk->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 sk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800220#ifdef CONFIG_TCP_MD5SIG
221 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
222#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
224 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
225
226 if (err) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800227 icsk->icsk_ext_hdr_len = exthdrlen;
228 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 sk->sk_backlog_rcv = tcp_v6_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800230#ifdef CONFIG_TCP_MD5SIG
231 tp->af_specific = &tcp_sock_ipv6_specific;
232#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233 goto failure;
234 } else {
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000235 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
236 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
Eric Dumazetefe42082013-10-03 15:42:29 -0700237 &sk->sk_v6_rcv_saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238 }
239
240 return err;
241 }
242
Eric Dumazetefe42082013-10-03 15:42:29 -0700243 if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
244 saddr = &sk->sk_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245
David S. Miller4c9483b2011-03-12 16:22:43 -0500246 fl6.flowi6_proto = IPPROTO_TCP;
Eric Dumazetefe42082013-10-03 15:42:29 -0700247 fl6.daddr = sk->sk_v6_daddr;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000248 fl6.saddr = saddr ? *saddr : np->saddr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500249 fl6.flowi6_oif = sk->sk_bound_dev_if;
250 fl6.flowi6_mark = sk->sk_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500251 fl6.fl6_dport = usin->sin6_port;
252 fl6.fl6_sport = inet->inet_sport;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
David S. Miller4c9483b2011-03-12 16:22:43 -0500254 final_p = fl6_update_dst(&fl6, np->opt, &final);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
David S. Miller4c9483b2011-03-12 16:22:43 -0500256 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700257
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200258 dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800259 if (IS_ERR(dst)) {
260 err = PTR_ERR(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 goto failure;
David S. Miller14e50e52007-05-24 18:17:54 -0700262 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263
264 if (saddr == NULL) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500265 saddr = &fl6.saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700266 sk->sk_v6_rcv_saddr = *saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267 }
268
269 /* set the source address */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000270 np->saddr = *saddr;
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000271 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
Herbert Xuf83ef8c2006-06-30 13:37:03 -0700273 sk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -0700274 __ip6_dst_store(sk, dst, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275
David S. Miller493f3772010-12-02 12:14:29 -0800276 rt = (struct rt6_info *) dst;
277 if (tcp_death_row.sysctl_tw_recycle &&
278 !tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700279 ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
David S. Miller81166dd2012-07-10 03:14:24 -0700280 tcp_fetch_timewait_stamp(sk, dst);
David S. Miller493f3772010-12-02 12:14:29 -0800281
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800282 icsk->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283 if (np->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800284 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
285 np->opt->opt_nflen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
287 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
288
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000289 inet->inet_dport = usin->sin6_port;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290
291 tcp_set_state(sk, TCP_SYN_SENT);
Arnaldo Carvalho de Melod8313f52005-12-13 23:25:44 -0800292 err = inet6_hash_connect(&tcp_death_row, sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 if (err)
294 goto late_failure;
295
Andrey Vagin2b916472012-11-22 01:13:58 +0000296 if (!tp->write_seq && likely(!tp->repair))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
Eric Dumazetefe42082013-10-03 15:42:29 -0700298 sk->sk_v6_daddr.s6_addr32,
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000299 inet->inet_sport,
300 inet->inet_dport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301
302 err = tcp_connect(sk);
303 if (err)
304 goto late_failure;
305
306 return 0;
307
308late_failure:
309 tcp_set_state(sk, TCP_CLOSE);
310 __sk_dst_reset(sk);
311failure:
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000312 inet->inet_dport = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313 sk->sk_route_caps = 0;
314 return err;
315}
316
Eric Dumazet563d34d2012-07-23 09:48:52 +0200317static void tcp_v6_mtu_reduced(struct sock *sk)
318{
319 struct dst_entry *dst;
320
321 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
322 return;
323
324 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
325 if (!dst)
326 return;
327
328 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
329 tcp_sync_mss(sk, dst_mtu(dst));
330 tcp_simple_retransmit(sk);
331 }
332}
333
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
Brian Haleyd5fdd6b2009-06-23 04:31:07 -0700335 u8 type, u8 code, int offset, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336{
Weilong Chen4c99aa42013-12-19 18:44:34 +0800337 const struct ipv6hdr *hdr = (const struct ipv6hdr *)skb->data;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -0300338 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 struct ipv6_pinfo *np;
340 struct sock *sk;
341 int err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900342 struct tcp_sock *tp;
Yuchung Cheng0a672f72014-05-11 20:22:12 -0700343 struct request_sock *fastopen;
344 __u32 seq, snd_una;
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700345 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700347 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800348 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 if (sk == NULL) {
Denis V. Luneve41b5362008-10-08 10:33:26 -0700351 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
352 ICMP6_MIB_INERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353 return;
354 }
355
356 if (sk->sk_state == TCP_TIME_WAIT) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700357 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 return;
359 }
360
361 bh_lock_sock(sk);
Eric Dumazet563d34d2012-07-23 09:48:52 +0200362 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700363 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364
365 if (sk->sk_state == TCP_CLOSE)
366 goto out;
367
Stephen Hemmingere802af92010-04-22 15:24:53 -0700368 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
369 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
370 goto out;
371 }
372
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 tp = tcp_sk(sk);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900374 seq = ntohl(th->seq);
Yuchung Cheng0a672f72014-05-11 20:22:12 -0700375 /* XXX (TFO) - tp->snd_una should be ISN (tcp_create_openreq_child() */
376 fastopen = tp->fastopen_rsk;
377 snd_una = fastopen ? tcp_rsk(fastopen)->snt_isn : tp->snd_una;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378 if (sk->sk_state != TCP_LISTEN &&
Yuchung Cheng0a672f72014-05-11 20:22:12 -0700379 !between(seq, snd_una, tp->snd_nxt)) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700380 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 goto out;
382 }
383
384 np = inet6_sk(sk);
385
David S. Millerec18d9a2012-07-12 00:25:15 -0700386 if (type == NDISC_REDIRECT) {
387 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
388
David S. Miller1ed5c482012-07-12 00:41:25 -0700389 if (dst)
David S. Miller6700c272012-07-17 03:29:28 -0700390 dst->ops->redirect(dst, sk, skb);
Christoph Paasch50a75a82013-04-07 04:53:15 +0000391 goto out;
David S. Millerec18d9a2012-07-12 00:25:15 -0700392 }
393
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 if (type == ICMPV6_PKT_TOOBIG) {
Eric Dumazet0d4f0602013-03-18 07:01:28 +0000395 /* We are not interested in TCP_LISTEN and open_requests
396 * (SYN-ACKs send out by Linux are always <576bytes so
397 * they should go through unfragmented).
398 */
399 if (sk->sk_state == TCP_LISTEN)
400 goto out;
401
Hannes Frederic Sowa93b36cf2013-12-15 03:41:14 +0100402 if (!ip6_sk_accept_pmtu(sk))
403 goto out;
404
Eric Dumazet563d34d2012-07-23 09:48:52 +0200405 tp->mtu_info = ntohl(info);
406 if (!sock_owned_by_user(sk))
407 tcp_v6_mtu_reduced(sk);
Julian Anastasovd013ef2a2012-09-05 10:53:18 +0000408 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
409 &tp->tsq_flags))
410 sock_hold(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411 goto out;
412 }
413
414 icmpv6_err_convert(type, code, &err);
415
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700416 /* Might be for an request_sock */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 switch (sk->sk_state) {
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700418 struct request_sock *req, **prev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419 case TCP_LISTEN:
420 if (sock_owned_by_user(sk))
421 goto out;
422
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800423 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
424 &hdr->saddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 if (!req)
426 goto out;
427
428 /* ICMPs are not backlogged, hence we cannot get
429 * an established socket here.
430 */
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700431 WARN_ON(req->sk != NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700433 if (seq != tcp_rsk(req)->snt_isn) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700434 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 goto out;
436 }
437
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -0700438 inet_csk_reqsk_queue_drop(sk, req, prev);
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000439 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700440 goto out;
441
442 case TCP_SYN_SENT:
Yuchung Cheng0a672f72014-05-11 20:22:12 -0700443 case TCP_SYN_RECV:
444 /* Only in fast or simultaneous open. If a fast open socket is
445 * is already accepted it is treated as a connected one below.
446 */
447 if (fastopen && fastopen->sk == NULL)
448 break;
449
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 if (!sock_owned_by_user(sk)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700451 sk->sk_err = err;
452 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
453
454 tcp_done(sk);
455 } else
456 sk->sk_err_soft = err;
457 goto out;
458 }
459
460 if (!sock_owned_by_user(sk) && np->recverr) {
461 sk->sk_err = err;
462 sk->sk_error_report(sk);
463 } else
464 sk->sk_err_soft = err;
465
466out:
467 bh_unlock_sock(sk);
468 sock_put(sk);
469}
470
471
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000472static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
Octavian Purdilad6274bd2014-06-25 17:09:58 +0300473 struct flowi *fl,
Neal Cardwell3840a062012-06-28 12:34:19 +0000474 struct request_sock *req,
Daniel Lee3a19ce02014-05-11 20:22:13 -0700475 u16 queue_mapping,
476 struct tcp_fastopen_cookie *foc)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700477{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700478 struct inet_request_sock *ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479 struct ipv6_pinfo *np = inet6_sk(sk);
Octavian Purdilad6274bd2014-06-25 17:09:58 +0300480 struct flowi6 *fl6 = &fl->u.ip6;
Weilong Chen4c99aa42013-12-19 18:44:34 +0800481 struct sk_buff *skb;
Neal Cardwell94942182012-06-28 12:34:20 +0000482 int err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000484 /* First, grab a route. */
485 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800486 goto done;
Neal Cardwell94942182012-06-28 12:34:20 +0000487
Daniel Lee3a19ce02014-05-11 20:22:13 -0700488 skb = tcp_make_synack(sk, dst, req, foc);
Neal Cardwell94942182012-06-28 12:34:20 +0000489
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 if (skb) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700491 __tcp_v6_send_check(skb, &ireq->ir_v6_loc_addr,
492 &ireq->ir_v6_rmt_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493
Eric Dumazet634fb9792013-10-09 15:21:29 -0700494 fl6->daddr = ireq->ir_v6_rmt_addr;
Florent Fourcotdf3687f2014-01-17 17:15:03 +0100495 if (np->repflow && (ireq->pktopts != NULL))
496 fl6->flowlabel = ip6_flowlabel(ipv6_hdr(ireq->pktopts));
497
Eric Dumazetfff32692012-06-01 01:47:50 +0000498 skb_set_queue_mapping(skb, queue_mapping);
RongQing.Li43264e02012-07-01 17:18:59 +0000499 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
Gerrit Renkerb9df3cb2006-11-14 11:21:36 -0200500 err = net_xmit_eval(err);
Octavian Purdilaaa27fc52014-06-25 17:09:51 +0300501 if (!tcp_rsk(req)->snt_synack && !err)
502 tcp_rsk(req)->snt_synack = tcp_time_stamp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503 }
504
505done:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506 return err;
507}
508
Octavian Purdila72659ec2010-01-17 19:09:39 -0800509
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700510static void tcp_v6_reqsk_destructor(struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700512 kfree_skb(inet_rsk(req)->pktopts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513}
514
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800515#ifdef CONFIG_TCP_MD5SIG
516static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000517 const struct in6_addr *addr)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800518{
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000519 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800520}
521
522static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
523 struct sock *addr_sk)
524{
Eric Dumazetefe42082013-10-03 15:42:29 -0700525 return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800526}
527
528static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
529 struct request_sock *req)
530{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700531 return tcp_v6_md5_do_lookup(sk, &inet_rsk(req)->ir_v6_rmt_addr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800532}
533
Wang Yufen4aa956d2014-03-29 09:27:29 +0800534static int tcp_v6_parse_md5_keys(struct sock *sk, char __user *optval,
535 int optlen)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800536{
537 struct tcp_md5sig cmd;
538 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800539
540 if (optlen < sizeof(cmd))
541 return -EINVAL;
542
543 if (copy_from_user(&cmd, optval, sizeof(cmd)))
544 return -EFAULT;
545
546 if (sin6->sin6_family != AF_INET6)
547 return -EINVAL;
548
549 if (!cmd.tcpm_keylen) {
Brian Haleye773e4f2007-08-24 23:16:08 -0700550 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000551 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
552 AF_INET);
553 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
554 AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800555 }
556
557 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
558 return -EINVAL;
559
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000560 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
561 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
562 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800563
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000564 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
565 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800566}
567
Adam Langley49a72df2008-07-19 00:01:42 -0700568static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000569 const struct in6_addr *daddr,
570 const struct in6_addr *saddr, int nbytes)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800571{
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800572 struct tcp6_pseudohdr *bp;
Adam Langley49a72df2008-07-19 00:01:42 -0700573 struct scatterlist sg;
YOSHIFUJI Hideaki8d26d762008-04-17 13:19:16 +0900574
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800575 bp = &hp->md5_blk.ip6;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800576 /* 1. TCP pseudo-header (RFC2460) */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000577 bp->saddr = *saddr;
578 bp->daddr = *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700579 bp->protocol = cpu_to_be32(IPPROTO_TCP);
Adam Langley00b13042008-07-31 21:36:07 -0700580 bp->len = cpu_to_be32(nbytes);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800581
Adam Langley49a72df2008-07-19 00:01:42 -0700582 sg_init_one(&sg, bp, sizeof(*bp));
583 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
584}
David S. Millerc7da57a2007-10-26 00:41:21 -0700585
Adam Langley49a72df2008-07-19 00:01:42 -0700586static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000587 const struct in6_addr *daddr, struct in6_addr *saddr,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400588 const struct tcphdr *th)
Adam Langley49a72df2008-07-19 00:01:42 -0700589{
590 struct tcp_md5sig_pool *hp;
591 struct hash_desc *desc;
592
593 hp = tcp_get_md5sig_pool();
594 if (!hp)
595 goto clear_hash_noput;
596 desc = &hp->md5_desc;
597
598 if (crypto_hash_init(desc))
599 goto clear_hash;
600 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
601 goto clear_hash;
602 if (tcp_md5_hash_header(hp, th))
603 goto clear_hash;
604 if (tcp_md5_hash_key(hp, key))
605 goto clear_hash;
606 if (crypto_hash_final(desc, md5_hash))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800607 goto clear_hash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800608
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800609 tcp_put_md5sig_pool();
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800610 return 0;
Adam Langley49a72df2008-07-19 00:01:42 -0700611
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800612clear_hash:
613 tcp_put_md5sig_pool();
614clear_hash_noput:
615 memset(md5_hash, 0, 16);
Adam Langley49a72df2008-07-19 00:01:42 -0700616 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800617}
618
Adam Langley49a72df2008-07-19 00:01:42 -0700619static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400620 const struct sock *sk,
621 const struct request_sock *req,
622 const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800623{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000624 const struct in6_addr *saddr, *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700625 struct tcp_md5sig_pool *hp;
626 struct hash_desc *desc;
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400627 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800628
629 if (sk) {
630 saddr = &inet6_sk(sk)->saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700631 daddr = &sk->sk_v6_daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700632 } else if (req) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700633 saddr = &inet_rsk(req)->ir_v6_loc_addr;
634 daddr = &inet_rsk(req)->ir_v6_rmt_addr;
Adam Langley49a72df2008-07-19 00:01:42 -0700635 } else {
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000636 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Adam Langley49a72df2008-07-19 00:01:42 -0700637 saddr = &ip6h->saddr;
638 daddr = &ip6h->daddr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800639 }
Adam Langley49a72df2008-07-19 00:01:42 -0700640
641 hp = tcp_get_md5sig_pool();
642 if (!hp)
643 goto clear_hash_noput;
644 desc = &hp->md5_desc;
645
646 if (crypto_hash_init(desc))
647 goto clear_hash;
648
649 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
650 goto clear_hash;
651 if (tcp_md5_hash_header(hp, th))
652 goto clear_hash;
653 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
654 goto clear_hash;
655 if (tcp_md5_hash_key(hp, key))
656 goto clear_hash;
657 if (crypto_hash_final(desc, md5_hash))
658 goto clear_hash;
659
660 tcp_put_md5sig_pool();
661 return 0;
662
663clear_hash:
664 tcp_put_md5sig_pool();
665clear_hash_noput:
666 memset(md5_hash, 0, 16);
667 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800668}
669
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400670static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800671{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400672 const __u8 *hash_location = NULL;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800673 struct tcp_md5sig_key *hash_expected;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000674 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400675 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800676 int genhash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800677 u8 newhash[16];
678
679 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
YOSHIFUJI Hideaki7d5d5522008-04-17 12:29:53 +0900680 hash_location = tcp_parse_md5sig_option(th);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800681
David S. Miller785957d2008-07-30 03:03:15 -0700682 /* We've parsed the options - do we have a hash? */
683 if (!hash_expected && !hash_location)
684 return 0;
685
686 if (hash_expected && !hash_location) {
687 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800688 return 1;
689 }
690
David S. Miller785957d2008-07-30 03:03:15 -0700691 if (!hash_expected && hash_location) {
692 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800693 return 1;
694 }
695
696 /* check the signature */
Adam Langley49a72df2008-07-19 00:01:42 -0700697 genhash = tcp_v6_md5_hash_skb(newhash,
698 hash_expected,
699 NULL, NULL, skb);
700
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800701 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
Joe Perchese87cc472012-05-13 21:56:26 +0000702 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
703 genhash ? "failed" : "mismatch",
704 &ip6h->saddr, ntohs(th->source),
705 &ip6h->daddr, ntohs(th->dest));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800706 return 1;
707 }
708 return 0;
709}
710#endif
711
Octavian Purdila16bea702014-06-25 17:09:53 +0300712static void tcp_v6_init_req(struct request_sock *req, struct sock *sk,
713 struct sk_buff *skb)
714{
715 struct inet_request_sock *ireq = inet_rsk(req);
716 struct ipv6_pinfo *np = inet6_sk(sk);
717
718 ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
719 ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
720
721 ireq->ir_iif = sk->sk_bound_dev_if;
722
723 /* So that link locals have meaning */
724 if (!sk->sk_bound_dev_if &&
725 ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
726 ireq->ir_iif = inet6_iif(skb);
727
728 if (!TCP_SKB_CB(skb)->when &&
729 (ipv6_opt_accepted(sk, skb) || np->rxopt.bits.rxinfo ||
730 np->rxopt.bits.rxoinfo || np->rxopt.bits.rxhlim ||
731 np->rxopt.bits.rxohlim || np->repflow)) {
732 atomic_inc(&skb->users);
733 ireq->pktopts = skb;
734 }
735}
736
Octavian Purdilad94e0412014-06-25 17:09:55 +0300737static struct dst_entry *tcp_v6_route_req(struct sock *sk, struct flowi *fl,
738 const struct request_sock *req,
739 bool *strict)
740{
741 if (strict)
742 *strict = true;
743 return inet6_csk_route_req(sk, &fl->u.ip6, req);
744}
745
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800746struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747 .family = AF_INET6,
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700748 .obj_size = sizeof(struct tcp6_request_sock),
Octavian Purdila5db92c92014-06-25 17:09:59 +0300749 .rtx_syn_ack = tcp_rtx_synack,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700750 .send_ack = tcp_v6_reqsk_send_ack,
751 .destructor = tcp_v6_reqsk_destructor,
Octavian Purdila72659ec2010-01-17 19:09:39 -0800752 .send_reset = tcp_v6_send_reset,
Wang Yufen4aa956d2014-03-29 09:27:29 +0800753 .syn_ack_timeout = tcp_syn_ack_timeout,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754};
755
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +0000756static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
Octavian Purdila16bea702014-06-25 17:09:53 +0300757#ifdef CONFIG_TCP_MD5SIG
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800758 .md5_lookup = tcp_v6_reqsk_md5_lookup,
John Dykstrae3afe7b2009-07-16 05:04:51 +0000759 .calc_md5_hash = tcp_v6_md5_hash_skb,
Andrew Mortonb6332e62006-11-30 19:16:28 -0800760#endif
Octavian Purdila16bea702014-06-25 17:09:53 +0300761 .init_req = tcp_v6_init_req,
Octavian Purdilafb7b37a2014-06-25 17:09:54 +0300762#ifdef CONFIG_SYN_COOKIES
763 .cookie_init_seq = cookie_v6_init_sequence,
764#endif
Octavian Purdilad94e0412014-06-25 17:09:55 +0300765 .route_req = tcp_v6_route_req,
Octavian Purdila936b8bd2014-06-25 17:09:57 +0300766 .init_seq = tcp_v6_init_sequence,
Octavian Purdilad6274bd2014-06-25 17:09:58 +0300767 .send_synack = tcp_v6_send_synack,
Octavian Purdila16bea702014-06-25 17:09:53 +0300768};
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800769
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700770static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
Wang Yufen9c76a112014-03-29 09:27:31 +0800771 u32 tsval, u32 tsecr, int oif,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100772 struct tcp_md5sig_key *key, int rst, u8 tclass,
773 u32 label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400775 const struct tcphdr *th = tcp_hdr(skb);
776 struct tcphdr *t1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 struct sk_buff *buff;
David S. Miller4c9483b2011-03-12 16:22:43 -0500778 struct flowi6 fl6;
Eric Dumazetadf30902009-06-02 05:19:30 +0000779 struct net *net = dev_net(skb_dst(skb)->dev);
Daniel Lezcanoe5047992008-03-07 11:16:26 -0800780 struct sock *ctl_sk = net->ipv6.tcp_sk;
YOSHIFUJI Hideaki9cb57342008-01-12 02:16:03 -0800781 unsigned int tot_len = sizeof(struct tcphdr);
Eric Dumazetadf30902009-06-02 05:19:30 +0000782 struct dst_entry *dst;
Al Viroe69a4ad2006-11-14 20:56:00 -0800783 __be32 *topt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784
Andrey Vaginee684b62013-02-11 05:50:19 +0000785 if (tsecr)
YOSHIFUJI Hideaki4244f8a2006-10-10 19:40:50 -0700786 tot_len += TCPOLEN_TSTAMP_ALIGNED;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800787#ifdef CONFIG_TCP_MD5SIG
788 if (key)
789 tot_len += TCPOLEN_MD5SIG_ALIGNED;
790#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700791
792 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
793 GFP_ATOMIC);
794 if (buff == NULL)
795 return;
796
797 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
798
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700799 t1 = (struct tcphdr *) skb_push(buff, tot_len);
Herbert Xu6651ffc2010-04-21 00:47:15 -0700800 skb_reset_transport_header(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700801
802 /* Swap the send and the receive. */
803 memset(t1, 0, sizeof(*t1));
804 t1->dest = th->source;
805 t1->source = th->dest;
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700806 t1->doff = tot_len / 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700807 t1->seq = htonl(seq);
808 t1->ack_seq = htonl(ack);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700809 t1->ack = !rst || !th->ack;
810 t1->rst = rst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700811 t1->window = htons(win);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800812
Al Viroe69a4ad2006-11-14 20:56:00 -0800813 topt = (__be32 *)(t1 + 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900814
Andrey Vaginee684b62013-02-11 05:50:19 +0000815 if (tsecr) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800816 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
817 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
Andrey Vaginee684b62013-02-11 05:50:19 +0000818 *topt++ = htonl(tsval);
819 *topt++ = htonl(tsecr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700820 }
821
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800822#ifdef CONFIG_TCP_MD5SIG
823 if (key) {
824 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
825 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
Adam Langley49a72df2008-07-19 00:01:42 -0700826 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
Adam Langley90b7e112008-07-31 20:49:48 -0700827 &ipv6_hdr(skb)->saddr,
828 &ipv6_hdr(skb)->daddr, t1);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800829 }
830#endif
831
David S. Miller4c9483b2011-03-12 16:22:43 -0500832 memset(&fl6, 0, sizeof(fl6));
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000833 fl6.daddr = ipv6_hdr(skb)->saddr;
834 fl6.saddr = ipv6_hdr(skb)->daddr;
Florent Fourcot1d13a962014-01-16 17:21:22 +0100835 fl6.flowlabel = label;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700836
David S. Millere5700af2010-04-21 14:59:20 -0700837 buff->ip_summed = CHECKSUM_PARTIAL;
838 buff->csum = 0;
839
David S. Miller4c9483b2011-03-12 16:22:43 -0500840 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841
David S. Miller4c9483b2011-03-12 16:22:43 -0500842 fl6.flowi6_proto = IPPROTO_TCP;
Lorenzo Colittia36dbdb2014-04-11 13:19:12 +0900843 if (rt6_need_strict(&fl6.daddr) && !oif)
Alexey Kuznetsov4c675252012-10-12 04:34:17 +0000844 fl6.flowi6_oif = inet6_iif(skb);
Wang Yufen9c76a112014-03-29 09:27:31 +0800845 else
846 fl6.flowi6_oif = oif;
Lorenzo Colittie1108612014-05-13 10:17:33 -0700847 fl6.flowi6_mark = IP6_REPLY_MARK(net, skb->mark);
David S. Miller1958b852011-03-12 16:36:19 -0500848 fl6.fl6_dport = t1->dest;
849 fl6.fl6_sport = t1->source;
David S. Miller4c9483b2011-03-12 16:22:43 -0500850 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700852 /* Pass a socket to ip6_dst_lookup either it is for RST
853 * Underlying function will use this to retrieve the network
854 * namespace
855 */
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200856 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800857 if (!IS_ERR(dst)) {
858 skb_dst_set(buff, dst);
Eric Dumazetb903d322011-10-27 00:44:35 -0400859 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800860 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
861 if (rst)
862 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
863 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864 }
865
866 kfree_skb(buff);
867}
868
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700869static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
870{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400871 const struct tcphdr *th = tcp_hdr(skb);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700872 u32 seq = 0, ack_seq = 0;
Guo-Fu Tsengfa3e5b42008-10-09 21:11:56 -0700873 struct tcp_md5sig_key *key = NULL;
Shawn Lu658ddaa2012-01-31 22:35:48 +0000874#ifdef CONFIG_TCP_MD5SIG
875 const __u8 *hash_location = NULL;
876 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
877 unsigned char newhash[16];
878 int genhash;
879 struct sock *sk1 = NULL;
880#endif
Wang Yufen9c76a112014-03-29 09:27:31 +0800881 int oif;
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700882
883 if (th->rst)
884 return;
885
886 if (!ipv6_unicast_destination(skb))
887 return;
888
889#ifdef CONFIG_TCP_MD5SIG
Shawn Lu658ddaa2012-01-31 22:35:48 +0000890 hash_location = tcp_parse_md5sig_option(th);
891 if (!sk && hash_location) {
892 /*
893 * active side is lost. Try to find listening socket through
894 * source port, and then find md5 key through listening socket.
895 * we are not loose security here:
896 * Incoming packet is checked with md5 hash with finding key,
897 * no RST generated if md5 hash doesn't match.
898 */
899 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
Tom Herbert5ba24952013-01-22 09:50:39 +0000900 &tcp_hashinfo, &ipv6h->saddr,
901 th->source, &ipv6h->daddr,
Shawn Lu658ddaa2012-01-31 22:35:48 +0000902 ntohs(th->source), inet6_iif(skb));
903 if (!sk1)
904 return;
905
906 rcu_read_lock();
907 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
908 if (!key)
909 goto release_sk1;
910
911 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
912 if (genhash || memcmp(hash_location, newhash, 16) != 0)
913 goto release_sk1;
914 } else {
915 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
916 }
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700917#endif
918
919 if (th->ack)
920 seq = ntohl(th->ack_seq);
921 else
922 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
923 (th->doff << 2);
924
Wang Yufen9c76a112014-03-29 09:27:31 +0800925 oif = sk ? sk->sk_bound_dev_if : 0;
926 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, oif, key, 1, 0, 0);
Shawn Lu658ddaa2012-01-31 22:35:48 +0000927
928#ifdef CONFIG_TCP_MD5SIG
929release_sk1:
930 if (sk1) {
931 rcu_read_unlock();
932 sock_put(sk1);
933 }
934#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700935}
936
Andrey Vaginee684b62013-02-11 05:50:19 +0000937static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
Wang Yufen9c76a112014-03-29 09:27:31 +0800938 u32 win, u32 tsval, u32 tsecr, int oif,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100939 struct tcp_md5sig_key *key, u8 tclass,
940 u32 label)
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700941{
Wang Yufen9c76a112014-03-29 09:27:31 +0800942 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, oif, key, 0, tclass,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100943 label);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700944}
945
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
947{
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700948 struct inet_timewait_sock *tw = inet_twsk(sk);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800949 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700950
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +0900951 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700952 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
Andrey Vaginee684b62013-02-11 05:50:19 +0000953 tcp_time_stamp + tcptw->tw_ts_offset,
Wang Yufen9c76a112014-03-29 09:27:31 +0800954 tcptw->tw_ts_recent, tw->tw_bound_dev_if, tcp_twsk_md5_key(tcptw),
Florent Fourcot1d13a962014-01-16 17:21:22 +0100955 tw->tw_tclass, (tw->tw_flowlabel << 12));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700956
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700957 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700958}
959
Gui Jianfeng6edafaa2008-08-06 23:50:04 -0700960static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
961 struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700962{
Daniel Lee3a19ce02014-05-11 20:22:13 -0700963 /* sk->sk_state == TCP_LISTEN -> for regular TCP_SYN_RECV
964 * sk->sk_state == TCP_SYN_RECV -> for Fast Open.
965 */
966 tcp_v6_send_ack(skb, (sk->sk_state == TCP_LISTEN) ?
967 tcp_rsk(req)->snt_isn + 1 : tcp_sk(sk)->snd_nxt,
968 tcp_rsk(req)->rcv_nxt,
Wang Yufen9c76a112014-03-29 09:27:31 +0800969 req->rcv_wnd, tcp_time_stamp, req->ts_recent, sk->sk_bound_dev_if,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100970 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr),
971 0, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700972}
973
974
Weilong Chen4c99aa42013-12-19 18:44:34 +0800975static struct sock *tcp_v6_hnd_req(struct sock *sk, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700976{
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700977 struct request_sock *req, **prev;
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700978 const struct tcphdr *th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700979 struct sock *nsk;
980
981 /* Find possible connection requests. */
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800982 req = inet6_csk_search_req(sk, &prev, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700983 &ipv6_hdr(skb)->saddr,
984 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700985 if (req)
Jerry Chu83368862012-08-31 12:29:12 +0000986 return tcp_check_req(sk, skb, req, prev, false);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700987
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900988 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800989 &ipv6_hdr(skb)->saddr, th->source,
990 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700991
992 if (nsk) {
993 if (nsk->sk_state != TCP_TIME_WAIT) {
994 bh_lock_sock(nsk);
995 return nsk;
996 }
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700997 inet_twsk_put(inet_twsk(nsk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700998 return NULL;
999 }
1000
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001001#ifdef CONFIG_SYN_COOKIES
Florian Westphalaf9b4732010-06-03 00:43:44 +00001002 if (!th->syn)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001003 sk = cookie_v6_check(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001004#endif
1005 return sk;
1006}
1007
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008/* FIXME: this is substantially similar to the ipv4 code.
1009 * Can some kind of merge be done? -- erics
1010 */
1011static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1012{
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001013 struct tcp_options_received tmp_opt;
1014 struct request_sock *req;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001015 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001016 struct tcp_sock *tp = tcp_sk(sk);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001017 __u32 isn = TCP_SKB_CB(skb)->when;
David S. Miller493f3772010-12-02 12:14:29 -08001018 struct dst_entry *dst = NULL;
Daniel Lee3a19ce02014-05-11 20:22:13 -07001019 struct tcp_fastopen_cookie foc = { .len = -1 };
1020 bool want_cookie = false, fastopen;
Neal Cardwell3840a062012-06-28 12:34:19 +00001021 struct flowi6 fl6;
Octavian Purdila16bea702014-06-25 17:09:53 +03001022 const struct tcp_request_sock_ops *af_ops;
Daniel Lee3a19ce02014-05-11 20:22:13 -07001023 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001024
1025 if (skb->protocol == htons(ETH_P_IP))
1026 return tcp_v4_conn_request(sk, skb);
1027
1028 if (!ipv6_unicast_destination(skb))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001029 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030
Hannes Frederic Sowa5ad37d52013-07-26 17:43:23 +02001031 if ((sysctl_tcp_syncookies == 2 ||
1032 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
Eric Dumazet946cedc2011-08-30 03:21:44 +00001033 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
1034 if (!want_cookie)
1035 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036 }
1037
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001038 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
1039 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001040 goto drop;
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001041 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001042
Octavian Purdila476eab82014-06-25 17:09:52 +03001043 req = inet_reqsk_alloc(&tcp6_request_sock_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001044 if (req == NULL)
1045 goto drop;
1046
Octavian Purdila16bea702014-06-25 17:09:53 +03001047 af_ops = tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001048
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049 tcp_clear_options(&tmp_opt);
1050 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1051 tmp_opt.user_mss = tp->rx_opt.user_mss;
Daniel Lee3a19ce02014-05-11 20:22:13 -07001052 tcp_parse_options(skb, &tmp_opt, 0, want_cookie ? NULL : &foc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053
Florian Westphal4dfc2812008-04-10 03:12:40 -07001054 if (want_cookie && !tmp_opt.saw_tstamp)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001055 tcp_clear_options(&tmp_opt);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001056
Linus Torvalds1da177e2005-04-16 15:20:36 -07001057 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
Octavian Purdilae0f802f2014-06-17 11:25:37 +03001058 tcp_openreq_init(req, &tmp_opt, skb, sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001059
Eric Dumazet634fb9792013-10-09 15:21:29 -07001060 ireq = inet_rsk(req);
Octavian Purdila16bea702014-06-25 17:09:53 +03001061 af_ops->init_req(req, sk, skb);
1062
Octavian Purdila94037152014-06-25 17:09:56 +03001063 if (security_inet_conn_request(sk, skb, req))
1064 goto drop_and_release;
1065
Florian Westphal172d69e2010-06-21 11:48:45 +00001066 if (!want_cookie || tmp_opt.tstamp_ok)
Hannes Frederic Sowa5d134f12013-01-05 16:10:48 +00001067 TCP_ECN_create_request(req, skb, sock_net(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001068
Octavian Purdila94037152014-06-25 17:09:56 +03001069 if (want_cookie) {
1070 isn = cookie_init_sequence(af_ops, sk, skb, &req->mss);
1071 req->cookie_ts = tmp_opt.tstamp_ok;
1072 } else if (!isn) {
David S. Miller493f3772010-12-02 12:14:29 -08001073 /* VJ's idea. We save last timestamp seen
1074 * from the destination in peer table, when entering
1075 * state TIME-WAIT, and check against it before
1076 * accepting new connection request.
1077 *
1078 * If "isn" is not zero, this request hit alive
1079 * timewait bucket, so that all the necessary checks
1080 * are made in the function processing timewait state.
1081 */
Octavian Purdilad94e0412014-06-25 17:09:55 +03001082 if (tmp_opt.saw_tstamp && tcp_death_row.sysctl_tw_recycle) {
1083 dst = af_ops->route_req(sk, (struct flowi *)&fl6, req,
1084 NULL);
1085 if (dst && !tcp_peer_is_proven(req, dst, true)) {
David S. Miller493f3772010-12-02 12:14:29 -08001086 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1087 goto drop_and_release;
1088 }
1089 }
1090 /* Kill the following clause, if you dislike this way. */
1091 else if (!sysctl_tcp_syncookies &&
1092 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1093 (sysctl_max_syn_backlog >> 2)) &&
David S. Miller81166dd2012-07-10 03:14:24 -07001094 !tcp_peer_is_proven(req, dst, false)) {
David S. Miller493f3772010-12-02 12:14:29 -08001095 /* Without syncookies last quarter of
1096 * backlog is filled with destinations,
1097 * proven to be alive.
1098 * It means that we continue to communicate
1099 * to destinations, already remembered
1100 * to the moment of synflood.
1101 */
1102 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
Eric Dumazet634fb9792013-10-09 15:21:29 -07001103 &ireq->ir_v6_rmt_addr, ntohs(tcp_hdr(skb)->source));
David S. Miller493f3772010-12-02 12:14:29 -08001104 goto drop_and_release;
1105 }
1106
Octavian Purdila936b8bd2014-06-25 17:09:57 +03001107 isn = af_ops->init_seq(skb);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001108 }
Venkat Yekkirala4237c752006-07-24 23:32:50 -07001109
Octavian Purdilad94e0412014-06-25 17:09:55 +03001110 if (!dst) {
1111 dst = af_ops->route_req(sk, (struct flowi *)&fl6, req, NULL);
1112 if (!dst)
1113 goto drop_and_free;
1114 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115
Daniel Lee3a19ce02014-05-11 20:22:13 -07001116 tcp_rsk(req)->snt_isn = isn;
Daniel Lee3a19ce02014-05-11 20:22:13 -07001117 tcp_openreq_init_rwin(req, sk, dst);
1118 fastopen = !want_cookie &&
1119 tcp_try_fastopen(sk, skb, req, &foc, dst);
Octavian Purdilad6274bd2014-06-25 17:09:58 +03001120 err = af_ops->send_synack(sk, dst, (struct flowi *)&fl6, req,
1121 skb_get_queue_mapping(skb), &foc);
Daniel Lee3a19ce02014-05-11 20:22:13 -07001122 if (!fastopen) {
1123 if (err || want_cookie)
1124 goto drop_and_free;
1125
1126 tcp_rsk(req)->listener = NULL;
1127 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1128 }
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001129 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001130
David S. Miller493f3772010-12-02 12:14:29 -08001131drop_and_release:
1132 dst_release(dst);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001133drop_and_free:
1134 reqsk_free(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001135drop:
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001136 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137 return 0; /* don't send reset */
1138}
1139
Weilong Chen4c99aa42013-12-19 18:44:34 +08001140static struct sock *tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1141 struct request_sock *req,
1142 struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143{
Eric Dumazet634fb9792013-10-09 15:21:29 -07001144 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1146 struct tcp6_sock *newtcp6sk;
1147 struct inet_sock *newinet;
1148 struct tcp_sock *newtp;
1149 struct sock *newsk;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001150#ifdef CONFIG_TCP_MD5SIG
1151 struct tcp_md5sig_key *key;
1152#endif
Neal Cardwell3840a062012-06-28 12:34:19 +00001153 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154
1155 if (skb->protocol == htons(ETH_P_IP)) {
1156 /*
1157 * v6 mapped
1158 */
1159
1160 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1161
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001162 if (newsk == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163 return NULL;
1164
1165 newtcp6sk = (struct tcp6_sock *)newsk;
1166 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1167
1168 newinet = inet_sk(newsk);
1169 newnp = inet6_sk(newsk);
1170 newtp = tcp_sk(newsk);
1171
1172 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1173
Eric Dumazetefe42082013-10-03 15:42:29 -07001174 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001175
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001176 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177
Eric Dumazetefe42082013-10-03 15:42:29 -07001178 newsk->sk_v6_rcv_saddr = newnp->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001179
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001180 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001181 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001182#ifdef CONFIG_TCP_MD5SIG
1183 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1184#endif
1185
Yan, Zheng676a1182011-09-25 02:21:30 +00001186 newnp->ipv6_ac_list = NULL;
1187 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188 newnp->pktoptions = NULL;
1189 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001190 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001191 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001192 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001193 if (np->repflow)
1194 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001196 /*
1197 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1198 * here, tcp_create_openreq_child now does this for us, see the comment in
1199 * that function for the gory details. -acme
Linus Torvalds1da177e2005-04-16 15:20:36 -07001200 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201
1202 /* It is tricky place. Until this moment IPv4 tcp
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001203 worked with IPv6 icsk.icsk_af_ops.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204 Sync it now.
1205 */
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001206 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207
1208 return newsk;
1209 }
1210
Eric Dumazet634fb9792013-10-09 15:21:29 -07001211 ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001212
1213 if (sk_acceptq_is_full(sk))
1214 goto out_overflow;
1215
David S. Miller493f3772010-12-02 12:14:29 -08001216 if (!dst) {
Neal Cardwell3840a062012-06-28 12:34:19 +00001217 dst = inet6_csk_route_req(sk, &fl6, req);
David S. Miller493f3772010-12-02 12:14:29 -08001218 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001219 goto out;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001220 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001221
1222 newsk = tcp_create_openreq_child(sk, req, skb);
1223 if (newsk == NULL)
Balazs Scheidler093d2822010-10-21 13:06:43 +02001224 goto out_nonewsk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001225
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001226 /*
1227 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1228 * count here, tcp_create_openreq_child now does this for us, see the
1229 * comment in that function for the gory details. -acme
1230 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231
Stephen Hemminger59eed272006-08-25 15:55:43 -07001232 newsk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -07001233 __ip6_dst_store(newsk, dst, NULL, NULL);
Neal Cardwellfae6ef82012-08-19 03:30:38 +00001234 inet6_sk_rx_dst_set(newsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235
1236 newtcp6sk = (struct tcp6_sock *)newsk;
1237 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1238
1239 newtp = tcp_sk(newsk);
1240 newinet = inet_sk(newsk);
1241 newnp = inet6_sk(newsk);
1242
1243 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1244
Eric Dumazet634fb9792013-10-09 15:21:29 -07001245 newsk->sk_v6_daddr = ireq->ir_v6_rmt_addr;
1246 newnp->saddr = ireq->ir_v6_loc_addr;
1247 newsk->sk_v6_rcv_saddr = ireq->ir_v6_loc_addr;
1248 newsk->sk_bound_dev_if = ireq->ir_iif;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001249
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001250 /* Now IPv6 options...
Linus Torvalds1da177e2005-04-16 15:20:36 -07001251
1252 First: no IPv4 options.
1253 */
Eric Dumazetf6d8bd02011-04-21 09:45:37 +00001254 newinet->inet_opt = NULL;
Yan, Zheng676a1182011-09-25 02:21:30 +00001255 newnp->ipv6_ac_list = NULL;
Masayuki Nakagawad35690b2007-03-16 16:14:03 -07001256 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257
1258 /* Clone RX bits */
1259 newnp->rxopt.all = np->rxopt.all;
1260
1261 /* Clone pktoptions received with SYN */
1262 newnp->pktoptions = NULL;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001263 if (ireq->pktopts != NULL) {
1264 newnp->pktoptions = skb_clone(ireq->pktopts,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001265 sk_gfp_atomic(sk, GFP_ATOMIC));
Eric Dumazet634fb9792013-10-09 15:21:29 -07001266 consume_skb(ireq->pktopts);
1267 ireq->pktopts = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268 if (newnp->pktoptions)
1269 skb_set_owner_r(newnp->pktoptions, newsk);
1270 }
1271 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001272 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001273 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001274 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001275 if (np->repflow)
1276 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001277
1278 /* Clone native IPv6 options from listening socket (if any)
1279
1280 Yes, keeping reference count would be much more clever,
1281 but we make one more one thing there: reattach optmem
1282 to newsk.
1283 */
RongQing.Li43264e02012-07-01 17:18:59 +00001284 if (np->opt)
1285 newnp->opt = ipv6_dup_options(newsk, np->opt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001286
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001287 inet_csk(newsk)->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001288 if (newnp->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001289 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1290 newnp->opt->opt_flen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001291
1292 tcp_sync_mss(newsk, dst_mtu(dst));
David S. Miller0dbaee32010-12-13 12:52:14 -08001293 newtp->advmss = dst_metric_advmss(dst);
Neal Cardwelld135c522012-04-22 09:45:47 +00001294 if (tcp_sk(sk)->rx_opt.user_mss &&
1295 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1296 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1297
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298 tcp_initialize_rcv_mss(newsk);
1299
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001300 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1301 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001302
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001303#ifdef CONFIG_TCP_MD5SIG
1304 /* Copy over the MD5 key from the original socket */
Wang Yufen4aa956d2014-03-29 09:27:29 +08001305 key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr);
1306 if (key != NULL) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001307 /* We're using one, so create a matching key
1308 * on the newsk structure. If we fail to get
1309 * memory, then we end up not copying the key
1310 * across. Shucks.
1311 */
Eric Dumazetefe42082013-10-03 15:42:29 -07001312 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001313 AF_INET6, key->key, key->keylen,
1314 sk_gfp_atomic(sk, GFP_ATOMIC));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001315 }
1316#endif
1317
Balazs Scheidler093d2822010-10-21 13:06:43 +02001318 if (__inet_inherit_port(sk, newsk) < 0) {
Christoph Paasche337e242012-12-14 04:07:58 +00001319 inet_csk_prepare_forced_close(newsk);
1320 tcp_done(newsk);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001321 goto out;
1322 }
Eric Dumazet9327f702009-12-04 03:46:54 +00001323 __inet6_hash(newsk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324
1325 return newsk;
1326
1327out_overflow:
Pavel Emelyanovde0744a2008-07-16 20:31:16 -07001328 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001329out_nonewsk:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001330 dst_release(dst);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001331out:
1332 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001333 return NULL;
1334}
1335
Linus Torvalds1da177e2005-04-16 15:20:36 -07001336/* The socket must have it's spinlock held when we get
1337 * here.
1338 *
1339 * We have a potential double-lock case here, so even when
1340 * doing backlog processing we use the BH locking scheme.
1341 * This is because we cannot sleep with the original spinlock
1342 * held.
1343 */
1344static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1345{
1346 struct ipv6_pinfo *np = inet6_sk(sk);
1347 struct tcp_sock *tp;
1348 struct sk_buff *opt_skb = NULL;
1349
1350 /* Imagine: socket is IPv6. IPv4 packet arrives,
1351 goes to IPv4 receive handler and backlogged.
1352 From backlog it always goes here. Kerboom...
1353 Fortunately, tcp_rcv_established and rcv_established
1354 handle them correctly, but it is not case with
1355 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1356 */
1357
1358 if (skb->protocol == htons(ETH_P_IP))
1359 return tcp_v4_do_rcv(sk, skb);
1360
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001361#ifdef CONFIG_TCP_MD5SIG
Wang Yufen4aa956d2014-03-29 09:27:29 +08001362 if (tcp_v6_inbound_md5_hash(sk, skb))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001363 goto discard;
1364#endif
1365
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001366 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001367 goto discard;
1368
1369 /*
1370 * socket locking is here for SMP purposes as backlog rcv
1371 * is currently called with bh processing disabled.
1372 */
1373
1374 /* Do Stevens' IPV6_PKTOPTIONS.
1375
1376 Yes, guys, it is the only place in our code, where we
1377 may make it not affecting IPv4.
1378 The rest of code is protocol independent,
1379 and I do not like idea to uglify IPv4.
1380
1381 Actually, all the idea behind IPV6_PKTOPTIONS
1382 looks not very well thought. For now we latch
1383 options, received in the last packet, enqueued
1384 by tcp. Feel free to propose better solution.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001385 --ANK (980728)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001386 */
1387 if (np->rxopt.all)
Mel Gorman99a1dec2012-07-31 16:44:14 -07001388 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389
1390 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
Eric Dumazet5d299f32012-08-06 05:09:33 +00001391 struct dst_entry *dst = sk->sk_rx_dst;
1392
Tom Herbertbdeab992011-08-14 19:45:55 +00001393 sock_rps_save_rxhash(sk, skb);
Eric Dumazet5d299f32012-08-06 05:09:33 +00001394 if (dst) {
1395 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1396 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1397 dst_release(dst);
1398 sk->sk_rx_dst = NULL;
1399 }
1400 }
1401
Vijay Subramanianc995ae22013-09-03 12:23:22 -07001402 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 if (opt_skb)
1404 goto ipv6_pktoptions;
1405 return 0;
1406 }
1407
Arnaldo Carvalho de Meloab6a5bb2007-03-18 17:43:48 -07001408 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001409 goto csum_err;
1410
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001411 if (sk->sk_state == TCP_LISTEN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001412 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1413 if (!nsk)
1414 goto discard;
1415
1416 /*
1417 * Queue it on the new socket if the new socket is active,
1418 * otherwise we just shortcircuit this and continue with
1419 * the new socket..
1420 */
Weilong Chen4c99aa42013-12-19 18:44:34 +08001421 if (nsk != sk) {
Tom Herbertbdeab992011-08-14 19:45:55 +00001422 sock_rps_save_rxhash(nsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001423 if (tcp_child_process(sk, nsk, skb))
1424 goto reset;
1425 if (opt_skb)
1426 __kfree_skb(opt_skb);
1427 return 0;
1428 }
Neil Horman47482f132011-04-06 13:07:09 -07001429 } else
Tom Herbertbdeab992011-08-14 19:45:55 +00001430 sock_rps_save_rxhash(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001431
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001432 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001433 goto reset;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001434 if (opt_skb)
1435 goto ipv6_pktoptions;
1436 return 0;
1437
1438reset:
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001439 tcp_v6_send_reset(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001440discard:
1441 if (opt_skb)
1442 __kfree_skb(opt_skb);
1443 kfree_skb(skb);
1444 return 0;
1445csum_err:
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001446 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001447 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001448 goto discard;
1449
1450
1451ipv6_pktoptions:
1452 /* Do you ask, what is it?
1453
1454 1. skb was enqueued by tcp.
1455 2. skb is added to tail of read queue, rather than out of order.
1456 3. socket is not in passive state.
1457 4. Finally, it really contains options, which user wants to receive.
1458 */
1459 tp = tcp_sk(sk);
1460 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1461 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001462 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001463 np->mcast_oif = inet6_iif(opt_skb);
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001464 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001465 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
Florent Fourcot82e9f102013-12-08 15:46:59 +01001466 if (np->rxopt.bits.rxflow || np->rxopt.bits.rxtclass)
Florent Fourcot1397ed32013-12-08 15:46:57 +01001467 np->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(opt_skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001468 if (np->repflow)
1469 np->flow_label = ip6_flowlabel(ipv6_hdr(opt_skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470 if (ipv6_opt_accepted(sk, opt_skb)) {
1471 skb_set_owner_r(opt_skb, sk);
1472 opt_skb = xchg(&np->pktoptions, opt_skb);
1473 } else {
1474 __kfree_skb(opt_skb);
1475 opt_skb = xchg(&np->pktoptions, NULL);
1476 }
1477 }
1478
Wei Yongjun800d55f2009-02-23 21:45:33 +00001479 kfree_skb(opt_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001480 return 0;
1481}
1482
Herbert Xue5bbef22007-10-15 12:50:28 -07001483static int tcp_v6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001484{
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001485 const struct tcphdr *th;
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001486 const struct ipv6hdr *hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001487 struct sock *sk;
1488 int ret;
Pavel Emelyanova86b1e32008-07-16 20:20:58 -07001489 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490
1491 if (skb->pkt_type != PACKET_HOST)
1492 goto discard_it;
1493
1494 /*
1495 * Count it even if it's bad.
1496 */
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001497 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001498
1499 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1500 goto discard_it;
1501
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001502 th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001503
1504 if (th->doff < sizeof(struct tcphdr)/4)
1505 goto bad_packet;
1506 if (!pskb_may_pull(skb, th->doff*4))
1507 goto discard_it;
1508
Tom Herberte4f45b72014-05-02 16:29:51 -07001509 if (skb_checksum_init(skb, IPPROTO_TCP, ip6_compute_pseudo))
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001510 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001512 th = tcp_hdr(skb);
Stephen Hemmingere802af92010-04-22 15:24:53 -07001513 hdr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1515 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1516 skb->len - th->doff*4);
1517 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1518 TCP_SKB_CB(skb)->when = 0;
Eric Dumazetb82d1bb2011-09-27 02:20:08 -04001519 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001520 TCP_SKB_CB(skb)->sacked = 0;
1521
Arnaldo Carvalho de Melo9a1f27c2008-10-07 11:41:57 -07001522 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001523 if (!sk)
1524 goto no_tcp_socket;
1525
1526process:
1527 if (sk->sk_state == TCP_TIME_WAIT)
1528 goto do_time_wait;
1529
Stephen Hemmingere802af92010-04-22 15:24:53 -07001530 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1531 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1532 goto discard_and_relse;
1533 }
1534
Linus Torvalds1da177e2005-04-16 15:20:36 -07001535 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1536 goto discard_and_relse;
1537
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001538 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001539 goto discard_and_relse;
1540
Eliezer Tamir8b80cda2013-07-10 17:13:26 +03001541 sk_mark_napi_id(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001542 skb->dev = NULL;
1543
Fabio Olive Leite293b9c42006-09-25 22:28:47 -07001544 bh_lock_sock_nested(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001545 ret = 0;
1546 if (!sock_owned_by_user(sk)) {
Chris Leech1a2449a2006-05-23 18:05:53 -07001547#ifdef CONFIG_NET_DMA
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001548 struct tcp_sock *tp = tcp_sk(sk);
David S. Millerb4caea82007-10-26 04:20:13 -07001549 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
Dave Jianga2bd1142012-04-04 16:10:46 -07001550 tp->ucopy.dma_chan = net_dma_find_channel();
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001551 if (tp->ucopy.dma_chan)
1552 ret = tcp_v6_do_rcv(sk, skb);
1553 else
Chris Leech1a2449a2006-05-23 18:05:53 -07001554#endif
1555 {
1556 if (!tcp_prequeue(sk, skb))
1557 ret = tcp_v6_do_rcv(sk, skb);
1558 }
Eric Dumazetda882c12012-04-22 23:38:54 +00001559 } else if (unlikely(sk_add_backlog(sk, skb,
1560 sk->sk_rcvbuf + sk->sk_sndbuf))) {
Zhu Yi6b03a532010-03-04 18:01:41 +00001561 bh_unlock_sock(sk);
Eric Dumazet6cce09f2010-03-07 23:21:57 +00001562 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
Zhu Yi6b03a532010-03-04 18:01:41 +00001563 goto discard_and_relse;
1564 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001565 bh_unlock_sock(sk);
1566
1567 sock_put(sk);
1568 return ret ? -1 : 0;
1569
1570no_tcp_socket:
1571 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1572 goto discard_it;
1573
1574 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001575csum_error:
1576 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577bad_packet:
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001578 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001579 } else {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001580 tcp_v6_send_reset(NULL, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001581 }
1582
1583discard_it:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001584 kfree_skb(skb);
1585 return 0;
1586
1587discard_and_relse:
1588 sock_put(sk);
1589 goto discard_it;
1590
1591do_time_wait:
1592 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001593 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594 goto discard_it;
1595 }
1596
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001597 if (skb->len < (th->doff<<2)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001598 inet_twsk_put(inet_twsk(sk));
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001599 goto bad_packet;
1600 }
1601 if (tcp_checksum_complete(skb)) {
1602 inet_twsk_put(inet_twsk(sk));
1603 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001604 }
1605
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001606 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001607 case TCP_TW_SYN:
1608 {
1609 struct sock *sk2;
1610
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001611 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
Tom Herbert5ba24952013-01-22 09:50:39 +00001612 &ipv6_hdr(skb)->saddr, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001613 &ipv6_hdr(skb)->daddr,
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001614 ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001615 if (sk2 != NULL) {
Arnaldo Carvalho de Melo295ff7e2005-08-09 20:44:40 -07001616 struct inet_timewait_sock *tw = inet_twsk(sk);
1617 inet_twsk_deschedule(tw, &tcp_death_row);
1618 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001619 sk = sk2;
1620 goto process;
1621 }
1622 /* Fall through to ACK */
1623 }
1624 case TCP_TW_ACK:
1625 tcp_v6_timewait_ack(sk, skb);
1626 break;
1627 case TCP_TW_RST:
1628 goto no_tcp_socket;
Wang Yufen4aa956d2014-03-29 09:27:29 +08001629 case TCP_TW_SUCCESS:
1630 ;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001631 }
1632 goto discard_it;
1633}
1634
Eric Dumazetc7109982012-07-26 12:18:11 +00001635static void tcp_v6_early_demux(struct sk_buff *skb)
1636{
1637 const struct ipv6hdr *hdr;
1638 const struct tcphdr *th;
1639 struct sock *sk;
1640
1641 if (skb->pkt_type != PACKET_HOST)
1642 return;
1643
1644 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1645 return;
1646
1647 hdr = ipv6_hdr(skb);
1648 th = tcp_hdr(skb);
1649
1650 if (th->doff < sizeof(struct tcphdr) / 4)
1651 return;
1652
1653 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1654 &hdr->saddr, th->source,
1655 &hdr->daddr, ntohs(th->dest),
1656 inet6_iif(skb));
1657 if (sk) {
1658 skb->sk = sk;
1659 skb->destructor = sock_edemux;
1660 if (sk->sk_state != TCP_TIME_WAIT) {
1661 struct dst_entry *dst = sk->sk_rx_dst;
Neal Cardwellf3f12132012-10-22 21:41:48 +00001662
Eric Dumazetc7109982012-07-26 12:18:11 +00001663 if (dst)
Eric Dumazet5d299f32012-08-06 05:09:33 +00001664 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
Eric Dumazetc7109982012-07-26 12:18:11 +00001665 if (dst &&
Neal Cardwellf3f12132012-10-22 21:41:48 +00001666 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
Eric Dumazetc7109982012-07-26 12:18:11 +00001667 skb_dst_set_noref(skb, dst);
1668 }
1669 }
1670}
1671
David S. Millerccb7c412010-12-01 18:09:13 -08001672static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1673 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1674 .twsk_unique = tcp_twsk_unique,
Wang Yufen4aa956d2014-03-29 09:27:29 +08001675 .twsk_destructor = tcp_twsk_destructor,
David S. Millerccb7c412010-12-01 18:09:13 -08001676};
1677
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001678static const struct inet_connection_sock_af_ops ipv6_specific = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001679 .queue_xmit = inet6_csk_xmit,
1680 .send_check = tcp_v6_send_check,
1681 .rebuild_header = inet6_sk_rebuild_header,
Eric Dumazet5d299f32012-08-06 05:09:33 +00001682 .sk_rx_dst_set = inet6_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001683 .conn_request = tcp_v6_conn_request,
1684 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001685 .net_header_len = sizeof(struct ipv6hdr),
Eric Dumazet67469602012-04-24 07:37:38 +00001686 .net_frag_header_len = sizeof(struct frag_hdr),
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001687 .setsockopt = ipv6_setsockopt,
1688 .getsockopt = ipv6_getsockopt,
1689 .addr2sockaddr = inet6_csk_addr2sockaddr,
1690 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001691 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001692#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001693 .compat_setsockopt = compat_ipv6_setsockopt,
1694 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001695#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001696};
1697
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001698#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +00001699static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001700 .md5_lookup = tcp_v6_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001701 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001702 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001703};
David S. Millera9286302006-11-14 19:53:22 -08001704#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001705
Linus Torvalds1da177e2005-04-16 15:20:36 -07001706/*
1707 * TCP over IPv4 via INET6 API
1708 */
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001709static const struct inet_connection_sock_af_ops ipv6_mapped = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001710 .queue_xmit = ip_queue_xmit,
1711 .send_check = tcp_v4_send_check,
1712 .rebuild_header = inet_sk_rebuild_header,
Eric Dumazet63d02d12012-08-09 14:11:00 +00001713 .sk_rx_dst_set = inet_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001714 .conn_request = tcp_v6_conn_request,
1715 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001716 .net_header_len = sizeof(struct iphdr),
1717 .setsockopt = ipv6_setsockopt,
1718 .getsockopt = ipv6_getsockopt,
1719 .addr2sockaddr = inet6_csk_addr2sockaddr,
1720 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001721 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001722#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001723 .compat_setsockopt = compat_ipv6_setsockopt,
1724 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001725#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001726};
1727
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001728#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +00001729static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001730 .md5_lookup = tcp_v4_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001731 .calc_md5_hash = tcp_v4_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001732 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001733};
David S. Millera9286302006-11-14 19:53:22 -08001734#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001735
Linus Torvalds1da177e2005-04-16 15:20:36 -07001736/* NOTE: A lot of things set to zero explicitly by call to
1737 * sk_alloc() so need not be done here.
1738 */
1739static int tcp_v6_init_sock(struct sock *sk)
1740{
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001741 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001742
Neal Cardwell900f65d2012-04-19 09:55:21 +00001743 tcp_init_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001744
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001745 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001746
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001747#ifdef CONFIG_TCP_MD5SIG
David S. Millerac807fa2012-04-23 03:21:58 -04001748 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001749#endif
1750
Linus Torvalds1da177e2005-04-16 15:20:36 -07001751 return 0;
1752}
1753
Brian Haley7d06b2e2008-06-14 17:04:49 -07001754static void tcp_v6_destroy_sock(struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001755{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001756 tcp_v4_destroy_sock(sk);
Brian Haley7d06b2e2008-06-14 17:04:49 -07001757 inet6_destroy_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001758}
1759
YOSHIFUJI Hideaki952a10b2007-04-21 20:13:44 +09001760#ifdef CONFIG_PROC_FS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001761/* Proc filesystem TCPv6 sock list dumping. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001762static void get_openreq6(struct seq_file *seq,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001763 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001764{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001765 int ttd = req->expires - jiffies;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001766 const struct in6_addr *src = &inet_rsk(req)->ir_v6_loc_addr;
1767 const struct in6_addr *dest = &inet_rsk(req)->ir_v6_rmt_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001768
1769 if (ttd < 0)
1770 ttd = 0;
1771
Linus Torvalds1da177e2005-04-16 15:20:36 -07001772 seq_printf(seq,
1773 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001774 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001775 i,
1776 src->s6_addr32[0], src->s6_addr32[1],
1777 src->s6_addr32[2], src->s6_addr32[3],
Eric Dumazetb44084c2013-10-10 00:04:37 -07001778 inet_rsk(req)->ir_num,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001779 dest->s6_addr32[0], dest->s6_addr32[1],
1780 dest->s6_addr32[2], dest->s6_addr32[3],
Eric Dumazet634fb9792013-10-09 15:21:29 -07001781 ntohs(inet_rsk(req)->ir_rmt_port),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001782 TCP_SYN_RECV,
Weilong Chen4c99aa42013-12-19 18:44:34 +08001783 0, 0, /* could print option size, but that is af dependent. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001784 1, /* timers active (only the expire timer) */
1785 jiffies_to_clock_t(ttd),
Eric Dumazete6c022a2012-10-27 23:16:46 +00001786 req->num_timeout,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001787 from_kuid_munged(seq_user_ns(seq), uid),
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001788 0, /* non standard timer */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001789 0, /* open_requests have no inode */
1790 0, req);
1791}
1792
1793static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1794{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001795 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001796 __u16 destp, srcp;
1797 int timer_active;
1798 unsigned long timer_expires;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001799 const struct inet_sock *inet = inet_sk(sp);
1800 const struct tcp_sock *tp = tcp_sk(sp);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001801 const struct inet_connection_sock *icsk = inet_csk(sp);
Yuchung Cheng0a672f72014-05-11 20:22:12 -07001802 struct fastopen_queue *fastopenq = icsk->icsk_accept_queue.fastopenq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001803
Eric Dumazetefe42082013-10-03 15:42:29 -07001804 dest = &sp->sk_v6_daddr;
1805 src = &sp->sk_v6_rcv_saddr;
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001806 destp = ntohs(inet->inet_dport);
1807 srcp = ntohs(inet->inet_sport);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001808
1809 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001810 timer_active = 1;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001811 timer_expires = icsk->icsk_timeout;
1812 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001813 timer_active = 4;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001814 timer_expires = icsk->icsk_timeout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001815 } else if (timer_pending(&sp->sk_timer)) {
1816 timer_active = 2;
1817 timer_expires = sp->sk_timer.expires;
1818 } else {
1819 timer_active = 0;
1820 timer_expires = jiffies;
1821 }
1822
1823 seq_printf(seq,
1824 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001825 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001826 i,
1827 src->s6_addr32[0], src->s6_addr32[1],
1828 src->s6_addr32[2], src->s6_addr32[3], srcp,
1829 dest->s6_addr32[0], dest->s6_addr32[1],
1830 dest->s6_addr32[2], dest->s6_addr32[3], destp,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001831 sp->sk_state,
Sridhar Samudrala47da8ee2006-06-27 13:29:00 -07001832 tp->write_seq-tp->snd_una,
1833 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001834 timer_active,
Eric Dumazeta399a802012-08-08 21:13:53 +00001835 jiffies_delta_to_clock_t(timer_expires - jiffies),
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001836 icsk->icsk_retransmits,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001837 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001838 icsk->icsk_probes_out,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001839 sock_i_ino(sp),
1840 atomic_read(&sp->sk_refcnt), sp,
Stephen Hemminger7be87352008-06-27 20:00:19 -07001841 jiffies_to_clock_t(icsk->icsk_rto),
1842 jiffies_to_clock_t(icsk->icsk_ack.ato),
Weilong Chen4c99aa42013-12-19 18:44:34 +08001843 (icsk->icsk_ack.quick << 1) | icsk->icsk_ack.pingpong,
Ilpo Järvinen0b6a05c2009-09-15 01:30:10 -07001844 tp->snd_cwnd,
Yuchung Cheng0a672f72014-05-11 20:22:12 -07001845 sp->sk_state == TCP_LISTEN ?
1846 (fastopenq ? fastopenq->max_qlen : 0) :
1847 (tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001848 );
1849}
1850
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001851static void get_timewait6_sock(struct seq_file *seq,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -07001852 struct inet_timewait_sock *tw, int i)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001853{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001854 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001855 __u16 destp, srcp;
Eric Dumazet96f817f2013-10-03 14:27:25 -07001856 s32 delta = tw->tw_ttd - inet_tw_time_stamp();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001857
Eric Dumazetefe42082013-10-03 15:42:29 -07001858 dest = &tw->tw_v6_daddr;
1859 src = &tw->tw_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001860 destp = ntohs(tw->tw_dport);
1861 srcp = ntohs(tw->tw_sport);
1862
1863 seq_printf(seq,
1864 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00001865 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001866 i,
1867 src->s6_addr32[0], src->s6_addr32[1],
1868 src->s6_addr32[2], src->s6_addr32[3], srcp,
1869 dest->s6_addr32[0], dest->s6_addr32[1],
1870 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1871 tw->tw_substate, 0, 0,
Eric Dumazeta399a802012-08-08 21:13:53 +00001872 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001873 atomic_read(&tw->tw_refcnt), tw);
1874}
1875
Linus Torvalds1da177e2005-04-16 15:20:36 -07001876static int tcp6_seq_show(struct seq_file *seq, void *v)
1877{
1878 struct tcp_iter_state *st;
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001879 struct sock *sk = v;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001880
1881 if (v == SEQ_START_TOKEN) {
1882 seq_puts(seq,
1883 " sl "
1884 "local_address "
1885 "remote_address "
1886 "st tx_queue rx_queue tr tm->when retrnsmt"
1887 " uid timeout inode\n");
1888 goto out;
1889 }
1890 st = seq->private;
1891
1892 switch (st->state) {
1893 case TCP_SEQ_STATE_LISTENING:
1894 case TCP_SEQ_STATE_ESTABLISHED:
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001895 if (sk->sk_state == TCP_TIME_WAIT)
1896 get_timewait6_sock(seq, v, st->num);
1897 else
1898 get_tcp6_sock(seq, v, st->num);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001899 break;
1900 case TCP_SEQ_STATE_OPENREQ:
1901 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1902 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001903 }
1904out:
1905 return 0;
1906}
1907
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001908static const struct file_operations tcp6_afinfo_seq_fops = {
1909 .owner = THIS_MODULE,
1910 .open = tcp_seq_open,
1911 .read = seq_read,
1912 .llseek = seq_lseek,
1913 .release = seq_release_net
1914};
1915
Linus Torvalds1da177e2005-04-16 15:20:36 -07001916static struct tcp_seq_afinfo tcp6_seq_afinfo = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001917 .name = "tcp6",
1918 .family = AF_INET6,
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001919 .seq_fops = &tcp6_afinfo_seq_fops,
Denis V. Lunev9427c4b2008-04-13 22:12:13 -07001920 .seq_ops = {
1921 .show = tcp6_seq_show,
1922 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001923};
1924
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001925int __net_init tcp6_proc_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001926{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001927 return tcp_proc_register(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001928}
1929
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001930void tcp6_proc_exit(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001931{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001932 tcp_proc_unregister(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001933}
1934#endif
1935
Eric Dumazetf77d6022013-05-09 10:28:16 +00001936static void tcp_v6_clear_sk(struct sock *sk, int size)
1937{
1938 struct inet_sock *inet = inet_sk(sk);
1939
1940 /* we do not want to clear pinet6 field, because of RCU lookups */
1941 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1942
1943 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1944 memset(&inet->pinet6 + 1, 0, size);
1945}
1946
Linus Torvalds1da177e2005-04-16 15:20:36 -07001947struct proto tcpv6_prot = {
1948 .name = "TCPv6",
1949 .owner = THIS_MODULE,
1950 .close = tcp_close,
1951 .connect = tcp_v6_connect,
1952 .disconnect = tcp_disconnect,
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001953 .accept = inet_csk_accept,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001954 .ioctl = tcp_ioctl,
1955 .init = tcp_v6_init_sock,
1956 .destroy = tcp_v6_destroy_sock,
1957 .shutdown = tcp_shutdown,
1958 .setsockopt = tcp_setsockopt,
1959 .getsockopt = tcp_getsockopt,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001960 .recvmsg = tcp_recvmsg,
Changli Gao7ba42912010-07-10 20:41:55 +00001961 .sendmsg = tcp_sendmsg,
1962 .sendpage = tcp_sendpage,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001963 .backlog_rcv = tcp_v6_do_rcv,
Eric Dumazet46d3cea2012-07-11 05:50:31 +00001964 .release_cb = tcp_release_cb,
Eric Dumazet563d34d2012-07-23 09:48:52 +02001965 .mtu_reduced = tcp_v6_mtu_reduced,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001966 .hash = tcp_v6_hash,
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001967 .unhash = inet_unhash,
1968 .get_port = inet_csk_get_port,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001969 .enter_memory_pressure = tcp_enter_memory_pressure,
Eric Dumazetc9bee3b72013-07-22 20:27:07 -07001970 .stream_memory_free = tcp_stream_memory_free,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001971 .sockets_allocated = &tcp_sockets_allocated,
1972 .memory_allocated = &tcp_memory_allocated,
1973 .memory_pressure = &tcp_memory_pressure,
Arnaldo Carvalho de Melo0a5578c2005-08-09 20:11:41 -07001974 .orphan_count = &tcp_orphan_count,
Eric W. Biedermana4fe34b2013-10-19 16:25:36 -07001975 .sysctl_mem = sysctl_tcp_mem,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001976 .sysctl_wmem = sysctl_tcp_wmem,
1977 .sysctl_rmem = sysctl_tcp_rmem,
1978 .max_header = MAX_TCP_HEADER,
1979 .obj_size = sizeof(struct tcp6_sock),
Eric Dumazet3ab5aee2008-11-16 19:40:17 -08001980 .slab_flags = SLAB_DESTROY_BY_RCU,
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -08001981 .twsk_prot = &tcp6_timewait_sock_ops,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07001982 .rsk_prot = &tcp6_request_sock_ops,
Pavel Emelyanov39d8cda2008-03-22 16:50:58 -07001983 .h.hashinfo = &tcp_hashinfo,
Changli Gao7ba42912010-07-10 20:41:55 +00001984 .no_autobind = true,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001985#ifdef CONFIG_COMPAT
1986 .compat_setsockopt = compat_tcp_setsockopt,
1987 .compat_getsockopt = compat_tcp_getsockopt,
1988#endif
Andrew Mortonc255a452012-07-31 16:43:02 -07001989#ifdef CONFIG_MEMCG_KMEM
Glauber Costad1a4c0b2011-12-11 21:47:04 +00001990 .proto_cgroup = tcp_proto_cgroup,
1991#endif
Eric Dumazetf77d6022013-05-09 10:28:16 +00001992 .clear_sk = tcp_v6_clear_sk,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001993};
1994
Alexey Dobriyan41135cc2009-09-14 12:22:28 +00001995static const struct inet6_protocol tcpv6_protocol = {
Eric Dumazetc7109982012-07-26 12:18:11 +00001996 .early_demux = tcp_v6_early_demux,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001997 .handler = tcp_v6_rcv,
1998 .err_handler = tcp_v6_err,
1999 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2000};
2001
Linus Torvalds1da177e2005-04-16 15:20:36 -07002002static struct inet_protosw tcpv6_protosw = {
2003 .type = SOCK_STREAM,
2004 .protocol = IPPROTO_TCP,
2005 .prot = &tcpv6_prot,
2006 .ops = &inet6_stream_ops,
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08002007 .flags = INET_PROTOSW_PERMANENT |
2008 INET_PROTOSW_ICSK,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002009};
2010
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002011static int __net_init tcpv6_net_init(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002012{
Denis V. Lunev56772422008-04-03 14:28:30 -07002013 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2014 SOCK_RAW, IPPROTO_TCP, net);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002015}
2016
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002017static void __net_exit tcpv6_net_exit(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002018{
Denis V. Lunev56772422008-04-03 14:28:30 -07002019 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002020}
2021
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002022static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002023{
2024 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002025}
2026
2027static struct pernet_operations tcpv6_net_ops = {
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002028 .init = tcpv6_net_init,
2029 .exit = tcpv6_net_exit,
2030 .exit_batch = tcpv6_net_exit_batch,
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002031};
2032
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002033int __init tcpv6_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002034{
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002035 int ret;
David Woodhouseae0f7d52006-01-11 15:53:04 -08002036
Vlad Yasevich33362882012-11-15 08:49:15 +00002037 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2038 if (ret)
Vlad Yasevichc6b641a2012-11-15 08:49:22 +00002039 goto out;
Vlad Yasevich33362882012-11-15 08:49:15 +00002040
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002041 /* register inet6 protocol */
2042 ret = inet6_register_protosw(&tcpv6_protosw);
2043 if (ret)
2044 goto out_tcpv6_protocol;
2045
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002046 ret = register_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002047 if (ret)
2048 goto out_tcpv6_protosw;
2049out:
2050 return ret;
2051
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002052out_tcpv6_protosw:
2053 inet6_unregister_protosw(&tcpv6_protosw);
Vlad Yasevich33362882012-11-15 08:49:15 +00002054out_tcpv6_protocol:
2055 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002056 goto out;
2057}
2058
Daniel Lezcano09f77092007-12-13 05:34:58 -08002059void tcpv6_exit(void)
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002060{
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002061 unregister_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002062 inet6_unregister_protosw(&tcpv6_protosw);
2063 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002064}