blob: 893f013d536917aa90dc3e1ace614431b0ca5cad [file] [log] [blame]
Pravin B Shelarc5441932013-03-25 14:49:35 +00001/*
2 * Copyright (c) 2013 Nicira, Inc.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of version 2 of the GNU General Public
6 * License as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public License
14 * along with this program; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16 * 02110-1301, USA
17 */
18
19#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
20
21#include <linux/capability.h>
22#include <linux/module.h>
23#include <linux/types.h>
24#include <linux/kernel.h>
25#include <linux/slab.h>
26#include <linux/uaccess.h>
27#include <linux/skbuff.h>
28#include <linux/netdevice.h>
29#include <linux/in.h>
30#include <linux/tcp.h>
31#include <linux/udp.h>
32#include <linux/if_arp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000033#include <linux/init.h>
34#include <linux/in6.h>
35#include <linux/inetdevice.h>
36#include <linux/igmp.h>
37#include <linux/netfilter_ipv4.h>
38#include <linux/etherdevice.h>
39#include <linux/if_ether.h>
40#include <linux/if_vlan.h>
41#include <linux/rculist.h>
Sachin Kamat27d79f32014-01-27 12:13:57 +053042#include <linux/err.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000043
44#include <net/sock.h>
45#include <net/ip.h>
46#include <net/icmp.h>
47#include <net/protocol.h>
48#include <net/ip_tunnels.h>
49#include <net/arp.h>
50#include <net/checksum.h>
51#include <net/dsfield.h>
52#include <net/inet_ecn.h>
53#include <net/xfrm.h>
54#include <net/net_namespace.h>
55#include <net/netns/generic.h>
56#include <net/rtnetlink.h>
Tom Herbert56328482014-09-17 12:25:58 -070057#include <net/udp.h>
Alexei Starovoitovcfc73812016-09-15 13:00:29 -070058#include <net/dst_metadata.h>
Tom Herbert63487ba2014-11-04 09:06:51 -080059
Pravin B Shelarc5441932013-03-25 14:49:35 +000060#if IS_ENABLED(CONFIG_IPV6)
61#include <net/ipv6.h>
62#include <net/ip6_fib.h>
63#include <net/ip6_route.h>
64#endif
65
Duan Jiong967680e2014-01-19 16:43:42 +080066static unsigned int ip_tunnel_hash(__be32 key, __be32 remote)
Pravin B Shelarc5441932013-03-25 14:49:35 +000067{
68 return hash_32((__force u32)key ^ (__force u32)remote,
69 IP_TNL_HASH_BITS);
70}
71
Pravin B Shelarc5441932013-03-25 14:49:35 +000072static bool ip_tunnel_key_match(const struct ip_tunnel_parm *p,
73 __be16 flags, __be32 key)
74{
75 if (p->i_flags & TUNNEL_KEY) {
76 if (flags & TUNNEL_KEY)
77 return key == p->i_key;
78 else
79 /* key expected, none present */
80 return false;
81 } else
82 return !(flags & TUNNEL_KEY);
83}
84
85/* Fallback tunnel: no source, no destination, no key, no options
86
87 Tunnel hash table:
88 We require exact key match i.e. if a key is present in packet
89 it will match only tunnel with the same key; if it is not present,
90 it will match only keyless tunnel.
91
92 All keysless packets, if not matched configured keyless tunnels
93 will match fallback tunnel.
94 Given src, dst and key, find appropriate for input tunnel.
95*/
96struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
97 int link, __be16 flags,
98 __be32 remote, __be32 local,
99 __be32 key)
100{
101 unsigned int hash;
102 struct ip_tunnel *t, *cand = NULL;
103 struct hlist_head *head;
104
Duan Jiong967680e2014-01-19 16:43:42 +0800105 hash = ip_tunnel_hash(key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000106 head = &itn->tunnels[hash];
107
108 hlist_for_each_entry_rcu(t, head, hash_node) {
109 if (local != t->parms.iph.saddr ||
110 remote != t->parms.iph.daddr ||
111 !(t->dev->flags & IFF_UP))
112 continue;
113
114 if (!ip_tunnel_key_match(&t->parms, flags, key))
115 continue;
116
117 if (t->parms.link == link)
118 return t;
119 else
120 cand = t;
121 }
122
123 hlist_for_each_entry_rcu(t, head, hash_node) {
124 if (remote != t->parms.iph.daddr ||
Dmitry Popove0056592014-07-05 02:26:37 +0400125 t->parms.iph.saddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000126 !(t->dev->flags & IFF_UP))
127 continue;
128
129 if (!ip_tunnel_key_match(&t->parms, flags, key))
130 continue;
131
132 if (t->parms.link == link)
133 return t;
134 else if (!cand)
135 cand = t;
136 }
137
Duan Jiong967680e2014-01-19 16:43:42 +0800138 hash = ip_tunnel_hash(key, 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000139 head = &itn->tunnels[hash];
140
141 hlist_for_each_entry_rcu(t, head, hash_node) {
Dmitry Popove0056592014-07-05 02:26:37 +0400142 if ((local != t->parms.iph.saddr || t->parms.iph.daddr != 0) &&
143 (local != t->parms.iph.daddr || !ipv4_is_multicast(local)))
144 continue;
145
146 if (!(t->dev->flags & IFF_UP))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000147 continue;
148
149 if (!ip_tunnel_key_match(&t->parms, flags, key))
150 continue;
151
152 if (t->parms.link == link)
153 return t;
154 else if (!cand)
155 cand = t;
156 }
157
158 if (flags & TUNNEL_NO_KEY)
159 goto skip_key_lookup;
160
161 hlist_for_each_entry_rcu(t, head, hash_node) {
162 if (t->parms.i_key != key ||
Dmitry Popove0056592014-07-05 02:26:37 +0400163 t->parms.iph.saddr != 0 ||
164 t->parms.iph.daddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000165 !(t->dev->flags & IFF_UP))
166 continue;
167
168 if (t->parms.link == link)
169 return t;
170 else if (!cand)
171 cand = t;
172 }
173
174skip_key_lookup:
175 if (cand)
176 return cand;
177
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700178 t = rcu_dereference(itn->collect_md_tun);
Haishuang Yan833a8b42017-09-12 17:47:56 +0800179 if (t && t->dev->flags & IFF_UP)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700180 return t;
181
Pravin B Shelarc5441932013-03-25 14:49:35 +0000182 if (itn->fb_tunnel_dev && itn->fb_tunnel_dev->flags & IFF_UP)
183 return netdev_priv(itn->fb_tunnel_dev);
184
Pravin B Shelarc5441932013-03-25 14:49:35 +0000185 return NULL;
186}
187EXPORT_SYMBOL_GPL(ip_tunnel_lookup);
188
189static struct hlist_head *ip_bucket(struct ip_tunnel_net *itn,
190 struct ip_tunnel_parm *parms)
191{
192 unsigned int h;
193 __be32 remote;
Steffen Klassert6d608f02014-02-21 08:41:09 +0100194 __be32 i_key = parms->i_key;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000195
196 if (parms->iph.daddr && !ipv4_is_multicast(parms->iph.daddr))
197 remote = parms->iph.daddr;
198 else
199 remote = 0;
200
Steffen Klassert6d608f02014-02-21 08:41:09 +0100201 if (!(parms->i_flags & TUNNEL_KEY) && (parms->i_flags & VTI_ISVTI))
202 i_key = 0;
203
204 h = ip_tunnel_hash(i_key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000205 return &itn->tunnels[h];
206}
207
208static void ip_tunnel_add(struct ip_tunnel_net *itn, struct ip_tunnel *t)
209{
210 struct hlist_head *head = ip_bucket(itn, &t->parms);
211
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700212 if (t->collect_md)
213 rcu_assign_pointer(itn->collect_md_tun, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000214 hlist_add_head_rcu(&t->hash_node, head);
215}
216
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700217static void ip_tunnel_del(struct ip_tunnel_net *itn, struct ip_tunnel *t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000218{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700219 if (t->collect_md)
220 rcu_assign_pointer(itn->collect_md_tun, NULL);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000221 hlist_del_init_rcu(&t->hash_node);
222}
223
224static struct ip_tunnel *ip_tunnel_find(struct ip_tunnel_net *itn,
225 struct ip_tunnel_parm *parms,
226 int type)
227{
228 __be32 remote = parms->iph.daddr;
229 __be32 local = parms->iph.saddr;
230 __be32 key = parms->i_key;
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400231 __be16 flags = parms->i_flags;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000232 int link = parms->link;
233 struct ip_tunnel *t = NULL;
234 struct hlist_head *head = ip_bucket(itn, parms);
235
236 hlist_for_each_entry_rcu(t, head, hash_node) {
237 if (local == t->parms.iph.saddr &&
238 remote == t->parms.iph.daddr &&
Pravin B Shelarc5441932013-03-25 14:49:35 +0000239 link == t->parms.link &&
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400240 type == t->dev->type &&
241 ip_tunnel_key_match(&t->parms, flags, key))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000242 break;
243 }
244 return t;
245}
246
247static struct net_device *__ip_tunnel_create(struct net *net,
248 const struct rtnl_link_ops *ops,
249 struct ip_tunnel_parm *parms)
250{
251 int err;
252 struct ip_tunnel *tunnel;
253 struct net_device *dev;
254 char name[IFNAMSIZ];
255
Eric Dumazet9cb726a2018-04-05 06:39:27 -0700256 err = -E2BIG;
257 if (parms->name[0]) {
258 if (!dev_valid_name(parms->name))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000259 goto failed;
Eric Dumazet9cb726a2018-04-05 06:39:27 -0700260 strlcpy(name, parms->name, IFNAMSIZ);
261 } else {
262 if (strlen(ops->kind) > (IFNAMSIZ - 3))
263 goto failed;
Sultan Alsawaf000ade82018-06-06 15:56:54 -0700264 strcpy(name, ops->kind);
265 strcat(name, "%d");
Pravin B Shelarc5441932013-03-25 14:49:35 +0000266 }
267
268 ASSERT_RTNL();
Tom Gundersenc835a672014-07-14 16:37:24 +0200269 dev = alloc_netdev(ops->priv_size, name, NET_NAME_UNKNOWN, ops->setup);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000270 if (!dev) {
271 err = -ENOMEM;
272 goto failed;
273 }
274 dev_net_set(dev, net);
275
276 dev->rtnl_link_ops = ops;
277
278 tunnel = netdev_priv(dev);
279 tunnel->parms = *parms;
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +0200280 tunnel->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000281
282 err = register_netdevice(dev);
283 if (err)
284 goto failed_free;
285
286 return dev;
287
288failed_free:
289 free_netdev(dev);
290failed:
291 return ERR_PTR(err);
292}
293
Pravin B Shelarc5441932013-03-25 14:49:35 +0000294static int ip_tunnel_bind_dev(struct net_device *dev)
295{
296 struct net_device *tdev = NULL;
297 struct ip_tunnel *tunnel = netdev_priv(dev);
298 const struct iphdr *iph;
299 int hlen = LL_MAX_HEADER;
300 int mtu = ETH_DATA_LEN;
301 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
302
303 iph = &tunnel->parms.iph;
304
305 /* Guess output device to choose reasonable mtu and needed_headroom */
306 if (iph->daddr) {
307 struct flowi4 fl4;
308 struct rtable *rt;
309
Petr Machatab0066da2018-02-27 14:53:38 +0100310 ip_tunnel_init_flow(&fl4, iph->protocol, iph->daddr,
311 iph->saddr, tunnel->parms.o_key,
312 RT_TOS(iph->tos), tunnel->parms.link,
313 tunnel->fwmark);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800314 rt = ip_route_output_key(tunnel->net, &fl4);
315
Pravin B Shelarc5441932013-03-25 14:49:35 +0000316 if (!IS_ERR(rt)) {
317 tdev = rt->dst.dev;
318 ip_rt_put(rt);
319 }
320 if (dev->type != ARPHRD_ETHER)
321 dev->flags |= IFF_POINTOPOINT;
Paolo Abenif27337e2016-04-28 11:04:51 +0200322
323 dst_cache_reset(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000324 }
325
326 if (!tdev && tunnel->parms.link)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200327 tdev = __dev_get_by_index(tunnel->net, tunnel->parms.link);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000328
329 if (tdev) {
330 hlen = tdev->hard_header_len + tdev->needed_headroom;
Nicolas Dichtel82612de2018-05-31 10:59:32 +0200331 mtu = min(tdev->mtu, IP_MAX_MTU);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000332 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000333
334 dev->needed_headroom = t_hlen + hlen;
335 mtu -= (dev->hard_header_len + t_hlen);
336
Eric Dumazetb5476022017-12-11 07:17:39 -0800337 if (mtu < IPV4_MIN_MTU)
338 mtu = IPV4_MIN_MTU;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000339
340 return mtu;
341}
342
343static struct ip_tunnel *ip_tunnel_create(struct net *net,
344 struct ip_tunnel_net *itn,
345 struct ip_tunnel_parm *parms)
346{
Julia Lawall4929fd82014-05-15 05:43:20 +0200347 struct ip_tunnel *nt;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000348 struct net_device *dev;
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400349 int t_hlen;
Petr Machataf6cc9c02018-03-22 19:53:33 +0200350 int mtu;
351 int err;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000352
Eric Dumazet79134e62018-03-08 12:51:41 -0800353 dev = __ip_tunnel_create(net, itn->rtnl_link_ops, parms);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000354 if (IS_ERR(dev))
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100355 return ERR_CAST(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000356
Petr Machataf6cc9c02018-03-22 19:53:33 +0200357 mtu = ip_tunnel_bind_dev(dev);
358 err = dev_set_mtu(dev, mtu);
359 if (err)
360 goto err_dev_set_mtu;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000361
362 nt = netdev_priv(dev);
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400363 t_hlen = nt->hlen + sizeof(struct iphdr);
364 dev->min_mtu = ETH_MIN_MTU;
Nicolas Dichtel82612de2018-05-31 10:59:32 +0200365 dev->max_mtu = IP_MAX_MTU - dev->hard_header_len - t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000366 ip_tunnel_add(itn, nt);
367 return nt;
Petr Machataf6cc9c02018-03-22 19:53:33 +0200368
369err_dev_set_mtu:
370 unregister_netdevice(dev);
371 return ERR_PTR(err);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000372}
373
374int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700375 const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
376 bool log_ecn_error)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000377{
Li RongQing8f849852014-01-04 13:57:59 +0800378 struct pcpu_sw_netstats *tstats;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000379 const struct iphdr *iph = ip_hdr(skb);
380 int err;
381
Pravin B Shelarc5441932013-03-25 14:49:35 +0000382#ifdef CONFIG_NET_IPGRE_BROADCAST
383 if (ipv4_is_multicast(iph->daddr)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000384 tunnel->dev->stats.multicast++;
385 skb->pkt_type = PACKET_BROADCAST;
386 }
387#endif
388
389 if ((!(tpi->flags&TUNNEL_CSUM) && (tunnel->parms.i_flags&TUNNEL_CSUM)) ||
390 ((tpi->flags&TUNNEL_CSUM) && !(tunnel->parms.i_flags&TUNNEL_CSUM))) {
391 tunnel->dev->stats.rx_crc_errors++;
392 tunnel->dev->stats.rx_errors++;
393 goto drop;
394 }
395
396 if (tunnel->parms.i_flags&TUNNEL_SEQ) {
397 if (!(tpi->flags&TUNNEL_SEQ) ||
398 (tunnel->i_seqno && (s32)(ntohl(tpi->seq) - tunnel->i_seqno) < 0)) {
399 tunnel->dev->stats.rx_fifo_errors++;
400 tunnel->dev->stats.rx_errors++;
401 goto drop;
402 }
403 tunnel->i_seqno = ntohl(tpi->seq) + 1;
404 }
405
Ying Caie96f2e72014-05-04 15:20:04 -0700406 skb_reset_network_header(skb);
407
Pravin B Shelarc5441932013-03-25 14:49:35 +0000408 err = IP_ECN_decapsulate(iph, skb);
409 if (unlikely(err)) {
410 if (log_ecn_error)
411 net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
412 &iph->saddr, iph->tos);
413 if (err > 1) {
414 ++tunnel->dev->stats.rx_frame_errors;
415 ++tunnel->dev->stats.rx_errors;
416 goto drop;
417 }
418 }
419
420 tstats = this_cpu_ptr(tunnel->dev->tstats);
421 u64_stats_update_begin(&tstats->syncp);
422 tstats->rx_packets++;
423 tstats->rx_bytes += skb->len;
424 u64_stats_update_end(&tstats->syncp);
425
Alexei Starovoitov81b9eab2013-11-12 14:39:13 -0800426 skb_scrub_packet(skb, !net_eq(tunnel->net, dev_net(tunnel->dev)));
427
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700428 if (tunnel->dev->type == ARPHRD_ETHER) {
429 skb->protocol = eth_type_trans(skb, tunnel->dev);
430 skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
431 } else {
432 skb->dev = tunnel->dev;
433 }
Nicolas Dichtel64261f22013-08-13 17:51:09 +0200434
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700435 if (tun_dst)
436 skb_dst_set(skb, (struct dst_entry *)tun_dst);
437
Pravin B Shelarc5441932013-03-25 14:49:35 +0000438 gro_cells_receive(&tunnel->gro_cells, skb);
439 return 0;
440
441drop:
Haishuang Yan469f87e2017-06-15 10:29:29 +0800442 if (tun_dst)
443 dst_release((struct dst_entry *)tun_dst);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000444 kfree_skb(skb);
445 return 0;
446}
447EXPORT_SYMBOL_GPL(ip_tunnel_rcv);
448
Tom Herberta8c5f902014-11-12 11:54:09 -0800449int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *ops,
450 unsigned int num)
451{
Thomas Grafbb1553c2014-12-16 21:05:20 +0100452 if (num >= MAX_IPTUN_ENCAP_OPS)
453 return -ERANGE;
454
Tom Herberta8c5f902014-11-12 11:54:09 -0800455 return !cmpxchg((const struct ip_tunnel_encap_ops **)
456 &iptun_encaps[num],
457 NULL, ops) ? 0 : -1;
458}
459EXPORT_SYMBOL(ip_tunnel_encap_add_ops);
460
461int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *ops,
462 unsigned int num)
463{
464 int ret;
465
Thomas Grafbb1553c2014-12-16 21:05:20 +0100466 if (num >= MAX_IPTUN_ENCAP_OPS)
467 return -ERANGE;
468
Tom Herberta8c5f902014-11-12 11:54:09 -0800469 ret = (cmpxchg((const struct ip_tunnel_encap_ops **)
470 &iptun_encaps[num],
471 ops, NULL) == ops) ? 0 : -1;
472
473 synchronize_net();
474
475 return ret;
476}
477EXPORT_SYMBOL(ip_tunnel_encap_del_ops);
478
Tom Herbert56328482014-09-17 12:25:58 -0700479int ip_tunnel_encap_setup(struct ip_tunnel *t,
480 struct ip_tunnel_encap *ipencap)
481{
482 int hlen;
483
484 memset(&t->encap, 0, sizeof(t->encap));
485
486 hlen = ip_encap_hlen(ipencap);
487 if (hlen < 0)
488 return hlen;
489
490 t->encap.type = ipencap->type;
491 t->encap.sport = ipencap->sport;
492 t->encap.dport = ipencap->dport;
493 t->encap.flags = ipencap->flags;
494
495 t->encap_hlen = hlen;
496 t->hlen = t->encap_hlen + t->tun_hlen;
497
498 return 0;
499}
500EXPORT_SYMBOL_GPL(ip_tunnel_encap_setup);
501
Pravin B Shelar23a36472013-07-02 10:57:33 -0700502static int tnl_update_pmtu(struct net_device *dev, struct sk_buff *skb,
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300503 struct rtable *rt, __be16 df,
wenxuc8b34e62019-01-22 18:39:50 +0800504 const struct iphdr *inner_iph,
505 int tunnel_hlen, __be32 dst, bool md)
Pravin B Shelar23a36472013-07-02 10:57:33 -0700506{
507 struct ip_tunnel *tunnel = netdev_priv(dev);
wenxuc8b34e62019-01-22 18:39:50 +0800508 int pkt_size;
Pravin B Shelar23a36472013-07-02 10:57:33 -0700509 int mtu;
510
wenxuc8b34e62019-01-22 18:39:50 +0800511 tunnel_hlen = md ? tunnel_hlen : tunnel->hlen;
512 pkt_size = skb->len - tunnel_hlen - dev->hard_header_len;
513
Pravin B Shelar23a36472013-07-02 10:57:33 -0700514 if (df)
515 mtu = dst_mtu(&rt->dst) - dev->hard_header_len
wenxuc8b34e62019-01-22 18:39:50 +0800516 - sizeof(struct iphdr) - tunnel_hlen;
Pravin B Shelar23a36472013-07-02 10:57:33 -0700517 else
518 mtu = skb_dst(skb) ? dst_mtu(skb_dst(skb)) : dev->mtu;
519
Nicolas Dichtelf15ca722018-01-25 19:03:03 +0100520 skb_dst_update_pmtu(skb, mtu);
Pravin B Shelar23a36472013-07-02 10:57:33 -0700521
522 if (skb->protocol == htons(ETH_P_IP)) {
523 if (!skb_is_gso(skb) &&
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300524 (inner_iph->frag_off & htons(IP_DF)) &&
525 mtu < pkt_size) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700526 memset(IPCB(skb), 0, sizeof(*IPCB(skb)));
527 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED, htonl(mtu));
528 return -E2BIG;
529 }
530 }
531#if IS_ENABLED(CONFIG_IPV6)
532 else if (skb->protocol == htons(ETH_P_IPV6)) {
533 struct rt6_info *rt6 = (struct rt6_info *)skb_dst(skb);
wenxuc8b34e62019-01-22 18:39:50 +0800534 __be32 daddr;
535
536 daddr = md ? dst : tunnel->parms.iph.daddr;
Pravin B Shelar23a36472013-07-02 10:57:33 -0700537
538 if (rt6 && mtu < dst_mtu(skb_dst(skb)) &&
539 mtu >= IPV6_MIN_MTU) {
wenxuc8b34e62019-01-22 18:39:50 +0800540 if ((daddr && !ipv4_is_multicast(daddr)) ||
Pravin B Shelar23a36472013-07-02 10:57:33 -0700541 rt6->rt6i_dst.plen == 128) {
542 rt6->rt6i_flags |= RTF_MODIFIED;
543 dst_metric_set(skb_dst(skb), RTAX_MTU, mtu);
544 }
545 }
546
547 if (!skb_is_gso(skb) && mtu >= IPV6_MIN_MTU &&
548 mtu < pkt_size) {
549 icmpv6_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu);
550 return -E2BIG;
551 }
552 }
553#endif
554 return 0;
555}
556
wenxuc8b34e62019-01-22 18:39:50 +0800557void ip_md_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
558 u8 proto, int tunnel_hlen)
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700559{
560 struct ip_tunnel *tunnel = netdev_priv(dev);
561 u32 headroom = sizeof(struct iphdr);
562 struct ip_tunnel_info *tun_info;
563 const struct ip_tunnel_key *key;
564 const struct iphdr *inner_iph;
wenxuf46fe4f2019-01-22 18:39:49 +0800565 struct rtable *rt = NULL;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700566 struct flowi4 fl4;
567 __be16 df = 0;
568 u8 tos, ttl;
wenxuf46fe4f2019-01-22 18:39:49 +0800569 bool use_cache;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700570
571 tun_info = skb_tunnel_info(skb);
572 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
573 ip_tunnel_info_af(tun_info) != AF_INET))
574 goto tx_error;
575 key = &tun_info->key;
576 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
577 inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
578 tos = key->tos;
579 if (tos == 1) {
580 if (skb->protocol == htons(ETH_P_IP))
581 tos = inner_iph->tos;
582 else if (skb->protocol == htons(ETH_P_IPV6))
583 tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
584 }
wenxu6e6b9042019-01-22 18:39:51 +0800585 ip_tunnel_init_flow(&fl4, proto, key->u.ipv4.dst, key->u.ipv4.src,
586 tunnel_id_to_key32(key->tun_id), RT_TOS(tos),
587 0, skb->mark);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700588 if (tunnel->encap.type != TUNNEL_ENCAP_NONE)
589 goto tx_error;
wenxuf46fe4f2019-01-22 18:39:49 +0800590
591 use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
592 if (use_cache)
593 rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl4.saddr);
594 if (!rt) {
595 rt = ip_route_output_key(tunnel->net, &fl4);
596 if (IS_ERR(rt)) {
597 dev->stats.tx_carrier_errors++;
598 goto tx_error;
599 }
600 if (use_cache)
601 dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
602 fl4.saddr);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700603 }
604 if (rt->dst.dev == dev) {
605 ip_rt_put(rt);
606 dev->stats.collisions++;
607 goto tx_error;
608 }
wenxuc8b34e62019-01-22 18:39:50 +0800609
610 if (key->tun_flags & TUNNEL_DONT_FRAGMENT)
611 df = htons(IP_DF);
612 if (tnl_update_pmtu(dev, skb, rt, df, inner_iph, tunnel_hlen,
613 key->u.ipv4.dst, true)) {
614 ip_rt_put(rt);
615 goto tx_error;
616 }
617
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700618 tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
619 ttl = key->ttl;
620 if (ttl == 0) {
621 if (skb->protocol == htons(ETH_P_IP))
622 ttl = inner_iph->ttl;
623 else if (skb->protocol == htons(ETH_P_IPV6))
624 ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
625 else
626 ttl = ip4_dst_hoplimit(&rt->dst);
627 }
wenxuc8b34e62019-01-22 18:39:50 +0800628
629 if (!df && skb->protocol == htons(ETH_P_IP))
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700630 df = inner_iph->frag_off & htons(IP_DF);
wenxuc8b34e62019-01-22 18:39:50 +0800631
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700632 headroom += LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len;
633 if (headroom > dev->needed_headroom)
634 dev->needed_headroom = headroom;
635
636 if (skb_cow_head(skb, dev->needed_headroom)) {
637 ip_rt_put(rt);
638 goto tx_dropped;
639 }
Haishuang Yan0f693f12017-09-07 14:08:34 +0800640 iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, proto, tos, ttl,
641 df, !net_eq(tunnel->net, dev_net(dev)));
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700642 return;
643tx_error:
644 dev->stats.tx_errors++;
645 goto kfree;
646tx_dropped:
647 dev->stats.tx_dropped++;
648kfree:
649 kfree_skb(skb);
650}
651EXPORT_SYMBOL_GPL(ip_md_tunnel_xmit);
652
Pravin B Shelarc5441932013-03-25 14:49:35 +0000653void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
Tom Herbert56328482014-09-17 12:25:58 -0700654 const struct iphdr *tnl_params, u8 protocol)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000655{
656 struct ip_tunnel *tunnel = netdev_priv(dev);
657 const struct iphdr *inner_iph;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000658 struct flowi4 fl4;
659 u8 tos, ttl;
660 __be16 df;
Eric Dumazetb045d372014-02-03 12:52:14 -0800661 struct rtable *rt; /* Route to the other host */
Pravin B Shelarc5441932013-03-25 14:49:35 +0000662 unsigned int max_headroom; /* The extra header space needed */
663 __be32 dst;
Timo Teräs22fb22e2014-05-16 08:34:39 +0300664 bool connected;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000665
666 inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
Timo Teräs22fb22e2014-05-16 08:34:39 +0300667 connected = (tunnel->parms.iph.daddr != 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000668
Bernie Harris5146d1f2016-02-22 12:58:05 +1300669 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
670
Pravin B Shelarc5441932013-03-25 14:49:35 +0000671 dst = tnl_params->daddr;
672 if (dst == 0) {
673 /* NBMA tunnel */
wenxud71b57532019-01-19 13:11:25 +0800674 struct ip_tunnel_info *tun_info;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000675
Ian Morris51456b22015-04-03 09:17:26 +0100676 if (!skb_dst(skb)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000677 dev->stats.tx_fifo_errors++;
678 goto tx_error;
679 }
680
wenxud71b57532019-01-19 13:11:25 +0800681 tun_info = skb_tunnel_info(skb);
682 if (tun_info && (tun_info->mode & IP_TUNNEL_INFO_TX) &&
683 ip_tunnel_info_af(tun_info) == AF_INET &&
684 tun_info->key.u.ipv4.dst)
685 dst = tun_info->key.u.ipv4.dst;
686 else if (skb->protocol == htons(ETH_P_IP)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000687 rt = skb_rtable(skb);
688 dst = rt_nexthop(rt, inner_iph->daddr);
689 }
690#if IS_ENABLED(CONFIG_IPV6)
691 else if (skb->protocol == htons(ETH_P_IPV6)) {
692 const struct in6_addr *addr6;
693 struct neighbour *neigh;
694 bool do_tx_error_icmp;
695 int addr_type;
696
697 neigh = dst_neigh_lookup(skb_dst(skb),
698 &ipv6_hdr(skb)->daddr);
Ian Morris51456b22015-04-03 09:17:26 +0100699 if (!neigh)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000700 goto tx_error;
701
702 addr6 = (const struct in6_addr *)&neigh->primary_key;
703 addr_type = ipv6_addr_type(addr6);
704
705 if (addr_type == IPV6_ADDR_ANY) {
706 addr6 = &ipv6_hdr(skb)->daddr;
707 addr_type = ipv6_addr_type(addr6);
708 }
709
710 if ((addr_type & IPV6_ADDR_COMPATv4) == 0)
711 do_tx_error_icmp = true;
712 else {
713 do_tx_error_icmp = false;
714 dst = addr6->s6_addr32[3];
715 }
716 neigh_release(neigh);
717 if (do_tx_error_icmp)
718 goto tx_error_icmp;
719 }
720#endif
721 else
722 goto tx_error;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800723
724 connected = false;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000725 }
726
727 tos = tnl_params->tos;
728 if (tos & 0x1) {
729 tos &= ~0x1;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800730 if (skb->protocol == htons(ETH_P_IP)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000731 tos = inner_iph->tos;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800732 connected = false;
733 } else if (skb->protocol == htons(ETH_P_IPV6)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000734 tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800735 connected = false;
736 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000737 }
738
David S. Miller0f3e9c92018-03-06 00:53:44 -0500739 ip_tunnel_init_flow(&fl4, protocol, dst, tnl_params->saddr,
740 tunnel->parms.o_key, RT_TOS(tos), tunnel->parms.link,
741 tunnel->fwmark);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800742
Tom Herbert56328482014-09-17 12:25:58 -0700743 if (ip_tunnel_encap(skb, tunnel, &protocol, &fl4) < 0)
744 goto tx_error;
745
Paolo Abenie09acdd2016-02-12 15:43:55 +0100746 rt = connected ? dst_cache_get_ip4(&tunnel->dst_cache, &fl4.saddr) :
747 NULL;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800748
749 if (!rt) {
750 rt = ip_route_output_key(tunnel->net, &fl4);
751
752 if (IS_ERR(rt)) {
753 dev->stats.tx_carrier_errors++;
754 goto tx_error;
755 }
756 if (connected)
Paolo Abenie09acdd2016-02-12 15:43:55 +0100757 dst_cache_set_ip4(&tunnel->dst_cache, &rt->dst,
758 fl4.saddr);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000759 }
Tom Herbert7d442fa2014-01-02 11:48:26 -0800760
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700761 if (rt->dst.dev == dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000762 ip_rt_put(rt);
763 dev->stats.collisions++;
764 goto tx_error;
765 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000766
wenxuc8b34e62019-01-22 18:39:50 +0800767 if (tnl_update_pmtu(dev, skb, rt, tnl_params->frag_off, inner_iph,
768 0, 0, false)) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700769 ip_rt_put(rt);
770 goto tx_error;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000771 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000772
773 if (tunnel->err_count > 0) {
774 if (time_before(jiffies,
775 tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
776 tunnel->err_count--;
777
778 dst_link_failure(skb);
779 } else
780 tunnel->err_count = 0;
781 }
782
Pravin B Shelard4a71b12013-09-25 09:57:47 -0700783 tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000784 ttl = tnl_params->ttl;
785 if (ttl == 0) {
786 if (skb->protocol == htons(ETH_P_IP))
787 ttl = inner_iph->ttl;
788#if IS_ENABLED(CONFIG_IPV6)
789 else if (skb->protocol == htons(ETH_P_IPV6))
790 ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
791#endif
792 else
793 ttl = ip4_dst_hoplimit(&rt->dst);
794 }
795
Pravin B Shelar23a36472013-07-02 10:57:33 -0700796 df = tnl_params->frag_off;
Philip Prindeville22a59be2016-06-14 15:53:02 -0600797 if (skb->protocol == htons(ETH_P_IP) && !tunnel->ignore_df)
Pravin B Shelar23a36472013-07-02 10:57:33 -0700798 df |= (inner_iph->frag_off&htons(IP_DF));
799
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700800 max_headroom = LL_RESERVED_SPACE(rt->dst.dev) + sizeof(struct iphdr)
Tom Herbert7371e022014-10-03 15:48:07 -0700801 + rt->dst.header_len + ip_encap_hlen(&tunnel->encap);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200802 if (max_headroom > dev->needed_headroom)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000803 dev->needed_headroom = max_headroom;
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200804
805 if (skb_cow_head(skb, dev->needed_headroom)) {
Dmitry Popov586d5fc2014-06-06 04:34:37 +0400806 ip_rt_put(rt);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200807 dev->stats.tx_dropped++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800808 kfree_skb(skb);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200809 return;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000810 }
811
Pravin B Shelar039f5062015-12-24 14:34:54 -0800812 iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, protocol, tos, ttl,
813 df, !net_eq(tunnel->net, dev_net(dev)));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000814 return;
815
816#if IS_ENABLED(CONFIG_IPV6)
817tx_error_icmp:
818 dst_link_failure(skb);
819#endif
820tx_error:
821 dev->stats.tx_errors++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800822 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000823}
824EXPORT_SYMBOL_GPL(ip_tunnel_xmit);
825
826static void ip_tunnel_update(struct ip_tunnel_net *itn,
827 struct ip_tunnel *t,
828 struct net_device *dev,
829 struct ip_tunnel_parm *p,
Craig Gallek9830ad42017-04-19 12:30:54 -0400830 bool set_mtu,
831 __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000832{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700833 ip_tunnel_del(itn, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000834 t->parms.iph.saddr = p->iph.saddr;
835 t->parms.iph.daddr = p->iph.daddr;
836 t->parms.i_key = p->i_key;
837 t->parms.o_key = p->o_key;
838 if (dev->type != ARPHRD_ETHER) {
839 memcpy(dev->dev_addr, &p->iph.saddr, 4);
840 memcpy(dev->broadcast, &p->iph.daddr, 4);
841 }
842 ip_tunnel_add(itn, t);
843
844 t->parms.iph.ttl = p->iph.ttl;
845 t->parms.iph.tos = p->iph.tos;
846 t->parms.iph.frag_off = p->iph.frag_off;
847
Craig Gallek9830ad42017-04-19 12:30:54 -0400848 if (t->parms.link != p->link || t->fwmark != fwmark) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000849 int mtu;
850
851 t->parms.link = p->link;
Craig Gallek9830ad42017-04-19 12:30:54 -0400852 t->fwmark = fwmark;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000853 mtu = ip_tunnel_bind_dev(dev);
854 if (set_mtu)
855 dev->mtu = mtu;
856 }
Paolo Abenie09acdd2016-02-12 15:43:55 +0100857 dst_cache_reset(&t->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000858 netdev_state_change(dev);
859}
860
861int ip_tunnel_ioctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd)
862{
863 int err = 0;
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200864 struct ip_tunnel *t = netdev_priv(dev);
865 struct net *net = t->net;
866 struct ip_tunnel_net *itn = net_generic(net, t->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000867
Pravin B Shelarc5441932013-03-25 14:49:35 +0000868 switch (cmd) {
869 case SIOCGETTUNNEL:
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200870 if (dev == itn->fb_tunnel_dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000871 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100872 if (!t)
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200873 t = netdev_priv(dev);
874 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000875 memcpy(p, &t->parms, sizeof(*p));
876 break;
877
878 case SIOCADDTUNNEL:
879 case SIOCCHGTUNNEL:
880 err = -EPERM;
881 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
882 goto done;
883 if (p->iph.ttl)
884 p->iph.frag_off |= htons(IP_DF);
Dmitry Popov7c8e6b92014-06-08 02:06:25 +0400885 if (!(p->i_flags & VTI_ISVTI)) {
886 if (!(p->i_flags & TUNNEL_KEY))
887 p->i_key = 0;
888 if (!(p->o_flags & TUNNEL_KEY))
889 p->o_key = 0;
890 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000891
Eric Dumazet79134e62018-03-08 12:51:41 -0800892 t = ip_tunnel_find(itn, p, itn->type);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000893
Steffen Klassertd61746b2014-09-22 09:11:08 +0200894 if (cmd == SIOCADDTUNNEL) {
895 if (!t) {
896 t = ip_tunnel_create(net, itn, p);
897 err = PTR_ERR_OR_ZERO(t);
898 break;
899 }
900
901 err = -EEXIST;
Duan Jiongee30ef4d2014-05-15 13:07:02 +0800902 break;
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100903 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000904 if (dev != itn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
Ian Morris00db4122015-04-03 09:17:27 +0100905 if (t) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000906 if (t->dev != dev) {
907 err = -EEXIST;
908 break;
909 }
910 } else {
911 unsigned int nflags = 0;
912
913 if (ipv4_is_multicast(p->iph.daddr))
914 nflags = IFF_BROADCAST;
915 else if (p->iph.daddr)
916 nflags = IFF_POINTOPOINT;
917
918 if ((dev->flags^nflags)&(IFF_POINTOPOINT|IFF_BROADCAST)) {
919 err = -EINVAL;
920 break;
921 }
922
923 t = netdev_priv(dev);
924 }
925 }
926
927 if (t) {
928 err = 0;
Craig Gallek9830ad42017-04-19 12:30:54 -0400929 ip_tunnel_update(itn, t, dev, p, true, 0);
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100930 } else {
931 err = -ENOENT;
932 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000933 break;
934
935 case SIOCDELTUNNEL:
936 err = -EPERM;
937 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
938 goto done;
939
940 if (dev == itn->fb_tunnel_dev) {
941 err = -ENOENT;
942 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100943 if (!t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000944 goto done;
945 err = -EPERM;
946 if (t == netdev_priv(itn->fb_tunnel_dev))
947 goto done;
948 dev = t->dev;
949 }
950 unregister_netdevice(dev);
951 err = 0;
952 break;
953
954 default:
955 err = -EINVAL;
956 }
957
958done:
959 return err;
960}
961EXPORT_SYMBOL_GPL(ip_tunnel_ioctl);
962
David Wragg7e059152016-02-10 00:05:58 +0000963int __ip_tunnel_change_mtu(struct net_device *dev, int new_mtu, bool strict)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000964{
965 struct ip_tunnel *tunnel = netdev_priv(dev);
966 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
Nicolas Dichtel82612de2018-05-31 10:59:32 +0200967 int max_mtu = IP_MAX_MTU - dev->hard_header_len - t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000968
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400969 if (new_mtu < ETH_MIN_MTU)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000970 return -EINVAL;
David Wragg7e059152016-02-10 00:05:58 +0000971
972 if (new_mtu > max_mtu) {
973 if (strict)
974 return -EINVAL;
975
976 new_mtu = max_mtu;
977 }
978
Pravin B Shelarc5441932013-03-25 14:49:35 +0000979 dev->mtu = new_mtu;
980 return 0;
981}
David Wragg7e059152016-02-10 00:05:58 +0000982EXPORT_SYMBOL_GPL(__ip_tunnel_change_mtu);
983
984int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
985{
986 return __ip_tunnel_change_mtu(dev, new_mtu, true);
987}
Pravin B Shelarc5441932013-03-25 14:49:35 +0000988EXPORT_SYMBOL_GPL(ip_tunnel_change_mtu);
989
990static void ip_tunnel_dev_free(struct net_device *dev)
991{
992 struct ip_tunnel *tunnel = netdev_priv(dev);
993
994 gro_cells_destroy(&tunnel->gro_cells);
Paolo Abenie09acdd2016-02-12 15:43:55 +0100995 dst_cache_destroy(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000996 free_percpu(dev->tstats);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000997}
998
999void ip_tunnel_dellink(struct net_device *dev, struct list_head *head)
1000{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001001 struct ip_tunnel *tunnel = netdev_priv(dev);
1002 struct ip_tunnel_net *itn;
1003
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001004 itn = net_generic(tunnel->net, tunnel->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001005
1006 if (itn->fb_tunnel_dev != dev) {
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001007 ip_tunnel_del(itn, netdev_priv(dev));
Pravin B Shelarc5441932013-03-25 14:49:35 +00001008 unregister_netdevice_queue(dev, head);
1009 }
1010}
1011EXPORT_SYMBOL_GPL(ip_tunnel_dellink);
1012
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001013struct net *ip_tunnel_get_link_net(const struct net_device *dev)
1014{
1015 struct ip_tunnel *tunnel = netdev_priv(dev);
1016
1017 return tunnel->net;
1018}
1019EXPORT_SYMBOL(ip_tunnel_get_link_net);
1020
Nicolas Dichtel1e995842015-04-02 17:07:02 +02001021int ip_tunnel_get_iflink(const struct net_device *dev)
1022{
1023 struct ip_tunnel *tunnel = netdev_priv(dev);
1024
1025 return tunnel->parms.link;
1026}
1027EXPORT_SYMBOL(ip_tunnel_get_iflink);
1028
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +03001029int ip_tunnel_init_net(struct net *net, unsigned int ip_tnl_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001030 struct rtnl_link_ops *ops, char *devname)
1031{
1032 struct ip_tunnel_net *itn = net_generic(net, ip_tnl_net_id);
1033 struct ip_tunnel_parm parms;
stephen hemminger6261d982013-08-05 22:51:37 -07001034 unsigned int i;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001035
Eric Dumazet79134e62018-03-08 12:51:41 -08001036 itn->rtnl_link_ops = ops;
stephen hemminger6261d982013-08-05 22:51:37 -07001037 for (i = 0; i < IP_TNL_HASH_SIZE; i++)
1038 INIT_HLIST_HEAD(&itn->tunnels[i]);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001039
Eric Dumazet79134e62018-03-08 12:51:41 -08001040 if (!ops || !net_has_fallback_tunnels(net)) {
1041 struct ip_tunnel_net *it_init_net;
1042
1043 it_init_net = net_generic(&init_net, ip_tnl_net_id);
1044 itn->type = it_init_net->type;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001045 itn->fb_tunnel_dev = NULL;
1046 return 0;
1047 }
stephen hemminger6261d982013-08-05 22:51:37 -07001048
Pravin B Shelarc5441932013-03-25 14:49:35 +00001049 memset(&parms, 0, sizeof(parms));
1050 if (devname)
1051 strlcpy(parms.name, devname, IFNAMSIZ);
1052
1053 rtnl_lock();
1054 itn->fb_tunnel_dev = __ip_tunnel_create(net, ops, &parms);
Dan Carpenterea857f22013-08-19 10:05:10 +03001055 /* FB netdevice is special: we have one, and only one per netns.
1056 * Allowing to move it to another netns is clearly unsafe.
1057 */
Steffen Klassert67013282013-10-01 11:34:48 +02001058 if (!IS_ERR(itn->fb_tunnel_dev)) {
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001059 itn->fb_tunnel_dev->features |= NETIF_F_NETNS_LOCAL;
Steffen Klassert78ff4be2014-05-19 11:36:56 +02001060 itn->fb_tunnel_dev->mtu = ip_tunnel_bind_dev(itn->fb_tunnel_dev);
Steffen Klassert67013282013-10-01 11:34:48 +02001061 ip_tunnel_add(itn, netdev_priv(itn->fb_tunnel_dev));
Eric Dumazet79134e62018-03-08 12:51:41 -08001062 itn->type = itn->fb_tunnel_dev->type;
Steffen Klassert67013282013-10-01 11:34:48 +02001063 }
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001064 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001065
Sachin Kamat27d79f32014-01-27 12:13:57 +05301066 return PTR_ERR_OR_ZERO(itn->fb_tunnel_dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001067}
1068EXPORT_SYMBOL_GPL(ip_tunnel_init_net);
1069
Eric Dumazet79134e62018-03-08 12:51:41 -08001070static void ip_tunnel_destroy(struct net *net, struct ip_tunnel_net *itn,
1071 struct list_head *head,
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001072 struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001073{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001074 struct net_device *dev, *aux;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001075 int h;
1076
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001077 for_each_netdev_safe(net, dev, aux)
1078 if (dev->rtnl_link_ops == ops)
1079 unregister_netdevice_queue(dev, head);
1080
Pravin B Shelarc5441932013-03-25 14:49:35 +00001081 for (h = 0; h < IP_TNL_HASH_SIZE; h++) {
1082 struct ip_tunnel *t;
1083 struct hlist_node *n;
1084 struct hlist_head *thead = &itn->tunnels[h];
1085
1086 hlist_for_each_entry_safe(t, n, thead, hash_node)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001087 /* If dev is in the same netns, it has already
1088 * been added to the list by the previous loop.
1089 */
1090 if (!net_eq(dev_net(t->dev), net))
1091 unregister_netdevice_queue(t->dev, head);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001092 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001093}
1094
Eric Dumazet64bc1782017-09-19 16:27:09 -07001095void ip_tunnel_delete_nets(struct list_head *net_list, unsigned int id,
1096 struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001097{
Eric Dumazet64bc1782017-09-19 16:27:09 -07001098 struct ip_tunnel_net *itn;
1099 struct net *net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001100 LIST_HEAD(list);
1101
1102 rtnl_lock();
Eric Dumazet64bc1782017-09-19 16:27:09 -07001103 list_for_each_entry(net, net_list, exit_list) {
1104 itn = net_generic(net, id);
Eric Dumazet79134e62018-03-08 12:51:41 -08001105 ip_tunnel_destroy(net, itn, &list, ops);
Eric Dumazet64bc1782017-09-19 16:27:09 -07001106 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001107 unregister_netdevice_many(&list);
1108 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001109}
Eric Dumazet64bc1782017-09-19 16:27:09 -07001110EXPORT_SYMBOL_GPL(ip_tunnel_delete_nets);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001111
1112int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
Craig Gallek9830ad42017-04-19 12:30:54 -04001113 struct ip_tunnel_parm *p, __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001114{
1115 struct ip_tunnel *nt;
1116 struct net *net = dev_net(dev);
1117 struct ip_tunnel_net *itn;
1118 int mtu;
1119 int err;
1120
1121 nt = netdev_priv(dev);
1122 itn = net_generic(net, nt->ip_tnl_net_id);
1123
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001124 if (nt->collect_md) {
1125 if (rtnl_dereference(itn->collect_md_tun))
1126 return -EEXIST;
1127 } else {
1128 if (ip_tunnel_find(itn, p, dev->type))
1129 return -EEXIST;
1130 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001131
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +02001132 nt->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001133 nt->parms = *p;
Craig Gallek9830ad42017-04-19 12:30:54 -04001134 nt->fwmark = fwmark;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001135 err = register_netdevice(dev);
1136 if (err)
Petr Machataf6cc9c02018-03-22 19:53:33 +02001137 goto err_register_netdevice;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001138
1139 if (dev->type == ARPHRD_ETHER && !tb[IFLA_ADDRESS])
1140 eth_hw_addr_random(dev);
1141
1142 mtu = ip_tunnel_bind_dev(dev);
Stefano Brivio24fc7972018-03-15 17:16:28 +01001143 if (tb[IFLA_MTU]) {
Nicolas Dichtel82612de2018-05-31 10:59:32 +02001144 unsigned int max = IP_MAX_MTU - dev->hard_header_len - nt->hlen;
Stefano Brivio24fc7972018-03-15 17:16:28 +01001145
David S. Miller5568cdc2018-03-29 11:42:14 -04001146 mtu = clamp(dev->mtu, (unsigned int)ETH_MIN_MTU,
1147 (unsigned int)(max - sizeof(struct iphdr)));
Petr Machataf6cc9c02018-03-22 19:53:33 +02001148 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001149
David S. Miller5568cdc2018-03-29 11:42:14 -04001150 err = dev_set_mtu(dev, mtu);
1151 if (err)
1152 goto err_dev_set_mtu;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001153
1154 ip_tunnel_add(itn, nt);
Petr Machataf6cc9c02018-03-22 19:53:33 +02001155 return 0;
1156
1157err_dev_set_mtu:
1158 unregister_netdevice(dev);
1159err_register_netdevice:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001160 return err;
1161}
1162EXPORT_SYMBOL_GPL(ip_tunnel_newlink);
1163
1164int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
Craig Gallek9830ad42017-04-19 12:30:54 -04001165 struct ip_tunnel_parm *p, __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001166{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001167 struct ip_tunnel *t;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001168 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001169 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001170 struct ip_tunnel_net *itn = net_generic(net, tunnel->ip_tnl_net_id);
1171
1172 if (dev == itn->fb_tunnel_dev)
1173 return -EINVAL;
1174
Pravin B Shelarc5441932013-03-25 14:49:35 +00001175 t = ip_tunnel_find(itn, p, dev->type);
1176
1177 if (t) {
1178 if (t->dev != dev)
1179 return -EEXIST;
1180 } else {
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001181 t = tunnel;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001182
1183 if (dev->type != ARPHRD_ETHER) {
1184 unsigned int nflags = 0;
1185
1186 if (ipv4_is_multicast(p->iph.daddr))
1187 nflags = IFF_BROADCAST;
1188 else if (p->iph.daddr)
1189 nflags = IFF_POINTOPOINT;
1190
1191 if ((dev->flags ^ nflags) &
1192 (IFF_POINTOPOINT | IFF_BROADCAST))
1193 return -EINVAL;
1194 }
1195 }
1196
Craig Gallek9830ad42017-04-19 12:30:54 -04001197 ip_tunnel_update(itn, t, dev, p, !tb[IFLA_MTU], fwmark);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001198 return 0;
1199}
1200EXPORT_SYMBOL_GPL(ip_tunnel_changelink);
1201
1202int ip_tunnel_init(struct net_device *dev)
1203{
1204 struct ip_tunnel *tunnel = netdev_priv(dev);
1205 struct iphdr *iph = &tunnel->parms.iph;
WANG Cong1c213bd2014-02-13 11:46:28 -08001206 int err;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001207
David S. Millercf124db2017-05-08 12:52:56 -04001208 dev->needs_free_netdev = true;
1209 dev->priv_destructor = ip_tunnel_dev_free;
WANG Cong1c213bd2014-02-13 11:46:28 -08001210 dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001211 if (!dev->tstats)
1212 return -ENOMEM;
1213
Paolo Abenie09acdd2016-02-12 15:43:55 +01001214 err = dst_cache_init(&tunnel->dst_cache, GFP_KERNEL);
1215 if (err) {
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001216 free_percpu(dev->tstats);
Paolo Abenie09acdd2016-02-12 15:43:55 +01001217 return err;
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001218 }
1219
Pravin B Shelarc5441932013-03-25 14:49:35 +00001220 err = gro_cells_init(&tunnel->gro_cells, dev);
1221 if (err) {
Paolo Abenie09acdd2016-02-12 15:43:55 +01001222 dst_cache_destroy(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001223 free_percpu(dev->tstats);
1224 return err;
1225 }
1226
1227 tunnel->dev = dev;
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001228 tunnel->net = dev_net(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001229 strcpy(tunnel->parms.name, dev->name);
1230 iph->version = 4;
1231 iph->ihl = 5;
1232
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001233 if (tunnel->collect_md) {
1234 dev->features |= NETIF_F_NETNS_LOCAL;
1235 netif_keep_dst(dev);
1236 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001237 return 0;
1238}
1239EXPORT_SYMBOL_GPL(ip_tunnel_init);
1240
1241void ip_tunnel_uninit(struct net_device *dev)
1242{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001243 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001244 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001245 struct ip_tunnel_net *itn;
1246
1247 itn = net_generic(net, tunnel->ip_tnl_net_id);
1248 /* fb_tunnel_dev will be unregisted in net-exit call. */
1249 if (itn->fb_tunnel_dev != dev)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001250 ip_tunnel_del(itn, netdev_priv(dev));
Tom Herbert7d442fa2014-01-02 11:48:26 -08001251
Paolo Abenie09acdd2016-02-12 15:43:55 +01001252 dst_cache_reset(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001253}
1254EXPORT_SYMBOL_GPL(ip_tunnel_uninit);
1255
1256/* Do least required initialization, rest of init is done in tunnel_init call */
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +03001257void ip_tunnel_setup(struct net_device *dev, unsigned int net_id)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001258{
1259 struct ip_tunnel *tunnel = netdev_priv(dev);
1260 tunnel->ip_tnl_net_id = net_id;
1261}
1262EXPORT_SYMBOL_GPL(ip_tunnel_setup);
1263
1264MODULE_LICENSE("GPL");