blob: b2117d89bc83aa92bb18390ebc2edb1da69da042 [file] [log] [blame]
Pravin B Shelarc5441932013-03-25 14:49:35 +00001/*
2 * Copyright (c) 2013 Nicira, Inc.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of version 2 of the GNU General Public
6 * License as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public License
14 * along with this program; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16 * 02110-1301, USA
17 */
18
19#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
20
21#include <linux/capability.h>
22#include <linux/module.h>
23#include <linux/types.h>
24#include <linux/kernel.h>
25#include <linux/slab.h>
26#include <linux/uaccess.h>
27#include <linux/skbuff.h>
28#include <linux/netdevice.h>
29#include <linux/in.h>
30#include <linux/tcp.h>
31#include <linux/udp.h>
32#include <linux/if_arp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000033#include <linux/init.h>
34#include <linux/in6.h>
35#include <linux/inetdevice.h>
36#include <linux/igmp.h>
37#include <linux/netfilter_ipv4.h>
38#include <linux/etherdevice.h>
39#include <linux/if_ether.h>
40#include <linux/if_vlan.h>
41#include <linux/rculist.h>
Sachin Kamat27d79f32014-01-27 12:13:57 +053042#include <linux/err.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000043
44#include <net/sock.h>
45#include <net/ip.h>
46#include <net/icmp.h>
47#include <net/protocol.h>
48#include <net/ip_tunnels.h>
49#include <net/arp.h>
50#include <net/checksum.h>
51#include <net/dsfield.h>
52#include <net/inet_ecn.h>
53#include <net/xfrm.h>
54#include <net/net_namespace.h>
55#include <net/netns/generic.h>
56#include <net/rtnetlink.h>
Tom Herbert56328482014-09-17 12:25:58 -070057#include <net/udp.h>
Alexei Starovoitovcfc73812016-09-15 13:00:29 -070058#include <net/dst_metadata.h>
Tom Herbert63487ba2014-11-04 09:06:51 -080059
Pravin B Shelarc5441932013-03-25 14:49:35 +000060#if IS_ENABLED(CONFIG_IPV6)
61#include <net/ipv6.h>
62#include <net/ip6_fib.h>
63#include <net/ip6_route.h>
64#endif
65
Duan Jiong967680e2014-01-19 16:43:42 +080066static unsigned int ip_tunnel_hash(__be32 key, __be32 remote)
Pravin B Shelarc5441932013-03-25 14:49:35 +000067{
68 return hash_32((__force u32)key ^ (__force u32)remote,
69 IP_TNL_HASH_BITS);
70}
71
Pravin B Shelarc5441932013-03-25 14:49:35 +000072static bool ip_tunnel_key_match(const struct ip_tunnel_parm *p,
73 __be16 flags, __be32 key)
74{
75 if (p->i_flags & TUNNEL_KEY) {
76 if (flags & TUNNEL_KEY)
77 return key == p->i_key;
78 else
79 /* key expected, none present */
80 return false;
81 } else
82 return !(flags & TUNNEL_KEY);
83}
84
85/* Fallback tunnel: no source, no destination, no key, no options
86
87 Tunnel hash table:
88 We require exact key match i.e. if a key is present in packet
89 it will match only tunnel with the same key; if it is not present,
90 it will match only keyless tunnel.
91
92 All keysless packets, if not matched configured keyless tunnels
93 will match fallback tunnel.
94 Given src, dst and key, find appropriate for input tunnel.
95*/
96struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
97 int link, __be16 flags,
98 __be32 remote, __be32 local,
99 __be32 key)
100{
101 unsigned int hash;
102 struct ip_tunnel *t, *cand = NULL;
103 struct hlist_head *head;
104
Duan Jiong967680e2014-01-19 16:43:42 +0800105 hash = ip_tunnel_hash(key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000106 head = &itn->tunnels[hash];
107
108 hlist_for_each_entry_rcu(t, head, hash_node) {
109 if (local != t->parms.iph.saddr ||
110 remote != t->parms.iph.daddr ||
111 !(t->dev->flags & IFF_UP))
112 continue;
113
114 if (!ip_tunnel_key_match(&t->parms, flags, key))
115 continue;
116
117 if (t->parms.link == link)
118 return t;
119 else
120 cand = t;
121 }
122
123 hlist_for_each_entry_rcu(t, head, hash_node) {
124 if (remote != t->parms.iph.daddr ||
Dmitry Popove0056592014-07-05 02:26:37 +0400125 t->parms.iph.saddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000126 !(t->dev->flags & IFF_UP))
127 continue;
128
129 if (!ip_tunnel_key_match(&t->parms, flags, key))
130 continue;
131
132 if (t->parms.link == link)
133 return t;
134 else if (!cand)
135 cand = t;
136 }
137
Duan Jiong967680e2014-01-19 16:43:42 +0800138 hash = ip_tunnel_hash(key, 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000139 head = &itn->tunnels[hash];
140
141 hlist_for_each_entry_rcu(t, head, hash_node) {
Dmitry Popove0056592014-07-05 02:26:37 +0400142 if ((local != t->parms.iph.saddr || t->parms.iph.daddr != 0) &&
143 (local != t->parms.iph.daddr || !ipv4_is_multicast(local)))
144 continue;
145
146 if (!(t->dev->flags & IFF_UP))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000147 continue;
148
149 if (!ip_tunnel_key_match(&t->parms, flags, key))
150 continue;
151
152 if (t->parms.link == link)
153 return t;
154 else if (!cand)
155 cand = t;
156 }
157
158 if (flags & TUNNEL_NO_KEY)
159 goto skip_key_lookup;
160
161 hlist_for_each_entry_rcu(t, head, hash_node) {
162 if (t->parms.i_key != key ||
Dmitry Popove0056592014-07-05 02:26:37 +0400163 t->parms.iph.saddr != 0 ||
164 t->parms.iph.daddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000165 !(t->dev->flags & IFF_UP))
166 continue;
167
168 if (t->parms.link == link)
169 return t;
170 else if (!cand)
171 cand = t;
172 }
173
174skip_key_lookup:
175 if (cand)
176 return cand;
177
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700178 t = rcu_dereference(itn->collect_md_tun);
Haishuang Yan833a8b42017-09-12 17:47:56 +0800179 if (t && t->dev->flags & IFF_UP)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700180 return t;
181
Pravin B Shelarc5441932013-03-25 14:49:35 +0000182 if (itn->fb_tunnel_dev && itn->fb_tunnel_dev->flags & IFF_UP)
183 return netdev_priv(itn->fb_tunnel_dev);
184
Pravin B Shelarc5441932013-03-25 14:49:35 +0000185 return NULL;
186}
187EXPORT_SYMBOL_GPL(ip_tunnel_lookup);
188
189static struct hlist_head *ip_bucket(struct ip_tunnel_net *itn,
190 struct ip_tunnel_parm *parms)
191{
192 unsigned int h;
193 __be32 remote;
Steffen Klassert6d608f02014-02-21 08:41:09 +0100194 __be32 i_key = parms->i_key;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000195
196 if (parms->iph.daddr && !ipv4_is_multicast(parms->iph.daddr))
197 remote = parms->iph.daddr;
198 else
199 remote = 0;
200
Steffen Klassert6d608f02014-02-21 08:41:09 +0100201 if (!(parms->i_flags & TUNNEL_KEY) && (parms->i_flags & VTI_ISVTI))
202 i_key = 0;
203
204 h = ip_tunnel_hash(i_key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000205 return &itn->tunnels[h];
206}
207
208static void ip_tunnel_add(struct ip_tunnel_net *itn, struct ip_tunnel *t)
209{
210 struct hlist_head *head = ip_bucket(itn, &t->parms);
211
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700212 if (t->collect_md)
213 rcu_assign_pointer(itn->collect_md_tun, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000214 hlist_add_head_rcu(&t->hash_node, head);
215}
216
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700217static void ip_tunnel_del(struct ip_tunnel_net *itn, struct ip_tunnel *t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000218{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700219 if (t->collect_md)
220 rcu_assign_pointer(itn->collect_md_tun, NULL);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000221 hlist_del_init_rcu(&t->hash_node);
222}
223
224static struct ip_tunnel *ip_tunnel_find(struct ip_tunnel_net *itn,
225 struct ip_tunnel_parm *parms,
226 int type)
227{
228 __be32 remote = parms->iph.daddr;
229 __be32 local = parms->iph.saddr;
230 __be32 key = parms->i_key;
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400231 __be16 flags = parms->i_flags;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000232 int link = parms->link;
233 struct ip_tunnel *t = NULL;
234 struct hlist_head *head = ip_bucket(itn, parms);
235
236 hlist_for_each_entry_rcu(t, head, hash_node) {
237 if (local == t->parms.iph.saddr &&
238 remote == t->parms.iph.daddr &&
Pravin B Shelarc5441932013-03-25 14:49:35 +0000239 link == t->parms.link &&
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400240 type == t->dev->type &&
241 ip_tunnel_key_match(&t->parms, flags, key))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000242 break;
243 }
244 return t;
245}
246
247static struct net_device *__ip_tunnel_create(struct net *net,
248 const struct rtnl_link_ops *ops,
249 struct ip_tunnel_parm *parms)
250{
251 int err;
252 struct ip_tunnel *tunnel;
253 struct net_device *dev;
254 char name[IFNAMSIZ];
255
256 if (parms->name[0])
257 strlcpy(name, parms->name, IFNAMSIZ);
258 else {
Pravin B Shelar54a5d382013-03-28 08:21:46 +0000259 if (strlen(ops->kind) > (IFNAMSIZ - 3)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000260 err = -E2BIG;
261 goto failed;
262 }
263 strlcpy(name, ops->kind, IFNAMSIZ);
264 strncat(name, "%d", 2);
265 }
266
267 ASSERT_RTNL();
Tom Gundersenc835a672014-07-14 16:37:24 +0200268 dev = alloc_netdev(ops->priv_size, name, NET_NAME_UNKNOWN, ops->setup);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000269 if (!dev) {
270 err = -ENOMEM;
271 goto failed;
272 }
273 dev_net_set(dev, net);
274
275 dev->rtnl_link_ops = ops;
276
277 tunnel = netdev_priv(dev);
278 tunnel->parms = *parms;
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +0200279 tunnel->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000280
281 err = register_netdevice(dev);
282 if (err)
283 goto failed_free;
284
285 return dev;
286
287failed_free:
288 free_netdev(dev);
289failed:
290 return ERR_PTR(err);
291}
292
Pravin B Shelarc5441932013-03-25 14:49:35 +0000293static int ip_tunnel_bind_dev(struct net_device *dev)
294{
295 struct net_device *tdev = NULL;
296 struct ip_tunnel *tunnel = netdev_priv(dev);
297 const struct iphdr *iph;
298 int hlen = LL_MAX_HEADER;
299 int mtu = ETH_DATA_LEN;
300 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
301
302 iph = &tunnel->parms.iph;
303
304 /* Guess output device to choose reasonable mtu and needed_headroom */
305 if (iph->daddr) {
306 struct flowi4 fl4;
307 struct rtable *rt;
308
Petr Machatab0066da2018-02-27 14:53:38 +0100309 ip_tunnel_init_flow(&fl4, iph->protocol, iph->daddr,
310 iph->saddr, tunnel->parms.o_key,
311 RT_TOS(iph->tos), tunnel->parms.link,
312 tunnel->fwmark);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800313 rt = ip_route_output_key(tunnel->net, &fl4);
314
Pravin B Shelarc5441932013-03-25 14:49:35 +0000315 if (!IS_ERR(rt)) {
316 tdev = rt->dst.dev;
317 ip_rt_put(rt);
318 }
319 if (dev->type != ARPHRD_ETHER)
320 dev->flags |= IFF_POINTOPOINT;
Paolo Abenif27337e2016-04-28 11:04:51 +0200321
322 dst_cache_reset(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000323 }
324
325 if (!tdev && tunnel->parms.link)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200326 tdev = __dev_get_by_index(tunnel->net, tunnel->parms.link);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000327
328 if (tdev) {
329 hlen = tdev->hard_header_len + tdev->needed_headroom;
330 mtu = tdev->mtu;
331 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000332
333 dev->needed_headroom = t_hlen + hlen;
334 mtu -= (dev->hard_header_len + t_hlen);
335
Eric Dumazetb5476022017-12-11 07:17:39 -0800336 if (mtu < IPV4_MIN_MTU)
337 mtu = IPV4_MIN_MTU;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000338
339 return mtu;
340}
341
342static struct ip_tunnel *ip_tunnel_create(struct net *net,
343 struct ip_tunnel_net *itn,
344 struct ip_tunnel_parm *parms)
345{
Julia Lawall4929fd82014-05-15 05:43:20 +0200346 struct ip_tunnel *nt;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000347 struct net_device *dev;
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400348 int t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000349
350 BUG_ON(!itn->fb_tunnel_dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000351 dev = __ip_tunnel_create(net, itn->fb_tunnel_dev->rtnl_link_ops, parms);
352 if (IS_ERR(dev))
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100353 return ERR_CAST(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000354
355 dev->mtu = ip_tunnel_bind_dev(dev);
356
357 nt = netdev_priv(dev);
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400358 t_hlen = nt->hlen + sizeof(struct iphdr);
359 dev->min_mtu = ETH_MIN_MTU;
360 dev->max_mtu = 0xFFF8 - dev->hard_header_len - t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000361 ip_tunnel_add(itn, nt);
362 return nt;
363}
364
365int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700366 const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
367 bool log_ecn_error)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000368{
Li RongQing8f849852014-01-04 13:57:59 +0800369 struct pcpu_sw_netstats *tstats;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000370 const struct iphdr *iph = ip_hdr(skb);
371 int err;
372
Pravin B Shelarc5441932013-03-25 14:49:35 +0000373#ifdef CONFIG_NET_IPGRE_BROADCAST
374 if (ipv4_is_multicast(iph->daddr)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000375 tunnel->dev->stats.multicast++;
376 skb->pkt_type = PACKET_BROADCAST;
377 }
378#endif
379
380 if ((!(tpi->flags&TUNNEL_CSUM) && (tunnel->parms.i_flags&TUNNEL_CSUM)) ||
381 ((tpi->flags&TUNNEL_CSUM) && !(tunnel->parms.i_flags&TUNNEL_CSUM))) {
382 tunnel->dev->stats.rx_crc_errors++;
383 tunnel->dev->stats.rx_errors++;
384 goto drop;
385 }
386
387 if (tunnel->parms.i_flags&TUNNEL_SEQ) {
388 if (!(tpi->flags&TUNNEL_SEQ) ||
389 (tunnel->i_seqno && (s32)(ntohl(tpi->seq) - tunnel->i_seqno) < 0)) {
390 tunnel->dev->stats.rx_fifo_errors++;
391 tunnel->dev->stats.rx_errors++;
392 goto drop;
393 }
394 tunnel->i_seqno = ntohl(tpi->seq) + 1;
395 }
396
Ying Caie96f2e72014-05-04 15:20:04 -0700397 skb_reset_network_header(skb);
398
Pravin B Shelarc5441932013-03-25 14:49:35 +0000399 err = IP_ECN_decapsulate(iph, skb);
400 if (unlikely(err)) {
401 if (log_ecn_error)
402 net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
403 &iph->saddr, iph->tos);
404 if (err > 1) {
405 ++tunnel->dev->stats.rx_frame_errors;
406 ++tunnel->dev->stats.rx_errors;
407 goto drop;
408 }
409 }
410
411 tstats = this_cpu_ptr(tunnel->dev->tstats);
412 u64_stats_update_begin(&tstats->syncp);
413 tstats->rx_packets++;
414 tstats->rx_bytes += skb->len;
415 u64_stats_update_end(&tstats->syncp);
416
Alexei Starovoitov81b9eab2013-11-12 14:39:13 -0800417 skb_scrub_packet(skb, !net_eq(tunnel->net, dev_net(tunnel->dev)));
418
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700419 if (tunnel->dev->type == ARPHRD_ETHER) {
420 skb->protocol = eth_type_trans(skb, tunnel->dev);
421 skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
422 } else {
423 skb->dev = tunnel->dev;
424 }
Nicolas Dichtel64261f22013-08-13 17:51:09 +0200425
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700426 if (tun_dst)
427 skb_dst_set(skb, (struct dst_entry *)tun_dst);
428
Pravin B Shelarc5441932013-03-25 14:49:35 +0000429 gro_cells_receive(&tunnel->gro_cells, skb);
430 return 0;
431
432drop:
Haishuang Yan469f87e2017-06-15 10:29:29 +0800433 if (tun_dst)
434 dst_release((struct dst_entry *)tun_dst);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000435 kfree_skb(skb);
436 return 0;
437}
438EXPORT_SYMBOL_GPL(ip_tunnel_rcv);
439
Tom Herberta8c5f902014-11-12 11:54:09 -0800440int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *ops,
441 unsigned int num)
442{
Thomas Grafbb1553c2014-12-16 21:05:20 +0100443 if (num >= MAX_IPTUN_ENCAP_OPS)
444 return -ERANGE;
445
Tom Herberta8c5f902014-11-12 11:54:09 -0800446 return !cmpxchg((const struct ip_tunnel_encap_ops **)
447 &iptun_encaps[num],
448 NULL, ops) ? 0 : -1;
449}
450EXPORT_SYMBOL(ip_tunnel_encap_add_ops);
451
452int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *ops,
453 unsigned int num)
454{
455 int ret;
456
Thomas Grafbb1553c2014-12-16 21:05:20 +0100457 if (num >= MAX_IPTUN_ENCAP_OPS)
458 return -ERANGE;
459
Tom Herberta8c5f902014-11-12 11:54:09 -0800460 ret = (cmpxchg((const struct ip_tunnel_encap_ops **)
461 &iptun_encaps[num],
462 ops, NULL) == ops) ? 0 : -1;
463
464 synchronize_net();
465
466 return ret;
467}
468EXPORT_SYMBOL(ip_tunnel_encap_del_ops);
469
Tom Herbert56328482014-09-17 12:25:58 -0700470int ip_tunnel_encap_setup(struct ip_tunnel *t,
471 struct ip_tunnel_encap *ipencap)
472{
473 int hlen;
474
475 memset(&t->encap, 0, sizeof(t->encap));
476
477 hlen = ip_encap_hlen(ipencap);
478 if (hlen < 0)
479 return hlen;
480
481 t->encap.type = ipencap->type;
482 t->encap.sport = ipencap->sport;
483 t->encap.dport = ipencap->dport;
484 t->encap.flags = ipencap->flags;
485
486 t->encap_hlen = hlen;
487 t->hlen = t->encap_hlen + t->tun_hlen;
488
489 return 0;
490}
491EXPORT_SYMBOL_GPL(ip_tunnel_encap_setup);
492
Pravin B Shelar23a36472013-07-02 10:57:33 -0700493static int tnl_update_pmtu(struct net_device *dev, struct sk_buff *skb,
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300494 struct rtable *rt, __be16 df,
495 const struct iphdr *inner_iph)
Pravin B Shelar23a36472013-07-02 10:57:33 -0700496{
497 struct ip_tunnel *tunnel = netdev_priv(dev);
Alexander Duyck8c91e162013-07-11 13:12:22 -0700498 int pkt_size = skb->len - tunnel->hlen - dev->hard_header_len;
Pravin B Shelar23a36472013-07-02 10:57:33 -0700499 int mtu;
500
501 if (df)
502 mtu = dst_mtu(&rt->dst) - dev->hard_header_len
503 - sizeof(struct iphdr) - tunnel->hlen;
504 else
505 mtu = skb_dst(skb) ? dst_mtu(skb_dst(skb)) : dev->mtu;
506
Nicolas Dichtelf15ca722018-01-25 19:03:03 +0100507 skb_dst_update_pmtu(skb, mtu);
Pravin B Shelar23a36472013-07-02 10:57:33 -0700508
509 if (skb->protocol == htons(ETH_P_IP)) {
510 if (!skb_is_gso(skb) &&
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300511 (inner_iph->frag_off & htons(IP_DF)) &&
512 mtu < pkt_size) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700513 memset(IPCB(skb), 0, sizeof(*IPCB(skb)));
514 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED, htonl(mtu));
515 return -E2BIG;
516 }
517 }
518#if IS_ENABLED(CONFIG_IPV6)
519 else if (skb->protocol == htons(ETH_P_IPV6)) {
520 struct rt6_info *rt6 = (struct rt6_info *)skb_dst(skb);
521
522 if (rt6 && mtu < dst_mtu(skb_dst(skb)) &&
523 mtu >= IPV6_MIN_MTU) {
524 if ((tunnel->parms.iph.daddr &&
525 !ipv4_is_multicast(tunnel->parms.iph.daddr)) ||
526 rt6->rt6i_dst.plen == 128) {
527 rt6->rt6i_flags |= RTF_MODIFIED;
528 dst_metric_set(skb_dst(skb), RTAX_MTU, mtu);
529 }
530 }
531
532 if (!skb_is_gso(skb) && mtu >= IPV6_MIN_MTU &&
533 mtu < pkt_size) {
534 icmpv6_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu);
535 return -E2BIG;
536 }
537 }
538#endif
539 return 0;
540}
541
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700542void ip_md_tunnel_xmit(struct sk_buff *skb, struct net_device *dev, u8 proto)
543{
544 struct ip_tunnel *tunnel = netdev_priv(dev);
545 u32 headroom = sizeof(struct iphdr);
546 struct ip_tunnel_info *tun_info;
547 const struct ip_tunnel_key *key;
548 const struct iphdr *inner_iph;
549 struct rtable *rt;
550 struct flowi4 fl4;
551 __be16 df = 0;
552 u8 tos, ttl;
553
554 tun_info = skb_tunnel_info(skb);
555 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
556 ip_tunnel_info_af(tun_info) != AF_INET))
557 goto tx_error;
558 key = &tun_info->key;
559 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
560 inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
561 tos = key->tos;
562 if (tos == 1) {
563 if (skb->protocol == htons(ETH_P_IP))
564 tos = inner_iph->tos;
565 else if (skb->protocol == htons(ETH_P_IPV6))
566 tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
567 }
Petr Machatab0066da2018-02-27 14:53:38 +0100568 ip_tunnel_init_flow(&fl4, proto, key->u.ipv4.dst, key->u.ipv4.src, 0,
569 RT_TOS(tos), tunnel->parms.link, tunnel->fwmark);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700570 if (tunnel->encap.type != TUNNEL_ENCAP_NONE)
571 goto tx_error;
572 rt = ip_route_output_key(tunnel->net, &fl4);
573 if (IS_ERR(rt)) {
574 dev->stats.tx_carrier_errors++;
575 goto tx_error;
576 }
577 if (rt->dst.dev == dev) {
578 ip_rt_put(rt);
579 dev->stats.collisions++;
580 goto tx_error;
581 }
582 tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
583 ttl = key->ttl;
584 if (ttl == 0) {
585 if (skb->protocol == htons(ETH_P_IP))
586 ttl = inner_iph->ttl;
587 else if (skb->protocol == htons(ETH_P_IPV6))
588 ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
589 else
590 ttl = ip4_dst_hoplimit(&rt->dst);
591 }
592 if (key->tun_flags & TUNNEL_DONT_FRAGMENT)
593 df = htons(IP_DF);
594 else if (skb->protocol == htons(ETH_P_IP))
595 df = inner_iph->frag_off & htons(IP_DF);
596 headroom += LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len;
597 if (headroom > dev->needed_headroom)
598 dev->needed_headroom = headroom;
599
600 if (skb_cow_head(skb, dev->needed_headroom)) {
601 ip_rt_put(rt);
602 goto tx_dropped;
603 }
Haishuang Yan0f693f12017-09-07 14:08:34 +0800604 iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, proto, tos, ttl,
605 df, !net_eq(tunnel->net, dev_net(dev)));
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700606 return;
607tx_error:
608 dev->stats.tx_errors++;
609 goto kfree;
610tx_dropped:
611 dev->stats.tx_dropped++;
612kfree:
613 kfree_skb(skb);
614}
615EXPORT_SYMBOL_GPL(ip_md_tunnel_xmit);
616
Pravin B Shelarc5441932013-03-25 14:49:35 +0000617void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
Tom Herbert56328482014-09-17 12:25:58 -0700618 const struct iphdr *tnl_params, u8 protocol)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000619{
620 struct ip_tunnel *tunnel = netdev_priv(dev);
621 const struct iphdr *inner_iph;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000622 struct flowi4 fl4;
623 u8 tos, ttl;
624 __be16 df;
Eric Dumazetb045d372014-02-03 12:52:14 -0800625 struct rtable *rt; /* Route to the other host */
Pravin B Shelarc5441932013-03-25 14:49:35 +0000626 unsigned int max_headroom; /* The extra header space needed */
627 __be32 dst;
Timo Teräs22fb22e2014-05-16 08:34:39 +0300628 bool connected;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000629
630 inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
Timo Teräs22fb22e2014-05-16 08:34:39 +0300631 connected = (tunnel->parms.iph.daddr != 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000632
Bernie Harris5146d1f2016-02-22 12:58:05 +1300633 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
634
Pravin B Shelarc5441932013-03-25 14:49:35 +0000635 dst = tnl_params->daddr;
636 if (dst == 0) {
637 /* NBMA tunnel */
638
Ian Morris51456b22015-04-03 09:17:26 +0100639 if (!skb_dst(skb)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000640 dev->stats.tx_fifo_errors++;
641 goto tx_error;
642 }
643
644 if (skb->protocol == htons(ETH_P_IP)) {
645 rt = skb_rtable(skb);
646 dst = rt_nexthop(rt, inner_iph->daddr);
647 }
648#if IS_ENABLED(CONFIG_IPV6)
649 else if (skb->protocol == htons(ETH_P_IPV6)) {
650 const struct in6_addr *addr6;
651 struct neighbour *neigh;
652 bool do_tx_error_icmp;
653 int addr_type;
654
655 neigh = dst_neigh_lookup(skb_dst(skb),
656 &ipv6_hdr(skb)->daddr);
Ian Morris51456b22015-04-03 09:17:26 +0100657 if (!neigh)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000658 goto tx_error;
659
660 addr6 = (const struct in6_addr *)&neigh->primary_key;
661 addr_type = ipv6_addr_type(addr6);
662
663 if (addr_type == IPV6_ADDR_ANY) {
664 addr6 = &ipv6_hdr(skb)->daddr;
665 addr_type = ipv6_addr_type(addr6);
666 }
667
668 if ((addr_type & IPV6_ADDR_COMPATv4) == 0)
669 do_tx_error_icmp = true;
670 else {
671 do_tx_error_icmp = false;
672 dst = addr6->s6_addr32[3];
673 }
674 neigh_release(neigh);
675 if (do_tx_error_icmp)
676 goto tx_error_icmp;
677 }
678#endif
679 else
680 goto tx_error;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800681
682 connected = false;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000683 }
684
685 tos = tnl_params->tos;
686 if (tos & 0x1) {
687 tos &= ~0x1;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800688 if (skb->protocol == htons(ETH_P_IP)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000689 tos = inner_iph->tos;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800690 connected = false;
691 } else if (skb->protocol == htons(ETH_P_IPV6)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000692 tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800693 connected = false;
694 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000695 }
696
Thomas Winter5c38bd12018-01-23 16:46:24 +1300697 if (tunnel->fwmark) {
Petr Machatab0066da2018-02-27 14:53:38 +0100698 ip_tunnel_init_flow(&fl4, protocol, dst, tnl_params->saddr,
699 tunnel->parms.o_key, RT_TOS(tos),
700 tunnel->parms.link, tunnel->fwmark);
Thomas Winter5c38bd12018-01-23 16:46:24 +1300701 }
702 else {
Petr Machatab0066da2018-02-27 14:53:38 +0100703 ip_tunnel_init_flow(&fl4, protocol, dst, tnl_params->saddr,
704 tunnel->parms.o_key, RT_TOS(tos),
705 tunnel->parms.link, skb->mark);
Thomas Winter5c38bd12018-01-23 16:46:24 +1300706 }
Tom Herbert7d442fa2014-01-02 11:48:26 -0800707
Tom Herbert56328482014-09-17 12:25:58 -0700708 if (ip_tunnel_encap(skb, tunnel, &protocol, &fl4) < 0)
709 goto tx_error;
710
Paolo Abenie09acdd2016-02-12 15:43:55 +0100711 rt = connected ? dst_cache_get_ip4(&tunnel->dst_cache, &fl4.saddr) :
712 NULL;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800713
714 if (!rt) {
715 rt = ip_route_output_key(tunnel->net, &fl4);
716
717 if (IS_ERR(rt)) {
718 dev->stats.tx_carrier_errors++;
719 goto tx_error;
720 }
721 if (connected)
Paolo Abenie09acdd2016-02-12 15:43:55 +0100722 dst_cache_set_ip4(&tunnel->dst_cache, &rt->dst,
723 fl4.saddr);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000724 }
Tom Herbert7d442fa2014-01-02 11:48:26 -0800725
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700726 if (rt->dst.dev == dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000727 ip_rt_put(rt);
728 dev->stats.collisions++;
729 goto tx_error;
730 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000731
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300732 if (tnl_update_pmtu(dev, skb, rt, tnl_params->frag_off, inner_iph)) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700733 ip_rt_put(rt);
734 goto tx_error;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000735 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000736
737 if (tunnel->err_count > 0) {
738 if (time_before(jiffies,
739 tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
740 tunnel->err_count--;
741
742 dst_link_failure(skb);
743 } else
744 tunnel->err_count = 0;
745 }
746
Pravin B Shelard4a71b12013-09-25 09:57:47 -0700747 tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000748 ttl = tnl_params->ttl;
749 if (ttl == 0) {
750 if (skb->protocol == htons(ETH_P_IP))
751 ttl = inner_iph->ttl;
752#if IS_ENABLED(CONFIG_IPV6)
753 else if (skb->protocol == htons(ETH_P_IPV6))
754 ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
755#endif
756 else
757 ttl = ip4_dst_hoplimit(&rt->dst);
758 }
759
Pravin B Shelar23a36472013-07-02 10:57:33 -0700760 df = tnl_params->frag_off;
Philip Prindeville22a59be2016-06-14 15:53:02 -0600761 if (skb->protocol == htons(ETH_P_IP) && !tunnel->ignore_df)
Pravin B Shelar23a36472013-07-02 10:57:33 -0700762 df |= (inner_iph->frag_off&htons(IP_DF));
763
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700764 max_headroom = LL_RESERVED_SPACE(rt->dst.dev) + sizeof(struct iphdr)
Tom Herbert7371e022014-10-03 15:48:07 -0700765 + rt->dst.header_len + ip_encap_hlen(&tunnel->encap);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200766 if (max_headroom > dev->needed_headroom)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000767 dev->needed_headroom = max_headroom;
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200768
769 if (skb_cow_head(skb, dev->needed_headroom)) {
Dmitry Popov586d5fc2014-06-06 04:34:37 +0400770 ip_rt_put(rt);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200771 dev->stats.tx_dropped++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800772 kfree_skb(skb);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200773 return;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000774 }
775
Pravin B Shelar039f5062015-12-24 14:34:54 -0800776 iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, protocol, tos, ttl,
777 df, !net_eq(tunnel->net, dev_net(dev)));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000778 return;
779
780#if IS_ENABLED(CONFIG_IPV6)
781tx_error_icmp:
782 dst_link_failure(skb);
783#endif
784tx_error:
785 dev->stats.tx_errors++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800786 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000787}
788EXPORT_SYMBOL_GPL(ip_tunnel_xmit);
789
790static void ip_tunnel_update(struct ip_tunnel_net *itn,
791 struct ip_tunnel *t,
792 struct net_device *dev,
793 struct ip_tunnel_parm *p,
Craig Gallek9830ad42017-04-19 12:30:54 -0400794 bool set_mtu,
795 __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000796{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700797 ip_tunnel_del(itn, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000798 t->parms.iph.saddr = p->iph.saddr;
799 t->parms.iph.daddr = p->iph.daddr;
800 t->parms.i_key = p->i_key;
801 t->parms.o_key = p->o_key;
802 if (dev->type != ARPHRD_ETHER) {
803 memcpy(dev->dev_addr, &p->iph.saddr, 4);
804 memcpy(dev->broadcast, &p->iph.daddr, 4);
805 }
806 ip_tunnel_add(itn, t);
807
808 t->parms.iph.ttl = p->iph.ttl;
809 t->parms.iph.tos = p->iph.tos;
810 t->parms.iph.frag_off = p->iph.frag_off;
811
Craig Gallek9830ad42017-04-19 12:30:54 -0400812 if (t->parms.link != p->link || t->fwmark != fwmark) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000813 int mtu;
814
815 t->parms.link = p->link;
Craig Gallek9830ad42017-04-19 12:30:54 -0400816 t->fwmark = fwmark;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000817 mtu = ip_tunnel_bind_dev(dev);
818 if (set_mtu)
819 dev->mtu = mtu;
820 }
Paolo Abenie09acdd2016-02-12 15:43:55 +0100821 dst_cache_reset(&t->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000822 netdev_state_change(dev);
823}
824
825int ip_tunnel_ioctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd)
826{
827 int err = 0;
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200828 struct ip_tunnel *t = netdev_priv(dev);
829 struct net *net = t->net;
830 struct ip_tunnel_net *itn = net_generic(net, t->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000831
832 BUG_ON(!itn->fb_tunnel_dev);
833 switch (cmd) {
834 case SIOCGETTUNNEL:
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200835 if (dev == itn->fb_tunnel_dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000836 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100837 if (!t)
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200838 t = netdev_priv(dev);
839 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000840 memcpy(p, &t->parms, sizeof(*p));
841 break;
842
843 case SIOCADDTUNNEL:
844 case SIOCCHGTUNNEL:
845 err = -EPERM;
846 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
847 goto done;
848 if (p->iph.ttl)
849 p->iph.frag_off |= htons(IP_DF);
Dmitry Popov7c8e6b92014-06-08 02:06:25 +0400850 if (!(p->i_flags & VTI_ISVTI)) {
851 if (!(p->i_flags & TUNNEL_KEY))
852 p->i_key = 0;
853 if (!(p->o_flags & TUNNEL_KEY))
854 p->o_key = 0;
855 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000856
857 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
858
Steffen Klassertd61746b2014-09-22 09:11:08 +0200859 if (cmd == SIOCADDTUNNEL) {
860 if (!t) {
861 t = ip_tunnel_create(net, itn, p);
862 err = PTR_ERR_OR_ZERO(t);
863 break;
864 }
865
866 err = -EEXIST;
Duan Jiongee30ef4d2014-05-15 13:07:02 +0800867 break;
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100868 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000869 if (dev != itn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
Ian Morris00db4122015-04-03 09:17:27 +0100870 if (t) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000871 if (t->dev != dev) {
872 err = -EEXIST;
873 break;
874 }
875 } else {
876 unsigned int nflags = 0;
877
878 if (ipv4_is_multicast(p->iph.daddr))
879 nflags = IFF_BROADCAST;
880 else if (p->iph.daddr)
881 nflags = IFF_POINTOPOINT;
882
883 if ((dev->flags^nflags)&(IFF_POINTOPOINT|IFF_BROADCAST)) {
884 err = -EINVAL;
885 break;
886 }
887
888 t = netdev_priv(dev);
889 }
890 }
891
892 if (t) {
893 err = 0;
Craig Gallek9830ad42017-04-19 12:30:54 -0400894 ip_tunnel_update(itn, t, dev, p, true, 0);
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100895 } else {
896 err = -ENOENT;
897 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000898 break;
899
900 case SIOCDELTUNNEL:
901 err = -EPERM;
902 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
903 goto done;
904
905 if (dev == itn->fb_tunnel_dev) {
906 err = -ENOENT;
907 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100908 if (!t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000909 goto done;
910 err = -EPERM;
911 if (t == netdev_priv(itn->fb_tunnel_dev))
912 goto done;
913 dev = t->dev;
914 }
915 unregister_netdevice(dev);
916 err = 0;
917 break;
918
919 default:
920 err = -EINVAL;
921 }
922
923done:
924 return err;
925}
926EXPORT_SYMBOL_GPL(ip_tunnel_ioctl);
927
David Wragg7e059152016-02-10 00:05:58 +0000928int __ip_tunnel_change_mtu(struct net_device *dev, int new_mtu, bool strict)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000929{
930 struct ip_tunnel *tunnel = netdev_priv(dev);
931 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
David Wragg7e059152016-02-10 00:05:58 +0000932 int max_mtu = 0xFFF8 - dev->hard_header_len - t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000933
Jarod Wilsonb96f9af2016-10-20 13:55:24 -0400934 if (new_mtu < ETH_MIN_MTU)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000935 return -EINVAL;
David Wragg7e059152016-02-10 00:05:58 +0000936
937 if (new_mtu > max_mtu) {
938 if (strict)
939 return -EINVAL;
940
941 new_mtu = max_mtu;
942 }
943
Pravin B Shelarc5441932013-03-25 14:49:35 +0000944 dev->mtu = new_mtu;
945 return 0;
946}
David Wragg7e059152016-02-10 00:05:58 +0000947EXPORT_SYMBOL_GPL(__ip_tunnel_change_mtu);
948
949int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
950{
951 return __ip_tunnel_change_mtu(dev, new_mtu, true);
952}
Pravin B Shelarc5441932013-03-25 14:49:35 +0000953EXPORT_SYMBOL_GPL(ip_tunnel_change_mtu);
954
955static void ip_tunnel_dev_free(struct net_device *dev)
956{
957 struct ip_tunnel *tunnel = netdev_priv(dev);
958
959 gro_cells_destroy(&tunnel->gro_cells);
Paolo Abenie09acdd2016-02-12 15:43:55 +0100960 dst_cache_destroy(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000961 free_percpu(dev->tstats);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000962}
963
964void ip_tunnel_dellink(struct net_device *dev, struct list_head *head)
965{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000966 struct ip_tunnel *tunnel = netdev_priv(dev);
967 struct ip_tunnel_net *itn;
968
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200969 itn = net_generic(tunnel->net, tunnel->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000970
971 if (itn->fb_tunnel_dev != dev) {
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700972 ip_tunnel_del(itn, netdev_priv(dev));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000973 unregister_netdevice_queue(dev, head);
974 }
975}
976EXPORT_SYMBOL_GPL(ip_tunnel_dellink);
977
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +0100978struct net *ip_tunnel_get_link_net(const struct net_device *dev)
979{
980 struct ip_tunnel *tunnel = netdev_priv(dev);
981
982 return tunnel->net;
983}
984EXPORT_SYMBOL(ip_tunnel_get_link_net);
985
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200986int ip_tunnel_get_iflink(const struct net_device *dev)
987{
988 struct ip_tunnel *tunnel = netdev_priv(dev);
989
990 return tunnel->parms.link;
991}
992EXPORT_SYMBOL(ip_tunnel_get_iflink);
993
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +0300994int ip_tunnel_init_net(struct net *net, unsigned int ip_tnl_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000995 struct rtnl_link_ops *ops, char *devname)
996{
997 struct ip_tunnel_net *itn = net_generic(net, ip_tnl_net_id);
998 struct ip_tunnel_parm parms;
stephen hemminger6261d982013-08-05 22:51:37 -0700999 unsigned int i;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001000
stephen hemminger6261d982013-08-05 22:51:37 -07001001 for (i = 0; i < IP_TNL_HASH_SIZE; i++)
1002 INIT_HLIST_HEAD(&itn->tunnels[i]);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001003
1004 if (!ops) {
1005 itn->fb_tunnel_dev = NULL;
1006 return 0;
1007 }
stephen hemminger6261d982013-08-05 22:51:37 -07001008
Pravin B Shelarc5441932013-03-25 14:49:35 +00001009 memset(&parms, 0, sizeof(parms));
1010 if (devname)
1011 strlcpy(parms.name, devname, IFNAMSIZ);
1012
1013 rtnl_lock();
1014 itn->fb_tunnel_dev = __ip_tunnel_create(net, ops, &parms);
Dan Carpenterea857f22013-08-19 10:05:10 +03001015 /* FB netdevice is special: we have one, and only one per netns.
1016 * Allowing to move it to another netns is clearly unsafe.
1017 */
Steffen Klassert67013282013-10-01 11:34:48 +02001018 if (!IS_ERR(itn->fb_tunnel_dev)) {
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001019 itn->fb_tunnel_dev->features |= NETIF_F_NETNS_LOCAL;
Steffen Klassert78ff4be2014-05-19 11:36:56 +02001020 itn->fb_tunnel_dev->mtu = ip_tunnel_bind_dev(itn->fb_tunnel_dev);
Steffen Klassert67013282013-10-01 11:34:48 +02001021 ip_tunnel_add(itn, netdev_priv(itn->fb_tunnel_dev));
1022 }
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001023 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001024
Sachin Kamat27d79f32014-01-27 12:13:57 +05301025 return PTR_ERR_OR_ZERO(itn->fb_tunnel_dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001026}
1027EXPORT_SYMBOL_GPL(ip_tunnel_init_net);
1028
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001029static void ip_tunnel_destroy(struct ip_tunnel_net *itn, struct list_head *head,
1030 struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001031{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001032 struct net *net = dev_net(itn->fb_tunnel_dev);
1033 struct net_device *dev, *aux;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001034 int h;
1035
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001036 for_each_netdev_safe(net, dev, aux)
1037 if (dev->rtnl_link_ops == ops)
1038 unregister_netdevice_queue(dev, head);
1039
Pravin B Shelarc5441932013-03-25 14:49:35 +00001040 for (h = 0; h < IP_TNL_HASH_SIZE; h++) {
1041 struct ip_tunnel *t;
1042 struct hlist_node *n;
1043 struct hlist_head *thead = &itn->tunnels[h];
1044
1045 hlist_for_each_entry_safe(t, n, thead, hash_node)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001046 /* If dev is in the same netns, it has already
1047 * been added to the list by the previous loop.
1048 */
1049 if (!net_eq(dev_net(t->dev), net))
1050 unregister_netdevice_queue(t->dev, head);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001051 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001052}
1053
Eric Dumazet64bc1782017-09-19 16:27:09 -07001054void ip_tunnel_delete_nets(struct list_head *net_list, unsigned int id,
1055 struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001056{
Eric Dumazet64bc1782017-09-19 16:27:09 -07001057 struct ip_tunnel_net *itn;
1058 struct net *net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001059 LIST_HEAD(list);
1060
1061 rtnl_lock();
Eric Dumazet64bc1782017-09-19 16:27:09 -07001062 list_for_each_entry(net, net_list, exit_list) {
1063 itn = net_generic(net, id);
1064 ip_tunnel_destroy(itn, &list, ops);
1065 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001066 unregister_netdevice_many(&list);
1067 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001068}
Eric Dumazet64bc1782017-09-19 16:27:09 -07001069EXPORT_SYMBOL_GPL(ip_tunnel_delete_nets);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001070
1071int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
Craig Gallek9830ad42017-04-19 12:30:54 -04001072 struct ip_tunnel_parm *p, __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001073{
1074 struct ip_tunnel *nt;
1075 struct net *net = dev_net(dev);
1076 struct ip_tunnel_net *itn;
1077 int mtu;
1078 int err;
1079
1080 nt = netdev_priv(dev);
1081 itn = net_generic(net, nt->ip_tnl_net_id);
1082
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001083 if (nt->collect_md) {
1084 if (rtnl_dereference(itn->collect_md_tun))
1085 return -EEXIST;
1086 } else {
1087 if (ip_tunnel_find(itn, p, dev->type))
1088 return -EEXIST;
1089 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001090
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +02001091 nt->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001092 nt->parms = *p;
Craig Gallek9830ad42017-04-19 12:30:54 -04001093 nt->fwmark = fwmark;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001094 err = register_netdevice(dev);
1095 if (err)
1096 goto out;
1097
1098 if (dev->type == ARPHRD_ETHER && !tb[IFLA_ADDRESS])
1099 eth_hw_addr_random(dev);
1100
1101 mtu = ip_tunnel_bind_dev(dev);
1102 if (!tb[IFLA_MTU])
1103 dev->mtu = mtu;
1104
1105 ip_tunnel_add(itn, nt);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001106out:
1107 return err;
1108}
1109EXPORT_SYMBOL_GPL(ip_tunnel_newlink);
1110
1111int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
Craig Gallek9830ad42017-04-19 12:30:54 -04001112 struct ip_tunnel_parm *p, __u32 fwmark)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001113{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001114 struct ip_tunnel *t;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001115 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001116 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001117 struct ip_tunnel_net *itn = net_generic(net, tunnel->ip_tnl_net_id);
1118
1119 if (dev == itn->fb_tunnel_dev)
1120 return -EINVAL;
1121
Pravin B Shelarc5441932013-03-25 14:49:35 +00001122 t = ip_tunnel_find(itn, p, dev->type);
1123
1124 if (t) {
1125 if (t->dev != dev)
1126 return -EEXIST;
1127 } else {
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001128 t = tunnel;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001129
1130 if (dev->type != ARPHRD_ETHER) {
1131 unsigned int nflags = 0;
1132
1133 if (ipv4_is_multicast(p->iph.daddr))
1134 nflags = IFF_BROADCAST;
1135 else if (p->iph.daddr)
1136 nflags = IFF_POINTOPOINT;
1137
1138 if ((dev->flags ^ nflags) &
1139 (IFF_POINTOPOINT | IFF_BROADCAST))
1140 return -EINVAL;
1141 }
1142 }
1143
Craig Gallek9830ad42017-04-19 12:30:54 -04001144 ip_tunnel_update(itn, t, dev, p, !tb[IFLA_MTU], fwmark);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001145 return 0;
1146}
1147EXPORT_SYMBOL_GPL(ip_tunnel_changelink);
1148
1149int ip_tunnel_init(struct net_device *dev)
1150{
1151 struct ip_tunnel *tunnel = netdev_priv(dev);
1152 struct iphdr *iph = &tunnel->parms.iph;
WANG Cong1c213bd2014-02-13 11:46:28 -08001153 int err;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001154
David S. Millercf124db2017-05-08 12:52:56 -04001155 dev->needs_free_netdev = true;
1156 dev->priv_destructor = ip_tunnel_dev_free;
WANG Cong1c213bd2014-02-13 11:46:28 -08001157 dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001158 if (!dev->tstats)
1159 return -ENOMEM;
1160
Paolo Abenie09acdd2016-02-12 15:43:55 +01001161 err = dst_cache_init(&tunnel->dst_cache, GFP_KERNEL);
1162 if (err) {
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001163 free_percpu(dev->tstats);
Paolo Abenie09acdd2016-02-12 15:43:55 +01001164 return err;
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001165 }
1166
Pravin B Shelarc5441932013-03-25 14:49:35 +00001167 err = gro_cells_init(&tunnel->gro_cells, dev);
1168 if (err) {
Paolo Abenie09acdd2016-02-12 15:43:55 +01001169 dst_cache_destroy(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001170 free_percpu(dev->tstats);
1171 return err;
1172 }
1173
1174 tunnel->dev = dev;
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001175 tunnel->net = dev_net(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001176 strcpy(tunnel->parms.name, dev->name);
1177 iph->version = 4;
1178 iph->ihl = 5;
1179
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001180 if (tunnel->collect_md) {
1181 dev->features |= NETIF_F_NETNS_LOCAL;
1182 netif_keep_dst(dev);
1183 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001184 return 0;
1185}
1186EXPORT_SYMBOL_GPL(ip_tunnel_init);
1187
1188void ip_tunnel_uninit(struct net_device *dev)
1189{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001190 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001191 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001192 struct ip_tunnel_net *itn;
1193
1194 itn = net_generic(net, tunnel->ip_tnl_net_id);
1195 /* fb_tunnel_dev will be unregisted in net-exit call. */
1196 if (itn->fb_tunnel_dev != dev)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001197 ip_tunnel_del(itn, netdev_priv(dev));
Tom Herbert7d442fa2014-01-02 11:48:26 -08001198
Paolo Abenie09acdd2016-02-12 15:43:55 +01001199 dst_cache_reset(&tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001200}
1201EXPORT_SYMBOL_GPL(ip_tunnel_uninit);
1202
1203/* Do least required initialization, rest of init is done in tunnel_init call */
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +03001204void ip_tunnel_setup(struct net_device *dev, unsigned int net_id)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001205{
1206 struct ip_tunnel *tunnel = netdev_priv(dev);
1207 tunnel->ip_tnl_net_id = net_id;
1208}
1209EXPORT_SYMBOL_GPL(ip_tunnel_setup);
1210
1211MODULE_LICENSE("GPL");