blob: c7bd72e9b544848d10a490b010e0a30c4d5e4c21 [file] [log] [blame]
Pravin B Shelarc5441932013-03-25 14:49:35 +00001/*
2 * Copyright (c) 2013 Nicira, Inc.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of version 2 of the GNU General Public
6 * License as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public License
14 * along with this program; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16 * 02110-1301, USA
17 */
18
19#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
20
21#include <linux/capability.h>
22#include <linux/module.h>
23#include <linux/types.h>
24#include <linux/kernel.h>
25#include <linux/slab.h>
26#include <linux/uaccess.h>
27#include <linux/skbuff.h>
28#include <linux/netdevice.h>
29#include <linux/in.h>
30#include <linux/tcp.h>
31#include <linux/udp.h>
32#include <linux/if_arp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000033#include <linux/init.h>
34#include <linux/in6.h>
35#include <linux/inetdevice.h>
36#include <linux/igmp.h>
37#include <linux/netfilter_ipv4.h>
38#include <linux/etherdevice.h>
39#include <linux/if_ether.h>
40#include <linux/if_vlan.h>
41#include <linux/rculist.h>
Sachin Kamat27d79f32014-01-27 12:13:57 +053042#include <linux/err.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000043
44#include <net/sock.h>
45#include <net/ip.h>
46#include <net/icmp.h>
47#include <net/protocol.h>
48#include <net/ip_tunnels.h>
49#include <net/arp.h>
50#include <net/checksum.h>
51#include <net/dsfield.h>
52#include <net/inet_ecn.h>
53#include <net/xfrm.h>
54#include <net/net_namespace.h>
55#include <net/netns/generic.h>
56#include <net/rtnetlink.h>
Tom Herbert56328482014-09-17 12:25:58 -070057#include <net/udp.h>
Tom Herbert63487ba2014-11-04 09:06:51 -080058
Pravin B Shelarc5441932013-03-25 14:49:35 +000059#if IS_ENABLED(CONFIG_IPV6)
60#include <net/ipv6.h>
61#include <net/ip6_fib.h>
62#include <net/ip6_route.h>
63#endif
64
Duan Jiong967680e2014-01-19 16:43:42 +080065static unsigned int ip_tunnel_hash(__be32 key, __be32 remote)
Pravin B Shelarc5441932013-03-25 14:49:35 +000066{
67 return hash_32((__force u32)key ^ (__force u32)remote,
68 IP_TNL_HASH_BITS);
69}
70
Eric Dumazet6c7e7612014-01-16 16:41:19 -080071static void __tunnel_dst_set(struct ip_tunnel_dst *idst,
Dmitry Popov95cb5742014-07-29 03:07:52 +040072 struct dst_entry *dst, __be32 saddr)
Tom Herbert7d442fa2014-01-02 11:48:26 -080073{
74 struct dst_entry *old_dst;
75
Eric Dumazetf8864972014-06-24 10:05:11 -070076 dst_clone(dst);
Eric Dumazet6c7e7612014-01-16 16:41:19 -080077 old_dst = xchg((__force struct dst_entry **)&idst->dst, dst);
Tom Herbert7d442fa2014-01-02 11:48:26 -080078 dst_release(old_dst);
Dmitry Popov95cb5742014-07-29 03:07:52 +040079 idst->saddr = saddr;
Tom Herbert7d442fa2014-01-02 11:48:26 -080080}
81
Eric Dumazeta35165c2014-09-22 10:38:16 -070082static noinline void tunnel_dst_set(struct ip_tunnel *t,
Dmitry Popov95cb5742014-07-29 03:07:52 +040083 struct dst_entry *dst, __be32 saddr)
Tom Herbert7d442fa2014-01-02 11:48:26 -080084{
Eric Dumazeta35165c2014-09-22 10:38:16 -070085 __tunnel_dst_set(raw_cpu_ptr(t->dst_cache), dst, saddr);
Tom Herbert7d442fa2014-01-02 11:48:26 -080086}
87
Eric Dumazet6c7e7612014-01-16 16:41:19 -080088static void tunnel_dst_reset(struct ip_tunnel *t)
Tom Herbert7d442fa2014-01-02 11:48:26 -080089{
Dmitry Popov95cb5742014-07-29 03:07:52 +040090 tunnel_dst_set(t, NULL, 0);
Tom Herbert7d442fa2014-01-02 11:48:26 -080091}
92
Nicolas Dichtelcf71d2bc2014-02-20 10:19:31 +010093void ip_tunnel_dst_reset_all(struct ip_tunnel *t)
Tom Herbert9a4aa9a2014-01-02 11:48:33 -080094{
95 int i;
96
97 for_each_possible_cpu(i)
Dmitry Popov95cb5742014-07-29 03:07:52 +040098 __tunnel_dst_set(per_cpu_ptr(t->dst_cache, i), NULL, 0);
Tom Herbert9a4aa9a2014-01-02 11:48:33 -080099}
Nicolas Dichtelcf71d2bc2014-02-20 10:19:31 +0100100EXPORT_SYMBOL(ip_tunnel_dst_reset_all);
Tom Herbert9a4aa9a2014-01-02 11:48:33 -0800101
Dmitry Popov95cb5742014-07-29 03:07:52 +0400102static struct rtable *tunnel_rtable_get(struct ip_tunnel *t,
103 u32 cookie, __be32 *saddr)
Tom Herbert7d442fa2014-01-02 11:48:26 -0800104{
Dmitry Popov95cb5742014-07-29 03:07:52 +0400105 struct ip_tunnel_dst *idst;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800106 struct dst_entry *dst;
107
108 rcu_read_lock();
Eric Dumazeta35165c2014-09-22 10:38:16 -0700109 idst = raw_cpu_ptr(t->dst_cache);
Dmitry Popov95cb5742014-07-29 03:07:52 +0400110 dst = rcu_dereference(idst->dst);
Eric Dumazetf8864972014-06-24 10:05:11 -0700111 if (dst && !atomic_inc_not_zero(&dst->__refcnt))
112 dst = NULL;
Eric Dumazetb045d372014-02-03 12:52:14 -0800113 if (dst) {
Dmitry Popov95cb5742014-07-29 03:07:52 +0400114 if (!dst->obsolete || dst->ops->check(dst, cookie)) {
115 *saddr = idst->saddr;
116 } else {
Eric Dumazetb045d372014-02-03 12:52:14 -0800117 tunnel_dst_reset(t);
Eric Dumazetf8864972014-06-24 10:05:11 -0700118 dst_release(dst);
119 dst = NULL;
Eric Dumazetb045d372014-02-03 12:52:14 -0800120 }
Tom Herbert7d442fa2014-01-02 11:48:26 -0800121 }
Eric Dumazetb045d372014-02-03 12:52:14 -0800122 rcu_read_unlock();
123 return (struct rtable *)dst;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800124}
125
Pravin B Shelarc5441932013-03-25 14:49:35 +0000126static bool ip_tunnel_key_match(const struct ip_tunnel_parm *p,
127 __be16 flags, __be32 key)
128{
129 if (p->i_flags & TUNNEL_KEY) {
130 if (flags & TUNNEL_KEY)
131 return key == p->i_key;
132 else
133 /* key expected, none present */
134 return false;
135 } else
136 return !(flags & TUNNEL_KEY);
137}
138
139/* Fallback tunnel: no source, no destination, no key, no options
140
141 Tunnel hash table:
142 We require exact key match i.e. if a key is present in packet
143 it will match only tunnel with the same key; if it is not present,
144 it will match only keyless tunnel.
145
146 All keysless packets, if not matched configured keyless tunnels
147 will match fallback tunnel.
148 Given src, dst and key, find appropriate for input tunnel.
149*/
150struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
151 int link, __be16 flags,
152 __be32 remote, __be32 local,
153 __be32 key)
154{
155 unsigned int hash;
156 struct ip_tunnel *t, *cand = NULL;
157 struct hlist_head *head;
158
Duan Jiong967680e2014-01-19 16:43:42 +0800159 hash = ip_tunnel_hash(key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000160 head = &itn->tunnels[hash];
161
162 hlist_for_each_entry_rcu(t, head, hash_node) {
163 if (local != t->parms.iph.saddr ||
164 remote != t->parms.iph.daddr ||
165 !(t->dev->flags & IFF_UP))
166 continue;
167
168 if (!ip_tunnel_key_match(&t->parms, flags, key))
169 continue;
170
171 if (t->parms.link == link)
172 return t;
173 else
174 cand = t;
175 }
176
177 hlist_for_each_entry_rcu(t, head, hash_node) {
178 if (remote != t->parms.iph.daddr ||
Dmitry Popove0056592014-07-05 02:26:37 +0400179 t->parms.iph.saddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000180 !(t->dev->flags & IFF_UP))
181 continue;
182
183 if (!ip_tunnel_key_match(&t->parms, flags, key))
184 continue;
185
186 if (t->parms.link == link)
187 return t;
188 else if (!cand)
189 cand = t;
190 }
191
Duan Jiong967680e2014-01-19 16:43:42 +0800192 hash = ip_tunnel_hash(key, 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000193 head = &itn->tunnels[hash];
194
195 hlist_for_each_entry_rcu(t, head, hash_node) {
Dmitry Popove0056592014-07-05 02:26:37 +0400196 if ((local != t->parms.iph.saddr || t->parms.iph.daddr != 0) &&
197 (local != t->parms.iph.daddr || !ipv4_is_multicast(local)))
198 continue;
199
200 if (!(t->dev->flags & IFF_UP))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000201 continue;
202
203 if (!ip_tunnel_key_match(&t->parms, flags, key))
204 continue;
205
206 if (t->parms.link == link)
207 return t;
208 else if (!cand)
209 cand = t;
210 }
211
212 if (flags & TUNNEL_NO_KEY)
213 goto skip_key_lookup;
214
215 hlist_for_each_entry_rcu(t, head, hash_node) {
216 if (t->parms.i_key != key ||
Dmitry Popove0056592014-07-05 02:26:37 +0400217 t->parms.iph.saddr != 0 ||
218 t->parms.iph.daddr != 0 ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000219 !(t->dev->flags & IFF_UP))
220 continue;
221
222 if (t->parms.link == link)
223 return t;
224 else if (!cand)
225 cand = t;
226 }
227
228skip_key_lookup:
229 if (cand)
230 return cand;
231
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700232 t = rcu_dereference(itn->collect_md_tun);
233 if (t)
234 return t;
235
Pravin B Shelarc5441932013-03-25 14:49:35 +0000236 if (itn->fb_tunnel_dev && itn->fb_tunnel_dev->flags & IFF_UP)
237 return netdev_priv(itn->fb_tunnel_dev);
238
Pravin B Shelarc5441932013-03-25 14:49:35 +0000239 return NULL;
240}
241EXPORT_SYMBOL_GPL(ip_tunnel_lookup);
242
243static struct hlist_head *ip_bucket(struct ip_tunnel_net *itn,
244 struct ip_tunnel_parm *parms)
245{
246 unsigned int h;
247 __be32 remote;
Steffen Klassert6d608f02014-02-21 08:41:09 +0100248 __be32 i_key = parms->i_key;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000249
250 if (parms->iph.daddr && !ipv4_is_multicast(parms->iph.daddr))
251 remote = parms->iph.daddr;
252 else
253 remote = 0;
254
Steffen Klassert6d608f02014-02-21 08:41:09 +0100255 if (!(parms->i_flags & TUNNEL_KEY) && (parms->i_flags & VTI_ISVTI))
256 i_key = 0;
257
258 h = ip_tunnel_hash(i_key, remote);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000259 return &itn->tunnels[h];
260}
261
262static void ip_tunnel_add(struct ip_tunnel_net *itn, struct ip_tunnel *t)
263{
264 struct hlist_head *head = ip_bucket(itn, &t->parms);
265
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700266 if (t->collect_md)
267 rcu_assign_pointer(itn->collect_md_tun, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000268 hlist_add_head_rcu(&t->hash_node, head);
269}
270
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700271static void ip_tunnel_del(struct ip_tunnel_net *itn, struct ip_tunnel *t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000272{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700273 if (t->collect_md)
274 rcu_assign_pointer(itn->collect_md_tun, NULL);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000275 hlist_del_init_rcu(&t->hash_node);
276}
277
278static struct ip_tunnel *ip_tunnel_find(struct ip_tunnel_net *itn,
279 struct ip_tunnel_parm *parms,
280 int type)
281{
282 __be32 remote = parms->iph.daddr;
283 __be32 local = parms->iph.saddr;
284 __be32 key = parms->i_key;
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400285 __be16 flags = parms->i_flags;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000286 int link = parms->link;
287 struct ip_tunnel *t = NULL;
288 struct hlist_head *head = ip_bucket(itn, parms);
289
290 hlist_for_each_entry_rcu(t, head, hash_node) {
291 if (local == t->parms.iph.saddr &&
292 remote == t->parms.iph.daddr &&
Pravin B Shelarc5441932013-03-25 14:49:35 +0000293 link == t->parms.link &&
Dmitry Popov5ce54af2014-06-08 03:03:08 +0400294 type == t->dev->type &&
295 ip_tunnel_key_match(&t->parms, flags, key))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000296 break;
297 }
298 return t;
299}
300
301static struct net_device *__ip_tunnel_create(struct net *net,
302 const struct rtnl_link_ops *ops,
303 struct ip_tunnel_parm *parms)
304{
305 int err;
306 struct ip_tunnel *tunnel;
307 struct net_device *dev;
308 char name[IFNAMSIZ];
309
310 if (parms->name[0])
311 strlcpy(name, parms->name, IFNAMSIZ);
312 else {
Pravin B Shelar54a5d382013-03-28 08:21:46 +0000313 if (strlen(ops->kind) > (IFNAMSIZ - 3)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000314 err = -E2BIG;
315 goto failed;
316 }
317 strlcpy(name, ops->kind, IFNAMSIZ);
318 strncat(name, "%d", 2);
319 }
320
321 ASSERT_RTNL();
Tom Gundersenc835a672014-07-14 16:37:24 +0200322 dev = alloc_netdev(ops->priv_size, name, NET_NAME_UNKNOWN, ops->setup);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000323 if (!dev) {
324 err = -ENOMEM;
325 goto failed;
326 }
327 dev_net_set(dev, net);
328
329 dev->rtnl_link_ops = ops;
330
331 tunnel = netdev_priv(dev);
332 tunnel->parms = *parms;
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +0200333 tunnel->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000334
335 err = register_netdevice(dev);
336 if (err)
337 goto failed_free;
338
339 return dev;
340
341failed_free:
342 free_netdev(dev);
343failed:
344 return ERR_PTR(err);
345}
346
Tom Herbert7d442fa2014-01-02 11:48:26 -0800347static inline void init_tunnel_flow(struct flowi4 *fl4,
348 int proto,
349 __be32 daddr, __be32 saddr,
350 __be32 key, __u8 tos, int oif)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000351{
352 memset(fl4, 0, sizeof(*fl4));
353 fl4->flowi4_oif = oif;
354 fl4->daddr = daddr;
355 fl4->saddr = saddr;
356 fl4->flowi4_tos = tos;
357 fl4->flowi4_proto = proto;
358 fl4->fl4_gre_key = key;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000359}
360
361static int ip_tunnel_bind_dev(struct net_device *dev)
362{
363 struct net_device *tdev = NULL;
364 struct ip_tunnel *tunnel = netdev_priv(dev);
365 const struct iphdr *iph;
366 int hlen = LL_MAX_HEADER;
367 int mtu = ETH_DATA_LEN;
368 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
369
370 iph = &tunnel->parms.iph;
371
372 /* Guess output device to choose reasonable mtu and needed_headroom */
373 if (iph->daddr) {
374 struct flowi4 fl4;
375 struct rtable *rt;
376
Tom Herbert7d442fa2014-01-02 11:48:26 -0800377 init_tunnel_flow(&fl4, iph->protocol, iph->daddr,
378 iph->saddr, tunnel->parms.o_key,
379 RT_TOS(iph->tos), tunnel->parms.link);
380 rt = ip_route_output_key(tunnel->net, &fl4);
381
Pravin B Shelarc5441932013-03-25 14:49:35 +0000382 if (!IS_ERR(rt)) {
383 tdev = rt->dst.dev;
Dmitry Popov95cb5742014-07-29 03:07:52 +0400384 tunnel_dst_set(tunnel, &rt->dst, fl4.saddr);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000385 ip_rt_put(rt);
386 }
387 if (dev->type != ARPHRD_ETHER)
388 dev->flags |= IFF_POINTOPOINT;
389 }
390
391 if (!tdev && tunnel->parms.link)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200392 tdev = __dev_get_by_index(tunnel->net, tunnel->parms.link);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000393
394 if (tdev) {
395 hlen = tdev->hard_header_len + tdev->needed_headroom;
396 mtu = tdev->mtu;
397 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000398
399 dev->needed_headroom = t_hlen + hlen;
400 mtu -= (dev->hard_header_len + t_hlen);
401
402 if (mtu < 68)
403 mtu = 68;
404
405 return mtu;
406}
407
408static struct ip_tunnel *ip_tunnel_create(struct net *net,
409 struct ip_tunnel_net *itn,
410 struct ip_tunnel_parm *parms)
411{
Julia Lawall4929fd82014-05-15 05:43:20 +0200412 struct ip_tunnel *nt;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000413 struct net_device *dev;
414
415 BUG_ON(!itn->fb_tunnel_dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000416 dev = __ip_tunnel_create(net, itn->fb_tunnel_dev->rtnl_link_ops, parms);
417 if (IS_ERR(dev))
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100418 return ERR_CAST(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000419
420 dev->mtu = ip_tunnel_bind_dev(dev);
421
422 nt = netdev_priv(dev);
423 ip_tunnel_add(itn, nt);
424 return nt;
425}
426
427int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700428 const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
429 bool log_ecn_error)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000430{
Li RongQing8f849852014-01-04 13:57:59 +0800431 struct pcpu_sw_netstats *tstats;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000432 const struct iphdr *iph = ip_hdr(skb);
433 int err;
434
Pravin B Shelarc5441932013-03-25 14:49:35 +0000435#ifdef CONFIG_NET_IPGRE_BROADCAST
436 if (ipv4_is_multicast(iph->daddr)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000437 tunnel->dev->stats.multicast++;
438 skb->pkt_type = PACKET_BROADCAST;
439 }
440#endif
441
442 if ((!(tpi->flags&TUNNEL_CSUM) && (tunnel->parms.i_flags&TUNNEL_CSUM)) ||
443 ((tpi->flags&TUNNEL_CSUM) && !(tunnel->parms.i_flags&TUNNEL_CSUM))) {
444 tunnel->dev->stats.rx_crc_errors++;
445 tunnel->dev->stats.rx_errors++;
446 goto drop;
447 }
448
449 if (tunnel->parms.i_flags&TUNNEL_SEQ) {
450 if (!(tpi->flags&TUNNEL_SEQ) ||
451 (tunnel->i_seqno && (s32)(ntohl(tpi->seq) - tunnel->i_seqno) < 0)) {
452 tunnel->dev->stats.rx_fifo_errors++;
453 tunnel->dev->stats.rx_errors++;
454 goto drop;
455 }
456 tunnel->i_seqno = ntohl(tpi->seq) + 1;
457 }
458
Ying Caie96f2e72014-05-04 15:20:04 -0700459 skb_reset_network_header(skb);
460
Pravin B Shelarc5441932013-03-25 14:49:35 +0000461 err = IP_ECN_decapsulate(iph, skb);
462 if (unlikely(err)) {
463 if (log_ecn_error)
464 net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
465 &iph->saddr, iph->tos);
466 if (err > 1) {
467 ++tunnel->dev->stats.rx_frame_errors;
468 ++tunnel->dev->stats.rx_errors;
469 goto drop;
470 }
471 }
472
473 tstats = this_cpu_ptr(tunnel->dev->tstats);
474 u64_stats_update_begin(&tstats->syncp);
475 tstats->rx_packets++;
476 tstats->rx_bytes += skb->len;
477 u64_stats_update_end(&tstats->syncp);
478
Alexei Starovoitov81b9eab2013-11-12 14:39:13 -0800479 skb_scrub_packet(skb, !net_eq(tunnel->net, dev_net(tunnel->dev)));
480
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700481 if (tunnel->dev->type == ARPHRD_ETHER) {
482 skb->protocol = eth_type_trans(skb, tunnel->dev);
483 skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
484 } else {
485 skb->dev = tunnel->dev;
486 }
Nicolas Dichtel64261f22013-08-13 17:51:09 +0200487
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700488 if (tun_dst)
489 skb_dst_set(skb, (struct dst_entry *)tun_dst);
490
Pravin B Shelarc5441932013-03-25 14:49:35 +0000491 gro_cells_receive(&tunnel->gro_cells, skb);
492 return 0;
493
494drop:
495 kfree_skb(skb);
496 return 0;
497}
498EXPORT_SYMBOL_GPL(ip_tunnel_rcv);
499
Tom Herbert56328482014-09-17 12:25:58 -0700500static int ip_encap_hlen(struct ip_tunnel_encap *e)
501{
Tom Herberta8c5f902014-11-12 11:54:09 -0800502 const struct ip_tunnel_encap_ops *ops;
503 int hlen = -EINVAL;
504
505 if (e->type == TUNNEL_ENCAP_NONE)
Tom Herbert56328482014-09-17 12:25:58 -0700506 return 0;
Tom Herberta8c5f902014-11-12 11:54:09 -0800507
508 if (e->type >= MAX_IPTUN_ENCAP_OPS)
Tom Herbert56328482014-09-17 12:25:58 -0700509 return -EINVAL;
Tom Herberta8c5f902014-11-12 11:54:09 -0800510
511 rcu_read_lock();
512 ops = rcu_dereference(iptun_encaps[e->type]);
513 if (likely(ops && ops->encap_hlen))
514 hlen = ops->encap_hlen(e);
515 rcu_read_unlock();
516
517 return hlen;
Tom Herbert56328482014-09-17 12:25:58 -0700518}
519
Tom Herberta8c5f902014-11-12 11:54:09 -0800520const struct ip_tunnel_encap_ops __rcu *
521 iptun_encaps[MAX_IPTUN_ENCAP_OPS] __read_mostly;
522
523int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *ops,
524 unsigned int num)
525{
Thomas Grafbb1553c2014-12-16 21:05:20 +0100526 if (num >= MAX_IPTUN_ENCAP_OPS)
527 return -ERANGE;
528
Tom Herberta8c5f902014-11-12 11:54:09 -0800529 return !cmpxchg((const struct ip_tunnel_encap_ops **)
530 &iptun_encaps[num],
531 NULL, ops) ? 0 : -1;
532}
533EXPORT_SYMBOL(ip_tunnel_encap_add_ops);
534
535int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *ops,
536 unsigned int num)
537{
538 int ret;
539
Thomas Grafbb1553c2014-12-16 21:05:20 +0100540 if (num >= MAX_IPTUN_ENCAP_OPS)
541 return -ERANGE;
542
Tom Herberta8c5f902014-11-12 11:54:09 -0800543 ret = (cmpxchg((const struct ip_tunnel_encap_ops **)
544 &iptun_encaps[num],
545 ops, NULL) == ops) ? 0 : -1;
546
547 synchronize_net();
548
549 return ret;
550}
551EXPORT_SYMBOL(ip_tunnel_encap_del_ops);
552
Tom Herbert56328482014-09-17 12:25:58 -0700553int ip_tunnel_encap_setup(struct ip_tunnel *t,
554 struct ip_tunnel_encap *ipencap)
555{
556 int hlen;
557
558 memset(&t->encap, 0, sizeof(t->encap));
559
560 hlen = ip_encap_hlen(ipencap);
561 if (hlen < 0)
562 return hlen;
563
564 t->encap.type = ipencap->type;
565 t->encap.sport = ipencap->sport;
566 t->encap.dport = ipencap->dport;
567 t->encap.flags = ipencap->flags;
568
569 t->encap_hlen = hlen;
570 t->hlen = t->encap_hlen + t->tun_hlen;
571
572 return 0;
573}
574EXPORT_SYMBOL_GPL(ip_tunnel_encap_setup);
575
Tom Herbert56328482014-09-17 12:25:58 -0700576int ip_tunnel_encap(struct sk_buff *skb, struct ip_tunnel *t,
577 u8 *protocol, struct flowi4 *fl4)
578{
Tom Herberta8c5f902014-11-12 11:54:09 -0800579 const struct ip_tunnel_encap_ops *ops;
580 int ret = -EINVAL;
581
582 if (t->encap.type == TUNNEL_ENCAP_NONE)
Tom Herbert56328482014-09-17 12:25:58 -0700583 return 0;
Tom Herberta8c5f902014-11-12 11:54:09 -0800584
Thomas Graff1fb5212014-12-16 21:05:21 +0100585 if (t->encap.type >= MAX_IPTUN_ENCAP_OPS)
586 return -EINVAL;
587
Tom Herberta8c5f902014-11-12 11:54:09 -0800588 rcu_read_lock();
589 ops = rcu_dereference(iptun_encaps[t->encap.type]);
590 if (likely(ops && ops->build_header))
591 ret = ops->build_header(skb, &t->encap, protocol, fl4);
592 rcu_read_unlock();
593
594 return ret;
Tom Herbert56328482014-09-17 12:25:58 -0700595}
596EXPORT_SYMBOL(ip_tunnel_encap);
597
Pravin B Shelar23a36472013-07-02 10:57:33 -0700598static int tnl_update_pmtu(struct net_device *dev, struct sk_buff *skb,
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300599 struct rtable *rt, __be16 df,
600 const struct iphdr *inner_iph)
Pravin B Shelar23a36472013-07-02 10:57:33 -0700601{
602 struct ip_tunnel *tunnel = netdev_priv(dev);
Alexander Duyck8c91e162013-07-11 13:12:22 -0700603 int pkt_size = skb->len - tunnel->hlen - dev->hard_header_len;
Pravin B Shelar23a36472013-07-02 10:57:33 -0700604 int mtu;
605
606 if (df)
607 mtu = dst_mtu(&rt->dst) - dev->hard_header_len
608 - sizeof(struct iphdr) - tunnel->hlen;
609 else
610 mtu = skb_dst(skb) ? dst_mtu(skb_dst(skb)) : dev->mtu;
611
612 if (skb_dst(skb))
613 skb_dst(skb)->ops->update_pmtu(skb_dst(skb), NULL, skb, mtu);
614
615 if (skb->protocol == htons(ETH_P_IP)) {
616 if (!skb_is_gso(skb) &&
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300617 (inner_iph->frag_off & htons(IP_DF)) &&
618 mtu < pkt_size) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700619 memset(IPCB(skb), 0, sizeof(*IPCB(skb)));
620 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED, htonl(mtu));
621 return -E2BIG;
622 }
623 }
624#if IS_ENABLED(CONFIG_IPV6)
625 else if (skb->protocol == htons(ETH_P_IPV6)) {
626 struct rt6_info *rt6 = (struct rt6_info *)skb_dst(skb);
627
628 if (rt6 && mtu < dst_mtu(skb_dst(skb)) &&
629 mtu >= IPV6_MIN_MTU) {
630 if ((tunnel->parms.iph.daddr &&
631 !ipv4_is_multicast(tunnel->parms.iph.daddr)) ||
632 rt6->rt6i_dst.plen == 128) {
633 rt6->rt6i_flags |= RTF_MODIFIED;
634 dst_metric_set(skb_dst(skb), RTAX_MTU, mtu);
635 }
636 }
637
638 if (!skb_is_gso(skb) && mtu >= IPV6_MIN_MTU &&
639 mtu < pkt_size) {
640 icmpv6_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu);
641 return -E2BIG;
642 }
643 }
644#endif
645 return 0;
646}
647
Pravin B Shelarc5441932013-03-25 14:49:35 +0000648void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
Tom Herbert56328482014-09-17 12:25:58 -0700649 const struct iphdr *tnl_params, u8 protocol)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000650{
651 struct ip_tunnel *tunnel = netdev_priv(dev);
652 const struct iphdr *inner_iph;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000653 struct flowi4 fl4;
654 u8 tos, ttl;
655 __be16 df;
Eric Dumazetb045d372014-02-03 12:52:14 -0800656 struct rtable *rt; /* Route to the other host */
Pravin B Shelarc5441932013-03-25 14:49:35 +0000657 unsigned int max_headroom; /* The extra header space needed */
658 __be32 dst;
Timo Teräs22fb22e2014-05-16 08:34:39 +0300659 bool connected;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000660
661 inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
Timo Teräs22fb22e2014-05-16 08:34:39 +0300662 connected = (tunnel->parms.iph.daddr != 0);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000663
664 dst = tnl_params->daddr;
665 if (dst == 0) {
666 /* NBMA tunnel */
667
Ian Morris51456b22015-04-03 09:17:26 +0100668 if (!skb_dst(skb)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000669 dev->stats.tx_fifo_errors++;
670 goto tx_error;
671 }
672
673 if (skb->protocol == htons(ETH_P_IP)) {
674 rt = skb_rtable(skb);
675 dst = rt_nexthop(rt, inner_iph->daddr);
676 }
677#if IS_ENABLED(CONFIG_IPV6)
678 else if (skb->protocol == htons(ETH_P_IPV6)) {
679 const struct in6_addr *addr6;
680 struct neighbour *neigh;
681 bool do_tx_error_icmp;
682 int addr_type;
683
684 neigh = dst_neigh_lookup(skb_dst(skb),
685 &ipv6_hdr(skb)->daddr);
Ian Morris51456b22015-04-03 09:17:26 +0100686 if (!neigh)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000687 goto tx_error;
688
689 addr6 = (const struct in6_addr *)&neigh->primary_key;
690 addr_type = ipv6_addr_type(addr6);
691
692 if (addr_type == IPV6_ADDR_ANY) {
693 addr6 = &ipv6_hdr(skb)->daddr;
694 addr_type = ipv6_addr_type(addr6);
695 }
696
697 if ((addr_type & IPV6_ADDR_COMPATv4) == 0)
698 do_tx_error_icmp = true;
699 else {
700 do_tx_error_icmp = false;
701 dst = addr6->s6_addr32[3];
702 }
703 neigh_release(neigh);
704 if (do_tx_error_icmp)
705 goto tx_error_icmp;
706 }
707#endif
708 else
709 goto tx_error;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800710
711 connected = false;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000712 }
713
714 tos = tnl_params->tos;
715 if (tos & 0x1) {
716 tos &= ~0x1;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800717 if (skb->protocol == htons(ETH_P_IP)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000718 tos = inner_iph->tos;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800719 connected = false;
720 } else if (skb->protocol == htons(ETH_P_IPV6)) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000721 tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
Tom Herbert7d442fa2014-01-02 11:48:26 -0800722 connected = false;
723 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000724 }
725
Tom Herbert7d442fa2014-01-02 11:48:26 -0800726 init_tunnel_flow(&fl4, protocol, dst, tnl_params->saddr,
727 tunnel->parms.o_key, RT_TOS(tos), tunnel->parms.link);
728
Tom Herbert56328482014-09-17 12:25:58 -0700729 if (ip_tunnel_encap(skb, tunnel, &protocol, &fl4) < 0)
730 goto tx_error;
731
Dmitry Popov95cb5742014-07-29 03:07:52 +0400732 rt = connected ? tunnel_rtable_get(tunnel, 0, &fl4.saddr) : NULL;
Tom Herbert7d442fa2014-01-02 11:48:26 -0800733
734 if (!rt) {
735 rt = ip_route_output_key(tunnel->net, &fl4);
736
737 if (IS_ERR(rt)) {
738 dev->stats.tx_carrier_errors++;
739 goto tx_error;
740 }
741 if (connected)
Dmitry Popov95cb5742014-07-29 03:07:52 +0400742 tunnel_dst_set(tunnel, &rt->dst, fl4.saddr);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000743 }
Tom Herbert7d442fa2014-01-02 11:48:26 -0800744
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700745 if (rt->dst.dev == dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000746 ip_rt_put(rt);
747 dev->stats.collisions++;
748 goto tx_error;
749 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000750
Timo Teräsfc24f2b22015-07-07 08:34:13 +0300751 if (tnl_update_pmtu(dev, skb, rt, tnl_params->frag_off, inner_iph)) {
Pravin B Shelar23a36472013-07-02 10:57:33 -0700752 ip_rt_put(rt);
753 goto tx_error;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000754 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000755
756 if (tunnel->err_count > 0) {
757 if (time_before(jiffies,
758 tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
759 tunnel->err_count--;
760
Duan Jiong11c21a32014-01-23 14:00:25 +0800761 memset(IPCB(skb), 0, sizeof(*IPCB(skb)));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000762 dst_link_failure(skb);
763 } else
764 tunnel->err_count = 0;
765 }
766
Pravin B Shelard4a71b12013-09-25 09:57:47 -0700767 tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000768 ttl = tnl_params->ttl;
769 if (ttl == 0) {
770 if (skb->protocol == htons(ETH_P_IP))
771 ttl = inner_iph->ttl;
772#if IS_ENABLED(CONFIG_IPV6)
773 else if (skb->protocol == htons(ETH_P_IPV6))
774 ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
775#endif
776 else
777 ttl = ip4_dst_hoplimit(&rt->dst);
778 }
779
Pravin B Shelar23a36472013-07-02 10:57:33 -0700780 df = tnl_params->frag_off;
781 if (skb->protocol == htons(ETH_P_IP))
782 df |= (inner_iph->frag_off&htons(IP_DF));
783
Pravin B Shelar0e6fbc52013-06-17 17:49:56 -0700784 max_headroom = LL_RESERVED_SPACE(rt->dst.dev) + sizeof(struct iphdr)
Tom Herbert7371e022014-10-03 15:48:07 -0700785 + rt->dst.header_len + ip_encap_hlen(&tunnel->encap);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200786 if (max_headroom > dev->needed_headroom)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000787 dev->needed_headroom = max_headroom;
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200788
789 if (skb_cow_head(skb, dev->needed_headroom)) {
Dmitry Popov586d5fc2014-06-06 04:34:37 +0400790 ip_rt_put(rt);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200791 dev->stats.tx_dropped++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800792 kfree_skb(skb);
Steffen Klassert3e08f4a2013-10-01 11:33:59 +0200793 return;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000794 }
795
Pravin B Shelar039f5062015-12-24 14:34:54 -0800796 iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, protocol, tos, ttl,
797 df, !net_eq(tunnel->net, dev_net(dev)));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000798 return;
799
800#if IS_ENABLED(CONFIG_IPV6)
801tx_error_icmp:
802 dst_link_failure(skb);
803#endif
804tx_error:
805 dev->stats.tx_errors++;
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800806 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000807}
808EXPORT_SYMBOL_GPL(ip_tunnel_xmit);
809
810static void ip_tunnel_update(struct ip_tunnel_net *itn,
811 struct ip_tunnel *t,
812 struct net_device *dev,
813 struct ip_tunnel_parm *p,
814 bool set_mtu)
815{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700816 ip_tunnel_del(itn, t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000817 t->parms.iph.saddr = p->iph.saddr;
818 t->parms.iph.daddr = p->iph.daddr;
819 t->parms.i_key = p->i_key;
820 t->parms.o_key = p->o_key;
821 if (dev->type != ARPHRD_ETHER) {
822 memcpy(dev->dev_addr, &p->iph.saddr, 4);
823 memcpy(dev->broadcast, &p->iph.daddr, 4);
824 }
825 ip_tunnel_add(itn, t);
826
827 t->parms.iph.ttl = p->iph.ttl;
828 t->parms.iph.tos = p->iph.tos;
829 t->parms.iph.frag_off = p->iph.frag_off;
830
831 if (t->parms.link != p->link) {
832 int mtu;
833
834 t->parms.link = p->link;
835 mtu = ip_tunnel_bind_dev(dev);
836 if (set_mtu)
837 dev->mtu = mtu;
838 }
Nicolas Dichtelcf71d2bc2014-02-20 10:19:31 +0100839 ip_tunnel_dst_reset_all(t);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000840 netdev_state_change(dev);
841}
842
843int ip_tunnel_ioctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd)
844{
845 int err = 0;
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200846 struct ip_tunnel *t = netdev_priv(dev);
847 struct net *net = t->net;
848 struct ip_tunnel_net *itn = net_generic(net, t->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000849
850 BUG_ON(!itn->fb_tunnel_dev);
851 switch (cmd) {
852 case SIOCGETTUNNEL:
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200853 if (dev == itn->fb_tunnel_dev) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000854 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100855 if (!t)
Nicolas Dichtel8c923ce2014-04-16 11:19:32 +0200856 t = netdev_priv(dev);
857 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000858 memcpy(p, &t->parms, sizeof(*p));
859 break;
860
861 case SIOCADDTUNNEL:
862 case SIOCCHGTUNNEL:
863 err = -EPERM;
864 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
865 goto done;
866 if (p->iph.ttl)
867 p->iph.frag_off |= htons(IP_DF);
Dmitry Popov7c8e6b92014-06-08 02:06:25 +0400868 if (!(p->i_flags & VTI_ISVTI)) {
869 if (!(p->i_flags & TUNNEL_KEY))
870 p->i_key = 0;
871 if (!(p->o_flags & TUNNEL_KEY))
872 p->o_key = 0;
873 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000874
875 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
876
Steffen Klassertd61746b2014-09-22 09:11:08 +0200877 if (cmd == SIOCADDTUNNEL) {
878 if (!t) {
879 t = ip_tunnel_create(net, itn, p);
880 err = PTR_ERR_OR_ZERO(t);
881 break;
882 }
883
884 err = -EEXIST;
Duan Jiongee30ef4d2014-05-15 13:07:02 +0800885 break;
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100886 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000887 if (dev != itn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
Ian Morris00db4122015-04-03 09:17:27 +0100888 if (t) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000889 if (t->dev != dev) {
890 err = -EEXIST;
891 break;
892 }
893 } else {
894 unsigned int nflags = 0;
895
896 if (ipv4_is_multicast(p->iph.daddr))
897 nflags = IFF_BROADCAST;
898 else if (p->iph.daddr)
899 nflags = IFF_POINTOPOINT;
900
901 if ((dev->flags^nflags)&(IFF_POINTOPOINT|IFF_BROADCAST)) {
902 err = -EINVAL;
903 break;
904 }
905
906 t = netdev_priv(dev);
907 }
908 }
909
910 if (t) {
911 err = 0;
912 ip_tunnel_update(itn, t, dev, p, true);
Florian Westphal6dd3c9e2014-02-14 13:14:39 +0100913 } else {
914 err = -ENOENT;
915 }
Pravin B Shelarc5441932013-03-25 14:49:35 +0000916 break;
917
918 case SIOCDELTUNNEL:
919 err = -EPERM;
920 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
921 goto done;
922
923 if (dev == itn->fb_tunnel_dev) {
924 err = -ENOENT;
925 t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
Ian Morris51456b22015-04-03 09:17:26 +0100926 if (!t)
Pravin B Shelarc5441932013-03-25 14:49:35 +0000927 goto done;
928 err = -EPERM;
929 if (t == netdev_priv(itn->fb_tunnel_dev))
930 goto done;
931 dev = t->dev;
932 }
933 unregister_netdevice(dev);
934 err = 0;
935 break;
936
937 default:
938 err = -EINVAL;
939 }
940
941done:
942 return err;
943}
944EXPORT_SYMBOL_GPL(ip_tunnel_ioctl);
945
946int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
947{
948 struct ip_tunnel *tunnel = netdev_priv(dev);
949 int t_hlen = tunnel->hlen + sizeof(struct iphdr);
950
951 if (new_mtu < 68 ||
952 new_mtu > 0xFFF8 - dev->hard_header_len - t_hlen)
953 return -EINVAL;
954 dev->mtu = new_mtu;
955 return 0;
956}
957EXPORT_SYMBOL_GPL(ip_tunnel_change_mtu);
958
959static void ip_tunnel_dev_free(struct net_device *dev)
960{
961 struct ip_tunnel *tunnel = netdev_priv(dev);
962
963 gro_cells_destroy(&tunnel->gro_cells);
Tom Herbert9a4aa9a2014-01-02 11:48:33 -0800964 free_percpu(tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000965 free_percpu(dev->tstats);
966 free_netdev(dev);
967}
968
969void ip_tunnel_dellink(struct net_device *dev, struct list_head *head)
970{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000971 struct ip_tunnel *tunnel = netdev_priv(dev);
972 struct ip_tunnel_net *itn;
973
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200974 itn = net_generic(tunnel->net, tunnel->ip_tnl_net_id);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000975
976 if (itn->fb_tunnel_dev != dev) {
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700977 ip_tunnel_del(itn, netdev_priv(dev));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000978 unregister_netdevice_queue(dev, head);
979 }
980}
981EXPORT_SYMBOL_GPL(ip_tunnel_dellink);
982
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +0100983struct net *ip_tunnel_get_link_net(const struct net_device *dev)
984{
985 struct ip_tunnel *tunnel = netdev_priv(dev);
986
987 return tunnel->net;
988}
989EXPORT_SYMBOL(ip_tunnel_get_link_net);
990
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200991int ip_tunnel_get_iflink(const struct net_device *dev)
992{
993 struct ip_tunnel *tunnel = netdev_priv(dev);
994
995 return tunnel->parms.link;
996}
997EXPORT_SYMBOL(ip_tunnel_get_iflink);
998
Eric Dumazetd3b6f612013-06-07 13:26:05 -0700999int ip_tunnel_init_net(struct net *net, int ip_tnl_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001000 struct rtnl_link_ops *ops, char *devname)
1001{
1002 struct ip_tunnel_net *itn = net_generic(net, ip_tnl_net_id);
1003 struct ip_tunnel_parm parms;
stephen hemminger6261d982013-08-05 22:51:37 -07001004 unsigned int i;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001005
stephen hemminger6261d982013-08-05 22:51:37 -07001006 for (i = 0; i < IP_TNL_HASH_SIZE; i++)
1007 INIT_HLIST_HEAD(&itn->tunnels[i]);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001008
1009 if (!ops) {
1010 itn->fb_tunnel_dev = NULL;
1011 return 0;
1012 }
stephen hemminger6261d982013-08-05 22:51:37 -07001013
Pravin B Shelarc5441932013-03-25 14:49:35 +00001014 memset(&parms, 0, sizeof(parms));
1015 if (devname)
1016 strlcpy(parms.name, devname, IFNAMSIZ);
1017
1018 rtnl_lock();
1019 itn->fb_tunnel_dev = __ip_tunnel_create(net, ops, &parms);
Dan Carpenterea857f22013-08-19 10:05:10 +03001020 /* FB netdevice is special: we have one, and only one per netns.
1021 * Allowing to move it to another netns is clearly unsafe.
1022 */
Steffen Klassert67013282013-10-01 11:34:48 +02001023 if (!IS_ERR(itn->fb_tunnel_dev)) {
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001024 itn->fb_tunnel_dev->features |= NETIF_F_NETNS_LOCAL;
Steffen Klassert78ff4be2014-05-19 11:36:56 +02001025 itn->fb_tunnel_dev->mtu = ip_tunnel_bind_dev(itn->fb_tunnel_dev);
Steffen Klassert67013282013-10-01 11:34:48 +02001026 ip_tunnel_add(itn, netdev_priv(itn->fb_tunnel_dev));
1027 }
Dan Carpenterb4de77a2013-08-23 11:15:37 +03001028 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001029
Sachin Kamat27d79f32014-01-27 12:13:57 +05301030 return PTR_ERR_OR_ZERO(itn->fb_tunnel_dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001031}
1032EXPORT_SYMBOL_GPL(ip_tunnel_init_net);
1033
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001034static void ip_tunnel_destroy(struct ip_tunnel_net *itn, struct list_head *head,
1035 struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001036{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001037 struct net *net = dev_net(itn->fb_tunnel_dev);
1038 struct net_device *dev, *aux;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001039 int h;
1040
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001041 for_each_netdev_safe(net, dev, aux)
1042 if (dev->rtnl_link_ops == ops)
1043 unregister_netdevice_queue(dev, head);
1044
Pravin B Shelarc5441932013-03-25 14:49:35 +00001045 for (h = 0; h < IP_TNL_HASH_SIZE; h++) {
1046 struct ip_tunnel *t;
1047 struct hlist_node *n;
1048 struct hlist_head *thead = &itn->tunnels[h];
1049
1050 hlist_for_each_entry_safe(t, n, thead, hash_node)
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001051 /* If dev is in the same netns, it has already
1052 * been added to the list by the previous loop.
1053 */
1054 if (!net_eq(dev_net(t->dev), net))
1055 unregister_netdevice_queue(t->dev, head);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001056 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001057}
1058
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001059void ip_tunnel_delete_net(struct ip_tunnel_net *itn, struct rtnl_link_ops *ops)
Pravin B Shelarc5441932013-03-25 14:49:35 +00001060{
1061 LIST_HEAD(list);
1062
1063 rtnl_lock();
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001064 ip_tunnel_destroy(itn, &list, ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001065 unregister_netdevice_many(&list);
1066 rtnl_unlock();
Pravin B Shelarc5441932013-03-25 14:49:35 +00001067}
1068EXPORT_SYMBOL_GPL(ip_tunnel_delete_net);
1069
1070int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
1071 struct ip_tunnel_parm *p)
1072{
1073 struct ip_tunnel *nt;
1074 struct net *net = dev_net(dev);
1075 struct ip_tunnel_net *itn;
1076 int mtu;
1077 int err;
1078
1079 nt = netdev_priv(dev);
1080 itn = net_generic(net, nt->ip_tnl_net_id);
1081
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001082 if (nt->collect_md) {
1083 if (rtnl_dereference(itn->collect_md_tun))
1084 return -EEXIST;
1085 } else {
1086 if (ip_tunnel_find(itn, p, dev->type))
1087 return -EEXIST;
1088 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001089
Nicolas Dichtel5e6700b2013-06-26 16:11:28 +02001090 nt->net = net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001091 nt->parms = *p;
1092 err = register_netdevice(dev);
1093 if (err)
1094 goto out;
1095
1096 if (dev->type == ARPHRD_ETHER && !tb[IFLA_ADDRESS])
1097 eth_hw_addr_random(dev);
1098
1099 mtu = ip_tunnel_bind_dev(dev);
1100 if (!tb[IFLA_MTU])
1101 dev->mtu = mtu;
1102
1103 ip_tunnel_add(itn, nt);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001104out:
1105 return err;
1106}
1107EXPORT_SYMBOL_GPL(ip_tunnel_newlink);
1108
1109int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
1110 struct ip_tunnel_parm *p)
1111{
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001112 struct ip_tunnel *t;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001113 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001114 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001115 struct ip_tunnel_net *itn = net_generic(net, tunnel->ip_tnl_net_id);
1116
1117 if (dev == itn->fb_tunnel_dev)
1118 return -EINVAL;
1119
Pravin B Shelarc5441932013-03-25 14:49:35 +00001120 t = ip_tunnel_find(itn, p, dev->type);
1121
1122 if (t) {
1123 if (t->dev != dev)
1124 return -EEXIST;
1125 } else {
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001126 t = tunnel;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001127
1128 if (dev->type != ARPHRD_ETHER) {
1129 unsigned int nflags = 0;
1130
1131 if (ipv4_is_multicast(p->iph.daddr))
1132 nflags = IFF_BROADCAST;
1133 else if (p->iph.daddr)
1134 nflags = IFF_POINTOPOINT;
1135
1136 if ((dev->flags ^ nflags) &
1137 (IFF_POINTOPOINT | IFF_BROADCAST))
1138 return -EINVAL;
1139 }
1140 }
1141
1142 ip_tunnel_update(itn, t, dev, p, !tb[IFLA_MTU]);
1143 return 0;
1144}
1145EXPORT_SYMBOL_GPL(ip_tunnel_changelink);
1146
1147int ip_tunnel_init(struct net_device *dev)
1148{
1149 struct ip_tunnel *tunnel = netdev_priv(dev);
1150 struct iphdr *iph = &tunnel->parms.iph;
WANG Cong1c213bd2014-02-13 11:46:28 -08001151 int err;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001152
1153 dev->destructor = ip_tunnel_dev_free;
WANG Cong1c213bd2014-02-13 11:46:28 -08001154 dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001155 if (!dev->tstats)
1156 return -ENOMEM;
1157
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001158 tunnel->dst_cache = alloc_percpu(struct ip_tunnel_dst);
1159 if (!tunnel->dst_cache) {
1160 free_percpu(dev->tstats);
1161 return -ENOMEM;
1162 }
1163
Pravin B Shelarc5441932013-03-25 14:49:35 +00001164 err = gro_cells_init(&tunnel->gro_cells, dev);
1165 if (err) {
Tom Herbert9a4aa9a2014-01-02 11:48:33 -08001166 free_percpu(tunnel->dst_cache);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001167 free_percpu(dev->tstats);
1168 return err;
1169 }
1170
1171 tunnel->dev = dev;
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001172 tunnel->net = dev_net(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001173 strcpy(tunnel->parms.name, dev->name);
1174 iph->version = 4;
1175 iph->ihl = 5;
1176
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001177 if (tunnel->collect_md) {
1178 dev->features |= NETIF_F_NETNS_LOCAL;
1179 netif_keep_dst(dev);
1180 }
Pravin B Shelarc5441932013-03-25 14:49:35 +00001181 return 0;
1182}
1183EXPORT_SYMBOL_GPL(ip_tunnel_init);
1184
1185void ip_tunnel_uninit(struct net_device *dev)
1186{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001187 struct ip_tunnel *tunnel = netdev_priv(dev);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001188 struct net *net = tunnel->net;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001189 struct ip_tunnel_net *itn;
1190
1191 itn = net_generic(net, tunnel->ip_tnl_net_id);
1192 /* fb_tunnel_dev will be unregisted in net-exit call. */
1193 if (itn->fb_tunnel_dev != dev)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001194 ip_tunnel_del(itn, netdev_priv(dev));
Tom Herbert7d442fa2014-01-02 11:48:26 -08001195
Nicolas Dichtelcf71d2bc2014-02-20 10:19:31 +01001196 ip_tunnel_dst_reset_all(tunnel);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001197}
1198EXPORT_SYMBOL_GPL(ip_tunnel_uninit);
1199
1200/* Do least required initialization, rest of init is done in tunnel_init call */
1201void ip_tunnel_setup(struct net_device *dev, int net_id)
1202{
1203 struct ip_tunnel *tunnel = netdev_priv(dev);
1204 tunnel->ip_tnl_net_id = net_id;
1205}
1206EXPORT_SYMBOL_GPL(ip_tunnel_setup);
1207
1208MODULE_LICENSE("GPL");