blob: 1e441c6f216025339caf5d82a04ea3570566641a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: IP/IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Authors:
5 * Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
6 *
7 * Fixes:
8 * Alan Cox : Merged and made usable non modular (its so tiny its silly as
9 * a module taking up 2 pages).
10 * Alan Cox : Fixed bug with 1.3.18 and IPIP not working (now needs to set skb->h.iph)
11 * to keep ip_forward happy.
12 * Alan Cox : More fixes for 1.3.21, and firewall fix. Maybe this will work soon 8).
13 * Kai Schulte : Fixed #defines for IP_FIREWALL->FIREWALL
14 * David Woodhouse : Perform some basic ICMP handling.
15 * IPIP Routing without decapsulation.
16 * Carlos Picoto : GRE over IP support
17 * Alexey Kuznetsov: Reworked. Really, now it is truncated version of ipv4/ip_gre.c.
18 * I do not want to merge them together.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 *
25 */
26
27/* tunnel.c: an IP tunnel driver
28
29 The purpose of this driver is to provide an IP tunnel through
30 which you can tunnel network traffic transparently across subnets.
31
32 This was written by looking at Nick Holloway's dummy driver
33 Thanks for the great code!
34
35 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090036
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 Minor tweaks:
38 Cleaned up the code a little and added some pre-1.3.0 tweaks.
39 dev->hard_header/hard_header_len changed to use no headers.
40 Comments/bracketing tweaked.
41 Made the tunnels use dev->name not tunnel: when error reporting.
42 Added tx_dropped stat
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090043
Alan Cox113aa832008-10-13 19:01:08 -070044 -Alan Cox (alan@lxorguk.ukuu.org.uk) 21 March 95
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46 Reworked:
47 Changed to tunnel to destination gateway in addition to the
48 tunnel's pointopoint address
49 Almost completely rewritten
50 Note: There is currently no firewall or ICMP handling done.
51
52 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/13/96
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090053
Linus Torvalds1da177e2005-04-16 15:20:36 -070054*/
55
56/* Things I wish I had known when writing the tunnel driver:
57
58 When the tunnel_xmit() function is called, the skb contains the
59 packet to be sent (plus a great deal of extra info), and dev
60 contains the tunnel device that _we_ are.
61
62 When we are passed a packet, we are expected to fill in the
63 source address with our source IP address.
64
65 What is the proper way to allocate, copy and free a buffer?
66 After you allocate it, it is a "0 length" chunk of memory
67 starting at zero. If you want to add headers to the buffer
68 later, you'll have to call "skb_reserve(skb, amount)" with
69 the amount of memory you want reserved. Then, you call
70 "skb_put(skb, amount)" with the amount of space you want in
71 the buffer. skb_put() returns a pointer to the top (#0) of
72 that buffer. skb->len is set to the amount of space you have
73 "allocated" with skb_put(). You can then write up to skb->len
74 bytes to that buffer. If you need more, you can call skb_put()
75 again with the additional amount of space you need. You can
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090076 find out how much more space you can allocate by calling
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 "skb_tailroom(skb)".
78 Now, to add header space, call "skb_push(skb, header_len)".
79 This creates space at the beginning of the buffer and returns
80 a pointer to this new space. If later you need to strip a
81 header from a buffer, call "skb_pull(skb, header_len)".
82 skb_headroom() will return how much space is left at the top
83 of the buffer (before the main data). Remember, this headroom
84 space must be reserved before the skb_put() function is called.
85 */
86
87/*
88 This version of net/ipv4/ipip.c is cloned of net/ipv4/ip_gre.c
89
90 For comments look at net/ipv4/ip_gre.c --ANK
91 */
92
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090093
Randy Dunlap4fc268d2006-01-11 12:17:47 -080094#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#include <linux/module.h>
96#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070097#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090098#include <linux/slab.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080099#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100#include <linux/skbuff.h>
101#include <linux/netdevice.h>
102#include <linux/in.h>
103#include <linux/tcp.h>
104#include <linux/udp.h>
105#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#include <linux/init.h>
107#include <linux/netfilter_ipv4.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800108#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
110#include <net/sock.h>
111#include <net/ip.h>
112#include <net/icmp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +0000113#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#include <net/inet_ecn.h>
115#include <net/xfrm.h>
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700116#include <net/net_namespace.h>
117#include <net/netns/generic.h>
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700118#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000120static bool log_ecn_error = true;
121module_param(log_ecn_error, bool, 0644);
122MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
123
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +0300124static unsigned int ipip_net_id __read_mostly;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700125
Eric Dumazet3c97af92010-09-27 00:35:50 +0000126static int ipip_tunnel_init(struct net_device *dev);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000127static struct rtnl_link_ops ipip_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
Herbert Xud2acc342006-03-28 01:12:13 -0800129static int ipip_err(struct sk_buff *skb, u32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131
Rami Rosen071f92d2008-05-21 17:47:54 -0700132/* All the routers (except for Linux) return only
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133 8 bytes of packet payload. It means, that precise relaying of
134 ICMP in the real Internet is absolutely infeasible.
135 */
Pravin B Shelarfd581562013-03-25 14:49:41 +0000136 struct net *net = dev_net(skb->dev);
137 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000138 const struct iphdr *iph = (const struct iphdr *)skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 struct ip_tunnel *t;
Herbert Xud2acc342006-03-28 01:12:13 -0800140 int err;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000141 const int type = icmp_hdr(skb)->type;
142 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Herbert Xud2acc342006-03-28 01:12:13 -0800144 err = -ENOENT;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000145 t = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
146 iph->daddr, iph->saddr, 0);
Ian Morris51456b22015-04-03 09:17:26 +0100147 if (!t)
David S. Miller36393392012-06-14 22:21:46 -0700148 goto out;
149
150 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
151 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200152 t->parms.link, 0, iph->protocol, 0);
David S. Miller36393392012-06-14 22:21:46 -0700153 err = 0;
154 goto out;
155 }
156
David S. Miller55be7a92012-07-11 21:27:49 -0700157 if (type == ICMP_REDIRECT) {
Dmitry Popov23468292014-06-06 23:19:21 +0400158 ipv4_redirect(skb, dev_net(skb->dev), t->parms.link, 0,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200159 iph->protocol, 0);
David S. Miller55be7a92012-07-11 21:27:49 -0700160 err = 0;
161 goto out;
162 }
163
David S. Miller36393392012-06-14 22:21:46 -0700164 if (t->parms.iph.daddr == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 goto out;
Herbert Xud2acc342006-03-28 01:12:13 -0800166
167 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
169 goto out;
170
Wei Yongjun26d94b42009-02-24 23:36:47 -0800171 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 t->err_count++;
173 else
174 t->err_count = 1;
175 t->err_time = jiffies;
stephen hemmingerb0558ef2012-09-24 18:12:25 +0000176
Pravin B Shelarfd581562013-03-25 14:49:41 +0000177out:
Herbert Xud2acc342006-03-28 01:12:13 -0800178 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179}
180
Simon Horman1b69e7e2016-07-07 07:56:14 +0200181static const struct tnl_ptk_info ipip_tpi = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000182 /* no tunnel info required for ipip. */
183 .proto = htons(ETH_P_IP),
184};
185
Simon Horman1b69e7e2016-07-07 07:56:14 +0200186#if IS_ENABLED(CONFIG_MPLS)
187static const struct tnl_ptk_info mplsip_tpi = {
188 /* no tunnel info required for mplsip. */
189 .proto = htons(ETH_P_MPLS_UC),
190};
191#endif
192
193static int ipip_tunnel_rcv(struct sk_buff *skb, u8 ipproto)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000195 struct net *net = dev_net(skb->dev);
196 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700197 struct metadata_dst *tun_dst = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 struct ip_tunnel *tunnel;
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700199 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700201 iph = ip_hdr(skb);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000202 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
203 iph->saddr, iph->daddr, 0);
204 if (tunnel) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200205 const struct tnl_ptk_info *tpi;
206
207 if (tunnel->parms.iph.protocol != ipproto &&
208 tunnel->parms.iph.protocol != 0)
209 goto drop;
210
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000211 if (!xfrm4_policy_check(NULL, XFRM_POLICY_IN, skb))
212 goto drop;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200213#if IS_ENABLED(CONFIG_MPLS)
214 if (ipproto == IPPROTO_MPLS)
215 tpi = &mplsip_tpi;
216 else
217#endif
218 tpi = &ipip_tpi;
219 if (iptunnel_pull_header(skb, 0, tpi->proto, false))
Li Hongjun737e8282013-08-28 11:54:50 +0200220 goto drop;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700221 if (tunnel->collect_md) {
222 tun_dst = ip_tun_rx_dst(skb, 0, 0, 0);
223 if (!tun_dst)
224 return 0;
225 }
226 return ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 return -1;
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000230
231drop:
232 kfree_skb(skb);
233 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234}
235
Simon Horman1b69e7e2016-07-07 07:56:14 +0200236static int ipip_rcv(struct sk_buff *skb)
237{
238 return ipip_tunnel_rcv(skb, IPPROTO_IPIP);
239}
240
241#if IS_ENABLED(CONFIG_MPLS)
242static int mplsip_rcv(struct sk_buff *skb)
243{
244 return ipip_tunnel_rcv(skb, IPPROTO_MPLS);
245}
246#endif
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248/*
249 * This function assumes it is being called from dev_queue_xmit()
250 * and that skb is filled properly by that function.
251 */
Simon Horman1b69e7e2016-07-07 07:56:14 +0200252static netdev_tx_t ipip_tunnel_xmit(struct sk_buff *skb,
253 struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254{
Patrick McHardy2941a482006-01-08 22:05:26 -0800255 struct ip_tunnel *tunnel = netdev_priv(dev);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000256 const struct iphdr *tiph = &tunnel->parms.iph;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200257 u8 ipproto;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
Simon Horman1b69e7e2016-07-07 07:56:14 +0200259 switch (skb->protocol) {
260 case htons(ETH_P_IP):
261 ipproto = IPPROTO_IPIP;
262 break;
263#if IS_ENABLED(CONFIG_MPLS)
264 case htons(ETH_P_MPLS_UC):
265 ipproto = IPPROTO_MPLS;
266 break;
267#endif
268 default:
269 goto tx_error;
270 }
271
272 if (tiph->protocol != ipproto && tiph->protocol != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 goto tx_error;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000274
Tom Herbert7e133182016-05-18 09:06:10 -0700275 if (iptunnel_handle_offloads(skb, SKB_GSO_IPXIP4))
Alexander Duyckaed069d2016-04-14 15:33:37 -0400276 goto tx_error;
Pravin B Shelar4f3ed922013-03-08 15:12:52 +0000277
Simon Horman1b69e7e2016-07-07 07:56:14 +0200278 skb_set_inner_ipproto(skb, ipproto);
Tom Herbert077c5a02014-09-29 20:22:31 -0700279
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700280 if (tunnel->collect_md)
281 ip_md_tunnel_xmit(skb, dev, ipproto);
282 else
283 ip_tunnel_xmit(skb, dev, tiph, ipproto);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000284 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286tx_error:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800287 kfree_skb(skb);
Alexander Duyckaed069d2016-04-14 15:33:37 -0400288
Eric Dumazetcb32f512013-10-19 11:42:57 -0700289 dev->stats.tx_errors++;
Patrick McHardy6ed10652009-06-23 06:03:08 +0000290 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291}
292
Simon Horman1b69e7e2016-07-07 07:56:14 +0200293static bool ipip_tunnel_ioctl_verify_protocol(u8 ipproto)
294{
295 switch (ipproto) {
296 case 0:
297 case IPPROTO_IPIP:
298#if IS_ENABLED(CONFIG_MPLS)
299 case IPPROTO_MPLS:
300#endif
301 return true;
302 }
303
304 return false;
305}
306
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307static int
Pravin B Shelarfd581562013-03-25 14:49:41 +0000308ipip_tunnel_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309{
310 int err = 0;
311 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
Pravin B Shelarfd581562013-03-25 14:49:41 +0000313 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
314 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Cong Wang3b7b5142013-07-02 14:49:34 +0800316 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200317 if (p.iph.version != 4 ||
318 !ipip_tunnel_ioctl_verify_protocol(p.iph.protocol) ||
Cong Wang3b7b5142013-07-02 14:49:34 +0800319 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)))
320 return -EINVAL;
321 }
322
Eric Dumazet252a8fb2015-05-15 08:58:45 -0700323 p.i_key = p.o_key = 0;
324 p.i_flags = p.o_flags = 0;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000325 err = ip_tunnel_ioctl(dev, &p, cmd);
326 if (err)
327 return err;
328
329 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
330 return -EFAULT;
331
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 return 0;
333}
334
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800335static const struct net_device_ops ipip_netdev_ops = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000336 .ndo_init = ipip_tunnel_init,
337 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800338 .ndo_start_xmit = ipip_tunnel_xmit,
339 .ndo_do_ioctl = ipip_tunnel_ioctl,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000340 .ndo_change_mtu = ip_tunnel_change_mtu,
341 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200342 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800343};
344
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000345#define IPIP_FEATURES (NETIF_F_SG | \
346 NETIF_F_FRAGLIST | \
347 NETIF_F_HIGHDMA | \
Eric Dumazetcb32f512013-10-19 11:42:57 -0700348 NETIF_F_GSO_SOFTWARE | \
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000349 NETIF_F_HW_CSUM)
350
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351static void ipip_tunnel_setup(struct net_device *dev)
352{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800353 dev->netdev_ops = &ipip_netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354
355 dev->type = ARPHRD_TUNNEL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 dev->flags = IFF_NOARP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 dev->addr_len = 4;
Eric Dumazet153f0942010-09-28 00:17:17 +0000358 dev->features |= NETIF_F_LLTX;
Eric Dumazet02875872014-10-05 18:38:35 -0700359 netif_keep_dst(dev);
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000360
361 dev->features |= IPIP_FEATURES;
362 dev->hw_features |= IPIP_FEATURES;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000363 ip_tunnel_setup(dev, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364}
365
Eric Dumazet3c97af92010-09-27 00:35:50 +0000366static int ipip_tunnel_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800368 struct ip_tunnel *tunnel = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370 memcpy(dev->dev_addr, &tunnel->parms.iph.saddr, 4);
371 memcpy(dev->broadcast, &tunnel->parms.iph.daddr, 4);
372
Tom Herbert473ab822014-09-17 12:26:00 -0700373 tunnel->tun_hlen = 0;
374 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000375 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376}
377
Simon Horman1b69e7e2016-07-07 07:56:14 +0200378static int ipip_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
379{
380 u8 proto;
381
382 if (!data || !data[IFLA_IPTUN_PROTO])
383 return 0;
384
385 proto = nla_get_u8(data[IFLA_IPTUN_PROTO]);
386 if (proto != IPPROTO_IPIP && proto != IPPROTO_MPLS && proto != 0)
387 return -EINVAL;
388
389 return 0;
390}
391
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000392static void ipip_netlink_parms(struct nlattr *data[],
Craig Gallek9830ad42017-04-19 12:30:54 -0400393 struct ip_tunnel_parm *parms, bool *collect_md,
394 __u32 *fwmark)
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000395{
396 memset(parms, 0, sizeof(*parms));
397
398 parms->iph.version = 4;
399 parms->iph.protocol = IPPROTO_IPIP;
400 parms->iph.ihl = 5;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700401 *collect_md = false;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000402
403 if (!data)
404 return;
405
406 if (data[IFLA_IPTUN_LINK])
407 parms->link = nla_get_u32(data[IFLA_IPTUN_LINK]);
408
409 if (data[IFLA_IPTUN_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +0200410 parms->iph.saddr = nla_get_in_addr(data[IFLA_IPTUN_LOCAL]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000411
412 if (data[IFLA_IPTUN_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +0200413 parms->iph.daddr = nla_get_in_addr(data[IFLA_IPTUN_REMOTE]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000414
415 if (data[IFLA_IPTUN_TTL]) {
416 parms->iph.ttl = nla_get_u8(data[IFLA_IPTUN_TTL]);
417 if (parms->iph.ttl)
418 parms->iph.frag_off = htons(IP_DF);
419 }
420
421 if (data[IFLA_IPTUN_TOS])
422 parms->iph.tos = nla_get_u8(data[IFLA_IPTUN_TOS]);
423
Simon Horman1b69e7e2016-07-07 07:56:14 +0200424 if (data[IFLA_IPTUN_PROTO])
425 parms->iph.protocol = nla_get_u8(data[IFLA_IPTUN_PROTO]);
426
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000427 if (!data[IFLA_IPTUN_PMTUDISC] || nla_get_u8(data[IFLA_IPTUN_PMTUDISC]))
428 parms->iph.frag_off = htons(IP_DF);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700429
430 if (data[IFLA_IPTUN_COLLECT_METADATA])
431 *collect_md = true;
Craig Gallek9830ad42017-04-19 12:30:54 -0400432
433 if (data[IFLA_IPTUN_FWMARK])
434 *fwmark = nla_get_u32(data[IFLA_IPTUN_FWMARK]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000435}
436
Tom Herbert473ab822014-09-17 12:26:00 -0700437/* This function returns true when ENCAP attributes are present in the nl msg */
438static bool ipip_netlink_encap_parms(struct nlattr *data[],
439 struct ip_tunnel_encap *ipencap)
440{
441 bool ret = false;
442
443 memset(ipencap, 0, sizeof(*ipencap));
444
445 if (!data)
446 return ret;
447
448 if (data[IFLA_IPTUN_ENCAP_TYPE]) {
449 ret = true;
450 ipencap->type = nla_get_u16(data[IFLA_IPTUN_ENCAP_TYPE]);
451 }
452
453 if (data[IFLA_IPTUN_ENCAP_FLAGS]) {
454 ret = true;
455 ipencap->flags = nla_get_u16(data[IFLA_IPTUN_ENCAP_FLAGS]);
456 }
457
458 if (data[IFLA_IPTUN_ENCAP_SPORT]) {
459 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100460 ipencap->sport = nla_get_be16(data[IFLA_IPTUN_ENCAP_SPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700461 }
462
463 if (data[IFLA_IPTUN_ENCAP_DPORT]) {
464 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100465 ipencap->dport = nla_get_be16(data[IFLA_IPTUN_ENCAP_DPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700466 }
467
468 return ret;
469}
470
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000471static int ipip_newlink(struct net *src_net, struct net_device *dev,
472 struct nlattr *tb[], struct nlattr *data[])
473{
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700474 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000475 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700476 struct ip_tunnel_encap ipencap;
Craig Gallek9830ad42017-04-19 12:30:54 -0400477 __u32 fwmark = 0;
Tom Herbert473ab822014-09-17 12:26:00 -0700478
479 if (ipip_netlink_encap_parms(data, &ipencap)) {
Tom Herbert473ab822014-09-17 12:26:00 -0700480 int err = ip_tunnel_encap_setup(t, &ipencap);
481
482 if (err < 0)
483 return err;
484 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000485
Craig Gallek9830ad42017-04-19 12:30:54 -0400486 ipip_netlink_parms(data, &p, &t->collect_md, &fwmark);
487 return ip_tunnel_newlink(dev, tb, &p, fwmark);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000488}
489
490static int ipip_changelink(struct net_device *dev, struct nlattr *tb[],
491 struct nlattr *data[])
492{
Craig Gallek9830ad42017-04-19 12:30:54 -0400493 struct ip_tunnel *t = netdev_priv(dev);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000494 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700495 struct ip_tunnel_encap ipencap;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700496 bool collect_md;
Craig Gallek9830ad42017-04-19 12:30:54 -0400497 __u32 fwmark = t->fwmark;
Tom Herbert473ab822014-09-17 12:26:00 -0700498
499 if (ipip_netlink_encap_parms(data, &ipencap)) {
Tom Herbert473ab822014-09-17 12:26:00 -0700500 int err = ip_tunnel_encap_setup(t, &ipencap);
501
502 if (err < 0)
503 return err;
504 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000505
Craig Gallek9830ad42017-04-19 12:30:54 -0400506 ipip_netlink_parms(data, &p, &collect_md, &fwmark);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700507 if (collect_md)
508 return -EINVAL;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000509
510 if (((dev->flags & IFF_POINTOPOINT) && !p.iph.daddr) ||
511 (!(dev->flags & IFF_POINTOPOINT) && p.iph.daddr))
512 return -EINVAL;
513
Craig Gallek9830ad42017-04-19 12:30:54 -0400514 return ip_tunnel_changelink(dev, tb, &p, fwmark);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000515}
516
Nicolas Dichtel09746582012-11-09 06:09:59 +0000517static size_t ipip_get_size(const struct net_device *dev)
518{
519 return
520 /* IFLA_IPTUN_LINK */
521 nla_total_size(4) +
522 /* IFLA_IPTUN_LOCAL */
523 nla_total_size(4) +
524 /* IFLA_IPTUN_REMOTE */
525 nla_total_size(4) +
526 /* IFLA_IPTUN_TTL */
527 nla_total_size(1) +
528 /* IFLA_IPTUN_TOS */
529 nla_total_size(1) +
Simon Horman1b69e7e2016-07-07 07:56:14 +0200530 /* IFLA_IPTUN_PROTO */
531 nla_total_size(1) +
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000532 /* IFLA_IPTUN_PMTUDISC */
533 nla_total_size(1) +
Tom Herbert473ab822014-09-17 12:26:00 -0700534 /* IFLA_IPTUN_ENCAP_TYPE */
535 nla_total_size(2) +
536 /* IFLA_IPTUN_ENCAP_FLAGS */
537 nla_total_size(2) +
538 /* IFLA_IPTUN_ENCAP_SPORT */
539 nla_total_size(2) +
540 /* IFLA_IPTUN_ENCAP_DPORT */
541 nla_total_size(2) +
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700542 /* IFLA_IPTUN_COLLECT_METADATA */
543 nla_total_size(0) +
Craig Gallek9830ad42017-04-19 12:30:54 -0400544 /* IFLA_IPTUN_FWMARK */
545 nla_total_size(4) +
Nicolas Dichtel09746582012-11-09 06:09:59 +0000546 0;
547}
548
549static int ipip_fill_info(struct sk_buff *skb, const struct net_device *dev)
550{
551 struct ip_tunnel *tunnel = netdev_priv(dev);
552 struct ip_tunnel_parm *parm = &tunnel->parms;
553
554 if (nla_put_u32(skb, IFLA_IPTUN_LINK, parm->link) ||
Jiri Benc930345e2015-03-29 16:59:25 +0200555 nla_put_in_addr(skb, IFLA_IPTUN_LOCAL, parm->iph.saddr) ||
556 nla_put_in_addr(skb, IFLA_IPTUN_REMOTE, parm->iph.daddr) ||
Nicolas Dichtel09746582012-11-09 06:09:59 +0000557 nla_put_u8(skb, IFLA_IPTUN_TTL, parm->iph.ttl) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000558 nla_put_u8(skb, IFLA_IPTUN_TOS, parm->iph.tos) ||
Simon Horman1b69e7e2016-07-07 07:56:14 +0200559 nla_put_u8(skb, IFLA_IPTUN_PROTO, parm->iph.protocol) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000560 nla_put_u8(skb, IFLA_IPTUN_PMTUDISC,
Craig Gallek9830ad42017-04-19 12:30:54 -0400561 !!(parm->iph.frag_off & htons(IP_DF))) ||
562 nla_put_u32(skb, IFLA_IPTUN_FWMARK, tunnel->fwmark))
Nicolas Dichtel09746582012-11-09 06:09:59 +0000563 goto nla_put_failure;
Tom Herbert473ab822014-09-17 12:26:00 -0700564
565 if (nla_put_u16(skb, IFLA_IPTUN_ENCAP_TYPE,
566 tunnel->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100567 nla_put_be16(skb, IFLA_IPTUN_ENCAP_SPORT,
568 tunnel->encap.sport) ||
569 nla_put_be16(skb, IFLA_IPTUN_ENCAP_DPORT,
570 tunnel->encap.dport) ||
Tom Herbert473ab822014-09-17 12:26:00 -0700571 nla_put_u16(skb, IFLA_IPTUN_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -0800572 tunnel->encap.flags))
Tom Herbert473ab822014-09-17 12:26:00 -0700573 goto nla_put_failure;
574
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700575 if (tunnel->collect_md)
576 if (nla_put_flag(skb, IFLA_IPTUN_COLLECT_METADATA))
577 goto nla_put_failure;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000578 return 0;
579
580nla_put_failure:
581 return -EMSGSIZE;
582}
583
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000584static const struct nla_policy ipip_policy[IFLA_IPTUN_MAX + 1] = {
585 [IFLA_IPTUN_LINK] = { .type = NLA_U32 },
586 [IFLA_IPTUN_LOCAL] = { .type = NLA_U32 },
587 [IFLA_IPTUN_REMOTE] = { .type = NLA_U32 },
588 [IFLA_IPTUN_TTL] = { .type = NLA_U8 },
589 [IFLA_IPTUN_TOS] = { .type = NLA_U8 },
Simon Horman1b69e7e2016-07-07 07:56:14 +0200590 [IFLA_IPTUN_PROTO] = { .type = NLA_U8 },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000591 [IFLA_IPTUN_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert473ab822014-09-17 12:26:00 -0700592 [IFLA_IPTUN_ENCAP_TYPE] = { .type = NLA_U16 },
593 [IFLA_IPTUN_ENCAP_FLAGS] = { .type = NLA_U16 },
594 [IFLA_IPTUN_ENCAP_SPORT] = { .type = NLA_U16 },
595 [IFLA_IPTUN_ENCAP_DPORT] = { .type = NLA_U16 },
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700596 [IFLA_IPTUN_COLLECT_METADATA] = { .type = NLA_FLAG },
Craig Gallek9830ad42017-04-19 12:30:54 -0400597 [IFLA_IPTUN_FWMARK] = { .type = NLA_U32 },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000598};
599
Nicolas Dichtel09746582012-11-09 06:09:59 +0000600static struct rtnl_link_ops ipip_link_ops __read_mostly = {
601 .kind = "ipip",
602 .maxtype = IFLA_IPTUN_MAX,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000603 .policy = ipip_policy,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000604 .priv_size = sizeof(struct ip_tunnel),
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000605 .setup = ipip_tunnel_setup,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200606 .validate = ipip_tunnel_validate,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000607 .newlink = ipip_newlink,
608 .changelink = ipip_changelink,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000609 .dellink = ip_tunnel_dellink,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000610 .get_size = ipip_get_size,
611 .fill_info = ipip_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +0100612 .get_link_net = ip_tunnel_get_link_net,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000613};
614
Eric Dumazet6dcd8142010-08-30 07:04:14 +0000615static struct xfrm_tunnel ipip_handler __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616 .handler = ipip_rcv,
617 .err_handler = ipip_err,
Herbert Xud2acc342006-03-28 01:12:13 -0800618 .priority = 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619};
620
Simon Horman1b69e7e2016-07-07 07:56:14 +0200621#if IS_ENABLED(CONFIG_MPLS)
622static struct xfrm_tunnel mplsip_handler __read_mostly = {
623 .handler = mplsip_rcv,
624 .err_handler = ipip_err,
625 .priority = 1,
626};
627#endif
628
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000629static int __net_init ipip_init_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700630{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000631 return ip_tunnel_init_net(net, ipip_net_id, &ipip_link_ops, "tunl0");
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700632}
633
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000634static void __net_exit ipip_exit_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700635{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000636 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200637 ip_tunnel_delete_net(itn, &ipip_link_ops);
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700638}
639
640static struct pernet_operations ipip_net_ops = {
641 .init = ipip_init_net,
642 .exit = ipip_exit_net,
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000643 .id = &ipip_net_id,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000644 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700645};
646
Linus Torvalds1da177e2005-04-16 15:20:36 -0700647static int __init ipip_init(void)
648{
649 int err;
650
Simon Horman1b69e7e2016-07-07 07:56:14 +0200651 pr_info("ipip: IPv4 and MPLS over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000653 err = register_pernet_device(&ipip_net_ops);
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000654 if (err < 0)
655 return err;
656 err = xfrm4_tunnel_register(&ipip_handler, AF_INET);
657 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +0000658 pr_info("%s: can't register tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200659 goto xfrm_tunnel_ipip_failed;
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000660 }
Simon Horman1b69e7e2016-07-07 07:56:14 +0200661#if IS_ENABLED(CONFIG_MPLS)
662 err = xfrm4_tunnel_register(&mplsip_handler, AF_MPLS);
663 if (err < 0) {
664 pr_info("%s: can't register tunnel\n", __func__);
665 goto xfrm_tunnel_mplsip_failed;
666 }
667#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000668 err = rtnl_link_register(&ipip_link_ops);
669 if (err < 0)
670 goto rtnl_link_failed;
671
672out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673 return err;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000674
675rtnl_link_failed:
Simon Horman1b69e7e2016-07-07 07:56:14 +0200676#if IS_ENABLED(CONFIG_MPLS)
677 xfrm4_tunnel_deregister(&mplsip_handler, AF_INET);
678xfrm_tunnel_mplsip_failed:
679
680#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000681 xfrm4_tunnel_deregister(&ipip_handler, AF_INET);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200682xfrm_tunnel_ipip_failed:
Nicolas Dichtel09746582012-11-09 06:09:59 +0000683 unregister_pernet_device(&ipip_net_ops);
684 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685}
686
687static void __exit ipip_fini(void)
688{
Nicolas Dichtel09746582012-11-09 06:09:59 +0000689 rtnl_link_unregister(&ipip_link_ops);
Kazunori MIYAZAWAc0d56402007-02-13 12:54:47 -0800690 if (xfrm4_tunnel_deregister(&ipip_handler, AF_INET))
Joe Perches058bd4d2012-03-11 18:36:11 +0000691 pr_info("%s: can't deregister tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200692#if IS_ENABLED(CONFIG_MPLS)
693 if (xfrm4_tunnel_deregister(&mplsip_handler, AF_MPLS))
694 pr_info("%s: can't deregister tunnel\n", __func__);
695#endif
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000696 unregister_pernet_device(&ipip_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700697}
698
699module_init(ipip_init);
700module_exit(ipip_fini);
701MODULE_LICENSE("GPL");
Tom Gundersenf98f89a2014-05-15 23:21:30 +0200702MODULE_ALIAS_RTNL_LINK("ipip");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +0300703MODULE_ALIAS_NETDEV("tunl0");