blob: fb1ad22b5e292d5669c70b5640ad3207c353c6bb [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: IP/IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Authors:
5 * Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
6 *
7 * Fixes:
8 * Alan Cox : Merged and made usable non modular (its so tiny its silly as
9 * a module taking up 2 pages).
10 * Alan Cox : Fixed bug with 1.3.18 and IPIP not working (now needs to set skb->h.iph)
11 * to keep ip_forward happy.
12 * Alan Cox : More fixes for 1.3.21, and firewall fix. Maybe this will work soon 8).
13 * Kai Schulte : Fixed #defines for IP_FIREWALL->FIREWALL
14 * David Woodhouse : Perform some basic ICMP handling.
15 * IPIP Routing without decapsulation.
16 * Carlos Picoto : GRE over IP support
17 * Alexey Kuznetsov: Reworked. Really, now it is truncated version of ipv4/ip_gre.c.
18 * I do not want to merge them together.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 *
25 */
26
27/* tunnel.c: an IP tunnel driver
28
29 The purpose of this driver is to provide an IP tunnel through
30 which you can tunnel network traffic transparently across subnets.
31
32 This was written by looking at Nick Holloway's dummy driver
33 Thanks for the great code!
34
35 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090036
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 Minor tweaks:
38 Cleaned up the code a little and added some pre-1.3.0 tweaks.
39 dev->hard_header/hard_header_len changed to use no headers.
40 Comments/bracketing tweaked.
41 Made the tunnels use dev->name not tunnel: when error reporting.
42 Added tx_dropped stat
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090043
Alan Cox113aa832008-10-13 19:01:08 -070044 -Alan Cox (alan@lxorguk.ukuu.org.uk) 21 March 95
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46 Reworked:
47 Changed to tunnel to destination gateway in addition to the
48 tunnel's pointopoint address
49 Almost completely rewritten
50 Note: There is currently no firewall or ICMP handling done.
51
52 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/13/96
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090053
Linus Torvalds1da177e2005-04-16 15:20:36 -070054*/
55
56/* Things I wish I had known when writing the tunnel driver:
57
58 When the tunnel_xmit() function is called, the skb contains the
59 packet to be sent (plus a great deal of extra info), and dev
60 contains the tunnel device that _we_ are.
61
62 When we are passed a packet, we are expected to fill in the
63 source address with our source IP address.
64
65 What is the proper way to allocate, copy and free a buffer?
66 After you allocate it, it is a "0 length" chunk of memory
67 starting at zero. If you want to add headers to the buffer
68 later, you'll have to call "skb_reserve(skb, amount)" with
69 the amount of memory you want reserved. Then, you call
70 "skb_put(skb, amount)" with the amount of space you want in
71 the buffer. skb_put() returns a pointer to the top (#0) of
72 that buffer. skb->len is set to the amount of space you have
73 "allocated" with skb_put(). You can then write up to skb->len
74 bytes to that buffer. If you need more, you can call skb_put()
75 again with the additional amount of space you need. You can
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090076 find out how much more space you can allocate by calling
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 "skb_tailroom(skb)".
78 Now, to add header space, call "skb_push(skb, header_len)".
79 This creates space at the beginning of the buffer and returns
80 a pointer to this new space. If later you need to strip a
81 header from a buffer, call "skb_pull(skb, header_len)".
82 skb_headroom() will return how much space is left at the top
83 of the buffer (before the main data). Remember, this headroom
84 space must be reserved before the skb_put() function is called.
85 */
86
87/*
88 This version of net/ipv4/ipip.c is cloned of net/ipv4/ip_gre.c
89
90 For comments look at net/ipv4/ip_gre.c --ANK
91 */
92
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090093
Randy Dunlap4fc268d2006-01-11 12:17:47 -080094#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#include <linux/module.h>
96#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070097#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090098#include <linux/slab.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080099#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100#include <linux/skbuff.h>
101#include <linux/netdevice.h>
102#include <linux/in.h>
103#include <linux/tcp.h>
104#include <linux/udp.h>
105#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#include <linux/init.h>
107#include <linux/netfilter_ipv4.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800108#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
110#include <net/sock.h>
111#include <net/ip.h>
112#include <net/icmp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +0000113#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#include <net/inet_ecn.h>
115#include <net/xfrm.h>
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700116#include <net/net_namespace.h>
117#include <net/netns/generic.h>
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700118#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000120static bool log_ecn_error = true;
121module_param(log_ecn_error, bool, 0644);
122MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
123
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +0300124static unsigned int ipip_net_id __read_mostly;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700125
Eric Dumazet3c97af92010-09-27 00:35:50 +0000126static int ipip_tunnel_init(struct net_device *dev);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000127static struct rtnl_link_ops ipip_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
Herbert Xud2acc342006-03-28 01:12:13 -0800129static int ipip_err(struct sk_buff *skb, u32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131
Rami Rosen071f92d2008-05-21 17:47:54 -0700132/* All the routers (except for Linux) return only
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133 8 bytes of packet payload. It means, that precise relaying of
134 ICMP in the real Internet is absolutely infeasible.
135 */
Pravin B Shelarfd581562013-03-25 14:49:41 +0000136 struct net *net = dev_net(skb->dev);
137 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000138 const struct iphdr *iph = (const struct iphdr *)skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 struct ip_tunnel *t;
Herbert Xud2acc342006-03-28 01:12:13 -0800140 int err;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000141 const int type = icmp_hdr(skb)->type;
142 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Herbert Xud2acc342006-03-28 01:12:13 -0800144 err = -ENOENT;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000145 t = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
146 iph->daddr, iph->saddr, 0);
Ian Morris51456b22015-04-03 09:17:26 +0100147 if (!t)
David S. Miller36393392012-06-14 22:21:46 -0700148 goto out;
149
150 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
151 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200152 t->parms.link, 0, iph->protocol, 0);
David S. Miller36393392012-06-14 22:21:46 -0700153 err = 0;
154 goto out;
155 }
156
David S. Miller55be7a92012-07-11 21:27:49 -0700157 if (type == ICMP_REDIRECT) {
Dmitry Popov23468292014-06-06 23:19:21 +0400158 ipv4_redirect(skb, dev_net(skb->dev), t->parms.link, 0,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200159 iph->protocol, 0);
David S. Miller55be7a92012-07-11 21:27:49 -0700160 err = 0;
161 goto out;
162 }
163
David S. Miller36393392012-06-14 22:21:46 -0700164 if (t->parms.iph.daddr == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 goto out;
Herbert Xud2acc342006-03-28 01:12:13 -0800166
167 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
169 goto out;
170
Wei Yongjun26d94b42009-02-24 23:36:47 -0800171 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 t->err_count++;
173 else
174 t->err_count = 1;
175 t->err_time = jiffies;
stephen hemmingerb0558ef2012-09-24 18:12:25 +0000176
Pravin B Shelarfd581562013-03-25 14:49:41 +0000177out:
Herbert Xud2acc342006-03-28 01:12:13 -0800178 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179}
180
Simon Horman1b69e7e2016-07-07 07:56:14 +0200181static const struct tnl_ptk_info ipip_tpi = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000182 /* no tunnel info required for ipip. */
183 .proto = htons(ETH_P_IP),
184};
185
Simon Horman1b69e7e2016-07-07 07:56:14 +0200186#if IS_ENABLED(CONFIG_MPLS)
187static const struct tnl_ptk_info mplsip_tpi = {
188 /* no tunnel info required for mplsip. */
189 .proto = htons(ETH_P_MPLS_UC),
190};
191#endif
192
193static int ipip_tunnel_rcv(struct sk_buff *skb, u8 ipproto)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000195 struct net *net = dev_net(skb->dev);
196 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700197 struct metadata_dst *tun_dst = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 struct ip_tunnel *tunnel;
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700199 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700201 iph = ip_hdr(skb);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000202 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
203 iph->saddr, iph->daddr, 0);
204 if (tunnel) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200205 const struct tnl_ptk_info *tpi;
206
207 if (tunnel->parms.iph.protocol != ipproto &&
208 tunnel->parms.iph.protocol != 0)
209 goto drop;
210
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000211 if (!xfrm4_policy_check(NULL, XFRM_POLICY_IN, skb))
212 goto drop;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200213#if IS_ENABLED(CONFIG_MPLS)
214 if (ipproto == IPPROTO_MPLS)
215 tpi = &mplsip_tpi;
216 else
217#endif
218 tpi = &ipip_tpi;
219 if (iptunnel_pull_header(skb, 0, tpi->proto, false))
Li Hongjun737e8282013-08-28 11:54:50 +0200220 goto drop;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700221 if (tunnel->collect_md) {
222 tun_dst = ip_tun_rx_dst(skb, 0, 0, 0);
223 if (!tun_dst)
224 return 0;
225 }
226 return ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 return -1;
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000230
231drop:
232 kfree_skb(skb);
233 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234}
235
Simon Horman1b69e7e2016-07-07 07:56:14 +0200236static int ipip_rcv(struct sk_buff *skb)
237{
238 return ipip_tunnel_rcv(skb, IPPROTO_IPIP);
239}
240
241#if IS_ENABLED(CONFIG_MPLS)
242static int mplsip_rcv(struct sk_buff *skb)
243{
244 return ipip_tunnel_rcv(skb, IPPROTO_MPLS);
245}
246#endif
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248/*
249 * This function assumes it is being called from dev_queue_xmit()
250 * and that skb is filled properly by that function.
251 */
Simon Horman1b69e7e2016-07-07 07:56:14 +0200252static netdev_tx_t ipip_tunnel_xmit(struct sk_buff *skb,
253 struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254{
Patrick McHardy2941a482006-01-08 22:05:26 -0800255 struct ip_tunnel *tunnel = netdev_priv(dev);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000256 const struct iphdr *tiph = &tunnel->parms.iph;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200257 u8 ipproto;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
Simon Horman1b69e7e2016-07-07 07:56:14 +0200259 switch (skb->protocol) {
260 case htons(ETH_P_IP):
261 ipproto = IPPROTO_IPIP;
262 break;
263#if IS_ENABLED(CONFIG_MPLS)
264 case htons(ETH_P_MPLS_UC):
265 ipproto = IPPROTO_MPLS;
266 break;
267#endif
268 default:
269 goto tx_error;
270 }
271
272 if (tiph->protocol != ipproto && tiph->protocol != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 goto tx_error;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000274
Tom Herbert7e133182016-05-18 09:06:10 -0700275 if (iptunnel_handle_offloads(skb, SKB_GSO_IPXIP4))
Alexander Duyckaed069d2016-04-14 15:33:37 -0400276 goto tx_error;
Pravin B Shelar4f3ed922013-03-08 15:12:52 +0000277
Simon Horman1b69e7e2016-07-07 07:56:14 +0200278 skb_set_inner_ipproto(skb, ipproto);
Tom Herbert077c5a02014-09-29 20:22:31 -0700279
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700280 if (tunnel->collect_md)
281 ip_md_tunnel_xmit(skb, dev, ipproto);
282 else
283 ip_tunnel_xmit(skb, dev, tiph, ipproto);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000284 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286tx_error:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800287 kfree_skb(skb);
Alexander Duyckaed069d2016-04-14 15:33:37 -0400288
Eric Dumazetcb32f512013-10-19 11:42:57 -0700289 dev->stats.tx_errors++;
Patrick McHardy6ed10652009-06-23 06:03:08 +0000290 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291}
292
Simon Horman1b69e7e2016-07-07 07:56:14 +0200293static bool ipip_tunnel_ioctl_verify_protocol(u8 ipproto)
294{
295 switch (ipproto) {
296 case 0:
297 case IPPROTO_IPIP:
298#if IS_ENABLED(CONFIG_MPLS)
299 case IPPROTO_MPLS:
300#endif
301 return true;
302 }
303
304 return false;
305}
306
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307static int
Pravin B Shelarfd581562013-03-25 14:49:41 +0000308ipip_tunnel_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309{
310 int err = 0;
311 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
Pravin B Shelarfd581562013-03-25 14:49:41 +0000313 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
314 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Cong Wang3b7b5142013-07-02 14:49:34 +0800316 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200317 if (p.iph.version != 4 ||
318 !ipip_tunnel_ioctl_verify_protocol(p.iph.protocol) ||
Cong Wang3b7b5142013-07-02 14:49:34 +0800319 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)))
320 return -EINVAL;
321 }
322
Eric Dumazet252a8fb2015-05-15 08:58:45 -0700323 p.i_key = p.o_key = 0;
324 p.i_flags = p.o_flags = 0;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000325 err = ip_tunnel_ioctl(dev, &p, cmd);
326 if (err)
327 return err;
328
329 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
330 return -EFAULT;
331
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 return 0;
333}
334
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800335static const struct net_device_ops ipip_netdev_ops = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000336 .ndo_init = ipip_tunnel_init,
337 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800338 .ndo_start_xmit = ipip_tunnel_xmit,
339 .ndo_do_ioctl = ipip_tunnel_ioctl,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000340 .ndo_change_mtu = ip_tunnel_change_mtu,
341 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200342 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800343};
344
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000345#define IPIP_FEATURES (NETIF_F_SG | \
346 NETIF_F_FRAGLIST | \
347 NETIF_F_HIGHDMA | \
Eric Dumazetcb32f512013-10-19 11:42:57 -0700348 NETIF_F_GSO_SOFTWARE | \
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000349 NETIF_F_HW_CSUM)
350
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351static void ipip_tunnel_setup(struct net_device *dev)
352{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800353 dev->netdev_ops = &ipip_netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354
355 dev->type = ARPHRD_TUNNEL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 dev->flags = IFF_NOARP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 dev->addr_len = 4;
Eric Dumazet153f0942010-09-28 00:17:17 +0000358 dev->features |= NETIF_F_LLTX;
Eric Dumazet02875872014-10-05 18:38:35 -0700359 netif_keep_dst(dev);
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000360
361 dev->features |= IPIP_FEATURES;
362 dev->hw_features |= IPIP_FEATURES;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000363 ip_tunnel_setup(dev, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364}
365
Eric Dumazet3c97af92010-09-27 00:35:50 +0000366static int ipip_tunnel_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800368 struct ip_tunnel *tunnel = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370 memcpy(dev->dev_addr, &tunnel->parms.iph.saddr, 4);
371 memcpy(dev->broadcast, &tunnel->parms.iph.daddr, 4);
372
Tom Herbert473ab822014-09-17 12:26:00 -0700373 tunnel->tun_hlen = 0;
374 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000375 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376}
377
Matthias Schiffera8b8a8892017-06-25 23:56:01 +0200378static int ipip_tunnel_validate(struct nlattr *tb[], struct nlattr *data[],
379 struct netlink_ext_ack *extack)
Simon Horman1b69e7e2016-07-07 07:56:14 +0200380{
381 u8 proto;
382
383 if (!data || !data[IFLA_IPTUN_PROTO])
384 return 0;
385
386 proto = nla_get_u8(data[IFLA_IPTUN_PROTO]);
387 if (proto != IPPROTO_IPIP && proto != IPPROTO_MPLS && proto != 0)
388 return -EINVAL;
389
390 return 0;
391}
392
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000393static void ipip_netlink_parms(struct nlattr *data[],
Craig Gallek9830ad42017-04-19 12:30:54 -0400394 struct ip_tunnel_parm *parms, bool *collect_md,
395 __u32 *fwmark)
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000396{
397 memset(parms, 0, sizeof(*parms));
398
399 parms->iph.version = 4;
400 parms->iph.protocol = IPPROTO_IPIP;
401 parms->iph.ihl = 5;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700402 *collect_md = false;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000403
404 if (!data)
405 return;
406
407 if (data[IFLA_IPTUN_LINK])
408 parms->link = nla_get_u32(data[IFLA_IPTUN_LINK]);
409
410 if (data[IFLA_IPTUN_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +0200411 parms->iph.saddr = nla_get_in_addr(data[IFLA_IPTUN_LOCAL]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000412
413 if (data[IFLA_IPTUN_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +0200414 parms->iph.daddr = nla_get_in_addr(data[IFLA_IPTUN_REMOTE]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000415
416 if (data[IFLA_IPTUN_TTL]) {
417 parms->iph.ttl = nla_get_u8(data[IFLA_IPTUN_TTL]);
418 if (parms->iph.ttl)
419 parms->iph.frag_off = htons(IP_DF);
420 }
421
422 if (data[IFLA_IPTUN_TOS])
423 parms->iph.tos = nla_get_u8(data[IFLA_IPTUN_TOS]);
424
Simon Horman1b69e7e2016-07-07 07:56:14 +0200425 if (data[IFLA_IPTUN_PROTO])
426 parms->iph.protocol = nla_get_u8(data[IFLA_IPTUN_PROTO]);
427
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000428 if (!data[IFLA_IPTUN_PMTUDISC] || nla_get_u8(data[IFLA_IPTUN_PMTUDISC]))
429 parms->iph.frag_off = htons(IP_DF);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700430
431 if (data[IFLA_IPTUN_COLLECT_METADATA])
432 *collect_md = true;
Craig Gallek9830ad42017-04-19 12:30:54 -0400433
434 if (data[IFLA_IPTUN_FWMARK])
435 *fwmark = nla_get_u32(data[IFLA_IPTUN_FWMARK]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000436}
437
Tom Herbert473ab822014-09-17 12:26:00 -0700438/* This function returns true when ENCAP attributes are present in the nl msg */
439static bool ipip_netlink_encap_parms(struct nlattr *data[],
440 struct ip_tunnel_encap *ipencap)
441{
442 bool ret = false;
443
444 memset(ipencap, 0, sizeof(*ipencap));
445
446 if (!data)
447 return ret;
448
449 if (data[IFLA_IPTUN_ENCAP_TYPE]) {
450 ret = true;
451 ipencap->type = nla_get_u16(data[IFLA_IPTUN_ENCAP_TYPE]);
452 }
453
454 if (data[IFLA_IPTUN_ENCAP_FLAGS]) {
455 ret = true;
456 ipencap->flags = nla_get_u16(data[IFLA_IPTUN_ENCAP_FLAGS]);
457 }
458
459 if (data[IFLA_IPTUN_ENCAP_SPORT]) {
460 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100461 ipencap->sport = nla_get_be16(data[IFLA_IPTUN_ENCAP_SPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700462 }
463
464 if (data[IFLA_IPTUN_ENCAP_DPORT]) {
465 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100466 ipencap->dport = nla_get_be16(data[IFLA_IPTUN_ENCAP_DPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700467 }
468
469 return ret;
470}
471
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000472static int ipip_newlink(struct net *src_net, struct net_device *dev,
Matthias Schiffer7a3f4a12017-06-25 23:55:59 +0200473 struct nlattr *tb[], struct nlattr *data[],
474 struct netlink_ext_ack *extack)
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000475{
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700476 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000477 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700478 struct ip_tunnel_encap ipencap;
Craig Gallek9830ad42017-04-19 12:30:54 -0400479 __u32 fwmark = 0;
Tom Herbert473ab822014-09-17 12:26:00 -0700480
481 if (ipip_netlink_encap_parms(data, &ipencap)) {
Tom Herbert473ab822014-09-17 12:26:00 -0700482 int err = ip_tunnel_encap_setup(t, &ipencap);
483
484 if (err < 0)
485 return err;
486 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000487
Craig Gallek9830ad42017-04-19 12:30:54 -0400488 ipip_netlink_parms(data, &p, &t->collect_md, &fwmark);
489 return ip_tunnel_newlink(dev, tb, &p, fwmark);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000490}
491
492static int ipip_changelink(struct net_device *dev, struct nlattr *tb[],
Matthias Schifferad744b22017-06-25 23:56:00 +0200493 struct nlattr *data[],
494 struct netlink_ext_ack *extack)
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000495{
Craig Gallek9830ad42017-04-19 12:30:54 -0400496 struct ip_tunnel *t = netdev_priv(dev);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000497 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700498 struct ip_tunnel_encap ipencap;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700499 bool collect_md;
Craig Gallek9830ad42017-04-19 12:30:54 -0400500 __u32 fwmark = t->fwmark;
Tom Herbert473ab822014-09-17 12:26:00 -0700501
502 if (ipip_netlink_encap_parms(data, &ipencap)) {
Tom Herbert473ab822014-09-17 12:26:00 -0700503 int err = ip_tunnel_encap_setup(t, &ipencap);
504
505 if (err < 0)
506 return err;
507 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000508
Craig Gallek9830ad42017-04-19 12:30:54 -0400509 ipip_netlink_parms(data, &p, &collect_md, &fwmark);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700510 if (collect_md)
511 return -EINVAL;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000512
513 if (((dev->flags & IFF_POINTOPOINT) && !p.iph.daddr) ||
514 (!(dev->flags & IFF_POINTOPOINT) && p.iph.daddr))
515 return -EINVAL;
516
Craig Gallek9830ad42017-04-19 12:30:54 -0400517 return ip_tunnel_changelink(dev, tb, &p, fwmark);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000518}
519
Nicolas Dichtel09746582012-11-09 06:09:59 +0000520static size_t ipip_get_size(const struct net_device *dev)
521{
522 return
523 /* IFLA_IPTUN_LINK */
524 nla_total_size(4) +
525 /* IFLA_IPTUN_LOCAL */
526 nla_total_size(4) +
527 /* IFLA_IPTUN_REMOTE */
528 nla_total_size(4) +
529 /* IFLA_IPTUN_TTL */
530 nla_total_size(1) +
531 /* IFLA_IPTUN_TOS */
532 nla_total_size(1) +
Simon Horman1b69e7e2016-07-07 07:56:14 +0200533 /* IFLA_IPTUN_PROTO */
534 nla_total_size(1) +
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000535 /* IFLA_IPTUN_PMTUDISC */
536 nla_total_size(1) +
Tom Herbert473ab822014-09-17 12:26:00 -0700537 /* IFLA_IPTUN_ENCAP_TYPE */
538 nla_total_size(2) +
539 /* IFLA_IPTUN_ENCAP_FLAGS */
540 nla_total_size(2) +
541 /* IFLA_IPTUN_ENCAP_SPORT */
542 nla_total_size(2) +
543 /* IFLA_IPTUN_ENCAP_DPORT */
544 nla_total_size(2) +
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700545 /* IFLA_IPTUN_COLLECT_METADATA */
546 nla_total_size(0) +
Craig Gallek9830ad42017-04-19 12:30:54 -0400547 /* IFLA_IPTUN_FWMARK */
548 nla_total_size(4) +
Nicolas Dichtel09746582012-11-09 06:09:59 +0000549 0;
550}
551
552static int ipip_fill_info(struct sk_buff *skb, const struct net_device *dev)
553{
554 struct ip_tunnel *tunnel = netdev_priv(dev);
555 struct ip_tunnel_parm *parm = &tunnel->parms;
556
557 if (nla_put_u32(skb, IFLA_IPTUN_LINK, parm->link) ||
Jiri Benc930345e2015-03-29 16:59:25 +0200558 nla_put_in_addr(skb, IFLA_IPTUN_LOCAL, parm->iph.saddr) ||
559 nla_put_in_addr(skb, IFLA_IPTUN_REMOTE, parm->iph.daddr) ||
Nicolas Dichtel09746582012-11-09 06:09:59 +0000560 nla_put_u8(skb, IFLA_IPTUN_TTL, parm->iph.ttl) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000561 nla_put_u8(skb, IFLA_IPTUN_TOS, parm->iph.tos) ||
Simon Horman1b69e7e2016-07-07 07:56:14 +0200562 nla_put_u8(skb, IFLA_IPTUN_PROTO, parm->iph.protocol) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000563 nla_put_u8(skb, IFLA_IPTUN_PMTUDISC,
Craig Gallek9830ad42017-04-19 12:30:54 -0400564 !!(parm->iph.frag_off & htons(IP_DF))) ||
565 nla_put_u32(skb, IFLA_IPTUN_FWMARK, tunnel->fwmark))
Nicolas Dichtel09746582012-11-09 06:09:59 +0000566 goto nla_put_failure;
Tom Herbert473ab822014-09-17 12:26:00 -0700567
568 if (nla_put_u16(skb, IFLA_IPTUN_ENCAP_TYPE,
569 tunnel->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100570 nla_put_be16(skb, IFLA_IPTUN_ENCAP_SPORT,
571 tunnel->encap.sport) ||
572 nla_put_be16(skb, IFLA_IPTUN_ENCAP_DPORT,
573 tunnel->encap.dport) ||
Tom Herbert473ab822014-09-17 12:26:00 -0700574 nla_put_u16(skb, IFLA_IPTUN_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -0800575 tunnel->encap.flags))
Tom Herbert473ab822014-09-17 12:26:00 -0700576 goto nla_put_failure;
577
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700578 if (tunnel->collect_md)
579 if (nla_put_flag(skb, IFLA_IPTUN_COLLECT_METADATA))
580 goto nla_put_failure;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000581 return 0;
582
583nla_put_failure:
584 return -EMSGSIZE;
585}
586
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000587static const struct nla_policy ipip_policy[IFLA_IPTUN_MAX + 1] = {
588 [IFLA_IPTUN_LINK] = { .type = NLA_U32 },
589 [IFLA_IPTUN_LOCAL] = { .type = NLA_U32 },
590 [IFLA_IPTUN_REMOTE] = { .type = NLA_U32 },
591 [IFLA_IPTUN_TTL] = { .type = NLA_U8 },
592 [IFLA_IPTUN_TOS] = { .type = NLA_U8 },
Simon Horman1b69e7e2016-07-07 07:56:14 +0200593 [IFLA_IPTUN_PROTO] = { .type = NLA_U8 },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000594 [IFLA_IPTUN_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert473ab822014-09-17 12:26:00 -0700595 [IFLA_IPTUN_ENCAP_TYPE] = { .type = NLA_U16 },
596 [IFLA_IPTUN_ENCAP_FLAGS] = { .type = NLA_U16 },
597 [IFLA_IPTUN_ENCAP_SPORT] = { .type = NLA_U16 },
598 [IFLA_IPTUN_ENCAP_DPORT] = { .type = NLA_U16 },
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700599 [IFLA_IPTUN_COLLECT_METADATA] = { .type = NLA_FLAG },
Craig Gallek9830ad42017-04-19 12:30:54 -0400600 [IFLA_IPTUN_FWMARK] = { .type = NLA_U32 },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000601};
602
Nicolas Dichtel09746582012-11-09 06:09:59 +0000603static struct rtnl_link_ops ipip_link_ops __read_mostly = {
604 .kind = "ipip",
605 .maxtype = IFLA_IPTUN_MAX,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000606 .policy = ipip_policy,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000607 .priv_size = sizeof(struct ip_tunnel),
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000608 .setup = ipip_tunnel_setup,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200609 .validate = ipip_tunnel_validate,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000610 .newlink = ipip_newlink,
611 .changelink = ipip_changelink,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000612 .dellink = ip_tunnel_dellink,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000613 .get_size = ipip_get_size,
614 .fill_info = ipip_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +0100615 .get_link_net = ip_tunnel_get_link_net,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000616};
617
Eric Dumazet6dcd8142010-08-30 07:04:14 +0000618static struct xfrm_tunnel ipip_handler __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 .handler = ipip_rcv,
620 .err_handler = ipip_err,
Herbert Xud2acc342006-03-28 01:12:13 -0800621 .priority = 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622};
623
Simon Horman1b69e7e2016-07-07 07:56:14 +0200624#if IS_ENABLED(CONFIG_MPLS)
625static struct xfrm_tunnel mplsip_handler __read_mostly = {
626 .handler = mplsip_rcv,
627 .err_handler = ipip_err,
628 .priority = 1,
629};
630#endif
631
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000632static int __net_init ipip_init_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700633{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000634 return ip_tunnel_init_net(net, ipip_net_id, &ipip_link_ops, "tunl0");
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700635}
636
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000637static void __net_exit ipip_exit_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700638{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000639 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200640 ip_tunnel_delete_net(itn, &ipip_link_ops);
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700641}
642
643static struct pernet_operations ipip_net_ops = {
644 .init = ipip_init_net,
645 .exit = ipip_exit_net,
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000646 .id = &ipip_net_id,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000647 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700648};
649
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650static int __init ipip_init(void)
651{
652 int err;
653
Simon Horman1b69e7e2016-07-07 07:56:14 +0200654 pr_info("ipip: IPv4 and MPLS over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000656 err = register_pernet_device(&ipip_net_ops);
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000657 if (err < 0)
658 return err;
659 err = xfrm4_tunnel_register(&ipip_handler, AF_INET);
660 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +0000661 pr_info("%s: can't register tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200662 goto xfrm_tunnel_ipip_failed;
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000663 }
Simon Horman1b69e7e2016-07-07 07:56:14 +0200664#if IS_ENABLED(CONFIG_MPLS)
665 err = xfrm4_tunnel_register(&mplsip_handler, AF_MPLS);
666 if (err < 0) {
667 pr_info("%s: can't register tunnel\n", __func__);
668 goto xfrm_tunnel_mplsip_failed;
669 }
670#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000671 err = rtnl_link_register(&ipip_link_ops);
672 if (err < 0)
673 goto rtnl_link_failed;
674
675out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676 return err;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000677
678rtnl_link_failed:
Simon Horman1b69e7e2016-07-07 07:56:14 +0200679#if IS_ENABLED(CONFIG_MPLS)
680 xfrm4_tunnel_deregister(&mplsip_handler, AF_INET);
681xfrm_tunnel_mplsip_failed:
682
683#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000684 xfrm4_tunnel_deregister(&ipip_handler, AF_INET);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200685xfrm_tunnel_ipip_failed:
Nicolas Dichtel09746582012-11-09 06:09:59 +0000686 unregister_pernet_device(&ipip_net_ops);
687 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688}
689
690static void __exit ipip_fini(void)
691{
Nicolas Dichtel09746582012-11-09 06:09:59 +0000692 rtnl_link_unregister(&ipip_link_ops);
Kazunori MIYAZAWAc0d56402007-02-13 12:54:47 -0800693 if (xfrm4_tunnel_deregister(&ipip_handler, AF_INET))
Joe Perches058bd4d2012-03-11 18:36:11 +0000694 pr_info("%s: can't deregister tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200695#if IS_ENABLED(CONFIG_MPLS)
696 if (xfrm4_tunnel_deregister(&mplsip_handler, AF_MPLS))
697 pr_info("%s: can't deregister tunnel\n", __func__);
698#endif
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000699 unregister_pernet_device(&ipip_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700}
701
702module_init(ipip_init);
703module_exit(ipip_fini);
704MODULE_LICENSE("GPL");
Tom Gundersenf98f89a2014-05-15 23:21:30 +0200705MODULE_ALIAS_RTNL_LINK("ipip");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +0300706MODULE_ALIAS_NETDEV("tunl0");