blob: 099fc1c428b419e3344b9f63cb19bacb0b5d0800 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: IP/IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Authors:
5 * Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
6 *
7 * Fixes:
8 * Alan Cox : Merged and made usable non modular (its so tiny its silly as
9 * a module taking up 2 pages).
10 * Alan Cox : Fixed bug with 1.3.18 and IPIP not working (now needs to set skb->h.iph)
11 * to keep ip_forward happy.
12 * Alan Cox : More fixes for 1.3.21, and firewall fix. Maybe this will work soon 8).
13 * Kai Schulte : Fixed #defines for IP_FIREWALL->FIREWALL
14 * David Woodhouse : Perform some basic ICMP handling.
15 * IPIP Routing without decapsulation.
16 * Carlos Picoto : GRE over IP support
17 * Alexey Kuznetsov: Reworked. Really, now it is truncated version of ipv4/ip_gre.c.
18 * I do not want to merge them together.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 *
25 */
26
27/* tunnel.c: an IP tunnel driver
28
29 The purpose of this driver is to provide an IP tunnel through
30 which you can tunnel network traffic transparently across subnets.
31
32 This was written by looking at Nick Holloway's dummy driver
33 Thanks for the great code!
34
35 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090036
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 Minor tweaks:
38 Cleaned up the code a little and added some pre-1.3.0 tweaks.
39 dev->hard_header/hard_header_len changed to use no headers.
40 Comments/bracketing tweaked.
41 Made the tunnels use dev->name not tunnel: when error reporting.
42 Added tx_dropped stat
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090043
Alan Cox113aa832008-10-13 19:01:08 -070044 -Alan Cox (alan@lxorguk.ukuu.org.uk) 21 March 95
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46 Reworked:
47 Changed to tunnel to destination gateway in addition to the
48 tunnel's pointopoint address
49 Almost completely rewritten
50 Note: There is currently no firewall or ICMP handling done.
51
52 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/13/96
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090053
Linus Torvalds1da177e2005-04-16 15:20:36 -070054*/
55
56/* Things I wish I had known when writing the tunnel driver:
57
58 When the tunnel_xmit() function is called, the skb contains the
59 packet to be sent (plus a great deal of extra info), and dev
60 contains the tunnel device that _we_ are.
61
62 When we are passed a packet, we are expected to fill in the
63 source address with our source IP address.
64
65 What is the proper way to allocate, copy and free a buffer?
66 After you allocate it, it is a "0 length" chunk of memory
67 starting at zero. If you want to add headers to the buffer
68 later, you'll have to call "skb_reserve(skb, amount)" with
69 the amount of memory you want reserved. Then, you call
70 "skb_put(skb, amount)" with the amount of space you want in
71 the buffer. skb_put() returns a pointer to the top (#0) of
72 that buffer. skb->len is set to the amount of space you have
73 "allocated" with skb_put(). You can then write up to skb->len
74 bytes to that buffer. If you need more, you can call skb_put()
75 again with the additional amount of space you need. You can
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090076 find out how much more space you can allocate by calling
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 "skb_tailroom(skb)".
78 Now, to add header space, call "skb_push(skb, header_len)".
79 This creates space at the beginning of the buffer and returns
80 a pointer to this new space. If later you need to strip a
81 header from a buffer, call "skb_pull(skb, header_len)".
82 skb_headroom() will return how much space is left at the top
83 of the buffer (before the main data). Remember, this headroom
84 space must be reserved before the skb_put() function is called.
85 */
86
87/*
88 This version of net/ipv4/ipip.c is cloned of net/ipv4/ip_gre.c
89
90 For comments look at net/ipv4/ip_gre.c --ANK
91 */
92
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090093
Randy Dunlap4fc268d2006-01-11 12:17:47 -080094#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#include <linux/module.h>
96#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070097#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090098#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070099#include <asm/uaccess.h>
100#include <linux/skbuff.h>
101#include <linux/netdevice.h>
102#include <linux/in.h>
103#include <linux/tcp.h>
104#include <linux/udp.h>
105#include <linux/if_arp.h>
106#include <linux/mroute.h>
107#include <linux/init.h>
108#include <linux/netfilter_ipv4.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800109#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110
111#include <net/sock.h>
112#include <net/ip.h>
113#include <net/icmp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#include <net/ipip.h>
115#include <net/inet_ecn.h>
116#include <net/xfrm.h>
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700117#include <net/net_namespace.h>
118#include <net/netns/generic.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
120#define HASH_SIZE 16
Al Virod5a0a1e2006-11-08 00:23:14 -0800121#define HASH(addr) (((__force u32)addr^((__force u32)addr>>4))&0xF)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000123static bool log_ecn_error = true;
124module_param(log_ecn_error, bool, 0644);
125MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
126
Eric Dumazetf99189b2009-11-17 10:42:49 +0000127static int ipip_net_id __read_mostly;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700128struct ipip_net {
Eric Dumazetb7285b72010-09-15 11:07:24 +0000129 struct ip_tunnel __rcu *tunnels_r_l[HASH_SIZE];
130 struct ip_tunnel __rcu *tunnels_r[HASH_SIZE];
131 struct ip_tunnel __rcu *tunnels_l[HASH_SIZE];
132 struct ip_tunnel __rcu *tunnels_wc[1];
133 struct ip_tunnel __rcu **tunnels[4];
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700134
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700135 struct net_device *fb_tunnel_dev;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700136};
137
Eric Dumazet3c97af92010-09-27 00:35:50 +0000138static int ipip_tunnel_init(struct net_device *dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139static void ipip_tunnel_setup(struct net_device *dev);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000140static void ipip_dev_free(struct net_device *dev);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000141static struct rtnl_link_ops ipip_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142
stephen hemminger87b6d212012-04-12 06:31:16 +0000143static struct rtnl_link_stats64 *ipip_get_stats64(struct net_device *dev,
144 struct rtnl_link_stats64 *tot)
Eric Dumazet3c97af92010-09-27 00:35:50 +0000145{
Eric Dumazet3c97af92010-09-27 00:35:50 +0000146 int i;
147
148 for_each_possible_cpu(i) {
149 const struct pcpu_tstats *tstats = per_cpu_ptr(dev->tstats, i);
stephen hemminger87b6d212012-04-12 06:31:16 +0000150 u64 rx_packets, rx_bytes, tx_packets, tx_bytes;
151 unsigned int start;
Eric Dumazet3c97af92010-09-27 00:35:50 +0000152
stephen hemminger87b6d212012-04-12 06:31:16 +0000153 do {
154 start = u64_stats_fetch_begin_bh(&tstats->syncp);
155 rx_packets = tstats->rx_packets;
156 tx_packets = tstats->tx_packets;
157 rx_bytes = tstats->rx_bytes;
158 tx_bytes = tstats->tx_bytes;
159 } while (u64_stats_fetch_retry_bh(&tstats->syncp, start));
160
161 tot->rx_packets += rx_packets;
162 tot->tx_packets += tx_packets;
163 tot->rx_bytes += rx_bytes;
164 tot->tx_bytes += tx_bytes;
Eric Dumazet3c97af92010-09-27 00:35:50 +0000165 }
stephen hemminger87b6d212012-04-12 06:31:16 +0000166
167 tot->tx_fifo_errors = dev->stats.tx_fifo_errors;
168 tot->tx_carrier_errors = dev->stats.tx_carrier_errors;
169 tot->tx_dropped = dev->stats.tx_dropped;
170 tot->tx_aborted_errors = dev->stats.tx_aborted_errors;
171 tot->tx_errors = dev->stats.tx_errors;
172 tot->collisions = dev->stats.collisions;
173
174 return tot;
Eric Dumazet3c97af92010-09-27 00:35:50 +0000175}
176
Daniel Baluta5e73ea12012-04-15 01:34:41 +0000177static struct ip_tunnel *ipip_tunnel_lookup(struct net *net,
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700178 __be32 remote, __be32 local)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179{
Eric Dumazetb7285b72010-09-15 11:07:24 +0000180 unsigned int h0 = HASH(remote);
181 unsigned int h1 = HASH(local);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182 struct ip_tunnel *t;
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700183 struct ipip_net *ipn = net_generic(net, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184
Amerigo Wange086cad2012-11-11 21:52:34 +0000185 for_each_ip_tunnel_rcu(t, ipn->tunnels_r_l[h0 ^ h1])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186 if (local == t->parms.iph.saddr &&
187 remote == t->parms.iph.daddr && (t->dev->flags&IFF_UP))
188 return t;
Eric Dumazet8f95dd62009-10-23 05:42:02 +0000189
Amerigo Wange086cad2012-11-11 21:52:34 +0000190 for_each_ip_tunnel_rcu(t, ipn->tunnels_r[h0])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191 if (remote == t->parms.iph.daddr && (t->dev->flags&IFF_UP))
192 return t;
Eric Dumazet8f95dd62009-10-23 05:42:02 +0000193
Amerigo Wange086cad2012-11-11 21:52:34 +0000194 for_each_ip_tunnel_rcu(t, ipn->tunnels_l[h1])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 if (local == t->parms.iph.saddr && (t->dev->flags&IFF_UP))
196 return t;
Eric Dumazet8f95dd62009-10-23 05:42:02 +0000197
198 t = rcu_dereference(ipn->tunnels_wc[0]);
199 if (t && (t->dev->flags&IFF_UP))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200 return t;
201 return NULL;
202}
203
Eric Dumazetb7285b72010-09-15 11:07:24 +0000204static struct ip_tunnel __rcu **__ipip_bucket(struct ipip_net *ipn,
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700205 struct ip_tunnel_parm *parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206{
YOSHIFUJI Hideaki87d1a162007-04-24 20:44:47 +0900207 __be32 remote = parms->iph.daddr;
208 __be32 local = parms->iph.saddr;
Eric Dumazetb7285b72010-09-15 11:07:24 +0000209 unsigned int h = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210 int prio = 0;
211
212 if (remote) {
213 prio |= 2;
214 h ^= HASH(remote);
215 }
216 if (local) {
217 prio |= 1;
218 h ^= HASH(local);
219 }
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700220 return &ipn->tunnels[prio][h];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221}
222
Eric Dumazetb7285b72010-09-15 11:07:24 +0000223static inline struct ip_tunnel __rcu **ipip_bucket(struct ipip_net *ipn,
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700224 struct ip_tunnel *t)
YOSHIFUJI Hideaki87d1a162007-04-24 20:44:47 +0900225{
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700226 return __ipip_bucket(ipn, &t->parms);
YOSHIFUJI Hideaki87d1a162007-04-24 20:44:47 +0900227}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700229static void ipip_tunnel_unlink(struct ipip_net *ipn, struct ip_tunnel *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230{
Eric Dumazetb7285b72010-09-15 11:07:24 +0000231 struct ip_tunnel __rcu **tp;
232 struct ip_tunnel *iter;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233
Eric Dumazetb7285b72010-09-15 11:07:24 +0000234 for (tp = ipip_bucket(ipn, t);
235 (iter = rtnl_dereference(*tp)) != NULL;
236 tp = &iter->next) {
237 if (t == iter) {
Eric Dumazetcf778b02012-01-12 04:41:32 +0000238 rcu_assign_pointer(*tp, t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 break;
240 }
241 }
242}
243
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700244static void ipip_tunnel_link(struct ipip_net *ipn, struct ip_tunnel *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245{
Eric Dumazetb7285b72010-09-15 11:07:24 +0000246 struct ip_tunnel __rcu **tp = ipip_bucket(ipn, t);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Eric Dumazetcf778b02012-01-12 04:41:32 +0000248 rcu_assign_pointer(t->next, rtnl_dereference(*tp));
249 rcu_assign_pointer(*tp, t);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250}
251
Daniel Baluta5e73ea12012-04-15 01:34:41 +0000252static struct ip_tunnel *ipip_tunnel_locate(struct net *net,
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700253 struct ip_tunnel_parm *parms, int create)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254{
Al Virod5a0a1e2006-11-08 00:23:14 -0800255 __be32 remote = parms->iph.daddr;
256 __be32 local = parms->iph.saddr;
Eric Dumazetb7285b72010-09-15 11:07:24 +0000257 struct ip_tunnel *t, *nt;
258 struct ip_tunnel __rcu **tp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259 struct net_device *dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260 char name[IFNAMSIZ];
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700261 struct ipip_net *ipn = net_generic(net, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262
Eric Dumazetb7285b72010-09-15 11:07:24 +0000263 for (tp = __ipip_bucket(ipn, parms);
264 (t = rtnl_dereference(*tp)) != NULL;
265 tp = &t->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 if (local == t->parms.iph.saddr && remote == t->parms.iph.daddr)
267 return t;
268 }
269 if (!create)
270 return NULL;
271
272 if (parms->name[0])
273 strlcpy(name, parms->name, IFNAMSIZ);
Pavel Emelyanov34cc7ba2008-02-23 20:19:20 -0800274 else
Eric Dumazet3c97af92010-09-27 00:35:50 +0000275 strcpy(name, "tunl%d");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
277 dev = alloc_netdev(sizeof(*t), name, ipip_tunnel_setup);
278 if (dev == NULL)
279 return NULL;
280
Pavel Emelyanov0a826402008-04-16 01:06:18 -0700281 dev_net_set(dev, net);
282
Patrick McHardy2941a482006-01-08 22:05:26 -0800283 nt = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 nt->parms = *parms;
285
Eric Dumazet3c97af92010-09-27 00:35:50 +0000286 if (ipip_tunnel_init(dev) < 0)
287 goto failed_free;
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800288
Pavel Emelyanovb37d428b2008-02-26 23:51:04 -0800289 if (register_netdevice(dev) < 0)
290 goto failed_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291
Ted Feng72b36012011-12-08 00:46:21 +0000292 strcpy(nt->parms.name, dev->name);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000293 dev->rtnl_link_ops = &ipip_link_ops;
Ted Feng72b36012011-12-08 00:46:21 +0000294
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 dev_hold(dev);
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700296 ipip_tunnel_link(ipn, nt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 return nt;
298
Pavel Emelyanovb37d428b2008-02-26 23:51:04 -0800299failed_free:
Eric Dumazet3c97af92010-09-27 00:35:50 +0000300 ipip_dev_free(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301 return NULL;
302}
303
Eric Dumazetb7285b72010-09-15 11:07:24 +0000304/* called with RTNL */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305static void ipip_tunnel_uninit(struct net_device *dev)
306{
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700307 struct net *net = dev_net(dev);
308 struct ipip_net *ipn = net_generic(net, ipip_net_id);
309
Eric Dumazetb7285b72010-09-15 11:07:24 +0000310 if (dev == ipn->fb_tunnel_dev)
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +0000311 RCU_INIT_POINTER(ipn->tunnels_wc[0], NULL);
Eric Dumazetb7285b72010-09-15 11:07:24 +0000312 else
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700313 ipip_tunnel_unlink(ipn, netdev_priv(dev));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314 dev_put(dev);
315}
316
Herbert Xud2acc342006-03-28 01:12:13 -0800317static int ipip_err(struct sk_buff *skb, u32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319
Rami Rosen071f92d2008-05-21 17:47:54 -0700320/* All the routers (except for Linux) return only
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321 8 bytes of packet payload. It means, that precise relaying of
322 ICMP in the real Internet is absolutely infeasible.
323 */
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000324 const struct iphdr *iph = (const struct iphdr *)skb->data;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300325 const int type = icmp_hdr(skb)->type;
326 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 struct ip_tunnel *t;
Herbert Xud2acc342006-03-28 01:12:13 -0800328 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329
330 switch (type) {
331 default:
332 case ICMP_PARAMETERPROB:
Herbert Xud2acc342006-03-28 01:12:13 -0800333 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334
335 case ICMP_DEST_UNREACH:
336 switch (code) {
337 case ICMP_SR_FAILED:
338 case ICMP_PORT_UNREACH:
339 /* Impossible event. */
Herbert Xud2acc342006-03-28 01:12:13 -0800340 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 default:
342 /* All others are translated to HOST_UNREACH.
343 rfc2003 contains "deep thoughts" about NET_UNREACH,
344 I believe they are just ether pollution. --ANK
345 */
346 break;
347 }
348 break;
349 case ICMP_TIME_EXCEEDED:
350 if (code != ICMP_EXC_TTL)
Herbert Xud2acc342006-03-28 01:12:13 -0800351 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700353 case ICMP_REDIRECT:
354 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355 }
356
Herbert Xud2acc342006-03-28 01:12:13 -0800357 err = -ENOENT;
Pavel Emelyanovcec3ffa2008-04-16 01:05:03 -0700358 t = ipip_tunnel_lookup(dev_net(skb->dev), iph->daddr, iph->saddr);
David S. Miller36393392012-06-14 22:21:46 -0700359 if (t == NULL)
360 goto out;
361
362 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
363 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
364 t->dev->ifindex, 0, IPPROTO_IPIP, 0);
365 err = 0;
366 goto out;
367 }
368
David S. Miller55be7a92012-07-11 21:27:49 -0700369 if (type == ICMP_REDIRECT) {
370 ipv4_redirect(skb, dev_net(skb->dev), t->dev->ifindex, 0,
371 IPPROTO_IPIP, 0);
372 err = 0;
373 goto out;
374 }
375
David S. Miller36393392012-06-14 22:21:46 -0700376 if (t->parms.iph.daddr == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 goto out;
Herbert Xud2acc342006-03-28 01:12:13 -0800378
379 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
381 goto out;
382
Wei Yongjun26d94b42009-02-24 23:36:47 -0800383 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384 t->err_count++;
385 else
386 t->err_count = 1;
387 t->err_time = jiffies;
388out:
stephen hemmingerb0558ef2012-09-24 18:12:25 +0000389
Herbert Xud2acc342006-03-28 01:12:13 -0800390 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391}
392
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393static int ipip_rcv(struct sk_buff *skb)
394{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 struct ip_tunnel *tunnel;
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700396 const struct iphdr *iph = ip_hdr(skb);
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000397 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
Eric Dumazet3c97af92010-09-27 00:35:50 +0000399 tunnel = ipip_tunnel_lookup(dev_net(skb->dev), iph->saddr, iph->daddr);
400 if (tunnel != NULL) {
401 struct pcpu_tstats *tstats;
402
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000403 if (!xfrm4_policy_check(NULL, XFRM_POLICY_IN, skb))
404 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700405
406 secpath_reset(skb);
407
Arnaldo Carvalho de Melob0e380b2007-04-10 21:21:55 -0700408 skb->mac_header = skb->network_header;
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700409 skb_reset_network_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 skb->protocol = htons(ETH_P_IP);
411 skb->pkt_type = PACKET_HOST;
412
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000413 __skb_tunnel_rx(skb, tunnel->dev);
414
415 err = IP_ECN_decapsulate(iph, skb);
416 if (unlikely(err)) {
417 if (log_ecn_error)
418 net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
419 &iph->saddr, iph->tos);
420 if (err > 1) {
421 ++tunnel->dev->stats.rx_frame_errors;
422 ++tunnel->dev->stats.rx_errors;
423 goto drop;
424 }
425 }
426
Eric Dumazet3c97af92010-09-27 00:35:50 +0000427 tstats = this_cpu_ptr(tunnel->dev->tstats);
stephen hemminger87b6d212012-04-12 06:31:16 +0000428 u64_stats_update_begin(&tstats->syncp);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000429 tstats->rx_packets++;
430 tstats->rx_bytes += skb->len;
stephen hemminger87b6d212012-04-12 06:31:16 +0000431 u64_stats_update_end(&tstats->syncp);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000432
Eric Dumazetcaf586e2010-09-30 21:06:55 +0000433 netif_rx(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434 return 0;
435 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 return -1;
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000438
439drop:
440 kfree_skb(skb);
441 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442}
443
444/*
445 * This function assumes it is being called from dev_queue_xmit()
446 * and that skb is filled properly by that function.
447 */
448
Stephen Hemminger6fef4c02009-08-31 19:50:41 +0000449static netdev_tx_t ipip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450{
Patrick McHardy2941a482006-01-08 22:05:26 -0800451 struct ip_tunnel *tunnel = netdev_priv(dev);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000452 const struct iphdr *tiph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700453 u8 tos = tunnel->parms.iph.tos;
Al Virod5a0a1e2006-11-08 00:23:14 -0800454 __be16 df = tiph->frag_off;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455 struct rtable *rt; /* Route to the other host */
Eric Dumazet3c97af92010-09-27 00:35:50 +0000456 struct net_device *tdev; /* Device to other host */
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000457 const struct iphdr *old_iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458 struct iphdr *iph; /* Our new IP header */
Chuck Leverc2636b42007-10-23 21:07:32 -0700459 unsigned int max_headroom; /* The extra header space needed */
Al Virod5a0a1e2006-11-08 00:23:14 -0800460 __be32 dst = tiph->daddr;
David S. Miller31e45432011-05-03 20:25:42 -0700461 struct flowi4 fl4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462 int mtu;
463
Linus Torvalds1da177e2005-04-16 15:20:36 -0700464 if (skb->protocol != htons(ETH_P_IP))
465 goto tx_error;
466
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000467 if (skb->ip_summed == CHECKSUM_PARTIAL &&
468 skb_checksum_help(skb))
469 goto tx_error;
470
Eric Dumazet3c97af92010-09-27 00:35:50 +0000471 if (tos & 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472 tos = old_iph->tos;
473
474 if (!dst) {
475 /* NBMA tunnel */
Eric Dumazet511c3f92009-06-02 05:14:27 +0000476 if ((rt = skb_rtable(skb)) == NULL) {
Eric Dumazet3c97af92010-09-27 00:35:50 +0000477 dev->stats.tx_fifo_errors++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 goto tx_error;
479 }
David S. Millerf8126f12012-07-13 05:03:45 -0700480 dst = rt_nexthop(rt, old_iph->daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 }
482
David S. Miller31e45432011-05-03 20:25:42 -0700483 rt = ip_route_output_ports(dev_net(dev), &fl4, NULL,
David S. Miller78fbfd82011-03-12 00:00:52 -0500484 dst, tiph->saddr,
485 0, 0,
486 IPPROTO_IPIP, RT_TOS(tos),
487 tunnel->parms.link);
488 if (IS_ERR(rt)) {
489 dev->stats.tx_carrier_errors++;
490 goto tx_error_icmp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700491 }
Changli Gaod8d1f302010-06-10 23:31:35 -0700492 tdev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493
494 if (tdev == dev) {
495 ip_rt_put(rt);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000496 dev->stats.collisions++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497 goto tx_error;
498 }
499
Herbert Xu23ca0c92009-11-06 10:37:41 +0000500 df |= old_iph->frag_off & htons(IP_DF);
501
502 if (df) {
Changli Gaod8d1f302010-06-10 23:31:35 -0700503 mtu = dst_mtu(&rt->dst) - sizeof(struct iphdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504
Herbert Xu23ca0c92009-11-06 10:37:41 +0000505 if (mtu < 68) {
Eric Dumazet3c97af92010-09-27 00:35:50 +0000506 dev->stats.collisions++;
Herbert Xu23ca0c92009-11-06 10:37:41 +0000507 ip_rt_put(rt);
508 goto tx_error;
509 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
Herbert Xu23ca0c92009-11-06 10:37:41 +0000511 if (skb_dst(skb))
David S. Miller6700c272012-07-17 03:29:28 -0700512 skb_dst(skb)->ops->update_pmtu(skb_dst(skb), NULL, skb, mtu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513
Herbert Xu23ca0c92009-11-06 10:37:41 +0000514 if ((old_iph->frag_off & htons(IP_DF)) &&
515 mtu < ntohs(old_iph->tot_len)) {
516 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED,
517 htonl(mtu));
518 ip_rt_put(rt);
519 goto tx_error;
520 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 }
522
523 if (tunnel->err_count > 0) {
Wei Yongjun26d94b42009-02-24 23:36:47 -0800524 if (time_before(jiffies,
525 tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526 tunnel->err_count--;
527 dst_link_failure(skb);
528 } else
529 tunnel->err_count = 0;
530 }
531
532 /*
533 * Okay, now see if we can stuff it in the buffer as-is.
534 */
535 max_headroom = (LL_RESERVED_SPACE(tdev)+sizeof(struct iphdr));
536
Patrick McHardycfbba492007-07-09 15:33:40 -0700537 if (skb_headroom(skb) < max_headroom || skb_shared(skb) ||
538 (skb_cloned(skb) && !skb_clone_writable(skb, 0))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700539 struct sk_buff *new_skb = skb_realloc_headroom(skb, max_headroom);
540 if (!new_skb) {
541 ip_rt_put(rt);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000542 dev->stats.tx_dropped++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700543 dev_kfree_skb(skb);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000544 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 }
546 if (skb->sk)
547 skb_set_owner_w(new_skb, skb->sk);
548 dev_kfree_skb(skb);
549 skb = new_skb;
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700550 old_iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 }
552
Arnaldo Carvalho de Melob0e380b2007-04-10 21:21:55 -0700553 skb->transport_header = skb->network_header;
Arnaldo Carvalho de Meloe2d1bca2007-04-10 20:46:21 -0700554 skb_push(skb, sizeof(struct iphdr));
555 skb_reset_network_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700556 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
Patrick McHardy48d5cad2006-02-15 15:10:22 -0800557 IPCB(skb)->flags &= ~(IPSKB_XFRM_TUNNEL_SIZE | IPSKB_XFRM_TRANSFORMED |
558 IPSKB_REROUTED);
Eric Dumazetadf30902009-06-02 05:19:30 +0000559 skb_dst_drop(skb);
Changli Gaod8d1f302010-06-10 23:31:35 -0700560 skb_dst_set(skb, &rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561
562 /*
563 * Push down and install the IPIP header.
564 */
565
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700566 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567 iph->version = 4;
568 iph->ihl = sizeof(struct iphdr)>>2;
569 iph->frag_off = df;
570 iph->protocol = IPPROTO_IPIP;
571 iph->tos = INET_ECN_encapsulate(tos, old_iph->tos);
David S. Miller69458cb2011-05-04 11:10:28 -0700572 iph->daddr = fl4.daddr;
573 iph->saddr = fl4.saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574
575 if ((iph->ttl = tiph->ttl) == 0)
576 iph->ttl = old_iph->ttl;
577
Amerigo Wangaa0010f2012-11-11 21:52:33 +0000578 iptunnel_xmit(skb, dev);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000579 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580
581tx_error_icmp:
582 dst_link_failure(skb);
583tx_error:
Eric Dumazet3c97af92010-09-27 00:35:50 +0000584 dev->stats.tx_errors++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 dev_kfree_skb(skb);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000586 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587}
588
Michal Schmidt55339952007-12-12 11:01:43 -0800589static void ipip_tunnel_bind_dev(struct net_device *dev)
590{
591 struct net_device *tdev = NULL;
592 struct ip_tunnel *tunnel;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000593 const struct iphdr *iph;
Michal Schmidt55339952007-12-12 11:01:43 -0800594
595 tunnel = netdev_priv(dev);
596 iph = &tunnel->parms.iph;
597
598 if (iph->daddr) {
David S. Miller31e45432011-05-03 20:25:42 -0700599 struct rtable *rt;
600 struct flowi4 fl4;
Eric Dumazet3c97af92010-09-27 00:35:50 +0000601
David S. Miller31e45432011-05-03 20:25:42 -0700602 rt = ip_route_output_ports(dev_net(dev), &fl4, NULL,
603 iph->daddr, iph->saddr,
604 0, 0,
605 IPPROTO_IPIP,
606 RT_TOS(iph->tos),
607 tunnel->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800608 if (!IS_ERR(rt)) {
Changli Gaod8d1f302010-06-10 23:31:35 -0700609 tdev = rt->dst.dev;
Michal Schmidt55339952007-12-12 11:01:43 -0800610 ip_rt_put(rt);
611 }
612 dev->flags |= IFF_POINTOPOINT;
613 }
614
615 if (!tdev && tunnel->parms.link)
Pavel Emelyanovb99f0152008-04-16 01:05:57 -0700616 tdev = __dev_get_by_index(dev_net(dev), tunnel->parms.link);
Michal Schmidt55339952007-12-12 11:01:43 -0800617
618 if (tdev) {
619 dev->hard_header_len = tdev->hard_header_len + sizeof(struct iphdr);
620 dev->mtu = tdev->mtu - sizeof(struct iphdr);
621 }
622 dev->iflink = tunnel->parms.link;
623}
624
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625static int
626ipip_tunnel_ioctl (struct net_device *dev, struct ifreq *ifr, int cmd)
627{
628 int err = 0;
629 struct ip_tunnel_parm p;
630 struct ip_tunnel *t;
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700631 struct net *net = dev_net(dev);
632 struct ipip_net *ipn = net_generic(net, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633
634 switch (cmd) {
635 case SIOCGETTUNNEL:
636 t = NULL;
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700637 if (dev == ipn->fb_tunnel_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700638 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p))) {
639 err = -EFAULT;
640 break;
641 }
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700642 t = ipip_tunnel_locate(net, &p, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 }
644 if (t == NULL)
Patrick McHardy2941a482006-01-08 22:05:26 -0800645 t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700646 memcpy(&p, &t->parms, sizeof(p));
647 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
648 err = -EFAULT;
649 break;
650
651 case SIOCADDTUNNEL:
652 case SIOCCHGTUNNEL:
653 err = -EPERM;
654 if (!capable(CAP_NET_ADMIN))
655 goto done;
656
657 err = -EFAULT;
658 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
659 goto done;
660
661 err = -EINVAL;
662 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_IPIP ||
663 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)))
664 goto done;
665 if (p.iph.ttl)
666 p.iph.frag_off |= htons(IP_DF);
667
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700668 t = ipip_tunnel_locate(net, &p, cmd == SIOCADDTUNNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700670 if (dev != ipn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 if (t != NULL) {
672 if (t->dev != dev) {
673 err = -EEXIST;
674 break;
675 }
676 } else {
677 if (((dev->flags&IFF_POINTOPOINT) && !p.iph.daddr) ||
678 (!(dev->flags&IFF_POINTOPOINT) && p.iph.daddr)) {
679 err = -EINVAL;
680 break;
681 }
Patrick McHardy2941a482006-01-08 22:05:26 -0800682 t = netdev_priv(dev);
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700683 ipip_tunnel_unlink(ipn, t);
Pavel Emelyanov74b0b852010-10-27 05:43:53 +0000684 synchronize_net();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685 t->parms.iph.saddr = p.iph.saddr;
686 t->parms.iph.daddr = p.iph.daddr;
687 memcpy(dev->dev_addr, &p.iph.saddr, 4);
688 memcpy(dev->broadcast, &p.iph.daddr, 4);
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700689 ipip_tunnel_link(ipn, t);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700690 netdev_state_change(dev);
691 }
692 }
693
694 if (t) {
695 err = 0;
696 if (cmd == SIOCCHGTUNNEL) {
697 t->parms.iph.ttl = p.iph.ttl;
698 t->parms.iph.tos = p.iph.tos;
699 t->parms.iph.frag_off = p.iph.frag_off;
Michal Schmidt55339952007-12-12 11:01:43 -0800700 if (t->parms.link != p.link) {
701 t->parms.link = p.link;
702 ipip_tunnel_bind_dev(dev);
703 netdev_state_change(dev);
704 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705 }
706 if (copy_to_user(ifr->ifr_ifru.ifru_data, &t->parms, sizeof(p)))
707 err = -EFAULT;
708 } else
709 err = (cmd == SIOCADDTUNNEL ? -ENOBUFS : -ENOENT);
710 break;
711
712 case SIOCDELTUNNEL:
713 err = -EPERM;
714 if (!capable(CAP_NET_ADMIN))
715 goto done;
716
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700717 if (dev == ipn->fb_tunnel_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 err = -EFAULT;
719 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
720 goto done;
721 err = -ENOENT;
Pavel Emelyanovb9fae5c2008-04-16 01:04:35 -0700722 if ((t = ipip_tunnel_locate(net, &p, 0)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 goto done;
724 err = -EPERM;
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700725 if (t->dev == ipn->fb_tunnel_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726 goto done;
727 dev = t->dev;
728 }
Stephen Hemminger22f8cde2007-02-07 00:09:58 -0800729 unregister_netdevice(dev);
730 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 break;
732
733 default:
734 err = -EINVAL;
735 }
736
737done:
738 return err;
739}
740
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741static int ipip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
742{
743 if (new_mtu < 68 || new_mtu > 0xFFF8 - sizeof(struct iphdr))
744 return -EINVAL;
745 dev->mtu = new_mtu;
746 return 0;
747}
748
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800749static const struct net_device_ops ipip_netdev_ops = {
750 .ndo_uninit = ipip_tunnel_uninit,
751 .ndo_start_xmit = ipip_tunnel_xmit,
752 .ndo_do_ioctl = ipip_tunnel_ioctl,
753 .ndo_change_mtu = ipip_tunnel_change_mtu,
stephen hemminger87b6d212012-04-12 06:31:16 +0000754 .ndo_get_stats64 = ipip_get_stats64,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800755};
756
Eric Dumazet3c97af92010-09-27 00:35:50 +0000757static void ipip_dev_free(struct net_device *dev)
758{
759 free_percpu(dev->tstats);
760 free_netdev(dev);
761}
762
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000763#define IPIP_FEATURES (NETIF_F_SG | \
764 NETIF_F_FRAGLIST | \
765 NETIF_F_HIGHDMA | \
766 NETIF_F_HW_CSUM)
767
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768static void ipip_tunnel_setup(struct net_device *dev)
769{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800770 dev->netdev_ops = &ipip_netdev_ops;
Eric Dumazet3c97af92010-09-27 00:35:50 +0000771 dev->destructor = ipip_dev_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772
773 dev->type = ARPHRD_TUNNEL;
774 dev->hard_header_len = LL_MAX_HEADER + sizeof(struct iphdr);
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800775 dev->mtu = ETH_DATA_LEN - sizeof(struct iphdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700776 dev->flags = IFF_NOARP;
777 dev->iflink = 0;
778 dev->addr_len = 4;
Pavel Emelyanov0a826402008-04-16 01:06:18 -0700779 dev->features |= NETIF_F_NETNS_LOCAL;
Eric Dumazet153f0942010-09-28 00:17:17 +0000780 dev->features |= NETIF_F_LLTX;
Eric Dumazet28e72212009-05-28 10:44:30 +0000781 dev->priv_flags &= ~IFF_XMIT_DST_RELEASE;
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000782
783 dev->features |= IPIP_FEATURES;
784 dev->hw_features |= IPIP_FEATURES;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700785}
786
Eric Dumazet3c97af92010-09-27 00:35:50 +0000787static int ipip_tunnel_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800789 struct ip_tunnel *tunnel = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790
791 tunnel->dev = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792
793 memcpy(dev->dev_addr, &tunnel->parms.iph.saddr, 4);
794 memcpy(dev->broadcast, &tunnel->parms.iph.daddr, 4);
795
Michal Schmidt55339952007-12-12 11:01:43 -0800796 ipip_tunnel_bind_dev(dev);
Eric Dumazet3c97af92010-09-27 00:35:50 +0000797
798 dev->tstats = alloc_percpu(struct pcpu_tstats);
799 if (!dev->tstats)
800 return -ENOMEM;
801
802 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803}
804
Eric Dumazetfada5632010-09-27 23:56:46 +0000805static int __net_init ipip_fb_tunnel_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700806{
Patrick McHardy2941a482006-01-08 22:05:26 -0800807 struct ip_tunnel *tunnel = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808 struct iphdr *iph = &tunnel->parms.iph;
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700809 struct ipip_net *ipn = net_generic(dev_net(dev), ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810
811 tunnel->dev = dev;
812 strcpy(tunnel->parms.name, dev->name);
813
814 iph->version = 4;
815 iph->protocol = IPPROTO_IPIP;
816 iph->ihl = 5;
817
Eric Dumazetfada5632010-09-27 23:56:46 +0000818 dev->tstats = alloc_percpu(struct pcpu_tstats);
819 if (!dev->tstats)
820 return -ENOMEM;
821
Linus Torvalds1da177e2005-04-16 15:20:36 -0700822 dev_hold(dev);
Eric Dumazetcf778b02012-01-12 04:41:32 +0000823 rcu_assign_pointer(ipn->tunnels_wc[0], tunnel);
Eric Dumazetfada5632010-09-27 23:56:46 +0000824 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825}
826
Nicolas Dichtel09746582012-11-09 06:09:59 +0000827static size_t ipip_get_size(const struct net_device *dev)
828{
829 return
830 /* IFLA_IPTUN_LINK */
831 nla_total_size(4) +
832 /* IFLA_IPTUN_LOCAL */
833 nla_total_size(4) +
834 /* IFLA_IPTUN_REMOTE */
835 nla_total_size(4) +
836 /* IFLA_IPTUN_TTL */
837 nla_total_size(1) +
838 /* IFLA_IPTUN_TOS */
839 nla_total_size(1) +
840 0;
841}
842
843static int ipip_fill_info(struct sk_buff *skb, const struct net_device *dev)
844{
845 struct ip_tunnel *tunnel = netdev_priv(dev);
846 struct ip_tunnel_parm *parm = &tunnel->parms;
847
848 if (nla_put_u32(skb, IFLA_IPTUN_LINK, parm->link) ||
849 nla_put_be32(skb, IFLA_IPTUN_LOCAL, parm->iph.saddr) ||
850 nla_put_be32(skb, IFLA_IPTUN_REMOTE, parm->iph.daddr) ||
851 nla_put_u8(skb, IFLA_IPTUN_TTL, parm->iph.ttl) ||
852 nla_put_u8(skb, IFLA_IPTUN_TOS, parm->iph.tos))
853 goto nla_put_failure;
854 return 0;
855
856nla_put_failure:
857 return -EMSGSIZE;
858}
859
860static struct rtnl_link_ops ipip_link_ops __read_mostly = {
861 .kind = "ipip",
862 .maxtype = IFLA_IPTUN_MAX,
863 .priv_size = sizeof(struct ip_tunnel),
864 .get_size = ipip_get_size,
865 .fill_info = ipip_fill_info,
866};
867
Eric Dumazet6dcd8142010-08-30 07:04:14 +0000868static struct xfrm_tunnel ipip_handler __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869 .handler = ipip_rcv,
870 .err_handler = ipip_err,
Herbert Xud2acc342006-03-28 01:12:13 -0800871 .priority = 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872};
873
Stephen Hemminger5747a1a2009-02-22 00:02:08 -0800874static const char banner[] __initconst =
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875 KERN_INFO "IPv4 over IPv4 tunneling driver\n";
876
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000877static void ipip_destroy_tunnels(struct ipip_net *ipn, struct list_head *head)
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700878{
879 int prio;
880
881 for (prio = 1; prio < 4; prio++) {
882 int h;
883 for (h = 0; h < HASH_SIZE; h++) {
Eric Dumazetb7285b72010-09-15 11:07:24 +0000884 struct ip_tunnel *t;
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000885
Eric Dumazetb7285b72010-09-15 11:07:24 +0000886 t = rtnl_dereference(ipn->tunnels[prio][h]);
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000887 while (t != NULL) {
888 unregister_netdevice_queue(t->dev, head);
Eric Dumazetb7285b72010-09-15 11:07:24 +0000889 t = rtnl_dereference(t->next);
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000890 }
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700891 }
892 }
893}
894
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000895static int __net_init ipip_init_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700896{
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000897 struct ipip_net *ipn = net_generic(net, ipip_net_id);
Ted Feng72b36012011-12-08 00:46:21 +0000898 struct ip_tunnel *t;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700899 int err;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700900
Pavel Emelyanov44d3c292008-04-16 01:05:32 -0700901 ipn->tunnels[0] = ipn->tunnels_wc;
902 ipn->tunnels[1] = ipn->tunnels_l;
903 ipn->tunnels[2] = ipn->tunnels_r;
904 ipn->tunnels[3] = ipn->tunnels_r_l;
905
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700906 ipn->fb_tunnel_dev = alloc_netdev(sizeof(struct ip_tunnel),
907 "tunl0",
908 ipip_tunnel_setup);
909 if (!ipn->fb_tunnel_dev) {
910 err = -ENOMEM;
911 goto err_alloc_dev;
912 }
Alexey Dobriyanbe77e592008-11-23 17:26:26 -0800913 dev_net_set(ipn->fb_tunnel_dev, net);
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700914
Eric Dumazetfada5632010-09-27 23:56:46 +0000915 err = ipip_fb_tunnel_init(ipn->fb_tunnel_dev);
916 if (err)
917 goto err_reg_dev;
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700918
919 if ((err = register_netdev(ipn->fb_tunnel_dev)))
920 goto err_reg_dev;
921
Ted Feng72b36012011-12-08 00:46:21 +0000922 t = netdev_priv(ipn->fb_tunnel_dev);
923
924 strcpy(t->parms.name, ipn->fb_tunnel_dev->name);
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700925 return 0;
926
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700927err_reg_dev:
Eric Dumazetfada5632010-09-27 23:56:46 +0000928 ipip_dev_free(ipn->fb_tunnel_dev);
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700929err_alloc_dev:
930 /* nothing */
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700931 return err;
932}
933
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000934static void __net_exit ipip_exit_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700935{
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000936 struct ipip_net *ipn = net_generic(net, ipip_net_id);
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000937 LIST_HEAD(list);
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700938
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700939 rtnl_lock();
Eric Dumazet0694c4c2009-10-27 07:06:59 +0000940 ipip_destroy_tunnels(ipn, &list);
941 unregister_netdevice_queue(ipn->fb_tunnel_dev, &list);
942 unregister_netdevice_many(&list);
Pavel Emelyanovb9855c52008-04-16 01:04:13 -0700943 rtnl_unlock();
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700944}
945
946static struct pernet_operations ipip_net_ops = {
947 .init = ipip_init_net,
948 .exit = ipip_exit_net,
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000949 .id = &ipip_net_id,
950 .size = sizeof(struct ipip_net),
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700951};
952
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953static int __init ipip_init(void)
954{
955 int err;
956
957 printk(banner);
958
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000959 err = register_pernet_device(&ipip_net_ops);
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000960 if (err < 0)
961 return err;
962 err = xfrm4_tunnel_register(&ipip_handler, AF_INET);
963 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +0000964 pr_info("%s: can't register tunnel\n", __func__);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000965 goto xfrm_tunnel_failed;
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000966 }
Nicolas Dichtel09746582012-11-09 06:09:59 +0000967 err = rtnl_link_register(&ipip_link_ops);
968 if (err < 0)
969 goto rtnl_link_failed;
970
971out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700972 return err;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000973
974rtnl_link_failed:
975 xfrm4_tunnel_deregister(&ipip_handler, AF_INET);
976xfrm_tunnel_failed:
977 unregister_pernet_device(&ipip_net_ops);
978 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700979}
980
981static void __exit ipip_fini(void)
982{
Nicolas Dichtel09746582012-11-09 06:09:59 +0000983 rtnl_link_unregister(&ipip_link_ops);
Kazunori MIYAZAWAc0d56402007-02-13 12:54:47 -0800984 if (xfrm4_tunnel_deregister(&ipip_handler, AF_INET))
Joe Perches058bd4d2012-03-11 18:36:11 +0000985 pr_info("%s: can't deregister tunnel\n", __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000987 unregister_pernet_device(&ipip_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988}
989
990module_init(ipip_init);
991module_exit(ipip_fini);
992MODULE_LICENSE("GPL");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +0300993MODULE_ALIAS_NETDEV("tunl0");