blob: 5a20ba9b9b50089a72801d73f14a29d873241065 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: GRE over IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Joe Perchesafd465032012-03-12 07:03:32 +000013#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14
Randy Dunlap4fc268d2006-01-11 12:17:47 -080015#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090019#include <linux/slab.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080020#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/skbuff.h>
22#include <linux/netdevice.h>
23#include <linux/in.h>
24#include <linux/tcp.h>
25#include <linux/udp.h>
26#include <linux/if_arp.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070027#include <linux/if_vlan.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/init.h>
29#include <linux/in6.h>
30#include <linux/inetdevice.h>
31#include <linux/igmp.h>
32#include <linux/netfilter_ipv4.h>
Herbert Xue1a80002008-10-09 12:00:17 -070033#include <linux/etherdevice.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080034#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#include <net/sock.h>
37#include <net/ip.h>
38#include <net/icmp.h>
39#include <net/protocol.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000040#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/arp.h>
42#include <net/checksum.h>
43#include <net/dsfield.h>
44#include <net/inet_ecn.h>
45#include <net/xfrm.h>
Pavel Emelyanov59a4c752008-04-16 01:08:53 -070046#include <net/net_namespace.h>
47#include <net/netns/generic.h>
Herbert Xuc19e6542008-10-09 11:59:55 -070048#include <net/rtnetlink.h>
Dmitry Kozlov00959ad2010-08-21 23:05:39 -070049#include <net/gre.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070050#include <net/dst_metadata.h>
William Tu84e54fe2017-08-22 09:40:28 -070051#include <net/erspan.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070052
Linus Torvalds1da177e2005-04-16 15:20:36 -070053/*
54 Problems & solutions
55 --------------------
56
57 1. The most important issue is detecting local dead loops.
58 They would cause complete host lockup in transmit, which
59 would be "resolved" by stack overflow or, if queueing is enabled,
60 with infinite looping in net_bh.
61
62 We cannot track such dead loops during route installation,
63 it is infeasible task. The most general solutions would be
64 to keep skb->encapsulation counter (sort of local ttl),
Eric Dumazet6d0722a2010-09-29 23:35:10 -070065 and silently drop packet when it expires. It is a good
stephen hemmingerbff52852012-02-24 08:08:20 +000066 solution, but it supposes maintaining new variable in ALL
Linus Torvalds1da177e2005-04-16 15:20:36 -070067 skb, even if no tunneling is used.
68
Eric Dumazet6d0722a2010-09-29 23:35:10 -070069 Current solution: xmit_recursion breaks dead loops. This is a percpu
70 counter, since when we enter the first ndo_xmit(), cpu migration is
71 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73 2. Networking dead loops would not kill routers, but would really
74 kill network. IP hop limit plays role of "t->recursion" in this case,
75 if we copy it from packet being encapsulated to upper header.
76 It is very good solution, but it introduces two problems:
77
78 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
79 do not work over tunnels.
80 - traceroute does not work. I planned to relay ICMP from tunnel,
81 so that this problem would be solved and traceroute output
82 would even more informative. This idea appeared to be wrong:
83 only Linux complies to rfc1812 now (yes, guys, Linux is the only
84 true router now :-)), all routers (at least, in neighbourhood of mine)
85 return only 8 bytes of payload. It is the end.
86
87 Hence, if we want that OSPF worked or traceroute said something reasonable,
88 we should search for another solution.
89
90 One of them is to parse packet trying to detect inner encapsulation
91 made by our node. It is difficult or even impossible, especially,
stephen hemmingerbff52852012-02-24 08:08:20 +000092 taking into account fragmentation. TO be short, ttl is not solution at all.
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
94 Current solution: The solution was UNEXPECTEDLY SIMPLE.
95 We force DF flag on tunnels with preconfigured hop limit,
96 that is ALL. :-) Well, it does not remove the problem completely,
97 but exponential growth of network traffic is changed to linear
98 (branches, that exceed pmtu are pruned) and tunnel mtu
stephen hemmingerbff52852012-02-24 08:08:20 +000099 rapidly degrades to value <68, where looping stops.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100 Yes, it is not good if there exists a router in the loop,
101 which does not force DF, even when encapsulating packets have DF set.
102 But it is not our problem! Nobody could accuse us, we made
103 all that we could make. Even if it is your gated who injected
104 fatal route to network, even if it were you who configured
105 fatal static route: you are innocent. :-)
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 Alexey Kuznetsov.
108 */
109
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000110static bool log_ecn_error = true;
111module_param(log_ecn_error, bool, 0644);
112MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
113
Herbert Xuc19e6542008-10-09 11:59:55 -0700114static struct rtnl_link_ops ipgre_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115static int ipgre_tunnel_init(struct net_device *dev);
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700116
Alexey Dobriyanc7d03a02016-11-17 04:58:21 +0300117static unsigned int ipgre_net_id __read_mostly;
118static unsigned int gre_tap_net_id __read_mostly;
William Tu84e54fe2017-08-22 09:40:28 -0700119static unsigned int erspan_net_id __read_mostly;
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700120
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700121static void ipgre_err(struct sk_buff *skb, u32 info,
122 const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124
Pravin B Shelarc5441932013-03-25 14:49:35 +0000125 /* All the routers (except for Linux) return only
126 8 bytes of packet payload. It means, that precise relaying of
127 ICMP in the real Internet is absolutely infeasible.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
Pravin B Shelarc5441932013-03-25 14:49:35 +0000129 Moreover, Cisco "wise men" put GRE key to the third word
130 in GRE header. It makes impossible maintaining even soft
131 state for keyed GRE tunnels with enabled checksum. Tell
132 them "thank you".
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133
Pravin B Shelarc5441932013-03-25 14:49:35 +0000134 Well, I wonder, rfc1812 was written by Cisco employee,
135 what the hell these idiots break standards established
136 by themselves???
137 */
138 struct net *net = dev_net(skb->dev);
139 struct ip_tunnel_net *itn;
Eric Dumazet96f5a842013-05-18 08:36:03 +0000140 const struct iphdr *iph;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300141 const int type = icmp_hdr(skb)->type;
142 const int code = icmp_hdr(skb)->code;
Eric Dumazet20e19542016-06-18 21:52:06 -0700143 unsigned int data_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144 struct ip_tunnel *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146 switch (type) {
147 default:
148 case ICMP_PARAMETERPROB:
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700149 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150
151 case ICMP_DEST_UNREACH:
152 switch (code) {
153 case ICMP_SR_FAILED:
154 case ICMP_PORT_UNREACH:
155 /* Impossible event. */
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700156 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 default:
158 /* All others are translated to HOST_UNREACH.
159 rfc2003 contains "deep thoughts" about NET_UNREACH,
160 I believe they are just ether pollution. --ANK
161 */
162 break;
163 }
164 break;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700165
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166 case ICMP_TIME_EXCEEDED:
167 if (code != ICMP_EXC_TTL)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700168 return;
Eric Dumazet20e19542016-06-18 21:52:06 -0700169 data_len = icmp_hdr(skb)->un.reserved[1] * 4; /* RFC 4884 4.1 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700171
172 case ICMP_REDIRECT:
173 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 }
175
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700176 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000177 itn = net_generic(net, gre_tap_net_id);
178 else
179 itn = net_generic(net, ipgre_net_id);
180
Duan Jiongc0c0c502014-01-28 11:49:43 +0800181 iph = (const struct iphdr *)(icmp_hdr(skb) + 1);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700182 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
183 iph->daddr, iph->saddr, tpi->key);
stephen hemmingerd2083282012-09-24 18:12:23 +0000184
Ian Morris51456b22015-04-03 09:17:26 +0100185 if (!t)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700186 return;
David S. Miller36393392012-06-14 22:21:46 -0700187
Eric Dumazet9b8c6d72016-06-18 21:52:05 -0700188#if IS_ENABLED(CONFIG_IPV6)
189 if (tpi->proto == htons(ETH_P_IPV6) &&
Eric Dumazet20e19542016-06-18 21:52:06 -0700190 !ip6_err_gen_icmpv6_unreach(skb, iph->ihl * 4 + tpi->hdr_len,
191 type, data_len))
Eric Dumazet9b8c6d72016-06-18 21:52:05 -0700192 return;
193#endif
194
David S. Miller36393392012-06-14 22:21:46 -0700195 if (t->parms.iph.daddr == 0 ||
Joe Perchesf97c1e02007-12-16 13:45:43 -0800196 ipv4_is_multicast(t->parms.iph.daddr))
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700197 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198
199 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700200 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201
Wei Yongjunda6185d82009-02-24 23:34:48 -0800202 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 t->err_count++;
204 else
205 t->err_count = 1;
206 t->err_time = jiffies;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700207}
208
209static void gre_err(struct sk_buff *skb, u32 info)
210{
211 /* All the routers (except for Linux) return only
212 * 8 bytes of packet payload. It means, that precise relaying of
213 * ICMP in the real Internet is absolutely infeasible.
214 *
215 * Moreover, Cisco "wise men" put GRE key to the third word
216 * in GRE header. It makes impossible maintaining even soft
217 * state for keyed
218 * GRE tunnels with enabled checksum. Tell them "thank you".
219 *
220 * Well, I wonder, rfc1812 was written by Cisco employee,
221 * what the hell these idiots break standards established
222 * by themselves???
223 */
224
Eric Dumazete582615ad2016-06-15 06:24:00 -0700225 const struct iphdr *iph = (struct iphdr *)skb->data;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700226 const int type = icmp_hdr(skb)->type;
227 const int code = icmp_hdr(skb)->code;
228 struct tnl_ptk_info tpi;
229 bool csum_err = false;
230
Eric Dumazete582615ad2016-06-15 06:24:00 -0700231 if (gre_parse_header(skb, &tpi, &csum_err, htons(ETH_P_IP),
232 iph->ihl * 4) < 0) {
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700233 if (!csum_err) /* ignore csum errors. */
234 return;
235 }
236
237 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
238 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
239 skb->dev->ifindex, 0, IPPROTO_GRE, 0);
240 return;
241 }
242 if (type == ICMP_REDIRECT) {
243 ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
244 IPPROTO_GRE, 0);
245 return;
246 }
247
248 ipgre_err(skb, info, &tpi);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249}
250
William Tu84e54fe2017-08-22 09:40:28 -0700251static int erspan_rcv(struct sk_buff *skb, struct tnl_ptk_info *tpi,
252 int gre_hdr_len)
253{
254 struct net *net = dev_net(skb->dev);
255 struct metadata_dst *tun_dst = NULL;
256 struct ip_tunnel_net *itn;
257 struct ip_tunnel *tunnel;
258 struct erspanhdr *ershdr;
259 const struct iphdr *iph;
260 __be32 session_id;
261 __be32 index;
262 int len;
263
264 itn = net_generic(net, erspan_net_id);
265 iph = ip_hdr(skb);
266 len = gre_hdr_len + sizeof(*ershdr);
267
268 if (unlikely(!pskb_may_pull(skb, len)))
269 return -ENOMEM;
270
271 iph = ip_hdr(skb);
272 ershdr = (struct erspanhdr *)(skb->data + gre_hdr_len);
273
274 /* The original GRE header does not have key field,
275 * Use ERSPAN 10-bit session ID as key.
276 */
277 session_id = cpu_to_be32(ntohs(ershdr->session_id));
278 tpi->key = session_id;
279 index = ershdr->md.index;
280 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex,
281 tpi->flags | TUNNEL_KEY,
282 iph->saddr, iph->daddr, tpi->key);
283
284 if (tunnel) {
285 if (__iptunnel_pull_header(skb,
286 gre_hdr_len + sizeof(*ershdr),
287 htons(ETH_P_TEB),
288 false, false) < 0)
289 goto drop;
290
291 tunnel->index = ntohl(index);
292 skb_reset_mac_header(skb);
293 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
294 return PACKET_RCVD;
295 }
296drop:
297 kfree_skb(skb);
298 return PACKET_RCVD;
299}
300
Jiri Benc125372f2016-05-03 17:10:08 +0200301static int __ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
302 struct ip_tunnel_net *itn, int hdr_len, bool raw_proto)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700304 struct metadata_dst *tun_dst = NULL;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000305 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 struct ip_tunnel *tunnel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700308 iph = ip_hdr(skb);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700309 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
310 iph->saddr, iph->daddr, tpi->key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311
stephen hemmingerd2083282012-09-24 18:12:23 +0000312 if (tunnel) {
Jiri Benc125372f2016-05-03 17:10:08 +0200313 if (__iptunnel_pull_header(skb, hdr_len, tpi->proto,
314 raw_proto, false) < 0)
Jiri Benc244a7972016-05-03 17:10:07 +0200315 goto drop;
316
Jiri Bence271c7b2016-05-11 15:53:57 +0200317 if (tunnel->dev->type != ARPHRD_NONE)
318 skb_pop_mac_header(skb);
319 else
320 skb_reset_mac_header(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700321 if (tunnel->collect_md) {
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700322 __be16 flags;
323 __be64 tun_id;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700324
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700325 flags = tpi->flags & (TUNNEL_CSUM | TUNNEL_KEY);
Amir Vadaid817f432016-09-08 16:23:45 +0300326 tun_id = key32_to_tunnel_id(tpi->key);
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700327 tun_dst = ip_tun_rx_dst(skb, flags, tun_id, 0);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700328 if (!tun_dst)
329 return PACKET_REJECT;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700330 }
331
332 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700333 return PACKET_RCVD;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334 }
Jiri Benc125372f2016-05-03 17:10:08 +0200335 return PACKET_NEXT;
Jiri Benc244a7972016-05-03 17:10:07 +0200336
337drop:
338 kfree_skb(skb);
339 return PACKET_RCVD;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340}
341
Jiri Benc125372f2016-05-03 17:10:08 +0200342static int ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
343 int hdr_len)
344{
345 struct net *net = dev_net(skb->dev);
346 struct ip_tunnel_net *itn;
347 int res;
348
349 if (tpi->proto == htons(ETH_P_TEB))
350 itn = net_generic(net, gre_tap_net_id);
351 else
352 itn = net_generic(net, ipgre_net_id);
353
354 res = __ipgre_rcv(skb, tpi, itn, hdr_len, false);
355 if (res == PACKET_NEXT && tpi->proto == htons(ETH_P_TEB)) {
356 /* ipgre tunnels in collect metadata mode should receive
357 * also ETH_P_TEB traffic.
358 */
359 itn = net_generic(net, ipgre_net_id);
360 res = __ipgre_rcv(skb, tpi, itn, hdr_len, true);
361 }
362 return res;
363}
364
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700365static int gre_rcv(struct sk_buff *skb)
366{
367 struct tnl_ptk_info tpi;
368 bool csum_err = false;
Tom Herbert95f5c642016-04-29 17:12:16 -0700369 int hdr_len;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700370
371#ifdef CONFIG_NET_IPGRE_BROADCAST
372 if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
373 /* Looped back packet, drop it! */
374 if (rt_is_output_route(skb_rtable(skb)))
375 goto drop;
376 }
377#endif
378
Eric Dumazete582615ad2016-06-15 06:24:00 -0700379 hdr_len = gre_parse_header(skb, &tpi, &csum_err, htons(ETH_P_IP), 0);
Jiri Bencf132ae72016-05-03 15:00:21 +0200380 if (hdr_len < 0)
Tom Herbert95f5c642016-04-29 17:12:16 -0700381 goto drop;
382
William Tu84e54fe2017-08-22 09:40:28 -0700383 if (unlikely(tpi.proto == htons(ETH_P_ERSPAN))) {
384 if (erspan_rcv(skb, &tpi, hdr_len) == PACKET_RCVD)
385 return 0;
386 }
387
Jiri Benc244a7972016-05-03 17:10:07 +0200388 if (ipgre_rcv(skb, &tpi, hdr_len) == PACKET_RCVD)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700389 return 0;
390
391 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
392drop:
393 kfree_skb(skb);
394 return 0;
395}
396
Pravin B Shelarc5441932013-03-25 14:49:35 +0000397static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
398 const struct iphdr *tnl_params,
399 __be16 proto)
400{
401 struct ip_tunnel *tunnel = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000402
Pravin B Shelarc5441932013-03-25 14:49:35 +0000403 if (tunnel->parms.o_flags & TUNNEL_SEQ)
404 tunnel->o_seqno++;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000405
Pravin B Shelarc5441932013-03-25 14:49:35 +0000406 /* Push GRE header. */
Tom Herbert182a3522016-04-29 17:12:19 -0700407 gre_build_header(skb, tunnel->tun_hlen,
408 tunnel->parms.o_flags, proto, tunnel->parms.o_key,
409 htonl(tunnel->o_seqno));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410
Nicolas Dichtelbf3d6a82013-05-27 23:48:15 +0000411 ip_tunnel_xmit(skb, dev, tnl_params, tnl_params->protocol);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700412}
413
Alexander Duyckaed069d2016-04-14 15:33:37 -0400414static int gre_handle_offloads(struct sk_buff *skb, bool csum)
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700415{
Edward Cree6fa79662016-02-11 21:02:31 +0000416 return iptunnel_handle_offloads(skb, csum ? SKB_GSO_GRE_CSUM : SKB_GSO_GRE);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700417}
418
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700419static struct rtable *gre_get_rt(struct sk_buff *skb,
420 struct net_device *dev,
421 struct flowi4 *fl,
422 const struct ip_tunnel_key *key)
423{
424 struct net *net = dev_net(dev);
425
426 memset(fl, 0, sizeof(*fl));
427 fl->daddr = key->u.ipv4.dst;
428 fl->saddr = key->u.ipv4.src;
429 fl->flowi4_tos = RT_TOS(key->tos);
430 fl->flowi4_mark = skb->mark;
431 fl->flowi4_proto = IPPROTO_GRE;
432
433 return ip_route_output_key(net, fl);
434}
435
Jiri Benc20907142016-04-27 11:29:07 +0200436static void gre_fb_xmit(struct sk_buff *skb, struct net_device *dev,
437 __be16 proto)
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700438{
439 struct ip_tunnel_info *tun_info;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700440 const struct ip_tunnel_key *key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100441 struct rtable *rt = NULL;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700442 struct flowi4 fl;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700443 int min_headroom;
444 int tunnel_hlen;
445 __be16 df, flags;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100446 bool use_cache;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700447 int err;
448
Jiri Benc61adedf2015-08-20 13:56:25 +0200449 tun_info = skb_tunnel_info(skb);
Jiri Benc7f9562a2015-08-28 20:48:20 +0200450 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
451 ip_tunnel_info_af(tun_info) != AF_INET))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700452 goto err_free_skb;
453
454 key = &tun_info->key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100455 use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
456 if (use_cache)
457 rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl.saddr);
Paolo Abeni3c1cb4d22016-02-12 15:43:59 +0100458 if (!rt) {
459 rt = gre_get_rt(skb, dev, &fl, key);
460 if (IS_ERR(rt))
461 goto err_free_skb;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100462 if (use_cache)
Paolo Abeni3c1cb4d22016-02-12 15:43:59 +0100463 dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
464 fl.saddr);
465 }
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700466
Tom Herbert95f5c642016-04-29 17:12:16 -0700467 tunnel_hlen = gre_calc_hlen(key->tun_flags);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700468
469 min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len
470 + tunnel_hlen + sizeof(struct iphdr);
471 if (skb_headroom(skb) < min_headroom || skb_header_cloned(skb)) {
472 int head_delta = SKB_DATA_ALIGN(min_headroom -
473 skb_headroom(skb) +
474 16);
475 err = pskb_expand_head(skb, max_t(int, head_delta, 0),
476 0, GFP_ATOMIC);
477 if (unlikely(err))
478 goto err_free_rt;
479 }
480
481 /* Push Tunnel header. */
Alexander Duyckaed069d2016-04-14 15:33:37 -0400482 if (gre_handle_offloads(skb, !!(tun_info->key.tun_flags & TUNNEL_CSUM)))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700483 goto err_free_rt;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700484
485 flags = tun_info->key.tun_flags & (TUNNEL_CSUM | TUNNEL_KEY);
David S. Millercba653212016-05-04 00:52:29 -0400486 gre_build_header(skb, tunnel_hlen, flags, proto,
Amir Vadaid817f432016-09-08 16:23:45 +0300487 tunnel_id_to_key32(tun_info->key.tun_id), 0);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700488
489 df = key->tun_flags & TUNNEL_DONT_FRAGMENT ? htons(IP_DF) : 0;
Pravin B Shelar039f5062015-12-24 14:34:54 -0800490
491 iptunnel_xmit(skb->sk, rt, skb, fl.saddr, key->u.ipv4.dst, IPPROTO_GRE,
492 key->tos, key->ttl, df, false);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700493 return;
494
495err_free_rt:
496 ip_rt_put(rt);
497err_free_skb:
498 kfree_skb(skb);
499 dev->stats.tx_dropped++;
500}
501
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700502static int gre_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb)
503{
504 struct ip_tunnel_info *info = skb_tunnel_info(skb);
505 struct rtable *rt;
506 struct flowi4 fl4;
507
508 if (ip_tunnel_info_af(info) != AF_INET)
509 return -EINVAL;
510
511 rt = gre_get_rt(skb, dev, &fl4, &info->key);
512 if (IS_ERR(rt))
513 return PTR_ERR(rt);
514
515 ip_rt_put(rt);
516 info->key.u.ipv4.src = fl4.saddr;
517 return 0;
518}
519
Pravin B Shelarc5441932013-03-25 14:49:35 +0000520static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
521 struct net_device *dev)
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800522{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000523 struct ip_tunnel *tunnel = netdev_priv(dev);
524 const struct iphdr *tnl_params;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800525
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700526 if (tunnel->collect_md) {
Jiri Benc20907142016-04-27 11:29:07 +0200527 gre_fb_xmit(skb, dev, skb->protocol);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700528 return NETDEV_TX_OK;
529 }
530
Pravin B Shelarc5441932013-03-25 14:49:35 +0000531 if (dev->header_ops) {
532 /* Need space for new headers */
533 if (skb_cow_head(skb, dev->needed_headroom -
Chen Gang2bac7cb2013-04-22 20:45:42 +0000534 (tunnel->hlen + sizeof(struct iphdr))))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000535 goto free_skb;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800536
Pravin B Shelarc5441932013-03-25 14:49:35 +0000537 tnl_params = (const struct iphdr *)skb->data;
Eric Dumazete985aad2010-09-27 03:57:11 +0000538
Pravin B Shelarc5441932013-03-25 14:49:35 +0000539 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
540 * to gre header.
541 */
542 skb_pull(skb, tunnel->hlen + sizeof(struct iphdr));
Timo Teräs8a0033a2014-12-15 09:24:13 +0200543 skb_reset_mac_header(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000544 } else {
545 if (skb_cow_head(skb, dev->needed_headroom))
546 goto free_skb;
Herbert Xue1a80002008-10-09 12:00:17 -0700547
Pravin B Shelarc5441932013-03-25 14:49:35 +0000548 tnl_params = &tunnel->parms.iph;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800549 }
550
Alexander Duyckaed069d2016-04-14 15:33:37 -0400551 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
552 goto free_skb;
Timo Teräs8a0033a2014-12-15 09:24:13 +0200553
Pravin B Shelarc5441932013-03-25 14:49:35 +0000554 __gre_xmit(skb, dev, tnl_params, skb->protocol);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000555 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800556
Pravin B Shelarc5441932013-03-25 14:49:35 +0000557free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800558 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000559 dev->stats.tx_dropped++;
560 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800561}
562
William Tu84e54fe2017-08-22 09:40:28 -0700563static inline u8 tos_to_cos(u8 tos)
564{
565 u8 dscp, cos;
566
567 dscp = tos >> 2;
568 cos = dscp >> 3;
569 return cos;
570}
571
572static void erspan_build_header(struct sk_buff *skb,
573 __be32 id, u32 index, bool truncate)
574{
575 struct iphdr *iphdr = ip_hdr(skb);
576 struct ethhdr *eth = eth_hdr(skb);
577 enum erspan_encap_type enc_type;
578 struct erspanhdr *ershdr;
579 struct qtag_prefix {
580 __be16 eth_type;
581 __be16 tci;
582 } *qp;
583 u16 vlan_tci = 0;
584
585 enc_type = ERSPAN_ENCAP_NOVLAN;
586
587 /* If mirrored packet has vlan tag, extract tci and
588 * perserve vlan header in the mirrored frame.
589 */
590 if (eth->h_proto == htons(ETH_P_8021Q)) {
591 qp = (struct qtag_prefix *)(skb->data + 2 * ETH_ALEN);
592 vlan_tci = ntohs(qp->tci);
593 enc_type = ERSPAN_ENCAP_INFRAME;
594 }
595
596 skb_push(skb, sizeof(*ershdr));
597 ershdr = (struct erspanhdr *)skb->data;
598 memset(ershdr, 0, sizeof(*ershdr));
599
600 ershdr->ver_vlan = htons((vlan_tci & VLAN_MASK) |
601 (ERSPAN_VERSION << VER_OFFSET));
602 ershdr->session_id = htons((u16)(ntohl(id) & ID_MASK) |
603 ((tos_to_cos(iphdr->tos) << COS_OFFSET) & COS_MASK) |
604 (enc_type << EN_OFFSET & EN_MASK) |
605 ((truncate << T_OFFSET) & T_MASK));
606 ershdr->md.index = htonl(index & INDEX_MASK);
607}
608
609static netdev_tx_t erspan_xmit(struct sk_buff *skb,
610 struct net_device *dev)
611{
612 struct ip_tunnel *tunnel = netdev_priv(dev);
613 bool truncate = false;
614
615 if (gre_handle_offloads(skb, false))
616 goto free_skb;
617
618 if (skb_cow_head(skb, dev->needed_headroom))
619 goto free_skb;
620
621 if (skb->len > dev->mtu) {
622 pskb_trim(skb, dev->mtu);
623 truncate = true;
624 }
625
626 /* Push ERSPAN header */
627 erspan_build_header(skb, tunnel->parms.o_key, tunnel->index, truncate);
628 tunnel->parms.o_flags &= ~TUNNEL_KEY;
629 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_ERSPAN));
630 return NETDEV_TX_OK;
631
632free_skb:
633 kfree_skb(skb);
634 dev->stats.tx_dropped++;
635 return NETDEV_TX_OK;
636}
637
Pravin B Shelarc5441932013-03-25 14:49:35 +0000638static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
639 struct net_device *dev)
640{
641 struct ip_tunnel *tunnel = netdev_priv(dev);
642
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700643 if (tunnel->collect_md) {
Jiri Benc20907142016-04-27 11:29:07 +0200644 gre_fb_xmit(skb, dev, htons(ETH_P_TEB));
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700645 return NETDEV_TX_OK;
646 }
647
Alexander Duyckaed069d2016-04-14 15:33:37 -0400648 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
649 goto free_skb;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000650
651 if (skb_cow_head(skb, dev->needed_headroom))
652 goto free_skb;
653
654 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000655 return NETDEV_TX_OK;
656
657free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800658 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000659 dev->stats.tx_dropped++;
660 return NETDEV_TX_OK;
661}
662
663static int ipgre_tunnel_ioctl(struct net_device *dev,
664 struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665{
Tom Herbert4565e992014-09-17 12:26:01 -0700666 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668
Pravin B Shelarc5441932013-03-25 14:49:35 +0000669 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
670 return -EFAULT;
Cong Wang6c734fb2013-06-29 12:02:59 +0800671 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
672 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_GRE ||
673 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)) ||
674 ((p.i_flags|p.o_flags)&(GRE_VERSION|GRE_ROUTING)))
675 return -EINVAL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000676 }
677 p.i_flags = gre_flags_to_tnl_flags(p.i_flags);
678 p.o_flags = gre_flags_to_tnl_flags(p.o_flags);
679
680 err = ip_tunnel_ioctl(dev, &p, cmd);
681 if (err)
682 return err;
683
Tom Herbert95f5c642016-04-29 17:12:16 -0700684 p.i_flags = gre_tnl_flags_to_gre_flags(p.i_flags);
685 p.o_flags = gre_tnl_flags_to_gre_flags(p.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000686
687 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
688 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689 return 0;
690}
691
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692/* Nice toy. Unfortunately, useless in real life :-)
693 It allows to construct virtual multiprotocol broadcast "LAN"
694 over the Internet, provided multicast routing is tuned.
695
696
697 I have no idea was this bicycle invented before me,
698 so that I had to set ARPHRD_IPGRE to a random value.
699 I have an impression, that Cisco could make something similar,
700 but this feature is apparently missing in IOS<=11.2(8).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900701
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
703 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
704
705 ping -t 255 224.66.66.66
706
707 If nobody answers, mbone does not work.
708
709 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
710 ip addr add 10.66.66.<somewhat>/24 dev Universe
711 ifconfig Universe up
712 ifconfig Universe add fe80::<Your_real_addr>/10
713 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
714 ftp 10.66.66.66
715 ...
716 ftp fec0:6666:6666::193.233.7.65
717 ...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 */
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700719static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
720 unsigned short type,
Eric Dumazet15078502010-09-15 11:07:53 +0000721 const void *daddr, const void *saddr, unsigned int len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722{
Patrick McHardy2941a482006-01-08 22:05:26 -0800723 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000724 struct iphdr *iph;
725 struct gre_base_hdr *greh;
726
Johannes Bergd58ff352017-06-16 14:29:23 +0200727 iph = skb_push(skb, t->hlen + sizeof(*iph));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000728 greh = (struct gre_base_hdr *)(iph+1);
Tom Herbert95f5c642016-04-29 17:12:16 -0700729 greh->flags = gre_tnl_flags_to_gre_flags(t->parms.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000730 greh->protocol = htons(type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731
732 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733
Pravin B Shelarc5441932013-03-25 14:49:35 +0000734 /* Set the source hardware address. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 if (saddr)
736 memcpy(&iph->saddr, saddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000737 if (daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 memcpy(&iph->daddr, daddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000739 if (iph->daddr)
Timo Teräs77a482b2013-08-06 13:45:43 +0300740 return t->hlen + sizeof(*iph);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900741
Pravin B Shelarc5441932013-03-25 14:49:35 +0000742 return -(t->hlen + sizeof(*iph));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743}
744
Timo Teras6a5f44d2007-10-23 20:31:53 -0700745static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
746{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000747 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
Timo Teras6a5f44d2007-10-23 20:31:53 -0700748 memcpy(haddr, &iph->saddr, 4);
749 return 4;
750}
751
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700752static const struct header_ops ipgre_header_ops = {
753 .create = ipgre_header,
Timo Teras6a5f44d2007-10-23 20:31:53 -0700754 .parse = ipgre_header_parse,
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700755};
756
Timo Teras6a5f44d2007-10-23 20:31:53 -0700757#ifdef CONFIG_NET_IPGRE_BROADCAST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758static int ipgre_open(struct net_device *dev)
759{
Patrick McHardy2941a482006-01-08 22:05:26 -0800760 struct ip_tunnel *t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761
Joe Perchesf97c1e02007-12-16 13:45:43 -0800762 if (ipv4_is_multicast(t->parms.iph.daddr)) {
David S. Millercbb1e852011-05-04 12:33:34 -0700763 struct flowi4 fl4;
764 struct rtable *rt;
Eric Dumazete985aad2010-09-27 03:57:11 +0000765
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200766 rt = ip_route_output_gre(t->net, &fl4,
David S. Millercbb1e852011-05-04 12:33:34 -0700767 t->parms.iph.daddr,
768 t->parms.iph.saddr,
769 t->parms.o_key,
770 RT_TOS(t->parms.iph.tos),
771 t->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800772 if (IS_ERR(rt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773 return -EADDRNOTAVAIL;
Changli Gaod8d1f302010-06-10 23:31:35 -0700774 dev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 ip_rt_put(rt);
Ian Morris51456b22015-04-03 09:17:26 +0100776 if (!__in_dev_get_rtnl(dev))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 return -EADDRNOTAVAIL;
778 t->mlink = dev->ifindex;
Herbert Xue5ed6392005-10-03 14:35:55 -0700779 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 }
781 return 0;
782}
783
784static int ipgre_close(struct net_device *dev)
785{
Patrick McHardy2941a482006-01-08 22:05:26 -0800786 struct ip_tunnel *t = netdev_priv(dev);
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800787
Joe Perchesf97c1e02007-12-16 13:45:43 -0800788 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800789 struct in_device *in_dev;
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200790 in_dev = inetdev_by_index(t->net, t->mlink);
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000791 if (in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700793 }
794 return 0;
795}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796#endif
797
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800798static const struct net_device_ops ipgre_netdev_ops = {
799 .ndo_init = ipgre_tunnel_init,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000800 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800801#ifdef CONFIG_NET_IPGRE_BROADCAST
802 .ndo_open = ipgre_open,
803 .ndo_stop = ipgre_close,
804#endif
Pravin B Shelarc5441932013-03-25 14:49:35 +0000805 .ndo_start_xmit = ipgre_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800806 .ndo_do_ioctl = ipgre_tunnel_ioctl,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000807 .ndo_change_mtu = ip_tunnel_change_mtu,
808 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200809 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800810};
811
Eric Dumazet6b78f162012-09-13 21:25:33 +0000812#define GRE_FEATURES (NETIF_F_SG | \
813 NETIF_F_FRAGLIST | \
814 NETIF_F_HIGHDMA | \
815 NETIF_F_HW_CSUM)
816
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817static void ipgre_tunnel_setup(struct net_device *dev)
818{
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800819 dev->netdev_ops = &ipgre_netdev_ops;
Nicolas Dichtel5a455272014-04-11 15:51:18 +0200820 dev->type = ARPHRD_IPGRE;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000821 ip_tunnel_setup(dev, ipgre_net_id);
822}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823
Pravin B Shelarc5441932013-03-25 14:49:35 +0000824static void __gre_tunnel_init(struct net_device *dev)
825{
826 struct ip_tunnel *tunnel;
Tom Herbert4565e992014-09-17 12:26:01 -0700827 int t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000828
829 tunnel = netdev_priv(dev);
Tom Herbert95f5c642016-04-29 17:12:16 -0700830 tunnel->tun_hlen = gre_calc_hlen(tunnel->parms.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000831 tunnel->parms.iph.protocol = IPPROTO_GRE;
832
Tom Herbert4565e992014-09-17 12:26:01 -0700833 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
834
835 t_hlen = tunnel->hlen + sizeof(struct iphdr);
836
837 dev->needed_headroom = LL_MAX_HEADER + t_hlen + 4;
838 dev->mtu = ETH_DATA_LEN - t_hlen - 4;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000839
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200840 dev->features |= GRE_FEATURES;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000841 dev->hw_features |= GRE_FEATURES;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000842
843 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
Alexander Duycka0ca1532016-04-05 09:13:39 -0700844 /* TCP offload with GRE SEQ is not supported, nor
845 * can we support 2 levels of outer headers requiring
846 * an update.
847 */
848 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
849 (tunnel->encap.type == TUNNEL_ENCAP_NONE)) {
850 dev->features |= NETIF_F_GSO_SOFTWARE;
851 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
852 }
853
Pravin B Shelarc5441932013-03-25 14:49:35 +0000854 /* Can use a lockless transmit, unless we generate
855 * output sequences
856 */
857 dev->features |= NETIF_F_LLTX;
858 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700859}
860
861static int ipgre_tunnel_init(struct net_device *dev)
862{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000863 struct ip_tunnel *tunnel = netdev_priv(dev);
864 struct iphdr *iph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865
Pravin B Shelarc5441932013-03-25 14:49:35 +0000866 __gre_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700867
Pravin B Shelarc5441932013-03-25 14:49:35 +0000868 memcpy(dev->dev_addr, &iph->saddr, 4);
869 memcpy(dev->broadcast, &iph->daddr, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700870
Pravin B Shelarc5441932013-03-25 14:49:35 +0000871 dev->flags = IFF_NOARP;
Eric Dumazet02875872014-10-05 18:38:35 -0700872 netif_keep_dst(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000873 dev->addr_len = 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700874
Jiri Benca64b04d2016-04-27 11:29:06 +0200875 if (iph->daddr && !tunnel->collect_md) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700876#ifdef CONFIG_NET_IPGRE_BROADCAST
Joe Perchesf97c1e02007-12-16 13:45:43 -0800877 if (ipv4_is_multicast(iph->daddr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700878 if (!iph->saddr)
879 return -EINVAL;
880 dev->flags = IFF_BROADCAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700881 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700882 }
883#endif
Jiri Benca64b04d2016-04-27 11:29:06 +0200884 } else if (!tunnel->collect_md) {
Timo Teras6a5f44d2007-10-23 20:31:53 -0700885 dev->header_ops = &ipgre_header_ops;
Jiri Benca64b04d2016-04-27 11:29:06 +0200886 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887
Pravin B Shelarc5441932013-03-25 14:49:35 +0000888 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700889}
890
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700891static const struct gre_protocol ipgre_protocol = {
892 .handler = gre_rcv,
893 .err_handler = gre_err,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894};
895
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000896static int __net_init ipgre_init_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700897{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000898 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700899}
900
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000901static void __net_exit ipgre_exit_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700902{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000903 struct ip_tunnel_net *itn = net_generic(net, ipgre_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200904 ip_tunnel_delete_net(itn, &ipgre_link_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700905}
906
907static struct pernet_operations ipgre_net_ops = {
908 .init = ipgre_init_net,
909 .exit = ipgre_exit_net,
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000910 .id = &ipgre_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000911 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700912};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700913
Matthias Schiffera8b8a8892017-06-25 23:56:01 +0200914static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[],
915 struct netlink_ext_ack *extack)
Herbert Xuc19e6542008-10-09 11:59:55 -0700916{
917 __be16 flags;
918
919 if (!data)
920 return 0;
921
922 flags = 0;
923 if (data[IFLA_GRE_IFLAGS])
924 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
925 if (data[IFLA_GRE_OFLAGS])
926 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
927 if (flags & (GRE_VERSION|GRE_ROUTING))
928 return -EINVAL;
929
Jiri Benc946b6362016-04-27 14:08:01 +0200930 if (data[IFLA_GRE_COLLECT_METADATA] &&
931 data[IFLA_GRE_ENCAP_TYPE] &&
932 nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]) != TUNNEL_ENCAP_NONE)
933 return -EINVAL;
934
Herbert Xuc19e6542008-10-09 11:59:55 -0700935 return 0;
936}
937
Matthias Schiffera8b8a8892017-06-25 23:56:01 +0200938static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[],
939 struct netlink_ext_ack *extack)
Herbert Xue1a80002008-10-09 12:00:17 -0700940{
941 __be32 daddr;
942
943 if (tb[IFLA_ADDRESS]) {
944 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
945 return -EINVAL;
946 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
947 return -EADDRNOTAVAIL;
948 }
949
950 if (!data)
951 goto out;
952
953 if (data[IFLA_GRE_REMOTE]) {
954 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
955 if (!daddr)
956 return -EINVAL;
957 }
958
959out:
Matthias Schiffera8b8a8892017-06-25 23:56:01 +0200960 return ipgre_tunnel_validate(tb, data, extack);
Herbert Xue1a80002008-10-09 12:00:17 -0700961}
962
William Tu84e54fe2017-08-22 09:40:28 -0700963static int erspan_validate(struct nlattr *tb[], struct nlattr *data[],
964 struct netlink_ext_ack *extack)
965{
966 __be16 flags = 0;
967 int ret;
968
969 if (!data)
970 return 0;
971
972 ret = ipgre_tap_validate(tb, data, extack);
973 if (ret)
974 return ret;
975
976 /* ERSPAN should only have GRE sequence and key flag */
977 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
978 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
979 if (flags != (GRE_SEQ | GRE_KEY))
980 return -EINVAL;
981
982 /* ERSPAN Session ID only has 10-bit. Since we reuse
983 * 32-bit key field as ID, check it's range.
984 */
985 if (data[IFLA_GRE_IKEY] &&
986 (ntohl(nla_get_be32(data[IFLA_GRE_IKEY])) & ~ID_MASK))
987 return -EINVAL;
988
989 if (data[IFLA_GRE_OKEY] &&
990 (ntohl(nla_get_be32(data[IFLA_GRE_OKEY])) & ~ID_MASK))
991 return -EINVAL;
992
993 return 0;
994}
995
Philip Prindeville22a59be2016-06-14 15:53:02 -0600996static int ipgre_netlink_parms(struct net_device *dev,
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700997 struct nlattr *data[],
998 struct nlattr *tb[],
Craig Gallek9830ad42017-04-19 12:30:54 -0400999 struct ip_tunnel_parm *parms,
1000 __u32 *fwmark)
Herbert Xuc19e6542008-10-09 11:59:55 -07001001{
Philip Prindeville22a59be2016-06-14 15:53:02 -06001002 struct ip_tunnel *t = netdev_priv(dev);
1003
Herbert Xu7bb82d92008-10-11 12:20:15 -07001004 memset(parms, 0, sizeof(*parms));
Herbert Xuc19e6542008-10-09 11:59:55 -07001005
1006 parms->iph.protocol = IPPROTO_GRE;
1007
1008 if (!data)
Philip Prindeville22a59be2016-06-14 15:53:02 -06001009 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001010
1011 if (data[IFLA_GRE_LINK])
1012 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
1013
1014 if (data[IFLA_GRE_IFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +00001015 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -07001016
1017 if (data[IFLA_GRE_OFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +00001018 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -07001019
1020 if (data[IFLA_GRE_IKEY])
1021 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
1022
1023 if (data[IFLA_GRE_OKEY])
1024 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
1025
1026 if (data[IFLA_GRE_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +02001027 parms->iph.saddr = nla_get_in_addr(data[IFLA_GRE_LOCAL]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001028
1029 if (data[IFLA_GRE_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +02001030 parms->iph.daddr = nla_get_in_addr(data[IFLA_GRE_REMOTE]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001031
1032 if (data[IFLA_GRE_TTL])
1033 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
1034
1035 if (data[IFLA_GRE_TOS])
1036 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
1037
Philip Prindeville22a59be2016-06-14 15:53:02 -06001038 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC])) {
1039 if (t->ignore_df)
1040 return -EINVAL;
Herbert Xuc19e6542008-10-09 11:59:55 -07001041 parms->iph.frag_off = htons(IP_DF);
Philip Prindeville22a59be2016-06-14 15:53:02 -06001042 }
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001043
1044 if (data[IFLA_GRE_COLLECT_METADATA]) {
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001045 t->collect_md = true;
Jiri Bence271c7b2016-05-11 15:53:57 +02001046 if (dev->type == ARPHRD_IPGRE)
1047 dev->type = ARPHRD_NONE;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001048 }
Philip Prindeville22a59be2016-06-14 15:53:02 -06001049
1050 if (data[IFLA_GRE_IGNORE_DF]) {
1051 if (nla_get_u8(data[IFLA_GRE_IGNORE_DF])
1052 && (parms->iph.frag_off & htons(IP_DF)))
1053 return -EINVAL;
1054 t->ignore_df = !!nla_get_u8(data[IFLA_GRE_IGNORE_DF]);
1055 }
1056
Craig Gallek9830ad42017-04-19 12:30:54 -04001057 if (data[IFLA_GRE_FWMARK])
1058 *fwmark = nla_get_u32(data[IFLA_GRE_FWMARK]);
1059
William Tu84e54fe2017-08-22 09:40:28 -07001060 if (data[IFLA_GRE_ERSPAN_INDEX]) {
1061 t->index = nla_get_u32(data[IFLA_GRE_ERSPAN_INDEX]);
1062
1063 if (t->index & ~INDEX_MASK)
1064 return -EINVAL;
1065 }
1066
Philip Prindeville22a59be2016-06-14 15:53:02 -06001067 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001068}
1069
Tom Herbert4565e992014-09-17 12:26:01 -07001070/* This function returns true when ENCAP attributes are present in the nl msg */
1071static bool ipgre_netlink_encap_parms(struct nlattr *data[],
1072 struct ip_tunnel_encap *ipencap)
1073{
1074 bool ret = false;
1075
1076 memset(ipencap, 0, sizeof(*ipencap));
1077
1078 if (!data)
1079 return ret;
1080
1081 if (data[IFLA_GRE_ENCAP_TYPE]) {
1082 ret = true;
1083 ipencap->type = nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]);
1084 }
1085
1086 if (data[IFLA_GRE_ENCAP_FLAGS]) {
1087 ret = true;
1088 ipencap->flags = nla_get_u16(data[IFLA_GRE_ENCAP_FLAGS]);
1089 }
1090
1091 if (data[IFLA_GRE_ENCAP_SPORT]) {
1092 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001093 ipencap->sport = nla_get_be16(data[IFLA_GRE_ENCAP_SPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001094 }
1095
1096 if (data[IFLA_GRE_ENCAP_DPORT]) {
1097 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001098 ipencap->dport = nla_get_be16(data[IFLA_GRE_ENCAP_DPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001099 }
1100
1101 return ret;
1102}
1103
Pravin B Shelarc5441932013-03-25 14:49:35 +00001104static int gre_tap_init(struct net_device *dev)
Herbert Xue1a80002008-10-09 12:00:17 -07001105{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001106 __gre_tunnel_init(dev);
stephen hemmingerbec94d4302014-12-27 10:01:42 -08001107 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Herbert Xue1a80002008-10-09 12:00:17 -07001108
Pravin B Shelarc5441932013-03-25 14:49:35 +00001109 return ip_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -07001110}
1111
Pravin B Shelarc5441932013-03-25 14:49:35 +00001112static const struct net_device_ops gre_tap_netdev_ops = {
1113 .ndo_init = gre_tap_init,
1114 .ndo_uninit = ip_tunnel_uninit,
1115 .ndo_start_xmit = gre_tap_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001116 .ndo_set_mac_address = eth_mac_addr,
1117 .ndo_validate_addr = eth_validate_addr,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001118 .ndo_change_mtu = ip_tunnel_change_mtu,
1119 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +02001120 .ndo_get_iflink = ip_tunnel_get_iflink,
Pravin B Shelarfc4099f2015-10-22 18:17:16 -07001121 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001122};
1123
William Tu84e54fe2017-08-22 09:40:28 -07001124static int erspan_tunnel_init(struct net_device *dev)
1125{
1126 struct ip_tunnel *tunnel = netdev_priv(dev);
1127 int t_hlen;
1128
1129 tunnel->tun_hlen = 8;
1130 tunnel->parms.iph.protocol = IPPROTO_GRE;
1131 t_hlen = tunnel->hlen + sizeof(struct iphdr) + sizeof(struct erspanhdr);
1132
1133 dev->needed_headroom = LL_MAX_HEADER + t_hlen + 4;
1134 dev->mtu = ETH_DATA_LEN - t_hlen - 4;
1135 dev->features |= GRE_FEATURES;
1136 dev->hw_features |= GRE_FEATURES;
1137 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
1138
1139 return ip_tunnel_init(dev);
1140}
1141
1142static const struct net_device_ops erspan_netdev_ops = {
1143 .ndo_init = erspan_tunnel_init,
1144 .ndo_uninit = ip_tunnel_uninit,
1145 .ndo_start_xmit = erspan_xmit,
1146 .ndo_set_mac_address = eth_mac_addr,
1147 .ndo_validate_addr = eth_validate_addr,
1148 .ndo_change_mtu = ip_tunnel_change_mtu,
1149 .ndo_get_stats64 = ip_tunnel_get_stats64,
1150 .ndo_get_iflink = ip_tunnel_get_iflink,
1151 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
1152};
1153
Herbert Xue1a80002008-10-09 12:00:17 -07001154static void ipgre_tap_setup(struct net_device *dev)
1155{
Herbert Xue1a80002008-10-09 12:00:17 -07001156 ether_setup(dev);
Jiri Bencd13b1612016-02-17 15:32:53 +01001157 dev->netdev_ops = &gre_tap_netdev_ops;
1158 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1159 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001160 ip_tunnel_setup(dev, gre_tap_net_id);
Herbert Xue1a80002008-10-09 12:00:17 -07001161}
1162
Pravin B Shelarc5441932013-03-25 14:49:35 +00001163static int ipgre_newlink(struct net *src_net, struct net_device *dev,
Matthias Schiffer7a3f4a12017-06-25 23:55:59 +02001164 struct nlattr *tb[], struct nlattr *data[],
1165 struct netlink_ext_ack *extack)
Herbert Xuc19e6542008-10-09 11:59:55 -07001166{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001167 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001168 struct ip_tunnel_encap ipencap;
Craig Gallek9830ad42017-04-19 12:30:54 -04001169 __u32 fwmark = 0;
Philip Prindeville22a59be2016-06-14 15:53:02 -06001170 int err;
Tom Herbert4565e992014-09-17 12:26:01 -07001171
1172 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1173 struct ip_tunnel *t = netdev_priv(dev);
Philip Prindeville22a59be2016-06-14 15:53:02 -06001174 err = ip_tunnel_encap_setup(t, &ipencap);
Tom Herbert4565e992014-09-17 12:26:01 -07001175
1176 if (err < 0)
1177 return err;
1178 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001179
Craig Gallek9830ad42017-04-19 12:30:54 -04001180 err = ipgre_netlink_parms(dev, data, tb, &p, &fwmark);
Philip Prindeville22a59be2016-06-14 15:53:02 -06001181 if (err < 0)
1182 return err;
Craig Gallek9830ad42017-04-19 12:30:54 -04001183 return ip_tunnel_newlink(dev, tb, &p, fwmark);
Herbert Xuc19e6542008-10-09 11:59:55 -07001184}
1185
1186static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
Matthias Schifferad744b22017-06-25 23:56:00 +02001187 struct nlattr *data[],
1188 struct netlink_ext_ack *extack)
Herbert Xuc19e6542008-10-09 11:59:55 -07001189{
Craig Gallek9830ad42017-04-19 12:30:54 -04001190 struct ip_tunnel *t = netdev_priv(dev);
Herbert Xuc19e6542008-10-09 11:59:55 -07001191 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001192 struct ip_tunnel_encap ipencap;
Craig Gallek9830ad42017-04-19 12:30:54 -04001193 __u32 fwmark = t->fwmark;
Philip Prindeville22a59be2016-06-14 15:53:02 -06001194 int err;
Tom Herbert4565e992014-09-17 12:26:01 -07001195
1196 if (ipgre_netlink_encap_parms(data, &ipencap)) {
Philip Prindeville22a59be2016-06-14 15:53:02 -06001197 err = ip_tunnel_encap_setup(t, &ipencap);
Tom Herbert4565e992014-09-17 12:26:01 -07001198
1199 if (err < 0)
1200 return err;
1201 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001202
Craig Gallek9830ad42017-04-19 12:30:54 -04001203 err = ipgre_netlink_parms(dev, data, tb, &p, &fwmark);
Philip Prindeville22a59be2016-06-14 15:53:02 -06001204 if (err < 0)
1205 return err;
Craig Gallek9830ad42017-04-19 12:30:54 -04001206 return ip_tunnel_changelink(dev, tb, &p, fwmark);
Herbert Xuc19e6542008-10-09 11:59:55 -07001207}
1208
1209static size_t ipgre_get_size(const struct net_device *dev)
1210{
1211 return
1212 /* IFLA_GRE_LINK */
1213 nla_total_size(4) +
1214 /* IFLA_GRE_IFLAGS */
1215 nla_total_size(2) +
1216 /* IFLA_GRE_OFLAGS */
1217 nla_total_size(2) +
1218 /* IFLA_GRE_IKEY */
1219 nla_total_size(4) +
1220 /* IFLA_GRE_OKEY */
1221 nla_total_size(4) +
1222 /* IFLA_GRE_LOCAL */
1223 nla_total_size(4) +
1224 /* IFLA_GRE_REMOTE */
1225 nla_total_size(4) +
1226 /* IFLA_GRE_TTL */
1227 nla_total_size(1) +
1228 /* IFLA_GRE_TOS */
1229 nla_total_size(1) +
1230 /* IFLA_GRE_PMTUDISC */
1231 nla_total_size(1) +
Tom Herbert4565e992014-09-17 12:26:01 -07001232 /* IFLA_GRE_ENCAP_TYPE */
1233 nla_total_size(2) +
1234 /* IFLA_GRE_ENCAP_FLAGS */
1235 nla_total_size(2) +
1236 /* IFLA_GRE_ENCAP_SPORT */
1237 nla_total_size(2) +
1238 /* IFLA_GRE_ENCAP_DPORT */
1239 nla_total_size(2) +
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001240 /* IFLA_GRE_COLLECT_METADATA */
1241 nla_total_size(0) +
Philip Prindeville22a59be2016-06-14 15:53:02 -06001242 /* IFLA_GRE_IGNORE_DF */
1243 nla_total_size(1) +
Craig Gallek9830ad42017-04-19 12:30:54 -04001244 /* IFLA_GRE_FWMARK */
1245 nla_total_size(4) +
William Tu84e54fe2017-08-22 09:40:28 -07001246 /* IFLA_GRE_ERSPAN_INDEX */
1247 nla_total_size(4) +
Herbert Xuc19e6542008-10-09 11:59:55 -07001248 0;
1249}
1250
1251static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
1252{
1253 struct ip_tunnel *t = netdev_priv(dev);
1254 struct ip_tunnel_parm *p = &t->parms;
1255
David S. Millerf3756b72012-04-01 20:39:02 -04001256 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
Tom Herbert95f5c642016-04-29 17:12:16 -07001257 nla_put_be16(skb, IFLA_GRE_IFLAGS,
1258 gre_tnl_flags_to_gre_flags(p->i_flags)) ||
1259 nla_put_be16(skb, IFLA_GRE_OFLAGS,
1260 gre_tnl_flags_to_gre_flags(p->o_flags)) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001261 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
1262 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
Jiri Benc930345e2015-03-29 16:59:25 +02001263 nla_put_in_addr(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
1264 nla_put_in_addr(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001265 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
1266 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
1267 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
Craig Gallek9830ad42017-04-19 12:30:54 -04001268 !!(p->iph.frag_off & htons(IP_DF))) ||
1269 nla_put_u32(skb, IFLA_GRE_FWMARK, t->fwmark))
David S. Millerf3756b72012-04-01 20:39:02 -04001270 goto nla_put_failure;
Tom Herbert4565e992014-09-17 12:26:01 -07001271
1272 if (nla_put_u16(skb, IFLA_GRE_ENCAP_TYPE,
1273 t->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001274 nla_put_be16(skb, IFLA_GRE_ENCAP_SPORT,
1275 t->encap.sport) ||
1276 nla_put_be16(skb, IFLA_GRE_ENCAP_DPORT,
1277 t->encap.dport) ||
Tom Herbert4565e992014-09-17 12:26:01 -07001278 nla_put_u16(skb, IFLA_GRE_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -08001279 t->encap.flags))
Tom Herbert4565e992014-09-17 12:26:01 -07001280 goto nla_put_failure;
1281
Philip Prindeville22a59be2016-06-14 15:53:02 -06001282 if (nla_put_u8(skb, IFLA_GRE_IGNORE_DF, t->ignore_df))
1283 goto nla_put_failure;
1284
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001285 if (t->collect_md) {
1286 if (nla_put_flag(skb, IFLA_GRE_COLLECT_METADATA))
1287 goto nla_put_failure;
1288 }
1289
William Tu84e54fe2017-08-22 09:40:28 -07001290 if (t->index)
1291 if (nla_put_u32(skb, IFLA_GRE_ERSPAN_INDEX, t->index))
1292 goto nla_put_failure;
1293
Herbert Xuc19e6542008-10-09 11:59:55 -07001294 return 0;
1295
1296nla_put_failure:
1297 return -EMSGSIZE;
1298}
1299
William Tu84e54fe2017-08-22 09:40:28 -07001300static void erspan_setup(struct net_device *dev)
1301{
1302 ether_setup(dev);
1303 dev->netdev_ops = &erspan_netdev_ops;
1304 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1305 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
1306 ip_tunnel_setup(dev, erspan_net_id);
1307}
1308
Herbert Xuc19e6542008-10-09 11:59:55 -07001309static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
1310 [IFLA_GRE_LINK] = { .type = NLA_U32 },
1311 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
1312 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
1313 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
1314 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001315 [IFLA_GRE_LOCAL] = { .len = FIELD_SIZEOF(struct iphdr, saddr) },
1316 [IFLA_GRE_REMOTE] = { .len = FIELD_SIZEOF(struct iphdr, daddr) },
Herbert Xuc19e6542008-10-09 11:59:55 -07001317 [IFLA_GRE_TTL] = { .type = NLA_U8 },
1318 [IFLA_GRE_TOS] = { .type = NLA_U8 },
1319 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert4565e992014-09-17 12:26:01 -07001320 [IFLA_GRE_ENCAP_TYPE] = { .type = NLA_U16 },
1321 [IFLA_GRE_ENCAP_FLAGS] = { .type = NLA_U16 },
1322 [IFLA_GRE_ENCAP_SPORT] = { .type = NLA_U16 },
1323 [IFLA_GRE_ENCAP_DPORT] = { .type = NLA_U16 },
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001324 [IFLA_GRE_COLLECT_METADATA] = { .type = NLA_FLAG },
Philip Prindeville22a59be2016-06-14 15:53:02 -06001325 [IFLA_GRE_IGNORE_DF] = { .type = NLA_U8 },
Craig Gallek9830ad42017-04-19 12:30:54 -04001326 [IFLA_GRE_FWMARK] = { .type = NLA_U32 },
William Tu84e54fe2017-08-22 09:40:28 -07001327 [IFLA_GRE_ERSPAN_INDEX] = { .type = NLA_U32 },
Herbert Xuc19e6542008-10-09 11:59:55 -07001328};
1329
1330static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
1331 .kind = "gre",
1332 .maxtype = IFLA_GRE_MAX,
1333 .policy = ipgre_policy,
1334 .priv_size = sizeof(struct ip_tunnel),
1335 .setup = ipgre_tunnel_setup,
1336 .validate = ipgre_tunnel_validate,
1337 .newlink = ipgre_newlink,
1338 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001339 .dellink = ip_tunnel_dellink,
Herbert Xuc19e6542008-10-09 11:59:55 -07001340 .get_size = ipgre_get_size,
1341 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001342 .get_link_net = ip_tunnel_get_link_net,
Herbert Xuc19e6542008-10-09 11:59:55 -07001343};
1344
Herbert Xue1a80002008-10-09 12:00:17 -07001345static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
1346 .kind = "gretap",
1347 .maxtype = IFLA_GRE_MAX,
1348 .policy = ipgre_policy,
1349 .priv_size = sizeof(struct ip_tunnel),
1350 .setup = ipgre_tap_setup,
1351 .validate = ipgre_tap_validate,
1352 .newlink = ipgre_newlink,
1353 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001354 .dellink = ip_tunnel_dellink,
Herbert Xue1a80002008-10-09 12:00:17 -07001355 .get_size = ipgre_get_size,
1356 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001357 .get_link_net = ip_tunnel_get_link_net,
Herbert Xue1a80002008-10-09 12:00:17 -07001358};
1359
William Tu84e54fe2017-08-22 09:40:28 -07001360static struct rtnl_link_ops erspan_link_ops __read_mostly = {
1361 .kind = "erspan",
1362 .maxtype = IFLA_GRE_MAX,
1363 .policy = ipgre_policy,
1364 .priv_size = sizeof(struct ip_tunnel),
1365 .setup = erspan_setup,
1366 .validate = erspan_validate,
1367 .newlink = ipgre_newlink,
1368 .changelink = ipgre_changelink,
1369 .dellink = ip_tunnel_dellink,
1370 .get_size = ipgre_get_size,
1371 .fill_info = ipgre_fill_info,
1372 .get_link_net = ip_tunnel_get_link_net,
1373};
1374
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001375struct net_device *gretap_fb_dev_create(struct net *net, const char *name,
1376 u8 name_assign_type)
1377{
1378 struct nlattr *tb[IFLA_MAX + 1];
1379 struct net_device *dev;
Nicolas Dichtel106da662016-06-13 10:31:04 +02001380 LIST_HEAD(list_kill);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001381 struct ip_tunnel *t;
1382 int err;
1383
1384 memset(&tb, 0, sizeof(tb));
1385
1386 dev = rtnl_create_link(net, name, name_assign_type,
1387 &ipgre_tap_ops, tb);
1388 if (IS_ERR(dev))
1389 return dev;
1390
1391 /* Configure flow based GRE device. */
1392 t = netdev_priv(dev);
1393 t->collect_md = true;
1394
Matthias Schiffer7a3f4a12017-06-25 23:55:59 +02001395 err = ipgre_newlink(net, dev, tb, NULL, NULL);
Nicolas Dichtel106da662016-06-13 10:31:04 +02001396 if (err < 0) {
1397 free_netdev(dev);
1398 return ERR_PTR(err);
1399 }
David Wragg7e059152016-02-10 00:05:58 +00001400
1401 /* openvswitch users expect packet sizes to be unrestricted,
1402 * so set the largest MTU we can.
1403 */
1404 err = __ip_tunnel_change_mtu(dev, IP_MAX_MTU, false);
1405 if (err)
1406 goto out;
1407
Nicolas Dichtelda6f1da2016-06-13 10:31:06 +02001408 err = rtnl_configure_link(dev, NULL);
1409 if (err < 0)
1410 goto out;
1411
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001412 return dev;
1413out:
Nicolas Dichtel106da662016-06-13 10:31:04 +02001414 ip_tunnel_dellink(dev, &list_kill);
1415 unregister_netdevice_many(&list_kill);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001416 return ERR_PTR(err);
1417}
1418EXPORT_SYMBOL_GPL(gretap_fb_dev_create);
1419
Pravin B Shelarc5441932013-03-25 14:49:35 +00001420static int __net_init ipgre_tap_init_net(struct net *net)
1421{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001422 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, "gretap0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001423}
1424
1425static void __net_exit ipgre_tap_exit_net(struct net *net)
1426{
1427 struct ip_tunnel_net *itn = net_generic(net, gre_tap_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001428 ip_tunnel_delete_net(itn, &ipgre_tap_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001429}
1430
1431static struct pernet_operations ipgre_tap_net_ops = {
1432 .init = ipgre_tap_init_net,
1433 .exit = ipgre_tap_exit_net,
1434 .id = &gre_tap_net_id,
1435 .size = sizeof(struct ip_tunnel_net),
1436};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001437
William Tu84e54fe2017-08-22 09:40:28 -07001438static int __net_init erspan_init_net(struct net *net)
1439{
1440 return ip_tunnel_init_net(net, erspan_net_id,
1441 &erspan_link_ops, "erspan0");
1442}
1443
1444static void __net_exit erspan_exit_net(struct net *net)
1445{
1446 struct ip_tunnel_net *itn = net_generic(net, erspan_net_id);
1447
1448 ip_tunnel_delete_net(itn, &erspan_link_ops);
1449}
1450
1451static struct pernet_operations erspan_net_ops = {
1452 .init = erspan_init_net,
1453 .exit = erspan_exit_net,
1454 .id = &erspan_net_id,
1455 .size = sizeof(struct ip_tunnel_net),
1456};
1457
Linus Torvalds1da177e2005-04-16 15:20:36 -07001458static int __init ipgre_init(void)
1459{
1460 int err;
1461
Joe Perches058bd4d2012-03-11 18:36:11 +00001462 pr_info("GRE over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001463
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +00001464 err = register_pernet_device(&ipgre_net_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -07001465 if (err < 0)
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001466 return err;
1467
Pravin B Shelarc5441932013-03-25 14:49:35 +00001468 err = register_pernet_device(&ipgre_tap_net_ops);
1469 if (err < 0)
William Tue3d03282017-08-22 17:04:05 -07001470 goto pnet_tap_failed;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001471
William Tu84e54fe2017-08-22 09:40:28 -07001472 err = register_pernet_device(&erspan_net_ops);
1473 if (err < 0)
1474 goto pnet_erspan_failed;
1475
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001476 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001477 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +00001478 pr_info("%s: can't add protocol\n", __func__);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001479 goto add_proto_failed;
1480 }
Pavel Emelyanov7daa0002008-04-16 01:10:05 -07001481
Herbert Xuc19e6542008-10-09 11:59:55 -07001482 err = rtnl_link_register(&ipgre_link_ops);
1483 if (err < 0)
1484 goto rtnl_link_failed;
1485
Herbert Xue1a80002008-10-09 12:00:17 -07001486 err = rtnl_link_register(&ipgre_tap_ops);
1487 if (err < 0)
1488 goto tap_ops_failed;
1489
William Tu84e54fe2017-08-22 09:40:28 -07001490 err = rtnl_link_register(&erspan_link_ops);
1491 if (err < 0)
1492 goto erspan_link_failed;
1493
Pravin B Shelarc5441932013-03-25 14:49:35 +00001494 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001495
William Tu84e54fe2017-08-22 09:40:28 -07001496erspan_link_failed:
1497 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xue1a80002008-10-09 12:00:17 -07001498tap_ops_failed:
1499 rtnl_link_unregister(&ipgre_link_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001500rtnl_link_failed:
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001501 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001502add_proto_failed:
William Tu84e54fe2017-08-22 09:40:28 -07001503 unregister_pernet_device(&erspan_net_ops);
1504pnet_erspan_failed:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001505 unregister_pernet_device(&ipgre_tap_net_ops);
William Tue3d03282017-08-22 17:04:05 -07001506pnet_tap_failed:
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001507 unregister_pernet_device(&ipgre_net_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001508 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001509}
1510
Alexey Kuznetsovdb445752005-07-30 17:46:44 -07001511static void __exit ipgre_fini(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001512{
Herbert Xue1a80002008-10-09 12:00:17 -07001513 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001514 rtnl_link_unregister(&ipgre_link_ops);
William Tu84e54fe2017-08-22 09:40:28 -07001515 rtnl_link_unregister(&erspan_link_ops);
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001516 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001517 unregister_pernet_device(&ipgre_tap_net_ops);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001518 unregister_pernet_device(&ipgre_net_ops);
William Tu84e54fe2017-08-22 09:40:28 -07001519 unregister_pernet_device(&erspan_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001520}
1521
1522module_init(ipgre_init);
1523module_exit(ipgre_fini);
1524MODULE_LICENSE("GPL");
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001525MODULE_ALIAS_RTNL_LINK("gre");
1526MODULE_ALIAS_RTNL_LINK("gretap");
William Tu84e54fe2017-08-22 09:40:28 -07001527MODULE_ALIAS_RTNL_LINK("erspan");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +03001528MODULE_ALIAS_NETDEV("gre0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001529MODULE_ALIAS_NETDEV("gretap0");
William Tu84e54fe2017-08-22 09:40:28 -07001530MODULE_ALIAS_NETDEV("erspan0");