blob: dd031617160ae8ac4ad1ae0441665d3a1acc8651 [file] [log] [blame]
Daniel Borkmannc50cd352013-07-01 19:24:00 +02001/*
2 * IPV4 GSO/GRO offload support
3 * Linux INET implementation
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * GRE GSO support
11 */
12
13#include <linux/skbuff.h>
Paul Gortmakercf172282014-01-15 11:19:55 -050014#include <linux/init.h>
Daniel Borkmannc50cd352013-07-01 19:24:00 +020015#include <net/protocol.h>
16#include <net/gre.h>
17
Daniel Borkmannc50cd352013-07-01 19:24:00 +020018static struct sk_buff *gre_gso_segment(struct sk_buff *skb,
19 netdev_features_t features)
20{
Alexander Duyck2e598af2016-02-05 15:28:01 -080021 int tnl_hlen = skb_inner_mac_header(skb) - skb_transport_header(skb);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020022 struct sk_buff *segs = ERR_PTR(-EINVAL);
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080023 u16 mac_offset = skb->mac_header;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020024 __be16 protocol = skb->protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080025 u16 mac_len = skb->mac_len;
26 int gre_offset, outer_hlen;
Alexander Duyck22463872016-02-24 16:46:21 -080027 bool need_csum, ufo;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020028
29 if (unlikely(skb_shinfo(skb)->gso_type &
30 ~(SKB_GSO_TCPV4 |
31 SKB_GSO_TCPV6 |
32 SKB_GSO_UDP |
33 SKB_GSO_DODGY |
34 SKB_GSO_TCP_ECN |
Eric Dumazetcb32f512013-10-19 11:42:57 -070035 SKB_GSO_GRE |
Tom Herbert4749c092014-06-04 17:20:23 -070036 SKB_GSO_GRE_CSUM |
Eric Dumazet7e3b6e72015-10-24 05:47:44 -070037 SKB_GSO_IPIP |
38 SKB_GSO_SIT)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020039 goto out;
40
Tom Herbert53e50392014-09-20 14:52:30 -070041 if (!skb->encapsulation)
42 goto out;
43
Alexander Duyck2e598af2016-02-05 15:28:01 -080044 if (unlikely(tnl_hlen < sizeof(struct gre_base_hdr)))
45 goto out;
46
47 if (unlikely(!pskb_may_pull(skb, tnl_hlen)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020048 goto out;
49
Daniel Borkmannc50cd352013-07-01 19:24:00 +020050 /* setup inner skb. */
Daniel Borkmannc50cd352013-07-01 19:24:00 +020051 skb->encapsulation = 0;
Alexander Duyck2e598af2016-02-05 15:28:01 -080052 __skb_pull(skb, tnl_hlen);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020053 skb_reset_mac_header(skb);
54 skb_set_network_header(skb, skb_inner_network_offset(skb));
55 skb->mac_len = skb_inner_network_offset(skb);
Alexander Duyck38720352016-02-05 15:28:08 -080056 skb->protocol = skb->inner_protocol;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020057
Alexander Duyck2e598af2016-02-05 15:28:01 -080058 need_csum = !!(skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM);
59 skb->encap_hdr_csum = need_csum;
60
Alexander Duyck22463872016-02-24 16:46:21 -080061 ufo = !!(skb_shinfo(skb)->gso_type & SKB_GSO_UDP);
62
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080063 features &= skb->dev->hw_enc_features;
64
Alexander Duyck22463872016-02-24 16:46:21 -080065 /* The only checksum offload we care about from here on out is the
66 * outer one so strip the existing checksum feature flags based
67 * on the fact that we will be computing our checksum in software.
68 */
69 if (ufo) {
70 features &= ~NETIF_F_CSUM_MASK;
71 if (!need_csum)
72 features |= NETIF_F_HW_CSUM;
73 }
74
Daniel Borkmannc50cd352013-07-01 19:24:00 +020075 /* segment inner packet. */
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080076 segs = skb_mac_gso_segment(skb, features);
Himangi Saraogi5a8dbf02014-07-27 12:36:51 +053077 if (IS_ERR_OR_NULL(segs)) {
Alexander Duyck2e598af2016-02-05 15:28:01 -080078 skb_gso_error_unwind(skb, protocol, tnl_hlen, mac_offset,
79 mac_len);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020080 goto out;
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080081 }
Daniel Borkmannc50cd352013-07-01 19:24:00 +020082
Alexander Duyck2e598af2016-02-05 15:28:01 -080083 outer_hlen = skb_tnl_header_len(skb);
84 gre_offset = outer_hlen - tnl_hlen;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020085 skb = segs;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020086 do {
Alexander Duyck38720352016-02-05 15:28:08 -080087 struct gre_base_hdr *greh;
Alexander Duyck2e598af2016-02-05 15:28:01 -080088 __be32 *pcsum;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020089
Alexander Duyck22463872016-02-24 16:46:21 -080090 /* Set up inner headers if we are offloading inner checksum */
91 if (skb->ip_summed == CHECKSUM_PARTIAL) {
92 skb_reset_inner_headers(skb);
93 skb->encapsulation = 1;
94 }
Alexander Duyckcdbaa0b2013-07-10 17:05:06 -070095
Daniel Borkmannc50cd352013-07-01 19:24:00 +020096 skb->mac_len = mac_len;
97 skb->protocol = protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080098
99 __skb_push(skb, outer_hlen);
100 skb_reset_mac_header(skb);
101 skb_set_network_header(skb, mac_len);
102 skb_set_transport_header(skb, gre_offset);
103
104 if (!need_csum)
105 continue;
106
107 greh = (struct gre_base_hdr *)skb_transport_header(skb);
108 pcsum = (__be32 *)(greh + 1);
109
110 *pcsum = 0;
111 *(__sum16 *)pcsum = gso_make_checksum(skb, 0);
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200112 } while ((skb = skb->next));
113out:
114 return segs;
115}
116
Jerry Chubf5a7552014-01-07 10:23:19 -0800117static struct sk_buff **gre_gro_receive(struct sk_buff **head,
118 struct sk_buff *skb)
119{
120 struct sk_buff **pp = NULL;
121 struct sk_buff *p;
122 const struct gre_base_hdr *greh;
123 unsigned int hlen, grehlen;
124 unsigned int off;
125 int flush = 1;
126 struct packet_offload *ptype;
127 __be16 type;
128
Jesse Grossfac8e0f2016-03-19 09:32:01 -0700129 if (NAPI_GRO_CB(skb)->encap_mark)
130 goto out;
131
132 NAPI_GRO_CB(skb)->encap_mark = 1;
133
Jerry Chubf5a7552014-01-07 10:23:19 -0800134 off = skb_gro_offset(skb);
135 hlen = off + sizeof(*greh);
136 greh = skb_gro_header_fast(skb, off);
137 if (skb_gro_header_hard(skb, hlen)) {
138 greh = skb_gro_header_slow(skb, hlen, off);
139 if (unlikely(!greh))
140 goto out;
141 }
142
143 /* Only support version 0 and K (key), C (csum) flags. Note that
144 * although the support for the S (seq#) flag can be added easily
145 * for GRO, this is problematic for GSO hence can not be enabled
146 * here because a GRO pkt may end up in the forwarding path, thus
147 * requiring GSO support to break it up correctly.
148 */
149 if ((greh->flags & ~(GRE_KEY|GRE_CSUM)) != 0)
150 goto out;
151
152 type = greh->protocol;
153
154 rcu_read_lock();
155 ptype = gro_find_receive_by_type(type);
Ian Morris51456b22015-04-03 09:17:26 +0100156 if (!ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800157 goto out_unlock;
158
159 grehlen = GRE_HEADER_SECTION;
160
161 if (greh->flags & GRE_KEY)
162 grehlen += GRE_HEADER_SECTION;
163
164 if (greh->flags & GRE_CSUM)
165 grehlen += GRE_HEADER_SECTION;
166
167 hlen = off + grehlen;
168 if (skb_gro_header_hard(skb, hlen)) {
169 greh = skb_gro_header_slow(skb, hlen, off);
170 if (unlikely(!greh))
171 goto out_unlock;
172 }
Jerry Chubf5a7552014-01-07 10:23:19 -0800173
Tom Herbert758f75d2014-08-22 13:34:22 -0700174 /* Don't bother verifying checksum if we're going to flush anyway. */
Tom Herbert884d3382014-08-31 15:12:44 -0700175 if ((greh->flags & GRE_CSUM) && !NAPI_GRO_CB(skb)->flush) {
176 if (skb_gro_checksum_simple_validate(skb))
Jerry Chubf5a7552014-01-07 10:23:19 -0800177 goto out_unlock;
Tom Herbert758f75d2014-08-22 13:34:22 -0700178
Tom Herbert884d3382014-08-31 15:12:44 -0700179 skb_gro_checksum_try_convert(skb, IPPROTO_GRE, 0,
180 null_compute_pseudo);
181 }
182
Jerry Chubf5a7552014-01-07 10:23:19 -0800183 for (p = *head; p; p = p->next) {
184 const struct gre_base_hdr *greh2;
185
186 if (!NAPI_GRO_CB(p)->same_flow)
187 continue;
188
189 /* The following checks are needed to ensure only pkts
190 * from the same tunnel are considered for aggregation.
191 * The criteria for "the same tunnel" includes:
192 * 1) same version (we only support version 0 here)
193 * 2) same protocol (we only support ETH_P_IP for now)
194 * 3) same set of flags
195 * 4) same key if the key field is present.
196 */
197 greh2 = (struct gre_base_hdr *)(p->data + off);
198
199 if (greh2->flags != greh->flags ||
200 greh2->protocol != greh->protocol) {
201 NAPI_GRO_CB(p)->same_flow = 0;
202 continue;
203 }
204 if (greh->flags & GRE_KEY) {
205 /* compare keys */
206 if (*(__be32 *)(greh2+1) != *(__be32 *)(greh+1)) {
207 NAPI_GRO_CB(p)->same_flow = 0;
208 continue;
209 }
210 }
211 }
212
213 skb_gro_pull(skb, grehlen);
214
215 /* Adjusted NAPI_GRO_CB(skb)->csum after skb_gro_pull()*/
216 skb_gro_postpull_rcsum(skb, greh, grehlen);
217
218 pp = ptype->callbacks.gro_receive(head, skb);
Alexander Duyckc194cf92016-03-09 09:24:23 -0800219 flush = 0;
Jerry Chubf5a7552014-01-07 10:23:19 -0800220
221out_unlock:
222 rcu_read_unlock();
223out:
224 NAPI_GRO_CB(skb)->flush |= flush;
225
226 return pp;
227}
228
Wei Yongjund10dbad2014-01-09 22:22:05 +0800229static int gre_gro_complete(struct sk_buff *skb, int nhoff)
Jerry Chubf5a7552014-01-07 10:23:19 -0800230{
231 struct gre_base_hdr *greh = (struct gre_base_hdr *)(skb->data + nhoff);
232 struct packet_offload *ptype;
233 unsigned int grehlen = sizeof(*greh);
234 int err = -ENOENT;
235 __be16 type;
236
Jerry Chuc3caf112014-07-14 15:54:46 -0700237 skb->encapsulation = 1;
238 skb_shinfo(skb)->gso_type = SKB_GSO_GRE;
239
Jerry Chubf5a7552014-01-07 10:23:19 -0800240 type = greh->protocol;
241 if (greh->flags & GRE_KEY)
242 grehlen += GRE_HEADER_SECTION;
243
244 if (greh->flags & GRE_CSUM)
245 grehlen += GRE_HEADER_SECTION;
246
247 rcu_read_lock();
248 ptype = gro_find_complete_by_type(type);
Ian Morris00db4122015-04-03 09:17:27 +0100249 if (ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800250 err = ptype->callbacks.gro_complete(skb, nhoff + grehlen);
251
252 rcu_read_unlock();
Tom Herbert6fb2a752014-11-29 09:59:45 -0800253
254 skb_set_inner_mac_header(skb, nhoff + grehlen);
255
Jerry Chubf5a7552014-01-07 10:23:19 -0800256 return err;
257}
258
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200259static const struct net_offload gre_offload = {
260 .callbacks = {
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200261 .gso_segment = gre_gso_segment,
Jerry Chubf5a7552014-01-07 10:23:19 -0800262 .gro_receive = gre_gro_receive,
263 .gro_complete = gre_gro_complete,
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200264 },
265};
266
Eric Dumazet438e38f2014-01-06 14:03:07 -0800267static int __init gre_offload_init(void)
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200268{
269 return inet_add_offload(&gre_offload, IPPROTO_GRE);
270}
Paul Gortmakercf172282014-01-15 11:19:55 -0500271device_initcall(gre_offload_init);