blob: 96e0efecefa6aa2f4bc97c098c08ee6c25f2e11c [file] [log] [blame]
Daniel Borkmannc50cd352013-07-01 19:24:00 +02001/*
2 * IPV4 GSO/GRO offload support
3 * Linux INET implementation
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * GRE GSO support
11 */
12
13#include <linux/skbuff.h>
Paul Gortmakercf172282014-01-15 11:19:55 -050014#include <linux/init.h>
Daniel Borkmannc50cd352013-07-01 19:24:00 +020015#include <net/protocol.h>
16#include <net/gre.h>
17
Daniel Borkmannc50cd352013-07-01 19:24:00 +020018static struct sk_buff *gre_gso_segment(struct sk_buff *skb,
19 netdev_features_t features)
20{
Alexander Duyck2e598af2016-02-05 15:28:01 -080021 int tnl_hlen = skb_inner_mac_header(skb) - skb_transport_header(skb);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020022 struct sk_buff *segs = ERR_PTR(-EINVAL);
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080023 u16 mac_offset = skb->mac_header;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020024 __be16 protocol = skb->protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080025 u16 mac_len = skb->mac_len;
26 int gre_offset, outer_hlen;
Steffen Klassert07b26c92016-09-19 12:58:47 +020027 bool need_csum, ufo, gso_partial;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020028
Tom Herbert53e50392014-09-20 14:52:30 -070029 if (!skb->encapsulation)
30 goto out;
31
Alexander Duyck2e598af2016-02-05 15:28:01 -080032 if (unlikely(tnl_hlen < sizeof(struct gre_base_hdr)))
33 goto out;
34
35 if (unlikely(!pskb_may_pull(skb, tnl_hlen)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020036 goto out;
37
Daniel Borkmannc50cd352013-07-01 19:24:00 +020038 /* setup inner skb. */
Daniel Borkmannc50cd352013-07-01 19:24:00 +020039 skb->encapsulation = 0;
Alexander Duyck5197f342016-03-22 16:18:07 -070040 SKB_GSO_CB(skb)->encap_level = 0;
Alexander Duyck2e598af2016-02-05 15:28:01 -080041 __skb_pull(skb, tnl_hlen);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020042 skb_reset_mac_header(skb);
43 skb_set_network_header(skb, skb_inner_network_offset(skb));
44 skb->mac_len = skb_inner_network_offset(skb);
Alexander Duyck38720352016-02-05 15:28:08 -080045 skb->protocol = skb->inner_protocol;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020046
Alexander Duyck2e598af2016-02-05 15:28:01 -080047 need_csum = !!(skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM);
48 skb->encap_hdr_csum = need_csum;
49
Alexander Duyck22463872016-02-24 16:46:21 -080050 ufo = !!(skb_shinfo(skb)->gso_type & SKB_GSO_UDP);
51
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080052 features &= skb->dev->hw_enc_features;
53
Alexander Duyck22463872016-02-24 16:46:21 -080054 /* The only checksum offload we care about from here on out is the
55 * outer one so strip the existing checksum feature flags based
56 * on the fact that we will be computing our checksum in software.
57 */
58 if (ufo) {
59 features &= ~NETIF_F_CSUM_MASK;
60 if (!need_csum)
61 features |= NETIF_F_HW_CSUM;
62 }
63
Daniel Borkmannc50cd352013-07-01 19:24:00 +020064 /* segment inner packet. */
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080065 segs = skb_mac_gso_segment(skb, features);
Himangi Saraogi5a8dbf02014-07-27 12:36:51 +053066 if (IS_ERR_OR_NULL(segs)) {
Alexander Duyck2e598af2016-02-05 15:28:01 -080067 skb_gso_error_unwind(skb, protocol, tnl_hlen, mac_offset,
68 mac_len);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020069 goto out;
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080070 }
Daniel Borkmannc50cd352013-07-01 19:24:00 +020071
Steffen Klassert07b26c92016-09-19 12:58:47 +020072 gso_partial = !!(skb_shinfo(segs)->gso_type & SKB_GSO_PARTIAL);
73
Alexander Duyck2e598af2016-02-05 15:28:01 -080074 outer_hlen = skb_tnl_header_len(skb);
75 gre_offset = outer_hlen - tnl_hlen;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020076 skb = segs;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020077 do {
Alexander Duyck38720352016-02-05 15:28:08 -080078 struct gre_base_hdr *greh;
Alexander Duyck802ab552016-04-10 21:45:03 -040079 __sum16 *pcsum;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020080
Alexander Duyck22463872016-02-24 16:46:21 -080081 /* Set up inner headers if we are offloading inner checksum */
82 if (skb->ip_summed == CHECKSUM_PARTIAL) {
83 skb_reset_inner_headers(skb);
84 skb->encapsulation = 1;
85 }
Alexander Duyckcdbaa0b2013-07-10 17:05:06 -070086
Daniel Borkmannc50cd352013-07-01 19:24:00 +020087 skb->mac_len = mac_len;
88 skb->protocol = protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080089
90 __skb_push(skb, outer_hlen);
91 skb_reset_mac_header(skb);
92 skb_set_network_header(skb, mac_len);
93 skb_set_transport_header(skb, gre_offset);
94
95 if (!need_csum)
96 continue;
97
98 greh = (struct gre_base_hdr *)skb_transport_header(skb);
Alexander Duyck802ab552016-04-10 21:45:03 -040099 pcsum = (__sum16 *)(greh + 1);
Alexander Duyck2e598af2016-02-05 15:28:01 -0800100
Steffen Klassert07b26c92016-09-19 12:58:47 +0200101 if (gso_partial) {
Alexander Duyck802ab552016-04-10 21:45:03 -0400102 unsigned int partial_adj;
103
104 /* Adjust checksum to account for the fact that
105 * the partial checksum is based on actual size
106 * whereas headers should be based on MSS size.
107 */
108 partial_adj = skb->len + skb_headroom(skb) -
109 SKB_GSO_CB(skb)->data_offset -
110 skb_shinfo(skb)->gso_size;
111 *pcsum = ~csum_fold((__force __wsum)htonl(partial_adj));
112 } else {
113 *pcsum = 0;
114 }
115
116 *(pcsum + 1) = 0;
117 *pcsum = gso_make_checksum(skb, 0);
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200118 } while ((skb = skb->next));
119out:
120 return segs;
121}
122
Jerry Chubf5a7552014-01-07 10:23:19 -0800123static struct sk_buff **gre_gro_receive(struct sk_buff **head,
124 struct sk_buff *skb)
125{
126 struct sk_buff **pp = NULL;
127 struct sk_buff *p;
128 const struct gre_base_hdr *greh;
129 unsigned int hlen, grehlen;
130 unsigned int off;
131 int flush = 1;
132 struct packet_offload *ptype;
133 __be16 type;
134
Jesse Grossfac8e0f2016-03-19 09:32:01 -0700135 if (NAPI_GRO_CB(skb)->encap_mark)
136 goto out;
137
138 NAPI_GRO_CB(skb)->encap_mark = 1;
139
Jerry Chubf5a7552014-01-07 10:23:19 -0800140 off = skb_gro_offset(skb);
141 hlen = off + sizeof(*greh);
142 greh = skb_gro_header_fast(skb, off);
143 if (skb_gro_header_hard(skb, hlen)) {
144 greh = skb_gro_header_slow(skb, hlen, off);
145 if (unlikely(!greh))
146 goto out;
147 }
148
149 /* Only support version 0 and K (key), C (csum) flags. Note that
150 * although the support for the S (seq#) flag can be added easily
151 * for GRO, this is problematic for GSO hence can not be enabled
152 * here because a GRO pkt may end up in the forwarding path, thus
153 * requiring GSO support to break it up correctly.
154 */
155 if ((greh->flags & ~(GRE_KEY|GRE_CSUM)) != 0)
156 goto out;
157
Alexander Duycka0ca1532016-04-05 09:13:39 -0700158 /* We can only support GRE_CSUM if we can track the location of
159 * the GRE header. In the case of FOU/GUE we cannot because the
160 * outer UDP header displaces the GRE header leaving us in a state
161 * of limbo.
162 */
163 if ((greh->flags & GRE_CSUM) && NAPI_GRO_CB(skb)->is_fou)
164 goto out;
165
Jerry Chubf5a7552014-01-07 10:23:19 -0800166 type = greh->protocol;
167
168 rcu_read_lock();
169 ptype = gro_find_receive_by_type(type);
Ian Morris51456b22015-04-03 09:17:26 +0100170 if (!ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800171 goto out_unlock;
172
173 grehlen = GRE_HEADER_SECTION;
174
175 if (greh->flags & GRE_KEY)
176 grehlen += GRE_HEADER_SECTION;
177
178 if (greh->flags & GRE_CSUM)
179 grehlen += GRE_HEADER_SECTION;
180
181 hlen = off + grehlen;
182 if (skb_gro_header_hard(skb, hlen)) {
183 greh = skb_gro_header_slow(skb, hlen, off);
184 if (unlikely(!greh))
185 goto out_unlock;
186 }
Jerry Chubf5a7552014-01-07 10:23:19 -0800187
Tom Herbert758f75d2014-08-22 13:34:22 -0700188 /* Don't bother verifying checksum if we're going to flush anyway. */
Tom Herbert884d3382014-08-31 15:12:44 -0700189 if ((greh->flags & GRE_CSUM) && !NAPI_GRO_CB(skb)->flush) {
190 if (skb_gro_checksum_simple_validate(skb))
Jerry Chubf5a7552014-01-07 10:23:19 -0800191 goto out_unlock;
Tom Herbert758f75d2014-08-22 13:34:22 -0700192
Tom Herbert884d3382014-08-31 15:12:44 -0700193 skb_gro_checksum_try_convert(skb, IPPROTO_GRE, 0,
194 null_compute_pseudo);
195 }
196
Jerry Chubf5a7552014-01-07 10:23:19 -0800197 for (p = *head; p; p = p->next) {
198 const struct gre_base_hdr *greh2;
199
200 if (!NAPI_GRO_CB(p)->same_flow)
201 continue;
202
203 /* The following checks are needed to ensure only pkts
204 * from the same tunnel are considered for aggregation.
205 * The criteria for "the same tunnel" includes:
206 * 1) same version (we only support version 0 here)
207 * 2) same protocol (we only support ETH_P_IP for now)
208 * 3) same set of flags
209 * 4) same key if the key field is present.
210 */
211 greh2 = (struct gre_base_hdr *)(p->data + off);
212
213 if (greh2->flags != greh->flags ||
214 greh2->protocol != greh->protocol) {
215 NAPI_GRO_CB(p)->same_flow = 0;
216 continue;
217 }
218 if (greh->flags & GRE_KEY) {
219 /* compare keys */
220 if (*(__be32 *)(greh2+1) != *(__be32 *)(greh+1)) {
221 NAPI_GRO_CB(p)->same_flow = 0;
222 continue;
223 }
224 }
225 }
226
227 skb_gro_pull(skb, grehlen);
228
229 /* Adjusted NAPI_GRO_CB(skb)->csum after skb_gro_pull()*/
230 skb_gro_postpull_rcsum(skb, greh, grehlen);
231
232 pp = ptype->callbacks.gro_receive(head, skb);
Alexander Duyckc194cf92016-03-09 09:24:23 -0800233 flush = 0;
Jerry Chubf5a7552014-01-07 10:23:19 -0800234
235out_unlock:
236 rcu_read_unlock();
237out:
238 NAPI_GRO_CB(skb)->flush |= flush;
239
240 return pp;
241}
242
Wei Yongjund10dbad2014-01-09 22:22:05 +0800243static int gre_gro_complete(struct sk_buff *skb, int nhoff)
Jerry Chubf5a7552014-01-07 10:23:19 -0800244{
245 struct gre_base_hdr *greh = (struct gre_base_hdr *)(skb->data + nhoff);
246 struct packet_offload *ptype;
247 unsigned int grehlen = sizeof(*greh);
248 int err = -ENOENT;
249 __be16 type;
250
Jerry Chuc3caf112014-07-14 15:54:46 -0700251 skb->encapsulation = 1;
252 skb_shinfo(skb)->gso_type = SKB_GSO_GRE;
253
Jerry Chubf5a7552014-01-07 10:23:19 -0800254 type = greh->protocol;
255 if (greh->flags & GRE_KEY)
256 grehlen += GRE_HEADER_SECTION;
257
258 if (greh->flags & GRE_CSUM)
259 grehlen += GRE_HEADER_SECTION;
260
261 rcu_read_lock();
262 ptype = gro_find_complete_by_type(type);
Ian Morris00db4122015-04-03 09:17:27 +0100263 if (ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800264 err = ptype->callbacks.gro_complete(skb, nhoff + grehlen);
265
266 rcu_read_unlock();
Tom Herbert6fb2a752014-11-29 09:59:45 -0800267
268 skb_set_inner_mac_header(skb, nhoff + grehlen);
269
Jerry Chubf5a7552014-01-07 10:23:19 -0800270 return err;
271}
272
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200273static const struct net_offload gre_offload = {
274 .callbacks = {
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200275 .gso_segment = gre_gso_segment,
Jerry Chubf5a7552014-01-07 10:23:19 -0800276 .gro_receive = gre_gro_receive,
277 .gro_complete = gre_gro_complete,
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200278 },
279};
280
Eric Dumazet438e38f2014-01-06 14:03:07 -0800281static int __init gre_offload_init(void)
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200282{
Alexander Duycke0c20962016-04-14 15:33:58 -0400283 int err;
284
285 err = inet_add_offload(&gre_offload, IPPROTO_GRE);
286#if IS_ENABLED(CONFIG_IPV6)
287 if (err)
288 return err;
289
290 err = inet6_add_offload(&gre_offload, IPPROTO_GRE);
291 if (err)
292 inet_del_offload(&gre_offload, IPPROTO_GRE);
293#endif
294
295 return err;
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200296}
Paul Gortmakercf172282014-01-15 11:19:55 -0500297device_initcall(gre_offload_init);