blob: 20557f211408750a48357812d457c2a1cb5bba51 [file] [log] [blame]
Daniel Borkmannc50cd352013-07-01 19:24:00 +02001/*
2 * IPV4 GSO/GRO offload support
3 * Linux INET implementation
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * GRE GSO support
11 */
12
13#include <linux/skbuff.h>
Paul Gortmakercf172282014-01-15 11:19:55 -050014#include <linux/init.h>
Daniel Borkmannc50cd352013-07-01 19:24:00 +020015#include <net/protocol.h>
16#include <net/gre.h>
17
Daniel Borkmannc50cd352013-07-01 19:24:00 +020018static struct sk_buff *gre_gso_segment(struct sk_buff *skb,
19 netdev_features_t features)
20{
Alexander Duyck2e598af2016-02-05 15:28:01 -080021 int tnl_hlen = skb_inner_mac_header(skb) - skb_transport_header(skb);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020022 struct sk_buff *segs = ERR_PTR(-EINVAL);
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080023 u16 mac_offset = skb->mac_header;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020024 __be16 protocol = skb->protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080025 u16 mac_len = skb->mac_len;
26 int gre_offset, outer_hlen;
Alexander Duyck22463872016-02-24 16:46:21 -080027 bool need_csum, ufo;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020028
29 if (unlikely(skb_shinfo(skb)->gso_type &
30 ~(SKB_GSO_TCPV4 |
31 SKB_GSO_TCPV6 |
32 SKB_GSO_UDP |
33 SKB_GSO_DODGY |
34 SKB_GSO_TCP_ECN |
Alexander Duyckcbc53e02016-04-10 21:44:51 -040035 SKB_GSO_TCP_FIXEDID |
Eric Dumazetcb32f512013-10-19 11:42:57 -070036 SKB_GSO_GRE |
Tom Herbert4749c092014-06-04 17:20:23 -070037 SKB_GSO_GRE_CSUM |
Eric Dumazet7e3b6e72015-10-24 05:47:44 -070038 SKB_GSO_IPIP |
Alexander Duyck802ab552016-04-10 21:45:03 -040039 SKB_GSO_SIT |
40 SKB_GSO_PARTIAL)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020041 goto out;
42
Tom Herbert53e50392014-09-20 14:52:30 -070043 if (!skb->encapsulation)
44 goto out;
45
Alexander Duyck2e598af2016-02-05 15:28:01 -080046 if (unlikely(tnl_hlen < sizeof(struct gre_base_hdr)))
47 goto out;
48
49 if (unlikely(!pskb_may_pull(skb, tnl_hlen)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020050 goto out;
51
Daniel Borkmannc50cd352013-07-01 19:24:00 +020052 /* setup inner skb. */
Daniel Borkmannc50cd352013-07-01 19:24:00 +020053 skb->encapsulation = 0;
Alexander Duyck5197f342016-03-22 16:18:07 -070054 SKB_GSO_CB(skb)->encap_level = 0;
Alexander Duyck2e598af2016-02-05 15:28:01 -080055 __skb_pull(skb, tnl_hlen);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020056 skb_reset_mac_header(skb);
57 skb_set_network_header(skb, skb_inner_network_offset(skb));
58 skb->mac_len = skb_inner_network_offset(skb);
Alexander Duyck38720352016-02-05 15:28:08 -080059 skb->protocol = skb->inner_protocol;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020060
Alexander Duyck2e598af2016-02-05 15:28:01 -080061 need_csum = !!(skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM);
62 skb->encap_hdr_csum = need_csum;
63
Alexander Duyck22463872016-02-24 16:46:21 -080064 ufo = !!(skb_shinfo(skb)->gso_type & SKB_GSO_UDP);
65
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080066 features &= skb->dev->hw_enc_features;
67
Alexander Duyck22463872016-02-24 16:46:21 -080068 /* The only checksum offload we care about from here on out is the
69 * outer one so strip the existing checksum feature flags based
70 * on the fact that we will be computing our checksum in software.
71 */
72 if (ufo) {
73 features &= ~NETIF_F_CSUM_MASK;
74 if (!need_csum)
75 features |= NETIF_F_HW_CSUM;
76 }
77
Daniel Borkmannc50cd352013-07-01 19:24:00 +020078 /* segment inner packet. */
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080079 segs = skb_mac_gso_segment(skb, features);
Himangi Saraogi5a8dbf02014-07-27 12:36:51 +053080 if (IS_ERR_OR_NULL(segs)) {
Alexander Duyck2e598af2016-02-05 15:28:01 -080081 skb_gso_error_unwind(skb, protocol, tnl_hlen, mac_offset,
82 mac_len);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020083 goto out;
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080084 }
Daniel Borkmannc50cd352013-07-01 19:24:00 +020085
Alexander Duyck2e598af2016-02-05 15:28:01 -080086 outer_hlen = skb_tnl_header_len(skb);
87 gre_offset = outer_hlen - tnl_hlen;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020088 skb = segs;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020089 do {
Alexander Duyck38720352016-02-05 15:28:08 -080090 struct gre_base_hdr *greh;
Alexander Duyck802ab552016-04-10 21:45:03 -040091 __sum16 *pcsum;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020092
Alexander Duyck22463872016-02-24 16:46:21 -080093 /* Set up inner headers if we are offloading inner checksum */
94 if (skb->ip_summed == CHECKSUM_PARTIAL) {
95 skb_reset_inner_headers(skb);
96 skb->encapsulation = 1;
97 }
Alexander Duyckcdbaa0b2013-07-10 17:05:06 -070098
Daniel Borkmannc50cd352013-07-01 19:24:00 +020099 skb->mac_len = mac_len;
100 skb->protocol = protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -0800101
102 __skb_push(skb, outer_hlen);
103 skb_reset_mac_header(skb);
104 skb_set_network_header(skb, mac_len);
105 skb_set_transport_header(skb, gre_offset);
106
107 if (!need_csum)
108 continue;
109
110 greh = (struct gre_base_hdr *)skb_transport_header(skb);
Alexander Duyck802ab552016-04-10 21:45:03 -0400111 pcsum = (__sum16 *)(greh + 1);
Alexander Duyck2e598af2016-02-05 15:28:01 -0800112
Alexander Duyck802ab552016-04-10 21:45:03 -0400113 if (skb_is_gso(skb)) {
114 unsigned int partial_adj;
115
116 /* Adjust checksum to account for the fact that
117 * the partial checksum is based on actual size
118 * whereas headers should be based on MSS size.
119 */
120 partial_adj = skb->len + skb_headroom(skb) -
121 SKB_GSO_CB(skb)->data_offset -
122 skb_shinfo(skb)->gso_size;
123 *pcsum = ~csum_fold((__force __wsum)htonl(partial_adj));
124 } else {
125 *pcsum = 0;
126 }
127
128 *(pcsum + 1) = 0;
129 *pcsum = gso_make_checksum(skb, 0);
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200130 } while ((skb = skb->next));
131out:
132 return segs;
133}
134
Jerry Chubf5a7552014-01-07 10:23:19 -0800135static struct sk_buff **gre_gro_receive(struct sk_buff **head,
136 struct sk_buff *skb)
137{
138 struct sk_buff **pp = NULL;
139 struct sk_buff *p;
140 const struct gre_base_hdr *greh;
141 unsigned int hlen, grehlen;
142 unsigned int off;
143 int flush = 1;
144 struct packet_offload *ptype;
145 __be16 type;
146
Jesse Grossfac8e0f2016-03-19 09:32:01 -0700147 if (NAPI_GRO_CB(skb)->encap_mark)
148 goto out;
149
150 NAPI_GRO_CB(skb)->encap_mark = 1;
151
Jerry Chubf5a7552014-01-07 10:23:19 -0800152 off = skb_gro_offset(skb);
153 hlen = off + sizeof(*greh);
154 greh = skb_gro_header_fast(skb, off);
155 if (skb_gro_header_hard(skb, hlen)) {
156 greh = skb_gro_header_slow(skb, hlen, off);
157 if (unlikely(!greh))
158 goto out;
159 }
160
161 /* Only support version 0 and K (key), C (csum) flags. Note that
162 * although the support for the S (seq#) flag can be added easily
163 * for GRO, this is problematic for GSO hence can not be enabled
164 * here because a GRO pkt may end up in the forwarding path, thus
165 * requiring GSO support to break it up correctly.
166 */
167 if ((greh->flags & ~(GRE_KEY|GRE_CSUM)) != 0)
168 goto out;
169
Alexander Duycka0ca1532016-04-05 09:13:39 -0700170 /* We can only support GRE_CSUM if we can track the location of
171 * the GRE header. In the case of FOU/GUE we cannot because the
172 * outer UDP header displaces the GRE header leaving us in a state
173 * of limbo.
174 */
175 if ((greh->flags & GRE_CSUM) && NAPI_GRO_CB(skb)->is_fou)
176 goto out;
177
Jerry Chubf5a7552014-01-07 10:23:19 -0800178 type = greh->protocol;
179
180 rcu_read_lock();
181 ptype = gro_find_receive_by_type(type);
Ian Morris51456b22015-04-03 09:17:26 +0100182 if (!ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800183 goto out_unlock;
184
185 grehlen = GRE_HEADER_SECTION;
186
187 if (greh->flags & GRE_KEY)
188 grehlen += GRE_HEADER_SECTION;
189
190 if (greh->flags & GRE_CSUM)
191 grehlen += GRE_HEADER_SECTION;
192
193 hlen = off + grehlen;
194 if (skb_gro_header_hard(skb, hlen)) {
195 greh = skb_gro_header_slow(skb, hlen, off);
196 if (unlikely(!greh))
197 goto out_unlock;
198 }
Jerry Chubf5a7552014-01-07 10:23:19 -0800199
Tom Herbert758f75d2014-08-22 13:34:22 -0700200 /* Don't bother verifying checksum if we're going to flush anyway. */
Tom Herbert884d3382014-08-31 15:12:44 -0700201 if ((greh->flags & GRE_CSUM) && !NAPI_GRO_CB(skb)->flush) {
202 if (skb_gro_checksum_simple_validate(skb))
Jerry Chubf5a7552014-01-07 10:23:19 -0800203 goto out_unlock;
Tom Herbert758f75d2014-08-22 13:34:22 -0700204
Tom Herbert884d3382014-08-31 15:12:44 -0700205 skb_gro_checksum_try_convert(skb, IPPROTO_GRE, 0,
206 null_compute_pseudo);
207 }
208
Jerry Chubf5a7552014-01-07 10:23:19 -0800209 for (p = *head; p; p = p->next) {
210 const struct gre_base_hdr *greh2;
211
212 if (!NAPI_GRO_CB(p)->same_flow)
213 continue;
214
215 /* The following checks are needed to ensure only pkts
216 * from the same tunnel are considered for aggregation.
217 * The criteria for "the same tunnel" includes:
218 * 1) same version (we only support version 0 here)
219 * 2) same protocol (we only support ETH_P_IP for now)
220 * 3) same set of flags
221 * 4) same key if the key field is present.
222 */
223 greh2 = (struct gre_base_hdr *)(p->data + off);
224
225 if (greh2->flags != greh->flags ||
226 greh2->protocol != greh->protocol) {
227 NAPI_GRO_CB(p)->same_flow = 0;
228 continue;
229 }
230 if (greh->flags & GRE_KEY) {
231 /* compare keys */
232 if (*(__be32 *)(greh2+1) != *(__be32 *)(greh+1)) {
233 NAPI_GRO_CB(p)->same_flow = 0;
234 continue;
235 }
236 }
237 }
238
239 skb_gro_pull(skb, grehlen);
240
241 /* Adjusted NAPI_GRO_CB(skb)->csum after skb_gro_pull()*/
242 skb_gro_postpull_rcsum(skb, greh, grehlen);
243
244 pp = ptype->callbacks.gro_receive(head, skb);
Alexander Duyckc194cf92016-03-09 09:24:23 -0800245 flush = 0;
Jerry Chubf5a7552014-01-07 10:23:19 -0800246
247out_unlock:
248 rcu_read_unlock();
249out:
250 NAPI_GRO_CB(skb)->flush |= flush;
251
252 return pp;
253}
254
Wei Yongjund10dbad2014-01-09 22:22:05 +0800255static int gre_gro_complete(struct sk_buff *skb, int nhoff)
Jerry Chubf5a7552014-01-07 10:23:19 -0800256{
257 struct gre_base_hdr *greh = (struct gre_base_hdr *)(skb->data + nhoff);
258 struct packet_offload *ptype;
259 unsigned int grehlen = sizeof(*greh);
260 int err = -ENOENT;
261 __be16 type;
262
Jerry Chuc3caf112014-07-14 15:54:46 -0700263 skb->encapsulation = 1;
264 skb_shinfo(skb)->gso_type = SKB_GSO_GRE;
265
Jerry Chubf5a7552014-01-07 10:23:19 -0800266 type = greh->protocol;
267 if (greh->flags & GRE_KEY)
268 grehlen += GRE_HEADER_SECTION;
269
270 if (greh->flags & GRE_CSUM)
271 grehlen += GRE_HEADER_SECTION;
272
273 rcu_read_lock();
274 ptype = gro_find_complete_by_type(type);
Ian Morris00db4122015-04-03 09:17:27 +0100275 if (ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800276 err = ptype->callbacks.gro_complete(skb, nhoff + grehlen);
277
278 rcu_read_unlock();
Tom Herbert6fb2a752014-11-29 09:59:45 -0800279
280 skb_set_inner_mac_header(skb, nhoff + grehlen);
281
Jerry Chubf5a7552014-01-07 10:23:19 -0800282 return err;
283}
284
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200285static const struct net_offload gre_offload = {
286 .callbacks = {
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200287 .gso_segment = gre_gso_segment,
Jerry Chubf5a7552014-01-07 10:23:19 -0800288 .gro_receive = gre_gro_receive,
289 .gro_complete = gre_gro_complete,
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200290 },
291};
292
Eric Dumazet438e38f2014-01-06 14:03:07 -0800293static int __init gre_offload_init(void)
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200294{
295 return inet_add_offload(&gre_offload, IPPROTO_GRE);
296}
Paul Gortmakercf172282014-01-15 11:19:55 -0500297device_initcall(gre_offload_init);