blob: ecd1e09dbbf137d44996a4a83aec2c13b48d09f9 [file] [log] [blame]
Daniel Borkmannc50cd352013-07-01 19:24:00 +02001/*
2 * IPV4 GSO/GRO offload support
3 * Linux INET implementation
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * GRE GSO support
11 */
12
13#include <linux/skbuff.h>
Paul Gortmakercf172282014-01-15 11:19:55 -050014#include <linux/init.h>
Daniel Borkmannc50cd352013-07-01 19:24:00 +020015#include <net/protocol.h>
16#include <net/gre.h>
17
Daniel Borkmannc50cd352013-07-01 19:24:00 +020018static struct sk_buff *gre_gso_segment(struct sk_buff *skb,
19 netdev_features_t features)
20{
Alexander Duyck2e598af2016-02-05 15:28:01 -080021 int tnl_hlen = skb_inner_mac_header(skb) - skb_transport_header(skb);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020022 struct sk_buff *segs = ERR_PTR(-EINVAL);
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080023 u16 mac_offset = skb->mac_header;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020024 __be16 protocol = skb->protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080025 u16 mac_len = skb->mac_len;
26 int gre_offset, outer_hlen;
Alexander Duyck22463872016-02-24 16:46:21 -080027 bool need_csum, ufo;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020028
Tom Herbert53e50392014-09-20 14:52:30 -070029 if (!skb->encapsulation)
30 goto out;
31
Alexander Duyck2e598af2016-02-05 15:28:01 -080032 if (unlikely(tnl_hlen < sizeof(struct gre_base_hdr)))
33 goto out;
34
35 if (unlikely(!pskb_may_pull(skb, tnl_hlen)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020036 goto out;
37
Daniel Borkmannc50cd352013-07-01 19:24:00 +020038 /* setup inner skb. */
Daniel Borkmannc50cd352013-07-01 19:24:00 +020039 skb->encapsulation = 0;
Alexander Duyck5197f342016-03-22 16:18:07 -070040 SKB_GSO_CB(skb)->encap_level = 0;
Alexander Duyck2e598af2016-02-05 15:28:01 -080041 __skb_pull(skb, tnl_hlen);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020042 skb_reset_mac_header(skb);
43 skb_set_network_header(skb, skb_inner_network_offset(skb));
44 skb->mac_len = skb_inner_network_offset(skb);
Alexander Duyck38720352016-02-05 15:28:08 -080045 skb->protocol = skb->inner_protocol;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020046
Alexander Duyck2e598af2016-02-05 15:28:01 -080047 need_csum = !!(skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM);
48 skb->encap_hdr_csum = need_csum;
49
Alexander Duyck22463872016-02-24 16:46:21 -080050 ufo = !!(skb_shinfo(skb)->gso_type & SKB_GSO_UDP);
51
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080052 features &= skb->dev->hw_enc_features;
53
Alexander Duyck22463872016-02-24 16:46:21 -080054 /* The only checksum offload we care about from here on out is the
55 * outer one so strip the existing checksum feature flags based
56 * on the fact that we will be computing our checksum in software.
57 */
58 if (ufo) {
59 features &= ~NETIF_F_CSUM_MASK;
60 if (!need_csum)
61 features |= NETIF_F_HW_CSUM;
62 }
63
Daniel Borkmannc50cd352013-07-01 19:24:00 +020064 /* segment inner packet. */
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080065 segs = skb_mac_gso_segment(skb, features);
Himangi Saraogi5a8dbf02014-07-27 12:36:51 +053066 if (IS_ERR_OR_NULL(segs)) {
Alexander Duyck2e598af2016-02-05 15:28:01 -080067 skb_gso_error_unwind(skb, protocol, tnl_hlen, mac_offset,
68 mac_len);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020069 goto out;
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080070 }
Daniel Borkmannc50cd352013-07-01 19:24:00 +020071
Alexander Duyck2e598af2016-02-05 15:28:01 -080072 outer_hlen = skb_tnl_header_len(skb);
73 gre_offset = outer_hlen - tnl_hlen;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020074 skb = segs;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020075 do {
Alexander Duyck38720352016-02-05 15:28:08 -080076 struct gre_base_hdr *greh;
Alexander Duyck802ab552016-04-10 21:45:03 -040077 __sum16 *pcsum;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020078
Alexander Duyck22463872016-02-24 16:46:21 -080079 /* Set up inner headers if we are offloading inner checksum */
80 if (skb->ip_summed == CHECKSUM_PARTIAL) {
81 skb_reset_inner_headers(skb);
82 skb->encapsulation = 1;
83 }
Alexander Duyckcdbaa0b2013-07-10 17:05:06 -070084
Daniel Borkmannc50cd352013-07-01 19:24:00 +020085 skb->mac_len = mac_len;
86 skb->protocol = protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080087
88 __skb_push(skb, outer_hlen);
89 skb_reset_mac_header(skb);
90 skb_set_network_header(skb, mac_len);
91 skb_set_transport_header(skb, gre_offset);
92
93 if (!need_csum)
94 continue;
95
96 greh = (struct gre_base_hdr *)skb_transport_header(skb);
Alexander Duyck802ab552016-04-10 21:45:03 -040097 pcsum = (__sum16 *)(greh + 1);
Alexander Duyck2e598af2016-02-05 15:28:01 -080098
Alexander Duyck802ab552016-04-10 21:45:03 -040099 if (skb_is_gso(skb)) {
100 unsigned int partial_adj;
101
102 /* Adjust checksum to account for the fact that
103 * the partial checksum is based on actual size
104 * whereas headers should be based on MSS size.
105 */
106 partial_adj = skb->len + skb_headroom(skb) -
107 SKB_GSO_CB(skb)->data_offset -
108 skb_shinfo(skb)->gso_size;
109 *pcsum = ~csum_fold((__force __wsum)htonl(partial_adj));
110 } else {
111 *pcsum = 0;
112 }
113
114 *(pcsum + 1) = 0;
115 *pcsum = gso_make_checksum(skb, 0);
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200116 } while ((skb = skb->next));
117out:
118 return segs;
119}
120
Jerry Chubf5a7552014-01-07 10:23:19 -0800121static struct sk_buff **gre_gro_receive(struct sk_buff **head,
122 struct sk_buff *skb)
123{
124 struct sk_buff **pp = NULL;
125 struct sk_buff *p;
126 const struct gre_base_hdr *greh;
127 unsigned int hlen, grehlen;
128 unsigned int off;
129 int flush = 1;
130 struct packet_offload *ptype;
131 __be16 type;
132
Jesse Grossfac8e0f2016-03-19 09:32:01 -0700133 if (NAPI_GRO_CB(skb)->encap_mark)
134 goto out;
135
136 NAPI_GRO_CB(skb)->encap_mark = 1;
137
Jerry Chubf5a7552014-01-07 10:23:19 -0800138 off = skb_gro_offset(skb);
139 hlen = off + sizeof(*greh);
140 greh = skb_gro_header_fast(skb, off);
141 if (skb_gro_header_hard(skb, hlen)) {
142 greh = skb_gro_header_slow(skb, hlen, off);
143 if (unlikely(!greh))
144 goto out;
145 }
146
147 /* Only support version 0 and K (key), C (csum) flags. Note that
148 * although the support for the S (seq#) flag can be added easily
149 * for GRO, this is problematic for GSO hence can not be enabled
150 * here because a GRO pkt may end up in the forwarding path, thus
151 * requiring GSO support to break it up correctly.
152 */
153 if ((greh->flags & ~(GRE_KEY|GRE_CSUM)) != 0)
154 goto out;
155
Alexander Duycka0ca1532016-04-05 09:13:39 -0700156 /* We can only support GRE_CSUM if we can track the location of
157 * the GRE header. In the case of FOU/GUE we cannot because the
158 * outer UDP header displaces the GRE header leaving us in a state
159 * of limbo.
160 */
161 if ((greh->flags & GRE_CSUM) && NAPI_GRO_CB(skb)->is_fou)
162 goto out;
163
Jerry Chubf5a7552014-01-07 10:23:19 -0800164 type = greh->protocol;
165
166 rcu_read_lock();
167 ptype = gro_find_receive_by_type(type);
Ian Morris51456b22015-04-03 09:17:26 +0100168 if (!ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800169 goto out_unlock;
170
171 grehlen = GRE_HEADER_SECTION;
172
173 if (greh->flags & GRE_KEY)
174 grehlen += GRE_HEADER_SECTION;
175
176 if (greh->flags & GRE_CSUM)
177 grehlen += GRE_HEADER_SECTION;
178
179 hlen = off + grehlen;
180 if (skb_gro_header_hard(skb, hlen)) {
181 greh = skb_gro_header_slow(skb, hlen, off);
182 if (unlikely(!greh))
183 goto out_unlock;
184 }
Jerry Chubf5a7552014-01-07 10:23:19 -0800185
Tom Herbert758f75d2014-08-22 13:34:22 -0700186 /* Don't bother verifying checksum if we're going to flush anyway. */
Tom Herbert884d3382014-08-31 15:12:44 -0700187 if ((greh->flags & GRE_CSUM) && !NAPI_GRO_CB(skb)->flush) {
188 if (skb_gro_checksum_simple_validate(skb))
Jerry Chubf5a7552014-01-07 10:23:19 -0800189 goto out_unlock;
Tom Herbert758f75d2014-08-22 13:34:22 -0700190
Tom Herbert884d3382014-08-31 15:12:44 -0700191 skb_gro_checksum_try_convert(skb, IPPROTO_GRE, 0,
192 null_compute_pseudo);
193 }
194
Jerry Chubf5a7552014-01-07 10:23:19 -0800195 for (p = *head; p; p = p->next) {
196 const struct gre_base_hdr *greh2;
197
198 if (!NAPI_GRO_CB(p)->same_flow)
199 continue;
200
201 /* The following checks are needed to ensure only pkts
202 * from the same tunnel are considered for aggregation.
203 * The criteria for "the same tunnel" includes:
204 * 1) same version (we only support version 0 here)
205 * 2) same protocol (we only support ETH_P_IP for now)
206 * 3) same set of flags
207 * 4) same key if the key field is present.
208 */
209 greh2 = (struct gre_base_hdr *)(p->data + off);
210
211 if (greh2->flags != greh->flags ||
212 greh2->protocol != greh->protocol) {
213 NAPI_GRO_CB(p)->same_flow = 0;
214 continue;
215 }
216 if (greh->flags & GRE_KEY) {
217 /* compare keys */
218 if (*(__be32 *)(greh2+1) != *(__be32 *)(greh+1)) {
219 NAPI_GRO_CB(p)->same_flow = 0;
220 continue;
221 }
222 }
223 }
224
225 skb_gro_pull(skb, grehlen);
226
227 /* Adjusted NAPI_GRO_CB(skb)->csum after skb_gro_pull()*/
228 skb_gro_postpull_rcsum(skb, greh, grehlen);
229
230 pp = ptype->callbacks.gro_receive(head, skb);
Alexander Duyckc194cf92016-03-09 09:24:23 -0800231 flush = 0;
Jerry Chubf5a7552014-01-07 10:23:19 -0800232
233out_unlock:
234 rcu_read_unlock();
235out:
236 NAPI_GRO_CB(skb)->flush |= flush;
237
238 return pp;
239}
240
Wei Yongjund10dbad2014-01-09 22:22:05 +0800241static int gre_gro_complete(struct sk_buff *skb, int nhoff)
Jerry Chubf5a7552014-01-07 10:23:19 -0800242{
243 struct gre_base_hdr *greh = (struct gre_base_hdr *)(skb->data + nhoff);
244 struct packet_offload *ptype;
245 unsigned int grehlen = sizeof(*greh);
246 int err = -ENOENT;
247 __be16 type;
248
Jerry Chuc3caf112014-07-14 15:54:46 -0700249 skb->encapsulation = 1;
250 skb_shinfo(skb)->gso_type = SKB_GSO_GRE;
251
Jerry Chubf5a7552014-01-07 10:23:19 -0800252 type = greh->protocol;
253 if (greh->flags & GRE_KEY)
254 grehlen += GRE_HEADER_SECTION;
255
256 if (greh->flags & GRE_CSUM)
257 grehlen += GRE_HEADER_SECTION;
258
259 rcu_read_lock();
260 ptype = gro_find_complete_by_type(type);
Ian Morris00db4122015-04-03 09:17:27 +0100261 if (ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800262 err = ptype->callbacks.gro_complete(skb, nhoff + grehlen);
263
264 rcu_read_unlock();
Tom Herbert6fb2a752014-11-29 09:59:45 -0800265
266 skb_set_inner_mac_header(skb, nhoff + grehlen);
267
Jerry Chubf5a7552014-01-07 10:23:19 -0800268 return err;
269}
270
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200271static const struct net_offload gre_offload = {
272 .callbacks = {
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200273 .gso_segment = gre_gso_segment,
Jerry Chubf5a7552014-01-07 10:23:19 -0800274 .gro_receive = gre_gro_receive,
275 .gro_complete = gre_gro_complete,
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200276 },
277};
278
Eric Dumazet438e38f2014-01-06 14:03:07 -0800279static int __init gre_offload_init(void)
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200280{
Alexander Duycke0c20962016-04-14 15:33:58 -0400281 int err;
282
283 err = inet_add_offload(&gre_offload, IPPROTO_GRE);
284#if IS_ENABLED(CONFIG_IPV6)
285 if (err)
286 return err;
287
288 err = inet6_add_offload(&gre_offload, IPPROTO_GRE);
289 if (err)
290 inet_del_offload(&gre_offload, IPPROTO_GRE);
291#endif
292
293 return err;
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200294}
Paul Gortmakercf172282014-01-15 11:19:55 -0500295device_initcall(gre_offload_init);