blob: 6a5bd43178666eed954c4ee6f22837059fad470d [file] [log] [blame]
Daniel Borkmannc50cd352013-07-01 19:24:00 +02001/*
2 * IPV4 GSO/GRO offload support
3 * Linux INET implementation
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * GRE GSO support
11 */
12
13#include <linux/skbuff.h>
Paul Gortmakercf172282014-01-15 11:19:55 -050014#include <linux/init.h>
Daniel Borkmannc50cd352013-07-01 19:24:00 +020015#include <net/protocol.h>
16#include <net/gre.h>
17
Daniel Borkmannc50cd352013-07-01 19:24:00 +020018static struct sk_buff *gre_gso_segment(struct sk_buff *skb,
19 netdev_features_t features)
20{
Alexander Duyck2e598af2016-02-05 15:28:01 -080021 int tnl_hlen = skb_inner_mac_header(skb) - skb_transport_header(skb);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020022 struct sk_buff *segs = ERR_PTR(-EINVAL);
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080023 u16 mac_offset = skb->mac_header;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020024 __be16 protocol = skb->protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080025 u16 mac_len = skb->mac_len;
26 int gre_offset, outer_hlen;
Alexander Duyck22463872016-02-24 16:46:21 -080027 bool need_csum, ufo;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020028
29 if (unlikely(skb_shinfo(skb)->gso_type &
30 ~(SKB_GSO_TCPV4 |
31 SKB_GSO_TCPV6 |
32 SKB_GSO_UDP |
33 SKB_GSO_DODGY |
34 SKB_GSO_TCP_ECN |
Eric Dumazetcb32f512013-10-19 11:42:57 -070035 SKB_GSO_GRE |
Tom Herbert4749c092014-06-04 17:20:23 -070036 SKB_GSO_GRE_CSUM |
Eric Dumazet7e3b6e72015-10-24 05:47:44 -070037 SKB_GSO_IPIP |
38 SKB_GSO_SIT)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020039 goto out;
40
Tom Herbert53e50392014-09-20 14:52:30 -070041 if (!skb->encapsulation)
42 goto out;
43
Alexander Duyck2e598af2016-02-05 15:28:01 -080044 if (unlikely(tnl_hlen < sizeof(struct gre_base_hdr)))
45 goto out;
46
47 if (unlikely(!pskb_may_pull(skb, tnl_hlen)))
Daniel Borkmannc50cd352013-07-01 19:24:00 +020048 goto out;
49
Daniel Borkmannc50cd352013-07-01 19:24:00 +020050 /* setup inner skb. */
Daniel Borkmannc50cd352013-07-01 19:24:00 +020051 skb->encapsulation = 0;
Alexander Duyck5197f342016-03-22 16:18:07 -070052 SKB_GSO_CB(skb)->encap_level = 0;
Alexander Duyck2e598af2016-02-05 15:28:01 -080053 __skb_pull(skb, tnl_hlen);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020054 skb_reset_mac_header(skb);
55 skb_set_network_header(skb, skb_inner_network_offset(skb));
56 skb->mac_len = skb_inner_network_offset(skb);
Alexander Duyck38720352016-02-05 15:28:08 -080057 skb->protocol = skb->inner_protocol;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020058
Alexander Duyck2e598af2016-02-05 15:28:01 -080059 need_csum = !!(skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM);
60 skb->encap_hdr_csum = need_csum;
61
Alexander Duyck22463872016-02-24 16:46:21 -080062 ufo = !!(skb_shinfo(skb)->gso_type & SKB_GSO_UDP);
63
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080064 features &= skb->dev->hw_enc_features;
65
Alexander Duyck22463872016-02-24 16:46:21 -080066 /* The only checksum offload we care about from here on out is the
67 * outer one so strip the existing checksum feature flags based
68 * on the fact that we will be computing our checksum in software.
69 */
70 if (ufo) {
71 features &= ~NETIF_F_CSUM_MASK;
72 if (!need_csum)
73 features |= NETIF_F_HW_CSUM;
74 }
75
Daniel Borkmannc50cd352013-07-01 19:24:00 +020076 /* segment inner packet. */
Alexander Duyckbef3c6c2016-02-05 15:27:31 -080077 segs = skb_mac_gso_segment(skb, features);
Himangi Saraogi5a8dbf02014-07-27 12:36:51 +053078 if (IS_ERR_OR_NULL(segs)) {
Alexander Duyck2e598af2016-02-05 15:28:01 -080079 skb_gso_error_unwind(skb, protocol, tnl_hlen, mac_offset,
80 mac_len);
Daniel Borkmannc50cd352013-07-01 19:24:00 +020081 goto out;
Wei-Chun Chao7a7ffba2013-12-26 13:10:22 -080082 }
Daniel Borkmannc50cd352013-07-01 19:24:00 +020083
Alexander Duyck2e598af2016-02-05 15:28:01 -080084 outer_hlen = skb_tnl_header_len(skb);
85 gre_offset = outer_hlen - tnl_hlen;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020086 skb = segs;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020087 do {
Alexander Duyck38720352016-02-05 15:28:08 -080088 struct gre_base_hdr *greh;
Alexander Duyck2e598af2016-02-05 15:28:01 -080089 __be32 *pcsum;
Daniel Borkmannc50cd352013-07-01 19:24:00 +020090
Alexander Duyck22463872016-02-24 16:46:21 -080091 /* Set up inner headers if we are offloading inner checksum */
92 if (skb->ip_summed == CHECKSUM_PARTIAL) {
93 skb_reset_inner_headers(skb);
94 skb->encapsulation = 1;
95 }
Alexander Duyckcdbaa0b2013-07-10 17:05:06 -070096
Daniel Borkmannc50cd352013-07-01 19:24:00 +020097 skb->mac_len = mac_len;
98 skb->protocol = protocol;
Alexander Duyck2e598af2016-02-05 15:28:01 -080099
100 __skb_push(skb, outer_hlen);
101 skb_reset_mac_header(skb);
102 skb_set_network_header(skb, mac_len);
103 skb_set_transport_header(skb, gre_offset);
104
105 if (!need_csum)
106 continue;
107
108 greh = (struct gre_base_hdr *)skb_transport_header(skb);
109 pcsum = (__be32 *)(greh + 1);
110
111 *pcsum = 0;
112 *(__sum16 *)pcsum = gso_make_checksum(skb, 0);
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200113 } while ((skb = skb->next));
114out:
115 return segs;
116}
117
Jerry Chubf5a7552014-01-07 10:23:19 -0800118static struct sk_buff **gre_gro_receive(struct sk_buff **head,
119 struct sk_buff *skb)
120{
121 struct sk_buff **pp = NULL;
122 struct sk_buff *p;
123 const struct gre_base_hdr *greh;
124 unsigned int hlen, grehlen;
125 unsigned int off;
126 int flush = 1;
127 struct packet_offload *ptype;
128 __be16 type;
129
Jesse Grossfac8e0f2016-03-19 09:32:01 -0700130 if (NAPI_GRO_CB(skb)->encap_mark)
131 goto out;
132
133 NAPI_GRO_CB(skb)->encap_mark = 1;
134
Jerry Chubf5a7552014-01-07 10:23:19 -0800135 off = skb_gro_offset(skb);
136 hlen = off + sizeof(*greh);
137 greh = skb_gro_header_fast(skb, off);
138 if (skb_gro_header_hard(skb, hlen)) {
139 greh = skb_gro_header_slow(skb, hlen, off);
140 if (unlikely(!greh))
141 goto out;
142 }
143
144 /* Only support version 0 and K (key), C (csum) flags. Note that
145 * although the support for the S (seq#) flag can be added easily
146 * for GRO, this is problematic for GSO hence can not be enabled
147 * here because a GRO pkt may end up in the forwarding path, thus
148 * requiring GSO support to break it up correctly.
149 */
150 if ((greh->flags & ~(GRE_KEY|GRE_CSUM)) != 0)
151 goto out;
152
Alexander Duycka0ca1532016-04-05 09:13:39 -0700153 /* We can only support GRE_CSUM if we can track the location of
154 * the GRE header. In the case of FOU/GUE we cannot because the
155 * outer UDP header displaces the GRE header leaving us in a state
156 * of limbo.
157 */
158 if ((greh->flags & GRE_CSUM) && NAPI_GRO_CB(skb)->is_fou)
159 goto out;
160
Jerry Chubf5a7552014-01-07 10:23:19 -0800161 type = greh->protocol;
162
163 rcu_read_lock();
164 ptype = gro_find_receive_by_type(type);
Ian Morris51456b22015-04-03 09:17:26 +0100165 if (!ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800166 goto out_unlock;
167
168 grehlen = GRE_HEADER_SECTION;
169
170 if (greh->flags & GRE_KEY)
171 grehlen += GRE_HEADER_SECTION;
172
173 if (greh->flags & GRE_CSUM)
174 grehlen += GRE_HEADER_SECTION;
175
176 hlen = off + grehlen;
177 if (skb_gro_header_hard(skb, hlen)) {
178 greh = skb_gro_header_slow(skb, hlen, off);
179 if (unlikely(!greh))
180 goto out_unlock;
181 }
Jerry Chubf5a7552014-01-07 10:23:19 -0800182
Tom Herbert758f75d2014-08-22 13:34:22 -0700183 /* Don't bother verifying checksum if we're going to flush anyway. */
Tom Herbert884d3382014-08-31 15:12:44 -0700184 if ((greh->flags & GRE_CSUM) && !NAPI_GRO_CB(skb)->flush) {
185 if (skb_gro_checksum_simple_validate(skb))
Jerry Chubf5a7552014-01-07 10:23:19 -0800186 goto out_unlock;
Tom Herbert758f75d2014-08-22 13:34:22 -0700187
Tom Herbert884d3382014-08-31 15:12:44 -0700188 skb_gro_checksum_try_convert(skb, IPPROTO_GRE, 0,
189 null_compute_pseudo);
190 }
191
Jerry Chubf5a7552014-01-07 10:23:19 -0800192 for (p = *head; p; p = p->next) {
193 const struct gre_base_hdr *greh2;
194
195 if (!NAPI_GRO_CB(p)->same_flow)
196 continue;
197
198 /* The following checks are needed to ensure only pkts
199 * from the same tunnel are considered for aggregation.
200 * The criteria for "the same tunnel" includes:
201 * 1) same version (we only support version 0 here)
202 * 2) same protocol (we only support ETH_P_IP for now)
203 * 3) same set of flags
204 * 4) same key if the key field is present.
205 */
206 greh2 = (struct gre_base_hdr *)(p->data + off);
207
208 if (greh2->flags != greh->flags ||
209 greh2->protocol != greh->protocol) {
210 NAPI_GRO_CB(p)->same_flow = 0;
211 continue;
212 }
213 if (greh->flags & GRE_KEY) {
214 /* compare keys */
215 if (*(__be32 *)(greh2+1) != *(__be32 *)(greh+1)) {
216 NAPI_GRO_CB(p)->same_flow = 0;
217 continue;
218 }
219 }
220 }
221
222 skb_gro_pull(skb, grehlen);
223
224 /* Adjusted NAPI_GRO_CB(skb)->csum after skb_gro_pull()*/
225 skb_gro_postpull_rcsum(skb, greh, grehlen);
226
227 pp = ptype->callbacks.gro_receive(head, skb);
Alexander Duyckc194cf92016-03-09 09:24:23 -0800228 flush = 0;
Jerry Chubf5a7552014-01-07 10:23:19 -0800229
230out_unlock:
231 rcu_read_unlock();
232out:
233 NAPI_GRO_CB(skb)->flush |= flush;
234
235 return pp;
236}
237
Wei Yongjund10dbad2014-01-09 22:22:05 +0800238static int gre_gro_complete(struct sk_buff *skb, int nhoff)
Jerry Chubf5a7552014-01-07 10:23:19 -0800239{
240 struct gre_base_hdr *greh = (struct gre_base_hdr *)(skb->data + nhoff);
241 struct packet_offload *ptype;
242 unsigned int grehlen = sizeof(*greh);
243 int err = -ENOENT;
244 __be16 type;
245
Jerry Chuc3caf112014-07-14 15:54:46 -0700246 skb->encapsulation = 1;
247 skb_shinfo(skb)->gso_type = SKB_GSO_GRE;
248
Jerry Chubf5a7552014-01-07 10:23:19 -0800249 type = greh->protocol;
250 if (greh->flags & GRE_KEY)
251 grehlen += GRE_HEADER_SECTION;
252
253 if (greh->flags & GRE_CSUM)
254 grehlen += GRE_HEADER_SECTION;
255
256 rcu_read_lock();
257 ptype = gro_find_complete_by_type(type);
Ian Morris00db4122015-04-03 09:17:27 +0100258 if (ptype)
Jerry Chubf5a7552014-01-07 10:23:19 -0800259 err = ptype->callbacks.gro_complete(skb, nhoff + grehlen);
260
261 rcu_read_unlock();
Tom Herbert6fb2a752014-11-29 09:59:45 -0800262
263 skb_set_inner_mac_header(skb, nhoff + grehlen);
264
Jerry Chubf5a7552014-01-07 10:23:19 -0800265 return err;
266}
267
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200268static const struct net_offload gre_offload = {
269 .callbacks = {
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200270 .gso_segment = gre_gso_segment,
Jerry Chubf5a7552014-01-07 10:23:19 -0800271 .gro_receive = gre_gro_receive,
272 .gro_complete = gre_gro_complete,
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200273 },
274};
275
Eric Dumazet438e38f2014-01-06 14:03:07 -0800276static int __init gre_offload_init(void)
Daniel Borkmannc50cd352013-07-01 19:24:00 +0200277{
278 return inet_add_offload(&gre_offload, IPPROTO_GRE);
279}
Paul Gortmakercf172282014-01-15 11:19:55 -0500280device_initcall(gre_offload_init);