blob: eedd829a2f8777343d73b983b4900a9ba32f6fb4 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: GRE over IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Joe Perchesafd465032012-03-12 07:03:32 +000013#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14
Randy Dunlap4fc268d2006-01-11 12:17:47 -080015#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090019#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <asm/uaccess.h>
21#include <linux/skbuff.h>
22#include <linux/netdevice.h>
23#include <linux/in.h>
24#include <linux/tcp.h>
25#include <linux/udp.h>
26#include <linux/if_arp.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070027#include <linux/if_vlan.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/init.h>
29#include <linux/in6.h>
30#include <linux/inetdevice.h>
31#include <linux/igmp.h>
32#include <linux/netfilter_ipv4.h>
Herbert Xue1a80002008-10-09 12:00:17 -070033#include <linux/etherdevice.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080034#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#include <net/sock.h>
37#include <net/ip.h>
38#include <net/icmp.h>
39#include <net/protocol.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000040#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/arp.h>
42#include <net/checksum.h>
43#include <net/dsfield.h>
44#include <net/inet_ecn.h>
45#include <net/xfrm.h>
Pavel Emelyanov59a4c752008-04-16 01:08:53 -070046#include <net/net_namespace.h>
47#include <net/netns/generic.h>
Herbert Xuc19e6542008-10-09 11:59:55 -070048#include <net/rtnetlink.h>
Dmitry Kozlov00959ad2010-08-21 23:05:39 -070049#include <net/gre.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070050#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
Eric Dumazetdfd56b82011-12-10 09:48:31 +000052#if IS_ENABLED(CONFIG_IPV6)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053#include <net/ipv6.h>
54#include <net/ip6_fib.h>
55#include <net/ip6_route.h>
56#endif
57
58/*
59 Problems & solutions
60 --------------------
61
62 1. The most important issue is detecting local dead loops.
63 They would cause complete host lockup in transmit, which
64 would be "resolved" by stack overflow or, if queueing is enabled,
65 with infinite looping in net_bh.
66
67 We cannot track such dead loops during route installation,
68 it is infeasible task. The most general solutions would be
69 to keep skb->encapsulation counter (sort of local ttl),
Eric Dumazet6d0722a2010-09-29 23:35:10 -070070 and silently drop packet when it expires. It is a good
stephen hemmingerbff52852012-02-24 08:08:20 +000071 solution, but it supposes maintaining new variable in ALL
Linus Torvalds1da177e2005-04-16 15:20:36 -070072 skb, even if no tunneling is used.
73
Eric Dumazet6d0722a2010-09-29 23:35:10 -070074 Current solution: xmit_recursion breaks dead loops. This is a percpu
75 counter, since when we enter the first ndo_xmit(), cpu migration is
76 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78 2. Networking dead loops would not kill routers, but would really
79 kill network. IP hop limit plays role of "t->recursion" in this case,
80 if we copy it from packet being encapsulated to upper header.
81 It is very good solution, but it introduces two problems:
82
83 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
84 do not work over tunnels.
85 - traceroute does not work. I planned to relay ICMP from tunnel,
86 so that this problem would be solved and traceroute output
87 would even more informative. This idea appeared to be wrong:
88 only Linux complies to rfc1812 now (yes, guys, Linux is the only
89 true router now :-)), all routers (at least, in neighbourhood of mine)
90 return only 8 bytes of payload. It is the end.
91
92 Hence, if we want that OSPF worked or traceroute said something reasonable,
93 we should search for another solution.
94
95 One of them is to parse packet trying to detect inner encapsulation
96 made by our node. It is difficult or even impossible, especially,
stephen hemmingerbff52852012-02-24 08:08:20 +000097 taking into account fragmentation. TO be short, ttl is not solution at all.
Linus Torvalds1da177e2005-04-16 15:20:36 -070098
99 Current solution: The solution was UNEXPECTEDLY SIMPLE.
100 We force DF flag on tunnels with preconfigured hop limit,
101 that is ALL. :-) Well, it does not remove the problem completely,
102 but exponential growth of network traffic is changed to linear
103 (branches, that exceed pmtu are pruned) and tunnel mtu
stephen hemmingerbff52852012-02-24 08:08:20 +0000104 rapidly degrades to value <68, where looping stops.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 Yes, it is not good if there exists a router in the loop,
106 which does not force DF, even when encapsulating packets have DF set.
107 But it is not our problem! Nobody could accuse us, we made
108 all that we could make. Even if it is your gated who injected
109 fatal route to network, even if it were you who configured
110 fatal static route: you are innocent. :-)
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 Alexey Kuznetsov.
113 */
114
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000115static bool log_ecn_error = true;
116module_param(log_ecn_error, bool, 0644);
117MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
118
Herbert Xuc19e6542008-10-09 11:59:55 -0700119static struct rtnl_link_ops ipgre_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120static int ipgre_tunnel_init(struct net_device *dev);
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700121
Eric Dumazetf99189b2009-11-17 10:42:49 +0000122static int ipgre_net_id __read_mostly;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000123static int gre_tap_net_id __read_mostly;
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700124
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700125static int ip_gre_calc_hlen(__be16 o_flags)
126{
127 int addend = 4;
128
129 if (o_flags & TUNNEL_CSUM)
130 addend += 4;
131 if (o_flags & TUNNEL_KEY)
132 addend += 4;
133 if (o_flags & TUNNEL_SEQ)
134 addend += 4;
135 return addend;
136}
137
138static __be16 gre_flags_to_tnl_flags(__be16 flags)
139{
140 __be16 tflags = 0;
141
142 if (flags & GRE_CSUM)
143 tflags |= TUNNEL_CSUM;
144 if (flags & GRE_ROUTING)
145 tflags |= TUNNEL_ROUTING;
146 if (flags & GRE_KEY)
147 tflags |= TUNNEL_KEY;
148 if (flags & GRE_SEQ)
149 tflags |= TUNNEL_SEQ;
150 if (flags & GRE_STRICT)
151 tflags |= TUNNEL_STRICT;
152 if (flags & GRE_REC)
153 tflags |= TUNNEL_REC;
154 if (flags & GRE_VERSION)
155 tflags |= TUNNEL_VERSION;
156
157 return tflags;
158}
159
160static __be16 tnl_flags_to_gre_flags(__be16 tflags)
161{
162 __be16 flags = 0;
163
164 if (tflags & TUNNEL_CSUM)
165 flags |= GRE_CSUM;
166 if (tflags & TUNNEL_ROUTING)
167 flags |= GRE_ROUTING;
168 if (tflags & TUNNEL_KEY)
169 flags |= GRE_KEY;
170 if (tflags & TUNNEL_SEQ)
171 flags |= GRE_SEQ;
172 if (tflags & TUNNEL_STRICT)
173 flags |= GRE_STRICT;
174 if (tflags & TUNNEL_REC)
175 flags |= GRE_REC;
176 if (tflags & TUNNEL_VERSION)
177 flags |= GRE_VERSION;
178
179 return flags;
180}
181
182static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
183 bool *csum_err)
184{
185 const struct gre_base_hdr *greh;
186 __be32 *options;
187 int hdr_len;
188
189 if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
190 return -EINVAL;
191
192 greh = (struct gre_base_hdr *)skb_transport_header(skb);
193 if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
194 return -EINVAL;
195
196 tpi->flags = gre_flags_to_tnl_flags(greh->flags);
197 hdr_len = ip_gre_calc_hlen(tpi->flags);
198
199 if (!pskb_may_pull(skb, hdr_len))
200 return -EINVAL;
201
202 greh = (struct gre_base_hdr *)skb_transport_header(skb);
203 tpi->proto = greh->protocol;
204
205 options = (__be32 *)(greh + 1);
206 if (greh->flags & GRE_CSUM) {
207 if (skb_checksum_simple_validate(skb)) {
208 *csum_err = true;
209 return -EINVAL;
210 }
211
212 skb_checksum_try_convert(skb, IPPROTO_GRE, 0,
213 null_compute_pseudo);
214 options++;
215 }
216
217 if (greh->flags & GRE_KEY) {
218 tpi->key = *options;
219 options++;
220 } else {
221 tpi->key = 0;
222 }
223 if (unlikely(greh->flags & GRE_SEQ)) {
224 tpi->seq = *options;
225 options++;
226 } else {
227 tpi->seq = 0;
228 }
229 /* WCCP version 1 and 2 protocol decoding.
230 * - Change protocol to IP
231 * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
232 */
233 if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
234 tpi->proto = htons(ETH_P_IP);
235 if ((*(u8 *)options & 0xF0) != 0x40) {
236 hdr_len += 4;
237 if (!pskb_may_pull(skb, hdr_len))
238 return -EINVAL;
239 }
240 }
Jiri Benc7f290c92016-02-18 11:22:52 +0100241 return iptunnel_pull_header(skb, hdr_len, tpi->proto, false);
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700242}
243
244static void ipgre_err(struct sk_buff *skb, u32 info,
245 const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Pravin B Shelarc5441932013-03-25 14:49:35 +0000248 /* All the routers (except for Linux) return only
249 8 bytes of packet payload. It means, that precise relaying of
250 ICMP in the real Internet is absolutely infeasible.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Pravin B Shelarc5441932013-03-25 14:49:35 +0000252 Moreover, Cisco "wise men" put GRE key to the third word
253 in GRE header. It makes impossible maintaining even soft
254 state for keyed GRE tunnels with enabled checksum. Tell
255 them "thank you".
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256
Pravin B Shelarc5441932013-03-25 14:49:35 +0000257 Well, I wonder, rfc1812 was written by Cisco employee,
258 what the hell these idiots break standards established
259 by themselves???
260 */
261 struct net *net = dev_net(skb->dev);
262 struct ip_tunnel_net *itn;
Eric Dumazet96f5a842013-05-18 08:36:03 +0000263 const struct iphdr *iph;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300264 const int type = icmp_hdr(skb)->type;
265 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 struct ip_tunnel *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 switch (type) {
269 default:
270 case ICMP_PARAMETERPROB:
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700271 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
273 case ICMP_DEST_UNREACH:
274 switch (code) {
275 case ICMP_SR_FAILED:
276 case ICMP_PORT_UNREACH:
277 /* Impossible event. */
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700278 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 default:
280 /* All others are translated to HOST_UNREACH.
281 rfc2003 contains "deep thoughts" about NET_UNREACH,
282 I believe they are just ether pollution. --ANK
283 */
284 break;
285 }
286 break;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 case ICMP_TIME_EXCEEDED:
289 if (code != ICMP_EXC_TTL)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700290 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700292
293 case ICMP_REDIRECT:
294 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 }
296
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700297 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000298 itn = net_generic(net, gre_tap_net_id);
299 else
300 itn = net_generic(net, ipgre_net_id);
301
Duan Jiongc0c0c502014-01-28 11:49:43 +0800302 iph = (const struct iphdr *)(icmp_hdr(skb) + 1);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700303 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
304 iph->daddr, iph->saddr, tpi->key);
stephen hemmingerd2083282012-09-24 18:12:23 +0000305
Ian Morris51456b22015-04-03 09:17:26 +0100306 if (!t)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700307 return;
David S. Miller36393392012-06-14 22:21:46 -0700308
David S. Miller36393392012-06-14 22:21:46 -0700309 if (t->parms.iph.daddr == 0 ||
Joe Perchesf97c1e02007-12-16 13:45:43 -0800310 ipv4_is_multicast(t->parms.iph.daddr))
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700311 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
313 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700314 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Wei Yongjunda6185d82009-02-24 23:34:48 -0800316 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317 t->err_count++;
318 else
319 t->err_count = 1;
320 t->err_time = jiffies;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700321}
322
323static void gre_err(struct sk_buff *skb, u32 info)
324{
325 /* All the routers (except for Linux) return only
326 * 8 bytes of packet payload. It means, that precise relaying of
327 * ICMP in the real Internet is absolutely infeasible.
328 *
329 * Moreover, Cisco "wise men" put GRE key to the third word
330 * in GRE header. It makes impossible maintaining even soft
331 * state for keyed
332 * GRE tunnels with enabled checksum. Tell them "thank you".
333 *
334 * Well, I wonder, rfc1812 was written by Cisco employee,
335 * what the hell these idiots break standards established
336 * by themselves???
337 */
338
339 const int type = icmp_hdr(skb)->type;
340 const int code = icmp_hdr(skb)->code;
341 struct tnl_ptk_info tpi;
342 bool csum_err = false;
343
344 if (parse_gre_header(skb, &tpi, &csum_err)) {
345 if (!csum_err) /* ignore csum errors. */
346 return;
347 }
348
349 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
350 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
351 skb->dev->ifindex, 0, IPPROTO_GRE, 0);
352 return;
353 }
354 if (type == ICMP_REDIRECT) {
355 ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
356 IPPROTO_GRE, 0);
357 return;
358 }
359
360 ipgre_err(skb, info, &tpi);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700363static __be64 key_to_tunnel_id(__be32 key)
364{
365#ifdef __BIG_ENDIAN
366 return (__force __be64)((__force u32)key);
367#else
368 return (__force __be64)((__force u64)key << 32);
369#endif
370}
371
372/* Returns the least-significant 32 bits of a __be64. */
373static __be32 tunnel_id_to_key(__be64 x)
374{
375#ifdef __BIG_ENDIAN
376 return (__force __be32)x;
377#else
378 return (__force __be32)((__force u64)x >> 32);
379#endif
380}
381
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700382static int ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000384 struct net *net = dev_net(skb->dev);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700385 struct metadata_dst *tun_dst = NULL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000386 struct ip_tunnel_net *itn;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000387 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 struct ip_tunnel *tunnel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700390 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000391 itn = net_generic(net, gre_tap_net_id);
392 else
393 itn = net_generic(net, ipgre_net_id);
394
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700395 iph = ip_hdr(skb);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700396 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
397 iph->saddr, iph->daddr, tpi->key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
stephen hemmingerd2083282012-09-24 18:12:23 +0000399 if (tunnel) {
Timo Teräs0e3da5b2013-12-16 11:02:09 +0200400 skb_pop_mac_header(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700401 if (tunnel->collect_md) {
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700402 __be16 flags;
403 __be64 tun_id;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700404
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700405 flags = tpi->flags & (TUNNEL_CSUM | TUNNEL_KEY);
406 tun_id = key_to_tunnel_id(tpi->key);
407 tun_dst = ip_tun_rx_dst(skb, flags, tun_id, 0);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700408 if (!tun_dst)
409 return PACKET_REJECT;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700410 }
411
412 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700413 return PACKET_RCVD;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 }
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700415 return PACKET_REJECT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416}
417
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700418static int gre_rcv(struct sk_buff *skb)
419{
420 struct tnl_ptk_info tpi;
421 bool csum_err = false;
422
423#ifdef CONFIG_NET_IPGRE_BROADCAST
424 if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
425 /* Looped back packet, drop it! */
426 if (rt_is_output_route(skb_rtable(skb)))
427 goto drop;
428 }
429#endif
430
431 if (parse_gre_header(skb, &tpi, &csum_err) < 0)
432 goto drop;
433
434 if (ipgre_rcv(skb, &tpi) == PACKET_RCVD)
435 return 0;
436
437 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
438drop:
439 kfree_skb(skb);
440 return 0;
441}
442
Edward Cree53936102016-02-11 21:01:07 +0000443static __sum16 gre_checksum(struct sk_buff *skb)
444{
445 __wsum csum;
446
447 if (skb->ip_summed == CHECKSUM_PARTIAL)
448 csum = lco_csum(skb);
449 else
450 csum = skb_checksum(skb, 0, skb->len, 0);
451 return csum_fold(csum);
452}
453
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700454static void build_header(struct sk_buff *skb, int hdr_len, __be16 flags,
455 __be16 proto, __be32 key, __be32 seq)
456{
457 struct gre_base_hdr *greh;
458
459 skb_push(skb, hdr_len);
460
461 skb_reset_transport_header(skb);
462 greh = (struct gre_base_hdr *)skb->data;
463 greh->flags = tnl_flags_to_gre_flags(flags);
464 greh->protocol = proto;
465
466 if (flags & (TUNNEL_KEY | TUNNEL_CSUM | TUNNEL_SEQ)) {
467 __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
468
469 if (flags & TUNNEL_SEQ) {
470 *ptr = seq;
471 ptr--;
472 }
473 if (flags & TUNNEL_KEY) {
474 *ptr = key;
475 ptr--;
476 }
477 if (flags & TUNNEL_CSUM &&
478 !(skb_shinfo(skb)->gso_type &
479 (SKB_GSO_GRE | SKB_GSO_GRE_CSUM))) {
480 *ptr = 0;
Edward Cree53936102016-02-11 21:01:07 +0000481 *(__sum16 *)ptr = gre_checksum(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700482 }
483 }
484}
485
Pravin B Shelarc5441932013-03-25 14:49:35 +0000486static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
487 const struct iphdr *tnl_params,
488 __be16 proto)
489{
490 struct ip_tunnel *tunnel = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000491
Pravin B Shelarc5441932013-03-25 14:49:35 +0000492 if (tunnel->parms.o_flags & TUNNEL_SEQ)
493 tunnel->o_seqno++;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000494
Pravin B Shelarc5441932013-03-25 14:49:35 +0000495 /* Push GRE header. */
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700496 build_header(skb, tunnel->tun_hlen, tunnel->parms.o_flags,
497 proto, tunnel->parms.o_key, htonl(tunnel->o_seqno));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700499 skb_set_inner_protocol(skb, proto);
Nicolas Dichtelbf3d6a82013-05-27 23:48:15 +0000500 ip_tunnel_xmit(skb, dev, tnl_params, tnl_params->protocol);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501}
502
Alexander Duyckaed069d2016-04-14 15:33:37 -0400503static int gre_handle_offloads(struct sk_buff *skb, bool csum)
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700504{
Edward Cree6fa79662016-02-11 21:02:31 +0000505 return iptunnel_handle_offloads(skb, csum ? SKB_GSO_GRE_CSUM : SKB_GSO_GRE);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700506}
507
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700508static struct rtable *gre_get_rt(struct sk_buff *skb,
509 struct net_device *dev,
510 struct flowi4 *fl,
511 const struct ip_tunnel_key *key)
512{
513 struct net *net = dev_net(dev);
514
515 memset(fl, 0, sizeof(*fl));
516 fl->daddr = key->u.ipv4.dst;
517 fl->saddr = key->u.ipv4.src;
518 fl->flowi4_tos = RT_TOS(key->tos);
519 fl->flowi4_mark = skb->mark;
520 fl->flowi4_proto = IPPROTO_GRE;
521
522 return ip_route_output_key(net, fl);
523}
524
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700525static void gre_fb_xmit(struct sk_buff *skb, struct net_device *dev)
526{
527 struct ip_tunnel_info *tun_info;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700528 const struct ip_tunnel_key *key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100529 struct rtable *rt = NULL;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700530 struct flowi4 fl;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700531 int min_headroom;
532 int tunnel_hlen;
533 __be16 df, flags;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100534 bool use_cache;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700535 int err;
536
Jiri Benc61adedf2015-08-20 13:56:25 +0200537 tun_info = skb_tunnel_info(skb);
Jiri Benc7f9562a2015-08-28 20:48:20 +0200538 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
539 ip_tunnel_info_af(tun_info) != AF_INET))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700540 goto err_free_skb;
541
542 key = &tun_info->key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100543 use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
544 if (use_cache)
545 rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl.saddr);
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100546 if (!rt) {
547 rt = gre_get_rt(skb, dev, &fl, key);
548 if (IS_ERR(rt))
549 goto err_free_skb;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100550 if (use_cache)
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100551 dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
552 fl.saddr);
553 }
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700554
555 tunnel_hlen = ip_gre_calc_hlen(key->tun_flags);
556
557 min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len
558 + tunnel_hlen + sizeof(struct iphdr);
559 if (skb_headroom(skb) < min_headroom || skb_header_cloned(skb)) {
560 int head_delta = SKB_DATA_ALIGN(min_headroom -
561 skb_headroom(skb) +
562 16);
563 err = pskb_expand_head(skb, max_t(int, head_delta, 0),
564 0, GFP_ATOMIC);
565 if (unlikely(err))
566 goto err_free_rt;
567 }
568
569 /* Push Tunnel header. */
Alexander Duyckaed069d2016-04-14 15:33:37 -0400570 if (gre_handle_offloads(skb, !!(tun_info->key.tun_flags & TUNNEL_CSUM)))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700571 goto err_free_rt;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700572
573 flags = tun_info->key.tun_flags & (TUNNEL_CSUM | TUNNEL_KEY);
574 build_header(skb, tunnel_hlen, flags, htons(ETH_P_TEB),
575 tunnel_id_to_key(tun_info->key.tun_id), 0);
576
577 df = key->tun_flags & TUNNEL_DONT_FRAGMENT ? htons(IP_DF) : 0;
Pravin B Shelar039f5062015-12-24 14:34:54 -0800578
579 iptunnel_xmit(skb->sk, rt, skb, fl.saddr, key->u.ipv4.dst, IPPROTO_GRE,
580 key->tos, key->ttl, df, false);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700581 return;
582
583err_free_rt:
584 ip_rt_put(rt);
585err_free_skb:
586 kfree_skb(skb);
587 dev->stats.tx_dropped++;
588}
589
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700590static int gre_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb)
591{
592 struct ip_tunnel_info *info = skb_tunnel_info(skb);
593 struct rtable *rt;
594 struct flowi4 fl4;
595
596 if (ip_tunnel_info_af(info) != AF_INET)
597 return -EINVAL;
598
599 rt = gre_get_rt(skb, dev, &fl4, &info->key);
600 if (IS_ERR(rt))
601 return PTR_ERR(rt);
602
603 ip_rt_put(rt);
604 info->key.u.ipv4.src = fl4.saddr;
605 return 0;
606}
607
Pravin B Shelarc5441932013-03-25 14:49:35 +0000608static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
609 struct net_device *dev)
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800610{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000611 struct ip_tunnel *tunnel = netdev_priv(dev);
612 const struct iphdr *tnl_params;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800613
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700614 if (tunnel->collect_md) {
615 gre_fb_xmit(skb, dev);
616 return NETDEV_TX_OK;
617 }
618
Pravin B Shelarc5441932013-03-25 14:49:35 +0000619 if (dev->header_ops) {
620 /* Need space for new headers */
621 if (skb_cow_head(skb, dev->needed_headroom -
Chen Gang2bac7cb2013-04-22 20:45:42 +0000622 (tunnel->hlen + sizeof(struct iphdr))))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000623 goto free_skb;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800624
Pravin B Shelarc5441932013-03-25 14:49:35 +0000625 tnl_params = (const struct iphdr *)skb->data;
Eric Dumazete985aad2010-09-27 03:57:11 +0000626
Pravin B Shelarc5441932013-03-25 14:49:35 +0000627 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
628 * to gre header.
629 */
630 skb_pull(skb, tunnel->hlen + sizeof(struct iphdr));
Timo Teräs8a0033a2014-12-15 09:24:13 +0200631 skb_reset_mac_header(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000632 } else {
633 if (skb_cow_head(skb, dev->needed_headroom))
634 goto free_skb;
Herbert Xue1a80002008-10-09 12:00:17 -0700635
Pravin B Shelarc5441932013-03-25 14:49:35 +0000636 tnl_params = &tunnel->parms.iph;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800637 }
638
Alexander Duyckaed069d2016-04-14 15:33:37 -0400639 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
640 goto free_skb;
Timo Teräs8a0033a2014-12-15 09:24:13 +0200641
Pravin B Shelarc5441932013-03-25 14:49:35 +0000642 __gre_xmit(skb, dev, tnl_params, skb->protocol);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000643 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800644
Pravin B Shelarc5441932013-03-25 14:49:35 +0000645free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800646 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000647 dev->stats.tx_dropped++;
648 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800649}
650
Pravin B Shelarc5441932013-03-25 14:49:35 +0000651static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
652 struct net_device *dev)
653{
654 struct ip_tunnel *tunnel = netdev_priv(dev);
655
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700656 if (tunnel->collect_md) {
657 gre_fb_xmit(skb, dev);
658 return NETDEV_TX_OK;
659 }
660
Alexander Duyckaed069d2016-04-14 15:33:37 -0400661 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
662 goto free_skb;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000663
664 if (skb_cow_head(skb, dev->needed_headroom))
665 goto free_skb;
666
667 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000668 return NETDEV_TX_OK;
669
670free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800671 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000672 dev->stats.tx_dropped++;
673 return NETDEV_TX_OK;
674}
675
676static int ipgre_tunnel_ioctl(struct net_device *dev,
677 struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700678{
Tom Herbert4565e992014-09-17 12:26:01 -0700679 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700680 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700681
Pravin B Shelarc5441932013-03-25 14:49:35 +0000682 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
683 return -EFAULT;
Cong Wang6c734fb2013-06-29 12:02:59 +0800684 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
685 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_GRE ||
686 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)) ||
687 ((p.i_flags|p.o_flags)&(GRE_VERSION|GRE_ROUTING)))
688 return -EINVAL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000689 }
690 p.i_flags = gre_flags_to_tnl_flags(p.i_flags);
691 p.o_flags = gre_flags_to_tnl_flags(p.o_flags);
692
693 err = ip_tunnel_ioctl(dev, &p, cmd);
694 if (err)
695 return err;
696
697 p.i_flags = tnl_flags_to_gre_flags(p.i_flags);
698 p.o_flags = tnl_flags_to_gre_flags(p.o_flags);
699
700 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
701 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 return 0;
703}
704
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705/* Nice toy. Unfortunately, useless in real life :-)
706 It allows to construct virtual multiprotocol broadcast "LAN"
707 over the Internet, provided multicast routing is tuned.
708
709
710 I have no idea was this bicycle invented before me,
711 so that I had to set ARPHRD_IPGRE to a random value.
712 I have an impression, that Cisco could make something similar,
713 but this feature is apparently missing in IOS<=11.2(8).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900714
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
716 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
717
718 ping -t 255 224.66.66.66
719
720 If nobody answers, mbone does not work.
721
722 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
723 ip addr add 10.66.66.<somewhat>/24 dev Universe
724 ifconfig Universe up
725 ifconfig Universe add fe80::<Your_real_addr>/10
726 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
727 ftp 10.66.66.66
728 ...
729 ftp fec0:6666:6666::193.233.7.65
730 ...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 */
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700732static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
733 unsigned short type,
Eric Dumazet15078502010-09-15 11:07:53 +0000734 const void *daddr, const void *saddr, unsigned int len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735{
Patrick McHardy2941a482006-01-08 22:05:26 -0800736 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000737 struct iphdr *iph;
738 struct gre_base_hdr *greh;
739
740 iph = (struct iphdr *)skb_push(skb, t->hlen + sizeof(*iph));
741 greh = (struct gre_base_hdr *)(iph+1);
742 greh->flags = tnl_flags_to_gre_flags(t->parms.o_flags);
743 greh->protocol = htons(type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744
745 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700746
Pravin B Shelarc5441932013-03-25 14:49:35 +0000747 /* Set the source hardware address. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 if (saddr)
749 memcpy(&iph->saddr, saddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000750 if (daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 memcpy(&iph->daddr, daddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000752 if (iph->daddr)
Timo Teräs77a482b2013-08-06 13:45:43 +0300753 return t->hlen + sizeof(*iph);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900754
Pravin B Shelarc5441932013-03-25 14:49:35 +0000755 return -(t->hlen + sizeof(*iph));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756}
757
Timo Teras6a5f44d2007-10-23 20:31:53 -0700758static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
759{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000760 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
Timo Teras6a5f44d2007-10-23 20:31:53 -0700761 memcpy(haddr, &iph->saddr, 4);
762 return 4;
763}
764
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700765static const struct header_ops ipgre_header_ops = {
766 .create = ipgre_header,
Timo Teras6a5f44d2007-10-23 20:31:53 -0700767 .parse = ipgre_header_parse,
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700768};
769
Timo Teras6a5f44d2007-10-23 20:31:53 -0700770#ifdef CONFIG_NET_IPGRE_BROADCAST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771static int ipgre_open(struct net_device *dev)
772{
Patrick McHardy2941a482006-01-08 22:05:26 -0800773 struct ip_tunnel *t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774
Joe Perchesf97c1e02007-12-16 13:45:43 -0800775 if (ipv4_is_multicast(t->parms.iph.daddr)) {
David S. Millercbb1e852011-05-04 12:33:34 -0700776 struct flowi4 fl4;
777 struct rtable *rt;
Eric Dumazete985aad2010-09-27 03:57:11 +0000778
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200779 rt = ip_route_output_gre(t->net, &fl4,
David S. Millercbb1e852011-05-04 12:33:34 -0700780 t->parms.iph.daddr,
781 t->parms.iph.saddr,
782 t->parms.o_key,
783 RT_TOS(t->parms.iph.tos),
784 t->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800785 if (IS_ERR(rt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786 return -EADDRNOTAVAIL;
Changli Gaod8d1f302010-06-10 23:31:35 -0700787 dev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788 ip_rt_put(rt);
Ian Morris51456b22015-04-03 09:17:26 +0100789 if (!__in_dev_get_rtnl(dev))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790 return -EADDRNOTAVAIL;
791 t->mlink = dev->ifindex;
Herbert Xue5ed6392005-10-03 14:35:55 -0700792 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700793 }
794 return 0;
795}
796
797static int ipgre_close(struct net_device *dev)
798{
Patrick McHardy2941a482006-01-08 22:05:26 -0800799 struct ip_tunnel *t = netdev_priv(dev);
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800800
Joe Perchesf97c1e02007-12-16 13:45:43 -0800801 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800802 struct in_device *in_dev;
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200803 in_dev = inetdev_by_index(t->net, t->mlink);
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000804 if (in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700805 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700806 }
807 return 0;
808}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700809#endif
810
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800811static const struct net_device_ops ipgre_netdev_ops = {
812 .ndo_init = ipgre_tunnel_init,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000813 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800814#ifdef CONFIG_NET_IPGRE_BROADCAST
815 .ndo_open = ipgre_open,
816 .ndo_stop = ipgre_close,
817#endif
Pravin B Shelarc5441932013-03-25 14:49:35 +0000818 .ndo_start_xmit = ipgre_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800819 .ndo_do_ioctl = ipgre_tunnel_ioctl,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000820 .ndo_change_mtu = ip_tunnel_change_mtu,
821 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200822 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800823};
824
Eric Dumazet6b78f162012-09-13 21:25:33 +0000825#define GRE_FEATURES (NETIF_F_SG | \
826 NETIF_F_FRAGLIST | \
827 NETIF_F_HIGHDMA | \
828 NETIF_F_HW_CSUM)
829
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830static void ipgre_tunnel_setup(struct net_device *dev)
831{
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800832 dev->netdev_ops = &ipgre_netdev_ops;
Nicolas Dichtel5a455272014-04-11 15:51:18 +0200833 dev->type = ARPHRD_IPGRE;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000834 ip_tunnel_setup(dev, ipgre_net_id);
835}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700836
Pravin B Shelarc5441932013-03-25 14:49:35 +0000837static void __gre_tunnel_init(struct net_device *dev)
838{
839 struct ip_tunnel *tunnel;
Tom Herbert4565e992014-09-17 12:26:01 -0700840 int t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000841
842 tunnel = netdev_priv(dev);
Tom Herbert4565e992014-09-17 12:26:01 -0700843 tunnel->tun_hlen = ip_gre_calc_hlen(tunnel->parms.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000844 tunnel->parms.iph.protocol = IPPROTO_GRE;
845
Tom Herbert4565e992014-09-17 12:26:01 -0700846 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
847
848 t_hlen = tunnel->hlen + sizeof(struct iphdr);
849
850 dev->needed_headroom = LL_MAX_HEADER + t_hlen + 4;
851 dev->mtu = ETH_DATA_LEN - t_hlen - 4;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000852
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200853 dev->features |= GRE_FEATURES;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000854 dev->hw_features |= GRE_FEATURES;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000855
856 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
Alexander Duycka0ca1532016-04-05 09:13:39 -0700857 /* TCP offload with GRE SEQ is not supported, nor
858 * can we support 2 levels of outer headers requiring
859 * an update.
860 */
861 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
862 (tunnel->encap.type == TUNNEL_ENCAP_NONE)) {
863 dev->features |= NETIF_F_GSO_SOFTWARE;
864 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
865 }
866
Pravin B Shelarc5441932013-03-25 14:49:35 +0000867 /* Can use a lockless transmit, unless we generate
868 * output sequences
869 */
870 dev->features |= NETIF_F_LLTX;
871 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872}
873
874static int ipgre_tunnel_init(struct net_device *dev)
875{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000876 struct ip_tunnel *tunnel = netdev_priv(dev);
877 struct iphdr *iph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700878
Pravin B Shelarc5441932013-03-25 14:49:35 +0000879 __gre_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880
Pravin B Shelarc5441932013-03-25 14:49:35 +0000881 memcpy(dev->dev_addr, &iph->saddr, 4);
882 memcpy(dev->broadcast, &iph->daddr, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700883
Pravin B Shelarc5441932013-03-25 14:49:35 +0000884 dev->flags = IFF_NOARP;
Eric Dumazet02875872014-10-05 18:38:35 -0700885 netif_keep_dst(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000886 dev->addr_len = 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887
Linus Torvalds1da177e2005-04-16 15:20:36 -0700888 if (iph->daddr) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700889#ifdef CONFIG_NET_IPGRE_BROADCAST
Joe Perchesf97c1e02007-12-16 13:45:43 -0800890 if (ipv4_is_multicast(iph->daddr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891 if (!iph->saddr)
892 return -EINVAL;
893 dev->flags = IFF_BROADCAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700894 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895 }
896#endif
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800897 } else
Timo Teras6a5f44d2007-10-23 20:31:53 -0700898 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700899
Pravin B Shelarc5441932013-03-25 14:49:35 +0000900 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901}
902
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700903static const struct gre_protocol ipgre_protocol = {
904 .handler = gre_rcv,
905 .err_handler = gre_err,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906};
907
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000908static int __net_init ipgre_init_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700909{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000910 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700911}
912
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000913static void __net_exit ipgre_exit_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700914{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000915 struct ip_tunnel_net *itn = net_generic(net, ipgre_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200916 ip_tunnel_delete_net(itn, &ipgre_link_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700917}
918
919static struct pernet_operations ipgre_net_ops = {
920 .init = ipgre_init_net,
921 .exit = ipgre_exit_net,
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000922 .id = &ipgre_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000923 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700924};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700925
Herbert Xuc19e6542008-10-09 11:59:55 -0700926static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
927{
928 __be16 flags;
929
930 if (!data)
931 return 0;
932
933 flags = 0;
934 if (data[IFLA_GRE_IFLAGS])
935 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
936 if (data[IFLA_GRE_OFLAGS])
937 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
938 if (flags & (GRE_VERSION|GRE_ROUTING))
939 return -EINVAL;
940
941 return 0;
942}
943
Herbert Xue1a80002008-10-09 12:00:17 -0700944static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[])
945{
946 __be32 daddr;
947
948 if (tb[IFLA_ADDRESS]) {
949 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
950 return -EINVAL;
951 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
952 return -EADDRNOTAVAIL;
953 }
954
955 if (!data)
956 goto out;
957
958 if (data[IFLA_GRE_REMOTE]) {
959 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
960 if (!daddr)
961 return -EINVAL;
962 }
963
964out:
965 return ipgre_tunnel_validate(tb, data);
966}
967
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700968static void ipgre_netlink_parms(struct net_device *dev,
969 struct nlattr *data[],
970 struct nlattr *tb[],
971 struct ip_tunnel_parm *parms)
Herbert Xuc19e6542008-10-09 11:59:55 -0700972{
Herbert Xu7bb82d92008-10-11 12:20:15 -0700973 memset(parms, 0, sizeof(*parms));
Herbert Xuc19e6542008-10-09 11:59:55 -0700974
975 parms->iph.protocol = IPPROTO_GRE;
976
977 if (!data)
978 return;
979
980 if (data[IFLA_GRE_LINK])
981 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
982
983 if (data[IFLA_GRE_IFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000984 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700985
986 if (data[IFLA_GRE_OFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000987 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700988
989 if (data[IFLA_GRE_IKEY])
990 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
991
992 if (data[IFLA_GRE_OKEY])
993 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
994
995 if (data[IFLA_GRE_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +0200996 parms->iph.saddr = nla_get_in_addr(data[IFLA_GRE_LOCAL]);
Herbert Xuc19e6542008-10-09 11:59:55 -0700997
998 if (data[IFLA_GRE_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +0200999 parms->iph.daddr = nla_get_in_addr(data[IFLA_GRE_REMOTE]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001000
1001 if (data[IFLA_GRE_TTL])
1002 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
1003
1004 if (data[IFLA_GRE_TOS])
1005 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
1006
1007 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC]))
1008 parms->iph.frag_off = htons(IP_DF);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001009
1010 if (data[IFLA_GRE_COLLECT_METADATA]) {
1011 struct ip_tunnel *t = netdev_priv(dev);
1012
1013 t->collect_md = true;
1014 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001015}
1016
Tom Herbert4565e992014-09-17 12:26:01 -07001017/* This function returns true when ENCAP attributes are present in the nl msg */
1018static bool ipgre_netlink_encap_parms(struct nlattr *data[],
1019 struct ip_tunnel_encap *ipencap)
1020{
1021 bool ret = false;
1022
1023 memset(ipencap, 0, sizeof(*ipencap));
1024
1025 if (!data)
1026 return ret;
1027
1028 if (data[IFLA_GRE_ENCAP_TYPE]) {
1029 ret = true;
1030 ipencap->type = nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]);
1031 }
1032
1033 if (data[IFLA_GRE_ENCAP_FLAGS]) {
1034 ret = true;
1035 ipencap->flags = nla_get_u16(data[IFLA_GRE_ENCAP_FLAGS]);
1036 }
1037
1038 if (data[IFLA_GRE_ENCAP_SPORT]) {
1039 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001040 ipencap->sport = nla_get_be16(data[IFLA_GRE_ENCAP_SPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001041 }
1042
1043 if (data[IFLA_GRE_ENCAP_DPORT]) {
1044 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001045 ipencap->dport = nla_get_be16(data[IFLA_GRE_ENCAP_DPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001046 }
1047
1048 return ret;
1049}
1050
Pravin B Shelarc5441932013-03-25 14:49:35 +00001051static int gre_tap_init(struct net_device *dev)
Herbert Xue1a80002008-10-09 12:00:17 -07001052{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001053 __gre_tunnel_init(dev);
stephen hemmingerbec94d42014-12-27 10:01:42 -08001054 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Herbert Xue1a80002008-10-09 12:00:17 -07001055
Pravin B Shelarc5441932013-03-25 14:49:35 +00001056 return ip_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -07001057}
1058
Pravin B Shelarc5441932013-03-25 14:49:35 +00001059static const struct net_device_ops gre_tap_netdev_ops = {
1060 .ndo_init = gre_tap_init,
1061 .ndo_uninit = ip_tunnel_uninit,
1062 .ndo_start_xmit = gre_tap_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001063 .ndo_set_mac_address = eth_mac_addr,
1064 .ndo_validate_addr = eth_validate_addr,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001065 .ndo_change_mtu = ip_tunnel_change_mtu,
1066 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +02001067 .ndo_get_iflink = ip_tunnel_get_iflink,
Pravin B Shelarfc4099f2015-10-22 18:17:16 -07001068 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001069};
1070
Herbert Xue1a80002008-10-09 12:00:17 -07001071static void ipgre_tap_setup(struct net_device *dev)
1072{
Herbert Xue1a80002008-10-09 12:00:17 -07001073 ether_setup(dev);
Jiri Bencd13b1612016-02-17 15:32:53 +01001074 dev->netdev_ops = &gre_tap_netdev_ops;
1075 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1076 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001077 ip_tunnel_setup(dev, gre_tap_net_id);
Herbert Xue1a80002008-10-09 12:00:17 -07001078}
1079
Pravin B Shelarc5441932013-03-25 14:49:35 +00001080static int ipgre_newlink(struct net *src_net, struct net_device *dev,
1081 struct nlattr *tb[], struct nlattr *data[])
Herbert Xuc19e6542008-10-09 11:59:55 -07001082{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001083 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001084 struct ip_tunnel_encap ipencap;
1085
1086 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1087 struct ip_tunnel *t = netdev_priv(dev);
1088 int err = ip_tunnel_encap_setup(t, &ipencap);
1089
1090 if (err < 0)
1091 return err;
1092 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001093
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001094 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001095 return ip_tunnel_newlink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001096}
1097
1098static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
1099 struct nlattr *data[])
1100{
Herbert Xuc19e6542008-10-09 11:59:55 -07001101 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001102 struct ip_tunnel_encap ipencap;
1103
1104 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1105 struct ip_tunnel *t = netdev_priv(dev);
1106 int err = ip_tunnel_encap_setup(t, &ipencap);
1107
1108 if (err < 0)
1109 return err;
1110 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001111
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001112 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001113 return ip_tunnel_changelink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001114}
1115
1116static size_t ipgre_get_size(const struct net_device *dev)
1117{
1118 return
1119 /* IFLA_GRE_LINK */
1120 nla_total_size(4) +
1121 /* IFLA_GRE_IFLAGS */
1122 nla_total_size(2) +
1123 /* IFLA_GRE_OFLAGS */
1124 nla_total_size(2) +
1125 /* IFLA_GRE_IKEY */
1126 nla_total_size(4) +
1127 /* IFLA_GRE_OKEY */
1128 nla_total_size(4) +
1129 /* IFLA_GRE_LOCAL */
1130 nla_total_size(4) +
1131 /* IFLA_GRE_REMOTE */
1132 nla_total_size(4) +
1133 /* IFLA_GRE_TTL */
1134 nla_total_size(1) +
1135 /* IFLA_GRE_TOS */
1136 nla_total_size(1) +
1137 /* IFLA_GRE_PMTUDISC */
1138 nla_total_size(1) +
Tom Herbert4565e992014-09-17 12:26:01 -07001139 /* IFLA_GRE_ENCAP_TYPE */
1140 nla_total_size(2) +
1141 /* IFLA_GRE_ENCAP_FLAGS */
1142 nla_total_size(2) +
1143 /* IFLA_GRE_ENCAP_SPORT */
1144 nla_total_size(2) +
1145 /* IFLA_GRE_ENCAP_DPORT */
1146 nla_total_size(2) +
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001147 /* IFLA_GRE_COLLECT_METADATA */
1148 nla_total_size(0) +
Herbert Xuc19e6542008-10-09 11:59:55 -07001149 0;
1150}
1151
1152static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
1153{
1154 struct ip_tunnel *t = netdev_priv(dev);
1155 struct ip_tunnel_parm *p = &t->parms;
1156
David S. Millerf3756b72012-04-01 20:39:02 -04001157 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
Pravin B Shelarc5441932013-03-25 14:49:35 +00001158 nla_put_be16(skb, IFLA_GRE_IFLAGS, tnl_flags_to_gre_flags(p->i_flags)) ||
1159 nla_put_be16(skb, IFLA_GRE_OFLAGS, tnl_flags_to_gre_flags(p->o_flags)) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001160 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
1161 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
Jiri Benc930345e2015-03-29 16:59:25 +02001162 nla_put_in_addr(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
1163 nla_put_in_addr(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001164 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
1165 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
1166 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
1167 !!(p->iph.frag_off & htons(IP_DF))))
1168 goto nla_put_failure;
Tom Herbert4565e992014-09-17 12:26:01 -07001169
1170 if (nla_put_u16(skb, IFLA_GRE_ENCAP_TYPE,
1171 t->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001172 nla_put_be16(skb, IFLA_GRE_ENCAP_SPORT,
1173 t->encap.sport) ||
1174 nla_put_be16(skb, IFLA_GRE_ENCAP_DPORT,
1175 t->encap.dport) ||
Tom Herbert4565e992014-09-17 12:26:01 -07001176 nla_put_u16(skb, IFLA_GRE_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -08001177 t->encap.flags))
Tom Herbert4565e992014-09-17 12:26:01 -07001178 goto nla_put_failure;
1179
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001180 if (t->collect_md) {
1181 if (nla_put_flag(skb, IFLA_GRE_COLLECT_METADATA))
1182 goto nla_put_failure;
1183 }
1184
Herbert Xuc19e6542008-10-09 11:59:55 -07001185 return 0;
1186
1187nla_put_failure:
1188 return -EMSGSIZE;
1189}
1190
1191static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
1192 [IFLA_GRE_LINK] = { .type = NLA_U32 },
1193 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
1194 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
1195 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
1196 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001197 [IFLA_GRE_LOCAL] = { .len = FIELD_SIZEOF(struct iphdr, saddr) },
1198 [IFLA_GRE_REMOTE] = { .len = FIELD_SIZEOF(struct iphdr, daddr) },
Herbert Xuc19e6542008-10-09 11:59:55 -07001199 [IFLA_GRE_TTL] = { .type = NLA_U8 },
1200 [IFLA_GRE_TOS] = { .type = NLA_U8 },
1201 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert4565e992014-09-17 12:26:01 -07001202 [IFLA_GRE_ENCAP_TYPE] = { .type = NLA_U16 },
1203 [IFLA_GRE_ENCAP_FLAGS] = { .type = NLA_U16 },
1204 [IFLA_GRE_ENCAP_SPORT] = { .type = NLA_U16 },
1205 [IFLA_GRE_ENCAP_DPORT] = { .type = NLA_U16 },
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001206 [IFLA_GRE_COLLECT_METADATA] = { .type = NLA_FLAG },
Herbert Xuc19e6542008-10-09 11:59:55 -07001207};
1208
1209static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
1210 .kind = "gre",
1211 .maxtype = IFLA_GRE_MAX,
1212 .policy = ipgre_policy,
1213 .priv_size = sizeof(struct ip_tunnel),
1214 .setup = ipgre_tunnel_setup,
1215 .validate = ipgre_tunnel_validate,
1216 .newlink = ipgre_newlink,
1217 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001218 .dellink = ip_tunnel_dellink,
Herbert Xuc19e6542008-10-09 11:59:55 -07001219 .get_size = ipgre_get_size,
1220 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001221 .get_link_net = ip_tunnel_get_link_net,
Herbert Xuc19e6542008-10-09 11:59:55 -07001222};
1223
Herbert Xue1a80002008-10-09 12:00:17 -07001224static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
1225 .kind = "gretap",
1226 .maxtype = IFLA_GRE_MAX,
1227 .policy = ipgre_policy,
1228 .priv_size = sizeof(struct ip_tunnel),
1229 .setup = ipgre_tap_setup,
1230 .validate = ipgre_tap_validate,
1231 .newlink = ipgre_newlink,
1232 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001233 .dellink = ip_tunnel_dellink,
Herbert Xue1a80002008-10-09 12:00:17 -07001234 .get_size = ipgre_get_size,
1235 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001236 .get_link_net = ip_tunnel_get_link_net,
Herbert Xue1a80002008-10-09 12:00:17 -07001237};
1238
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001239struct net_device *gretap_fb_dev_create(struct net *net, const char *name,
1240 u8 name_assign_type)
1241{
1242 struct nlattr *tb[IFLA_MAX + 1];
1243 struct net_device *dev;
1244 struct ip_tunnel *t;
1245 int err;
1246
1247 memset(&tb, 0, sizeof(tb));
1248
1249 dev = rtnl_create_link(net, name, name_assign_type,
1250 &ipgre_tap_ops, tb);
1251 if (IS_ERR(dev))
1252 return dev;
1253
1254 /* Configure flow based GRE device. */
1255 t = netdev_priv(dev);
1256 t->collect_md = true;
1257
1258 err = ipgre_newlink(net, dev, tb, NULL);
1259 if (err < 0)
1260 goto out;
David Wragg7e059152016-02-10 00:05:58 +00001261
1262 /* openvswitch users expect packet sizes to be unrestricted,
1263 * so set the largest MTU we can.
1264 */
1265 err = __ip_tunnel_change_mtu(dev, IP_MAX_MTU, false);
1266 if (err)
1267 goto out;
1268
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001269 return dev;
1270out:
1271 free_netdev(dev);
1272 return ERR_PTR(err);
1273}
1274EXPORT_SYMBOL_GPL(gretap_fb_dev_create);
1275
Pravin B Shelarc5441932013-03-25 14:49:35 +00001276static int __net_init ipgre_tap_init_net(struct net *net)
1277{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001278 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, "gretap0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001279}
1280
1281static void __net_exit ipgre_tap_exit_net(struct net *net)
1282{
1283 struct ip_tunnel_net *itn = net_generic(net, gre_tap_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001284 ip_tunnel_delete_net(itn, &ipgre_tap_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001285}
1286
1287static struct pernet_operations ipgre_tap_net_ops = {
1288 .init = ipgre_tap_init_net,
1289 .exit = ipgre_tap_exit_net,
1290 .id = &gre_tap_net_id,
1291 .size = sizeof(struct ip_tunnel_net),
1292};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293
1294static int __init ipgre_init(void)
1295{
1296 int err;
1297
Joe Perches058bd4d2012-03-11 18:36:11 +00001298 pr_info("GRE over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001299
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +00001300 err = register_pernet_device(&ipgre_net_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -07001301 if (err < 0)
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001302 return err;
1303
Pravin B Shelarc5441932013-03-25 14:49:35 +00001304 err = register_pernet_device(&ipgre_tap_net_ops);
1305 if (err < 0)
1306 goto pnet_tap_faied;
1307
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001308 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001309 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +00001310 pr_info("%s: can't add protocol\n", __func__);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001311 goto add_proto_failed;
1312 }
Pavel Emelyanov7daa0002008-04-16 01:10:05 -07001313
Herbert Xuc19e6542008-10-09 11:59:55 -07001314 err = rtnl_link_register(&ipgre_link_ops);
1315 if (err < 0)
1316 goto rtnl_link_failed;
1317
Herbert Xue1a80002008-10-09 12:00:17 -07001318 err = rtnl_link_register(&ipgre_tap_ops);
1319 if (err < 0)
1320 goto tap_ops_failed;
1321
Pravin B Shelarc5441932013-03-25 14:49:35 +00001322 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001323
Herbert Xue1a80002008-10-09 12:00:17 -07001324tap_ops_failed:
1325 rtnl_link_unregister(&ipgre_link_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001326rtnl_link_failed:
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001327 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001328add_proto_failed:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001329 unregister_pernet_device(&ipgre_tap_net_ops);
1330pnet_tap_faied:
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001331 unregister_pernet_device(&ipgre_net_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001332 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001333}
1334
Alexey Kuznetsovdb445752005-07-30 17:46:44 -07001335static void __exit ipgre_fini(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001336{
Herbert Xue1a80002008-10-09 12:00:17 -07001337 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001338 rtnl_link_unregister(&ipgre_link_ops);
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001339 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001340 unregister_pernet_device(&ipgre_tap_net_ops);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001341 unregister_pernet_device(&ipgre_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001342}
1343
1344module_init(ipgre_init);
1345module_exit(ipgre_fini);
1346MODULE_LICENSE("GPL");
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001347MODULE_ALIAS_RTNL_LINK("gre");
1348MODULE_ALIAS_RTNL_LINK("gretap");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +03001349MODULE_ALIAS_NETDEV("gre0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001350MODULE_ALIAS_NETDEV("gretap0");