blob: af5d1f38217f4e4dcb977b6410d0d9a6a6c1e87c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: GRE over IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Joe Perchesafd465032012-03-12 07:03:32 +000013#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14
Randy Dunlap4fc268d2006-01-11 12:17:47 -080015#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090019#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <asm/uaccess.h>
21#include <linux/skbuff.h>
22#include <linux/netdevice.h>
23#include <linux/in.h>
24#include <linux/tcp.h>
25#include <linux/udp.h>
26#include <linux/if_arp.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070027#include <linux/if_vlan.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/init.h>
29#include <linux/in6.h>
30#include <linux/inetdevice.h>
31#include <linux/igmp.h>
32#include <linux/netfilter_ipv4.h>
Herbert Xue1a80002008-10-09 12:00:17 -070033#include <linux/etherdevice.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080034#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#include <net/sock.h>
37#include <net/ip.h>
38#include <net/icmp.h>
39#include <net/protocol.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000040#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/arp.h>
42#include <net/checksum.h>
43#include <net/dsfield.h>
44#include <net/inet_ecn.h>
45#include <net/xfrm.h>
Pavel Emelyanov59a4c752008-04-16 01:08:53 -070046#include <net/net_namespace.h>
47#include <net/netns/generic.h>
Herbert Xuc19e6542008-10-09 11:59:55 -070048#include <net/rtnetlink.h>
Dmitry Kozlov00959ad2010-08-21 23:05:39 -070049#include <net/gre.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070050#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
Eric Dumazetdfd56b82011-12-10 09:48:31 +000052#if IS_ENABLED(CONFIG_IPV6)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053#include <net/ipv6.h>
54#include <net/ip6_fib.h>
55#include <net/ip6_route.h>
56#endif
57
58/*
59 Problems & solutions
60 --------------------
61
62 1. The most important issue is detecting local dead loops.
63 They would cause complete host lockup in transmit, which
64 would be "resolved" by stack overflow or, if queueing is enabled,
65 with infinite looping in net_bh.
66
67 We cannot track such dead loops during route installation,
68 it is infeasible task. The most general solutions would be
69 to keep skb->encapsulation counter (sort of local ttl),
Eric Dumazet6d0722a2010-09-29 23:35:10 -070070 and silently drop packet when it expires. It is a good
stephen hemmingerbff52852012-02-24 08:08:20 +000071 solution, but it supposes maintaining new variable in ALL
Linus Torvalds1da177e2005-04-16 15:20:36 -070072 skb, even if no tunneling is used.
73
Eric Dumazet6d0722a2010-09-29 23:35:10 -070074 Current solution: xmit_recursion breaks dead loops. This is a percpu
75 counter, since when we enter the first ndo_xmit(), cpu migration is
76 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78 2. Networking dead loops would not kill routers, but would really
79 kill network. IP hop limit plays role of "t->recursion" in this case,
80 if we copy it from packet being encapsulated to upper header.
81 It is very good solution, but it introduces two problems:
82
83 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
84 do not work over tunnels.
85 - traceroute does not work. I planned to relay ICMP from tunnel,
86 so that this problem would be solved and traceroute output
87 would even more informative. This idea appeared to be wrong:
88 only Linux complies to rfc1812 now (yes, guys, Linux is the only
89 true router now :-)), all routers (at least, in neighbourhood of mine)
90 return only 8 bytes of payload. It is the end.
91
92 Hence, if we want that OSPF worked or traceroute said something reasonable,
93 we should search for another solution.
94
95 One of them is to parse packet trying to detect inner encapsulation
96 made by our node. It is difficult or even impossible, especially,
stephen hemmingerbff52852012-02-24 08:08:20 +000097 taking into account fragmentation. TO be short, ttl is not solution at all.
Linus Torvalds1da177e2005-04-16 15:20:36 -070098
99 Current solution: The solution was UNEXPECTEDLY SIMPLE.
100 We force DF flag on tunnels with preconfigured hop limit,
101 that is ALL. :-) Well, it does not remove the problem completely,
102 but exponential growth of network traffic is changed to linear
103 (branches, that exceed pmtu are pruned) and tunnel mtu
stephen hemmingerbff52852012-02-24 08:08:20 +0000104 rapidly degrades to value <68, where looping stops.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 Yes, it is not good if there exists a router in the loop,
106 which does not force DF, even when encapsulating packets have DF set.
107 But it is not our problem! Nobody could accuse us, we made
108 all that we could make. Even if it is your gated who injected
109 fatal route to network, even if it were you who configured
110 fatal static route: you are innocent. :-)
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 Alexey Kuznetsov.
113 */
114
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000115static bool log_ecn_error = true;
116module_param(log_ecn_error, bool, 0644);
117MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
118
Herbert Xuc19e6542008-10-09 11:59:55 -0700119static struct rtnl_link_ops ipgre_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120static int ipgre_tunnel_init(struct net_device *dev);
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700121
Eric Dumazetf99189b2009-11-17 10:42:49 +0000122static int ipgre_net_id __read_mostly;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000123static int gre_tap_net_id __read_mostly;
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700124
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700125static int ip_gre_calc_hlen(__be16 o_flags)
126{
127 int addend = 4;
128
129 if (o_flags & TUNNEL_CSUM)
130 addend += 4;
131 if (o_flags & TUNNEL_KEY)
132 addend += 4;
133 if (o_flags & TUNNEL_SEQ)
134 addend += 4;
135 return addend;
136}
137
138static __be16 gre_flags_to_tnl_flags(__be16 flags)
139{
140 __be16 tflags = 0;
141
142 if (flags & GRE_CSUM)
143 tflags |= TUNNEL_CSUM;
144 if (flags & GRE_ROUTING)
145 tflags |= TUNNEL_ROUTING;
146 if (flags & GRE_KEY)
147 tflags |= TUNNEL_KEY;
148 if (flags & GRE_SEQ)
149 tflags |= TUNNEL_SEQ;
150 if (flags & GRE_STRICT)
151 tflags |= TUNNEL_STRICT;
152 if (flags & GRE_REC)
153 tflags |= TUNNEL_REC;
154 if (flags & GRE_VERSION)
155 tflags |= TUNNEL_VERSION;
156
157 return tflags;
158}
159
160static __be16 tnl_flags_to_gre_flags(__be16 tflags)
161{
162 __be16 flags = 0;
163
164 if (tflags & TUNNEL_CSUM)
165 flags |= GRE_CSUM;
166 if (tflags & TUNNEL_ROUTING)
167 flags |= GRE_ROUTING;
168 if (tflags & TUNNEL_KEY)
169 flags |= GRE_KEY;
170 if (tflags & TUNNEL_SEQ)
171 flags |= GRE_SEQ;
172 if (tflags & TUNNEL_STRICT)
173 flags |= GRE_STRICT;
174 if (tflags & TUNNEL_REC)
175 flags |= GRE_REC;
176 if (tflags & TUNNEL_VERSION)
177 flags |= GRE_VERSION;
178
179 return flags;
180}
181
182static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
183 bool *csum_err)
184{
185 const struct gre_base_hdr *greh;
186 __be32 *options;
187 int hdr_len;
188
189 if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
190 return -EINVAL;
191
192 greh = (struct gre_base_hdr *)skb_transport_header(skb);
193 if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
194 return -EINVAL;
195
196 tpi->flags = gre_flags_to_tnl_flags(greh->flags);
197 hdr_len = ip_gre_calc_hlen(tpi->flags);
198
199 if (!pskb_may_pull(skb, hdr_len))
200 return -EINVAL;
201
202 greh = (struct gre_base_hdr *)skb_transport_header(skb);
203 tpi->proto = greh->protocol;
204
205 options = (__be32 *)(greh + 1);
206 if (greh->flags & GRE_CSUM) {
207 if (skb_checksum_simple_validate(skb)) {
208 *csum_err = true;
209 return -EINVAL;
210 }
211
212 skb_checksum_try_convert(skb, IPPROTO_GRE, 0,
213 null_compute_pseudo);
214 options++;
215 }
216
217 if (greh->flags & GRE_KEY) {
218 tpi->key = *options;
219 options++;
220 } else {
221 tpi->key = 0;
222 }
223 if (unlikely(greh->flags & GRE_SEQ)) {
224 tpi->seq = *options;
225 options++;
226 } else {
227 tpi->seq = 0;
228 }
229 /* WCCP version 1 and 2 protocol decoding.
230 * - Change protocol to IP
231 * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
232 */
233 if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
234 tpi->proto = htons(ETH_P_IP);
235 if ((*(u8 *)options & 0xF0) != 0x40) {
236 hdr_len += 4;
237 if (!pskb_may_pull(skb, hdr_len))
238 return -EINVAL;
239 }
240 }
Jiri Benc7f290c92016-02-18 11:22:52 +0100241 return iptunnel_pull_header(skb, hdr_len, tpi->proto, false);
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700242}
243
244static void ipgre_err(struct sk_buff *skb, u32 info,
245 const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Pravin B Shelarc5441932013-03-25 14:49:35 +0000248 /* All the routers (except for Linux) return only
249 8 bytes of packet payload. It means, that precise relaying of
250 ICMP in the real Internet is absolutely infeasible.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Pravin B Shelarc5441932013-03-25 14:49:35 +0000252 Moreover, Cisco "wise men" put GRE key to the third word
253 in GRE header. It makes impossible maintaining even soft
254 state for keyed GRE tunnels with enabled checksum. Tell
255 them "thank you".
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256
Pravin B Shelarc5441932013-03-25 14:49:35 +0000257 Well, I wonder, rfc1812 was written by Cisco employee,
258 what the hell these idiots break standards established
259 by themselves???
260 */
261 struct net *net = dev_net(skb->dev);
262 struct ip_tunnel_net *itn;
Eric Dumazet96f5a842013-05-18 08:36:03 +0000263 const struct iphdr *iph;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300264 const int type = icmp_hdr(skb)->type;
265 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 struct ip_tunnel *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 switch (type) {
269 default:
270 case ICMP_PARAMETERPROB:
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700271 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
273 case ICMP_DEST_UNREACH:
274 switch (code) {
275 case ICMP_SR_FAILED:
276 case ICMP_PORT_UNREACH:
277 /* Impossible event. */
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700278 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 default:
280 /* All others are translated to HOST_UNREACH.
281 rfc2003 contains "deep thoughts" about NET_UNREACH,
282 I believe they are just ether pollution. --ANK
283 */
284 break;
285 }
286 break;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 case ICMP_TIME_EXCEEDED:
289 if (code != ICMP_EXC_TTL)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700290 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700292
293 case ICMP_REDIRECT:
294 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 }
296
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700297 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000298 itn = net_generic(net, gre_tap_net_id);
299 else
300 itn = net_generic(net, ipgre_net_id);
301
Duan Jiongc0c0c502014-01-28 11:49:43 +0800302 iph = (const struct iphdr *)(icmp_hdr(skb) + 1);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700303 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
304 iph->daddr, iph->saddr, tpi->key);
stephen hemmingerd2083282012-09-24 18:12:23 +0000305
Ian Morris51456b22015-04-03 09:17:26 +0100306 if (!t)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700307 return;
David S. Miller36393392012-06-14 22:21:46 -0700308
David S. Miller36393392012-06-14 22:21:46 -0700309 if (t->parms.iph.daddr == 0 ||
Joe Perchesf97c1e02007-12-16 13:45:43 -0800310 ipv4_is_multicast(t->parms.iph.daddr))
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700311 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
313 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700314 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Wei Yongjunda6185d82009-02-24 23:34:48 -0800316 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317 t->err_count++;
318 else
319 t->err_count = 1;
320 t->err_time = jiffies;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700321}
322
323static void gre_err(struct sk_buff *skb, u32 info)
324{
325 /* All the routers (except for Linux) return only
326 * 8 bytes of packet payload. It means, that precise relaying of
327 * ICMP in the real Internet is absolutely infeasible.
328 *
329 * Moreover, Cisco "wise men" put GRE key to the third word
330 * in GRE header. It makes impossible maintaining even soft
331 * state for keyed
332 * GRE tunnels with enabled checksum. Tell them "thank you".
333 *
334 * Well, I wonder, rfc1812 was written by Cisco employee,
335 * what the hell these idiots break standards established
336 * by themselves???
337 */
338
339 const int type = icmp_hdr(skb)->type;
340 const int code = icmp_hdr(skb)->code;
341 struct tnl_ptk_info tpi;
342 bool csum_err = false;
343
344 if (parse_gre_header(skb, &tpi, &csum_err)) {
345 if (!csum_err) /* ignore csum errors. */
346 return;
347 }
348
349 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
350 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
351 skb->dev->ifindex, 0, IPPROTO_GRE, 0);
352 return;
353 }
354 if (type == ICMP_REDIRECT) {
355 ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
356 IPPROTO_GRE, 0);
357 return;
358 }
359
360 ipgre_err(skb, info, &tpi);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700363static __be64 key_to_tunnel_id(__be32 key)
364{
365#ifdef __BIG_ENDIAN
366 return (__force __be64)((__force u32)key);
367#else
368 return (__force __be64)((__force u64)key << 32);
369#endif
370}
371
372/* Returns the least-significant 32 bits of a __be64. */
373static __be32 tunnel_id_to_key(__be64 x)
374{
375#ifdef __BIG_ENDIAN
376 return (__force __be32)x;
377#else
378 return (__force __be32)((__force u64)x >> 32);
379#endif
380}
381
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700382static int ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000384 struct net *net = dev_net(skb->dev);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700385 struct metadata_dst *tun_dst = NULL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000386 struct ip_tunnel_net *itn;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000387 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 struct ip_tunnel *tunnel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700390 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000391 itn = net_generic(net, gre_tap_net_id);
392 else
393 itn = net_generic(net, ipgre_net_id);
394
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700395 iph = ip_hdr(skb);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700396 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
397 iph->saddr, iph->daddr, tpi->key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
stephen hemmingerd2083282012-09-24 18:12:23 +0000399 if (tunnel) {
Timo Teräs0e3da5b2013-12-16 11:02:09 +0200400 skb_pop_mac_header(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700401 if (tunnel->collect_md) {
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700402 __be16 flags;
403 __be64 tun_id;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700404
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700405 flags = tpi->flags & (TUNNEL_CSUM | TUNNEL_KEY);
406 tun_id = key_to_tunnel_id(tpi->key);
407 tun_dst = ip_tun_rx_dst(skb, flags, tun_id, 0);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700408 if (!tun_dst)
409 return PACKET_REJECT;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700410 }
411
412 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700413 return PACKET_RCVD;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 }
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700415 return PACKET_REJECT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416}
417
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700418static int gre_rcv(struct sk_buff *skb)
419{
420 struct tnl_ptk_info tpi;
421 bool csum_err = false;
422
423#ifdef CONFIG_NET_IPGRE_BROADCAST
424 if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
425 /* Looped back packet, drop it! */
426 if (rt_is_output_route(skb_rtable(skb)))
427 goto drop;
428 }
429#endif
430
431 if (parse_gre_header(skb, &tpi, &csum_err) < 0)
432 goto drop;
433
434 if (ipgre_rcv(skb, &tpi) == PACKET_RCVD)
435 return 0;
436
437 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
438drop:
439 kfree_skb(skb);
440 return 0;
441}
442
Edward Cree53936102016-02-11 21:01:07 +0000443static __sum16 gre_checksum(struct sk_buff *skb)
444{
445 __wsum csum;
446
447 if (skb->ip_summed == CHECKSUM_PARTIAL)
448 csum = lco_csum(skb);
449 else
450 csum = skb_checksum(skb, 0, skb->len, 0);
451 return csum_fold(csum);
452}
453
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700454static void build_header(struct sk_buff *skb, int hdr_len, __be16 flags,
455 __be16 proto, __be32 key, __be32 seq)
456{
457 struct gre_base_hdr *greh;
458
459 skb_push(skb, hdr_len);
460
461 skb_reset_transport_header(skb);
462 greh = (struct gre_base_hdr *)skb->data;
463 greh->flags = tnl_flags_to_gre_flags(flags);
464 greh->protocol = proto;
465
466 if (flags & (TUNNEL_KEY | TUNNEL_CSUM | TUNNEL_SEQ)) {
467 __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
468
469 if (flags & TUNNEL_SEQ) {
470 *ptr = seq;
471 ptr--;
472 }
473 if (flags & TUNNEL_KEY) {
474 *ptr = key;
475 ptr--;
476 }
477 if (flags & TUNNEL_CSUM &&
478 !(skb_shinfo(skb)->gso_type &
479 (SKB_GSO_GRE | SKB_GSO_GRE_CSUM))) {
480 *ptr = 0;
Edward Cree53936102016-02-11 21:01:07 +0000481 *(__sum16 *)ptr = gre_checksum(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700482 }
483 }
484}
485
Pravin B Shelarc5441932013-03-25 14:49:35 +0000486static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
487 const struct iphdr *tnl_params,
488 __be16 proto)
489{
490 struct ip_tunnel *tunnel = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000491
Pravin B Shelarc5441932013-03-25 14:49:35 +0000492 if (tunnel->parms.o_flags & TUNNEL_SEQ)
493 tunnel->o_seqno++;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000494
Pravin B Shelarc5441932013-03-25 14:49:35 +0000495 /* Push GRE header. */
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700496 build_header(skb, tunnel->tun_hlen, tunnel->parms.o_flags,
497 proto, tunnel->parms.o_key, htonl(tunnel->o_seqno));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700499 skb_set_inner_protocol(skb, proto);
Nicolas Dichtelbf3d6a82013-05-27 23:48:15 +0000500 ip_tunnel_xmit(skb, dev, tnl_params, tnl_params->protocol);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501}
502
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700503static struct sk_buff *gre_handle_offloads(struct sk_buff *skb,
504 bool csum)
505{
Edward Cree6fa79662016-02-11 21:02:31 +0000506 return iptunnel_handle_offloads(skb, csum ? SKB_GSO_GRE_CSUM : SKB_GSO_GRE);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700507}
508
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700509static struct rtable *gre_get_rt(struct sk_buff *skb,
510 struct net_device *dev,
511 struct flowi4 *fl,
512 const struct ip_tunnel_key *key)
513{
514 struct net *net = dev_net(dev);
515
516 memset(fl, 0, sizeof(*fl));
517 fl->daddr = key->u.ipv4.dst;
518 fl->saddr = key->u.ipv4.src;
519 fl->flowi4_tos = RT_TOS(key->tos);
520 fl->flowi4_mark = skb->mark;
521 fl->flowi4_proto = IPPROTO_GRE;
522
523 return ip_route_output_key(net, fl);
524}
525
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700526static void gre_fb_xmit(struct sk_buff *skb, struct net_device *dev)
527{
528 struct ip_tunnel_info *tun_info;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700529 const struct ip_tunnel_key *key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100530 struct rtable *rt = NULL;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700531 struct flowi4 fl;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700532 int min_headroom;
533 int tunnel_hlen;
534 __be16 df, flags;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100535 bool use_cache;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700536 int err;
537
Jiri Benc61adedf2015-08-20 13:56:25 +0200538 tun_info = skb_tunnel_info(skb);
Jiri Benc7f9562a2015-08-28 20:48:20 +0200539 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
540 ip_tunnel_info_af(tun_info) != AF_INET))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700541 goto err_free_skb;
542
543 key = &tun_info->key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100544 use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
545 if (use_cache)
546 rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl.saddr);
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100547 if (!rt) {
548 rt = gre_get_rt(skb, dev, &fl, key);
549 if (IS_ERR(rt))
550 goto err_free_skb;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100551 if (use_cache)
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100552 dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
553 fl.saddr);
554 }
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700555
556 tunnel_hlen = ip_gre_calc_hlen(key->tun_flags);
557
558 min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len
559 + tunnel_hlen + sizeof(struct iphdr);
560 if (skb_headroom(skb) < min_headroom || skb_header_cloned(skb)) {
561 int head_delta = SKB_DATA_ALIGN(min_headroom -
562 skb_headroom(skb) +
563 16);
564 err = pskb_expand_head(skb, max_t(int, head_delta, 0),
565 0, GFP_ATOMIC);
566 if (unlikely(err))
567 goto err_free_rt;
568 }
569
570 /* Push Tunnel header. */
571 skb = gre_handle_offloads(skb, !!(tun_info->key.tun_flags & TUNNEL_CSUM));
572 if (IS_ERR(skb)) {
573 skb = NULL;
574 goto err_free_rt;
575 }
576
577 flags = tun_info->key.tun_flags & (TUNNEL_CSUM | TUNNEL_KEY);
578 build_header(skb, tunnel_hlen, flags, htons(ETH_P_TEB),
579 tunnel_id_to_key(tun_info->key.tun_id), 0);
580
581 df = key->tun_flags & TUNNEL_DONT_FRAGMENT ? htons(IP_DF) : 0;
Pravin B Shelar039f5062015-12-24 14:34:54 -0800582
583 iptunnel_xmit(skb->sk, rt, skb, fl.saddr, key->u.ipv4.dst, IPPROTO_GRE,
584 key->tos, key->ttl, df, false);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700585 return;
586
587err_free_rt:
588 ip_rt_put(rt);
589err_free_skb:
590 kfree_skb(skb);
591 dev->stats.tx_dropped++;
592}
593
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700594static int gre_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb)
595{
596 struct ip_tunnel_info *info = skb_tunnel_info(skb);
597 struct rtable *rt;
598 struct flowi4 fl4;
599
600 if (ip_tunnel_info_af(info) != AF_INET)
601 return -EINVAL;
602
603 rt = gre_get_rt(skb, dev, &fl4, &info->key);
604 if (IS_ERR(rt))
605 return PTR_ERR(rt);
606
607 ip_rt_put(rt);
608 info->key.u.ipv4.src = fl4.saddr;
609 return 0;
610}
611
Pravin B Shelarc5441932013-03-25 14:49:35 +0000612static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
613 struct net_device *dev)
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800614{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000615 struct ip_tunnel *tunnel = netdev_priv(dev);
616 const struct iphdr *tnl_params;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800617
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700618 if (tunnel->collect_md) {
619 gre_fb_xmit(skb, dev);
620 return NETDEV_TX_OK;
621 }
622
Pravin B Shelarc5441932013-03-25 14:49:35 +0000623 if (dev->header_ops) {
624 /* Need space for new headers */
625 if (skb_cow_head(skb, dev->needed_headroom -
Chen Gang2bac7cb2013-04-22 20:45:42 +0000626 (tunnel->hlen + sizeof(struct iphdr))))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000627 goto free_skb;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800628
Pravin B Shelarc5441932013-03-25 14:49:35 +0000629 tnl_params = (const struct iphdr *)skb->data;
Eric Dumazete985aad2010-09-27 03:57:11 +0000630
Pravin B Shelarc5441932013-03-25 14:49:35 +0000631 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
632 * to gre header.
633 */
634 skb_pull(skb, tunnel->hlen + sizeof(struct iphdr));
Timo Teräs8a0033a2014-12-15 09:24:13 +0200635 skb_reset_mac_header(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000636 } else {
637 if (skb_cow_head(skb, dev->needed_headroom))
638 goto free_skb;
Herbert Xue1a80002008-10-09 12:00:17 -0700639
Pravin B Shelarc5441932013-03-25 14:49:35 +0000640 tnl_params = &tunnel->parms.iph;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800641 }
642
Timo Teräs8a0033a2014-12-15 09:24:13 +0200643 skb = gre_handle_offloads(skb, !!(tunnel->parms.o_flags&TUNNEL_CSUM));
644 if (IS_ERR(skb))
645 goto out;
646
Pravin B Shelarc5441932013-03-25 14:49:35 +0000647 __gre_xmit(skb, dev, tnl_params, skb->protocol);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000648 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800649
Pravin B Shelarc5441932013-03-25 14:49:35 +0000650free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800651 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000652out:
653 dev->stats.tx_dropped++;
654 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800655}
656
Pravin B Shelarc5441932013-03-25 14:49:35 +0000657static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
658 struct net_device *dev)
659{
660 struct ip_tunnel *tunnel = netdev_priv(dev);
661
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700662 if (tunnel->collect_md) {
663 gre_fb_xmit(skb, dev);
664 return NETDEV_TX_OK;
665 }
666
Pravin B Shelar45f2e992013-06-17 17:49:51 -0700667 skb = gre_handle_offloads(skb, !!(tunnel->parms.o_flags&TUNNEL_CSUM));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000668 if (IS_ERR(skb))
669 goto out;
670
671 if (skb_cow_head(skb, dev->needed_headroom))
672 goto free_skb;
673
674 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000675 return NETDEV_TX_OK;
676
677free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800678 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000679out:
680 dev->stats.tx_dropped++;
681 return NETDEV_TX_OK;
682}
683
684static int ipgre_tunnel_ioctl(struct net_device *dev,
685 struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686{
Tom Herbert4565e992014-09-17 12:26:01 -0700687 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689
Pravin B Shelarc5441932013-03-25 14:49:35 +0000690 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
691 return -EFAULT;
Cong Wang6c734fb2013-06-29 12:02:59 +0800692 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
693 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_GRE ||
694 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)) ||
695 ((p.i_flags|p.o_flags)&(GRE_VERSION|GRE_ROUTING)))
696 return -EINVAL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000697 }
698 p.i_flags = gre_flags_to_tnl_flags(p.i_flags);
699 p.o_flags = gre_flags_to_tnl_flags(p.o_flags);
700
701 err = ip_tunnel_ioctl(dev, &p, cmd);
702 if (err)
703 return err;
704
705 p.i_flags = tnl_flags_to_gre_flags(p.i_flags);
706 p.o_flags = tnl_flags_to_gre_flags(p.o_flags);
707
708 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
709 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 return 0;
711}
712
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713/* Nice toy. Unfortunately, useless in real life :-)
714 It allows to construct virtual multiprotocol broadcast "LAN"
715 over the Internet, provided multicast routing is tuned.
716
717
718 I have no idea was this bicycle invented before me,
719 so that I had to set ARPHRD_IPGRE to a random value.
720 I have an impression, that Cisco could make something similar,
721 but this feature is apparently missing in IOS<=11.2(8).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900722
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
724 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
725
726 ping -t 255 224.66.66.66
727
728 If nobody answers, mbone does not work.
729
730 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
731 ip addr add 10.66.66.<somewhat>/24 dev Universe
732 ifconfig Universe up
733 ifconfig Universe add fe80::<Your_real_addr>/10
734 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
735 ftp 10.66.66.66
736 ...
737 ftp fec0:6666:6666::193.233.7.65
738 ...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739 */
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700740static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
741 unsigned short type,
Eric Dumazet15078502010-09-15 11:07:53 +0000742 const void *daddr, const void *saddr, unsigned int len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743{
Patrick McHardy2941a482006-01-08 22:05:26 -0800744 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000745 struct iphdr *iph;
746 struct gre_base_hdr *greh;
747
748 iph = (struct iphdr *)skb_push(skb, t->hlen + sizeof(*iph));
749 greh = (struct gre_base_hdr *)(iph+1);
750 greh->flags = tnl_flags_to_gre_flags(t->parms.o_flags);
751 greh->protocol = htons(type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752
753 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754
Pravin B Shelarc5441932013-03-25 14:49:35 +0000755 /* Set the source hardware address. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756 if (saddr)
757 memcpy(&iph->saddr, saddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000758 if (daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 memcpy(&iph->daddr, daddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000760 if (iph->daddr)
Timo Teräs77a482b2013-08-06 13:45:43 +0300761 return t->hlen + sizeof(*iph);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900762
Pravin B Shelarc5441932013-03-25 14:49:35 +0000763 return -(t->hlen + sizeof(*iph));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764}
765
Timo Teras6a5f44d2007-10-23 20:31:53 -0700766static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
767{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000768 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
Timo Teras6a5f44d2007-10-23 20:31:53 -0700769 memcpy(haddr, &iph->saddr, 4);
770 return 4;
771}
772
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700773static const struct header_ops ipgre_header_ops = {
774 .create = ipgre_header,
Timo Teras6a5f44d2007-10-23 20:31:53 -0700775 .parse = ipgre_header_parse,
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700776};
777
Timo Teras6a5f44d2007-10-23 20:31:53 -0700778#ifdef CONFIG_NET_IPGRE_BROADCAST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779static int ipgre_open(struct net_device *dev)
780{
Patrick McHardy2941a482006-01-08 22:05:26 -0800781 struct ip_tunnel *t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782
Joe Perchesf97c1e02007-12-16 13:45:43 -0800783 if (ipv4_is_multicast(t->parms.iph.daddr)) {
David S. Millercbb1e852011-05-04 12:33:34 -0700784 struct flowi4 fl4;
785 struct rtable *rt;
Eric Dumazete985aad2010-09-27 03:57:11 +0000786
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200787 rt = ip_route_output_gre(t->net, &fl4,
David S. Millercbb1e852011-05-04 12:33:34 -0700788 t->parms.iph.daddr,
789 t->parms.iph.saddr,
790 t->parms.o_key,
791 RT_TOS(t->parms.iph.tos),
792 t->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800793 if (IS_ERR(rt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700794 return -EADDRNOTAVAIL;
Changli Gaod8d1f302010-06-10 23:31:35 -0700795 dev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796 ip_rt_put(rt);
Ian Morris51456b22015-04-03 09:17:26 +0100797 if (!__in_dev_get_rtnl(dev))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798 return -EADDRNOTAVAIL;
799 t->mlink = dev->ifindex;
Herbert Xue5ed6392005-10-03 14:35:55 -0700800 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700801 }
802 return 0;
803}
804
805static int ipgre_close(struct net_device *dev)
806{
Patrick McHardy2941a482006-01-08 22:05:26 -0800807 struct ip_tunnel *t = netdev_priv(dev);
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800808
Joe Perchesf97c1e02007-12-16 13:45:43 -0800809 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800810 struct in_device *in_dev;
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200811 in_dev = inetdev_by_index(t->net, t->mlink);
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000812 if (in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814 }
815 return 0;
816}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817#endif
818
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800819static const struct net_device_ops ipgre_netdev_ops = {
820 .ndo_init = ipgre_tunnel_init,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000821 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800822#ifdef CONFIG_NET_IPGRE_BROADCAST
823 .ndo_open = ipgre_open,
824 .ndo_stop = ipgre_close,
825#endif
Pravin B Shelarc5441932013-03-25 14:49:35 +0000826 .ndo_start_xmit = ipgre_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800827 .ndo_do_ioctl = ipgre_tunnel_ioctl,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000828 .ndo_change_mtu = ip_tunnel_change_mtu,
829 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200830 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800831};
832
Eric Dumazet6b78f162012-09-13 21:25:33 +0000833#define GRE_FEATURES (NETIF_F_SG | \
834 NETIF_F_FRAGLIST | \
835 NETIF_F_HIGHDMA | \
836 NETIF_F_HW_CSUM)
837
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838static void ipgre_tunnel_setup(struct net_device *dev)
839{
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800840 dev->netdev_ops = &ipgre_netdev_ops;
Nicolas Dichtel5a455272014-04-11 15:51:18 +0200841 dev->type = ARPHRD_IPGRE;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000842 ip_tunnel_setup(dev, ipgre_net_id);
843}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844
Pravin B Shelarc5441932013-03-25 14:49:35 +0000845static void __gre_tunnel_init(struct net_device *dev)
846{
847 struct ip_tunnel *tunnel;
Tom Herbert4565e992014-09-17 12:26:01 -0700848 int t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000849
850 tunnel = netdev_priv(dev);
Tom Herbert4565e992014-09-17 12:26:01 -0700851 tunnel->tun_hlen = ip_gre_calc_hlen(tunnel->parms.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000852 tunnel->parms.iph.protocol = IPPROTO_GRE;
853
Tom Herbert4565e992014-09-17 12:26:01 -0700854 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
855
856 t_hlen = tunnel->hlen + sizeof(struct iphdr);
857
858 dev->needed_headroom = LL_MAX_HEADER + t_hlen + 4;
859 dev->mtu = ETH_DATA_LEN - t_hlen - 4;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000860
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200861 dev->features |= GRE_FEATURES;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000862 dev->hw_features |= GRE_FEATURES;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000863
864 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
Alexander Duycka0ca1532016-04-05 09:13:39 -0700865 /* TCP offload with GRE SEQ is not supported, nor
866 * can we support 2 levels of outer headers requiring
867 * an update.
868 */
869 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
870 (tunnel->encap.type == TUNNEL_ENCAP_NONE)) {
871 dev->features |= NETIF_F_GSO_SOFTWARE;
872 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
873 }
874
Pravin B Shelarc5441932013-03-25 14:49:35 +0000875 /* Can use a lockless transmit, unless we generate
876 * output sequences
877 */
878 dev->features |= NETIF_F_LLTX;
879 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880}
881
882static int ipgre_tunnel_init(struct net_device *dev)
883{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000884 struct ip_tunnel *tunnel = netdev_priv(dev);
885 struct iphdr *iph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700886
Pravin B Shelarc5441932013-03-25 14:49:35 +0000887 __gre_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700888
Pravin B Shelarc5441932013-03-25 14:49:35 +0000889 memcpy(dev->dev_addr, &iph->saddr, 4);
890 memcpy(dev->broadcast, &iph->daddr, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891
Pravin B Shelarc5441932013-03-25 14:49:35 +0000892 dev->flags = IFF_NOARP;
Eric Dumazet02875872014-10-05 18:38:35 -0700893 netif_keep_dst(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000894 dev->addr_len = 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
Linus Torvalds1da177e2005-04-16 15:20:36 -0700896 if (iph->daddr) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897#ifdef CONFIG_NET_IPGRE_BROADCAST
Joe Perchesf97c1e02007-12-16 13:45:43 -0800898 if (ipv4_is_multicast(iph->daddr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700899 if (!iph->saddr)
900 return -EINVAL;
901 dev->flags = IFF_BROADCAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700902 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700903 }
904#endif
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800905 } else
Timo Teras6a5f44d2007-10-23 20:31:53 -0700906 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907
Pravin B Shelarc5441932013-03-25 14:49:35 +0000908 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700909}
910
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700911static const struct gre_protocol ipgre_protocol = {
912 .handler = gre_rcv,
913 .err_handler = gre_err,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914};
915
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000916static int __net_init ipgre_init_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700917{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000918 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700919}
920
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000921static void __net_exit ipgre_exit_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700922{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000923 struct ip_tunnel_net *itn = net_generic(net, ipgre_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200924 ip_tunnel_delete_net(itn, &ipgre_link_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700925}
926
927static struct pernet_operations ipgre_net_ops = {
928 .init = ipgre_init_net,
929 .exit = ipgre_exit_net,
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000930 .id = &ipgre_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000931 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700932};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933
Herbert Xuc19e6542008-10-09 11:59:55 -0700934static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
935{
936 __be16 flags;
937
938 if (!data)
939 return 0;
940
941 flags = 0;
942 if (data[IFLA_GRE_IFLAGS])
943 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
944 if (data[IFLA_GRE_OFLAGS])
945 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
946 if (flags & (GRE_VERSION|GRE_ROUTING))
947 return -EINVAL;
948
949 return 0;
950}
951
Herbert Xue1a80002008-10-09 12:00:17 -0700952static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[])
953{
954 __be32 daddr;
955
956 if (tb[IFLA_ADDRESS]) {
957 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
958 return -EINVAL;
959 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
960 return -EADDRNOTAVAIL;
961 }
962
963 if (!data)
964 goto out;
965
966 if (data[IFLA_GRE_REMOTE]) {
967 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
968 if (!daddr)
969 return -EINVAL;
970 }
971
972out:
973 return ipgre_tunnel_validate(tb, data);
974}
975
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700976static void ipgre_netlink_parms(struct net_device *dev,
977 struct nlattr *data[],
978 struct nlattr *tb[],
979 struct ip_tunnel_parm *parms)
Herbert Xuc19e6542008-10-09 11:59:55 -0700980{
Herbert Xu7bb82d92008-10-11 12:20:15 -0700981 memset(parms, 0, sizeof(*parms));
Herbert Xuc19e6542008-10-09 11:59:55 -0700982
983 parms->iph.protocol = IPPROTO_GRE;
984
985 if (!data)
986 return;
987
988 if (data[IFLA_GRE_LINK])
989 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
990
991 if (data[IFLA_GRE_IFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000992 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700993
994 if (data[IFLA_GRE_OFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000995 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700996
997 if (data[IFLA_GRE_IKEY])
998 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
999
1000 if (data[IFLA_GRE_OKEY])
1001 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
1002
1003 if (data[IFLA_GRE_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +02001004 parms->iph.saddr = nla_get_in_addr(data[IFLA_GRE_LOCAL]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001005
1006 if (data[IFLA_GRE_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +02001007 parms->iph.daddr = nla_get_in_addr(data[IFLA_GRE_REMOTE]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001008
1009 if (data[IFLA_GRE_TTL])
1010 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
1011
1012 if (data[IFLA_GRE_TOS])
1013 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
1014
1015 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC]))
1016 parms->iph.frag_off = htons(IP_DF);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001017
1018 if (data[IFLA_GRE_COLLECT_METADATA]) {
1019 struct ip_tunnel *t = netdev_priv(dev);
1020
1021 t->collect_md = true;
1022 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001023}
1024
Tom Herbert4565e992014-09-17 12:26:01 -07001025/* This function returns true when ENCAP attributes are present in the nl msg */
1026static bool ipgre_netlink_encap_parms(struct nlattr *data[],
1027 struct ip_tunnel_encap *ipencap)
1028{
1029 bool ret = false;
1030
1031 memset(ipencap, 0, sizeof(*ipencap));
1032
1033 if (!data)
1034 return ret;
1035
1036 if (data[IFLA_GRE_ENCAP_TYPE]) {
1037 ret = true;
1038 ipencap->type = nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]);
1039 }
1040
1041 if (data[IFLA_GRE_ENCAP_FLAGS]) {
1042 ret = true;
1043 ipencap->flags = nla_get_u16(data[IFLA_GRE_ENCAP_FLAGS]);
1044 }
1045
1046 if (data[IFLA_GRE_ENCAP_SPORT]) {
1047 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001048 ipencap->sport = nla_get_be16(data[IFLA_GRE_ENCAP_SPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001049 }
1050
1051 if (data[IFLA_GRE_ENCAP_DPORT]) {
1052 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001053 ipencap->dport = nla_get_be16(data[IFLA_GRE_ENCAP_DPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001054 }
1055
1056 return ret;
1057}
1058
Pravin B Shelarc5441932013-03-25 14:49:35 +00001059static int gre_tap_init(struct net_device *dev)
Herbert Xue1a80002008-10-09 12:00:17 -07001060{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001061 __gre_tunnel_init(dev);
stephen hemmingerbec94d42014-12-27 10:01:42 -08001062 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Herbert Xue1a80002008-10-09 12:00:17 -07001063
Pravin B Shelarc5441932013-03-25 14:49:35 +00001064 return ip_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -07001065}
1066
Pravin B Shelarc5441932013-03-25 14:49:35 +00001067static const struct net_device_ops gre_tap_netdev_ops = {
1068 .ndo_init = gre_tap_init,
1069 .ndo_uninit = ip_tunnel_uninit,
1070 .ndo_start_xmit = gre_tap_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001071 .ndo_set_mac_address = eth_mac_addr,
1072 .ndo_validate_addr = eth_validate_addr,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001073 .ndo_change_mtu = ip_tunnel_change_mtu,
1074 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +02001075 .ndo_get_iflink = ip_tunnel_get_iflink,
Pravin B Shelarfc4099f2015-10-22 18:17:16 -07001076 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001077};
1078
Herbert Xue1a80002008-10-09 12:00:17 -07001079static void ipgre_tap_setup(struct net_device *dev)
1080{
Herbert Xue1a80002008-10-09 12:00:17 -07001081 ether_setup(dev);
Jiri Bencd13b1612016-02-17 15:32:53 +01001082 dev->netdev_ops = &gre_tap_netdev_ops;
1083 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1084 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001085 ip_tunnel_setup(dev, gre_tap_net_id);
Herbert Xue1a80002008-10-09 12:00:17 -07001086}
1087
Pravin B Shelarc5441932013-03-25 14:49:35 +00001088static int ipgre_newlink(struct net *src_net, struct net_device *dev,
1089 struct nlattr *tb[], struct nlattr *data[])
Herbert Xuc19e6542008-10-09 11:59:55 -07001090{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001091 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001092 struct ip_tunnel_encap ipencap;
1093
1094 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1095 struct ip_tunnel *t = netdev_priv(dev);
1096 int err = ip_tunnel_encap_setup(t, &ipencap);
1097
1098 if (err < 0)
1099 return err;
1100 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001101
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001102 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001103 return ip_tunnel_newlink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001104}
1105
1106static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
1107 struct nlattr *data[])
1108{
Herbert Xuc19e6542008-10-09 11:59:55 -07001109 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001110 struct ip_tunnel_encap ipencap;
1111
1112 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1113 struct ip_tunnel *t = netdev_priv(dev);
1114 int err = ip_tunnel_encap_setup(t, &ipencap);
1115
1116 if (err < 0)
1117 return err;
1118 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001119
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001120 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001121 return ip_tunnel_changelink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001122}
1123
1124static size_t ipgre_get_size(const struct net_device *dev)
1125{
1126 return
1127 /* IFLA_GRE_LINK */
1128 nla_total_size(4) +
1129 /* IFLA_GRE_IFLAGS */
1130 nla_total_size(2) +
1131 /* IFLA_GRE_OFLAGS */
1132 nla_total_size(2) +
1133 /* IFLA_GRE_IKEY */
1134 nla_total_size(4) +
1135 /* IFLA_GRE_OKEY */
1136 nla_total_size(4) +
1137 /* IFLA_GRE_LOCAL */
1138 nla_total_size(4) +
1139 /* IFLA_GRE_REMOTE */
1140 nla_total_size(4) +
1141 /* IFLA_GRE_TTL */
1142 nla_total_size(1) +
1143 /* IFLA_GRE_TOS */
1144 nla_total_size(1) +
1145 /* IFLA_GRE_PMTUDISC */
1146 nla_total_size(1) +
Tom Herbert4565e992014-09-17 12:26:01 -07001147 /* IFLA_GRE_ENCAP_TYPE */
1148 nla_total_size(2) +
1149 /* IFLA_GRE_ENCAP_FLAGS */
1150 nla_total_size(2) +
1151 /* IFLA_GRE_ENCAP_SPORT */
1152 nla_total_size(2) +
1153 /* IFLA_GRE_ENCAP_DPORT */
1154 nla_total_size(2) +
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001155 /* IFLA_GRE_COLLECT_METADATA */
1156 nla_total_size(0) +
Herbert Xuc19e6542008-10-09 11:59:55 -07001157 0;
1158}
1159
1160static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
1161{
1162 struct ip_tunnel *t = netdev_priv(dev);
1163 struct ip_tunnel_parm *p = &t->parms;
1164
David S. Millerf3756b72012-04-01 20:39:02 -04001165 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
Pravin B Shelarc5441932013-03-25 14:49:35 +00001166 nla_put_be16(skb, IFLA_GRE_IFLAGS, tnl_flags_to_gre_flags(p->i_flags)) ||
1167 nla_put_be16(skb, IFLA_GRE_OFLAGS, tnl_flags_to_gre_flags(p->o_flags)) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001168 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
1169 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
Jiri Benc930345e2015-03-29 16:59:25 +02001170 nla_put_in_addr(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
1171 nla_put_in_addr(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001172 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
1173 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
1174 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
1175 !!(p->iph.frag_off & htons(IP_DF))))
1176 goto nla_put_failure;
Tom Herbert4565e992014-09-17 12:26:01 -07001177
1178 if (nla_put_u16(skb, IFLA_GRE_ENCAP_TYPE,
1179 t->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001180 nla_put_be16(skb, IFLA_GRE_ENCAP_SPORT,
1181 t->encap.sport) ||
1182 nla_put_be16(skb, IFLA_GRE_ENCAP_DPORT,
1183 t->encap.dport) ||
Tom Herbert4565e992014-09-17 12:26:01 -07001184 nla_put_u16(skb, IFLA_GRE_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -08001185 t->encap.flags))
Tom Herbert4565e992014-09-17 12:26:01 -07001186 goto nla_put_failure;
1187
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001188 if (t->collect_md) {
1189 if (nla_put_flag(skb, IFLA_GRE_COLLECT_METADATA))
1190 goto nla_put_failure;
1191 }
1192
Herbert Xuc19e6542008-10-09 11:59:55 -07001193 return 0;
1194
1195nla_put_failure:
1196 return -EMSGSIZE;
1197}
1198
1199static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
1200 [IFLA_GRE_LINK] = { .type = NLA_U32 },
1201 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
1202 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
1203 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
1204 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001205 [IFLA_GRE_LOCAL] = { .len = FIELD_SIZEOF(struct iphdr, saddr) },
1206 [IFLA_GRE_REMOTE] = { .len = FIELD_SIZEOF(struct iphdr, daddr) },
Herbert Xuc19e6542008-10-09 11:59:55 -07001207 [IFLA_GRE_TTL] = { .type = NLA_U8 },
1208 [IFLA_GRE_TOS] = { .type = NLA_U8 },
1209 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert4565e992014-09-17 12:26:01 -07001210 [IFLA_GRE_ENCAP_TYPE] = { .type = NLA_U16 },
1211 [IFLA_GRE_ENCAP_FLAGS] = { .type = NLA_U16 },
1212 [IFLA_GRE_ENCAP_SPORT] = { .type = NLA_U16 },
1213 [IFLA_GRE_ENCAP_DPORT] = { .type = NLA_U16 },
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001214 [IFLA_GRE_COLLECT_METADATA] = { .type = NLA_FLAG },
Herbert Xuc19e6542008-10-09 11:59:55 -07001215};
1216
1217static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
1218 .kind = "gre",
1219 .maxtype = IFLA_GRE_MAX,
1220 .policy = ipgre_policy,
1221 .priv_size = sizeof(struct ip_tunnel),
1222 .setup = ipgre_tunnel_setup,
1223 .validate = ipgre_tunnel_validate,
1224 .newlink = ipgre_newlink,
1225 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001226 .dellink = ip_tunnel_dellink,
Herbert Xuc19e6542008-10-09 11:59:55 -07001227 .get_size = ipgre_get_size,
1228 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001229 .get_link_net = ip_tunnel_get_link_net,
Herbert Xuc19e6542008-10-09 11:59:55 -07001230};
1231
Herbert Xue1a80002008-10-09 12:00:17 -07001232static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
1233 .kind = "gretap",
1234 .maxtype = IFLA_GRE_MAX,
1235 .policy = ipgre_policy,
1236 .priv_size = sizeof(struct ip_tunnel),
1237 .setup = ipgre_tap_setup,
1238 .validate = ipgre_tap_validate,
1239 .newlink = ipgre_newlink,
1240 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001241 .dellink = ip_tunnel_dellink,
Herbert Xue1a80002008-10-09 12:00:17 -07001242 .get_size = ipgre_get_size,
1243 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001244 .get_link_net = ip_tunnel_get_link_net,
Herbert Xue1a80002008-10-09 12:00:17 -07001245};
1246
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001247struct net_device *gretap_fb_dev_create(struct net *net, const char *name,
1248 u8 name_assign_type)
1249{
1250 struct nlattr *tb[IFLA_MAX + 1];
1251 struct net_device *dev;
1252 struct ip_tunnel *t;
1253 int err;
1254
1255 memset(&tb, 0, sizeof(tb));
1256
1257 dev = rtnl_create_link(net, name, name_assign_type,
1258 &ipgre_tap_ops, tb);
1259 if (IS_ERR(dev))
1260 return dev;
1261
1262 /* Configure flow based GRE device. */
1263 t = netdev_priv(dev);
1264 t->collect_md = true;
1265
1266 err = ipgre_newlink(net, dev, tb, NULL);
1267 if (err < 0)
1268 goto out;
David Wragg7e059152016-02-10 00:05:58 +00001269
1270 /* openvswitch users expect packet sizes to be unrestricted,
1271 * so set the largest MTU we can.
1272 */
1273 err = __ip_tunnel_change_mtu(dev, IP_MAX_MTU, false);
1274 if (err)
1275 goto out;
1276
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001277 return dev;
1278out:
1279 free_netdev(dev);
1280 return ERR_PTR(err);
1281}
1282EXPORT_SYMBOL_GPL(gretap_fb_dev_create);
1283
Pravin B Shelarc5441932013-03-25 14:49:35 +00001284static int __net_init ipgre_tap_init_net(struct net *net)
1285{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001286 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, "gretap0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001287}
1288
1289static void __net_exit ipgre_tap_exit_net(struct net *net)
1290{
1291 struct ip_tunnel_net *itn = net_generic(net, gre_tap_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001292 ip_tunnel_delete_net(itn, &ipgre_tap_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001293}
1294
1295static struct pernet_operations ipgre_tap_net_ops = {
1296 .init = ipgre_tap_init_net,
1297 .exit = ipgre_tap_exit_net,
1298 .id = &gre_tap_net_id,
1299 .size = sizeof(struct ip_tunnel_net),
1300};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301
1302static int __init ipgre_init(void)
1303{
1304 int err;
1305
Joe Perches058bd4d2012-03-11 18:36:11 +00001306 pr_info("GRE over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001307
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +00001308 err = register_pernet_device(&ipgre_net_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -07001309 if (err < 0)
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001310 return err;
1311
Pravin B Shelarc5441932013-03-25 14:49:35 +00001312 err = register_pernet_device(&ipgre_tap_net_ops);
1313 if (err < 0)
1314 goto pnet_tap_faied;
1315
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001316 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001317 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +00001318 pr_info("%s: can't add protocol\n", __func__);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001319 goto add_proto_failed;
1320 }
Pavel Emelyanov7daa0002008-04-16 01:10:05 -07001321
Herbert Xuc19e6542008-10-09 11:59:55 -07001322 err = rtnl_link_register(&ipgre_link_ops);
1323 if (err < 0)
1324 goto rtnl_link_failed;
1325
Herbert Xue1a80002008-10-09 12:00:17 -07001326 err = rtnl_link_register(&ipgre_tap_ops);
1327 if (err < 0)
1328 goto tap_ops_failed;
1329
Pravin B Shelarc5441932013-03-25 14:49:35 +00001330 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001331
Herbert Xue1a80002008-10-09 12:00:17 -07001332tap_ops_failed:
1333 rtnl_link_unregister(&ipgre_link_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001334rtnl_link_failed:
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001335 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001336add_proto_failed:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001337 unregister_pernet_device(&ipgre_tap_net_ops);
1338pnet_tap_faied:
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001339 unregister_pernet_device(&ipgre_net_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001340 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001341}
1342
Alexey Kuznetsovdb445752005-07-30 17:46:44 -07001343static void __exit ipgre_fini(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344{
Herbert Xue1a80002008-10-09 12:00:17 -07001345 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001346 rtnl_link_unregister(&ipgre_link_ops);
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001347 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001348 unregister_pernet_device(&ipgre_tap_net_ops);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001349 unregister_pernet_device(&ipgre_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001350}
1351
1352module_init(ipgre_init);
1353module_exit(ipgre_fini);
1354MODULE_LICENSE("GPL");
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001355MODULE_ALIAS_RTNL_LINK("gre");
1356MODULE_ALIAS_RTNL_LINK("gretap");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +03001357MODULE_ALIAS_NETDEV("gre0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001358MODULE_ALIAS_NETDEV("gretap0");