blob: d0abde4236af48ce1b655d12da71303f36da1e02 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: GRE over IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Joe Perchesafd465032012-03-12 07:03:32 +000013#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14
Randy Dunlap4fc268d2006-01-11 12:17:47 -080015#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090019#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <asm/uaccess.h>
21#include <linux/skbuff.h>
22#include <linux/netdevice.h>
23#include <linux/in.h>
24#include <linux/tcp.h>
25#include <linux/udp.h>
26#include <linux/if_arp.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070027#include <linux/if_vlan.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/init.h>
29#include <linux/in6.h>
30#include <linux/inetdevice.h>
31#include <linux/igmp.h>
32#include <linux/netfilter_ipv4.h>
Herbert Xue1a80002008-10-09 12:00:17 -070033#include <linux/etherdevice.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080034#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#include <net/sock.h>
37#include <net/ip.h>
38#include <net/icmp.h>
39#include <net/protocol.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000040#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/arp.h>
42#include <net/checksum.h>
43#include <net/dsfield.h>
44#include <net/inet_ecn.h>
45#include <net/xfrm.h>
Pavel Emelyanov59a4c752008-04-16 01:08:53 -070046#include <net/net_namespace.h>
47#include <net/netns/generic.h>
Herbert Xuc19e6542008-10-09 11:59:55 -070048#include <net/rtnetlink.h>
Dmitry Kozlov00959ad2010-08-21 23:05:39 -070049#include <net/gre.h>
Pravin B Shelar2e15ea32015-08-07 23:51:42 -070050#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
Eric Dumazetdfd56b82011-12-10 09:48:31 +000052#if IS_ENABLED(CONFIG_IPV6)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053#include <net/ipv6.h>
54#include <net/ip6_fib.h>
55#include <net/ip6_route.h>
56#endif
57
58/*
59 Problems & solutions
60 --------------------
61
62 1. The most important issue is detecting local dead loops.
63 They would cause complete host lockup in transmit, which
64 would be "resolved" by stack overflow or, if queueing is enabled,
65 with infinite looping in net_bh.
66
67 We cannot track such dead loops during route installation,
68 it is infeasible task. The most general solutions would be
69 to keep skb->encapsulation counter (sort of local ttl),
Eric Dumazet6d0722a2010-09-29 23:35:10 -070070 and silently drop packet when it expires. It is a good
stephen hemmingerbff52852012-02-24 08:08:20 +000071 solution, but it supposes maintaining new variable in ALL
Linus Torvalds1da177e2005-04-16 15:20:36 -070072 skb, even if no tunneling is used.
73
Eric Dumazet6d0722a2010-09-29 23:35:10 -070074 Current solution: xmit_recursion breaks dead loops. This is a percpu
75 counter, since when we enter the first ndo_xmit(), cpu migration is
76 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78 2. Networking dead loops would not kill routers, but would really
79 kill network. IP hop limit plays role of "t->recursion" in this case,
80 if we copy it from packet being encapsulated to upper header.
81 It is very good solution, but it introduces two problems:
82
83 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
84 do not work over tunnels.
85 - traceroute does not work. I planned to relay ICMP from tunnel,
86 so that this problem would be solved and traceroute output
87 would even more informative. This idea appeared to be wrong:
88 only Linux complies to rfc1812 now (yes, guys, Linux is the only
89 true router now :-)), all routers (at least, in neighbourhood of mine)
90 return only 8 bytes of payload. It is the end.
91
92 Hence, if we want that OSPF worked or traceroute said something reasonable,
93 we should search for another solution.
94
95 One of them is to parse packet trying to detect inner encapsulation
96 made by our node. It is difficult or even impossible, especially,
stephen hemmingerbff52852012-02-24 08:08:20 +000097 taking into account fragmentation. TO be short, ttl is not solution at all.
Linus Torvalds1da177e2005-04-16 15:20:36 -070098
99 Current solution: The solution was UNEXPECTEDLY SIMPLE.
100 We force DF flag on tunnels with preconfigured hop limit,
101 that is ALL. :-) Well, it does not remove the problem completely,
102 but exponential growth of network traffic is changed to linear
103 (branches, that exceed pmtu are pruned) and tunnel mtu
stephen hemmingerbff52852012-02-24 08:08:20 +0000104 rapidly degrades to value <68, where looping stops.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 Yes, it is not good if there exists a router in the loop,
106 which does not force DF, even when encapsulating packets have DF set.
107 But it is not our problem! Nobody could accuse us, we made
108 all that we could make. Even if it is your gated who injected
109 fatal route to network, even if it were you who configured
110 fatal static route: you are innocent. :-)
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 Alexey Kuznetsov.
113 */
114
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000115static bool log_ecn_error = true;
116module_param(log_ecn_error, bool, 0644);
117MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
118
Herbert Xuc19e6542008-10-09 11:59:55 -0700119static struct rtnl_link_ops ipgre_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120static int ipgre_tunnel_init(struct net_device *dev);
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700121
Eric Dumazetf99189b2009-11-17 10:42:49 +0000122static int ipgre_net_id __read_mostly;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000123static int gre_tap_net_id __read_mostly;
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700124
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700125static int ip_gre_calc_hlen(__be16 o_flags)
126{
127 int addend = 4;
128
129 if (o_flags & TUNNEL_CSUM)
130 addend += 4;
131 if (o_flags & TUNNEL_KEY)
132 addend += 4;
133 if (o_flags & TUNNEL_SEQ)
134 addend += 4;
135 return addend;
136}
137
138static __be16 gre_flags_to_tnl_flags(__be16 flags)
139{
140 __be16 tflags = 0;
141
142 if (flags & GRE_CSUM)
143 tflags |= TUNNEL_CSUM;
144 if (flags & GRE_ROUTING)
145 tflags |= TUNNEL_ROUTING;
146 if (flags & GRE_KEY)
147 tflags |= TUNNEL_KEY;
148 if (flags & GRE_SEQ)
149 tflags |= TUNNEL_SEQ;
150 if (flags & GRE_STRICT)
151 tflags |= TUNNEL_STRICT;
152 if (flags & GRE_REC)
153 tflags |= TUNNEL_REC;
154 if (flags & GRE_VERSION)
155 tflags |= TUNNEL_VERSION;
156
157 return tflags;
158}
159
160static __be16 tnl_flags_to_gre_flags(__be16 tflags)
161{
162 __be16 flags = 0;
163
164 if (tflags & TUNNEL_CSUM)
165 flags |= GRE_CSUM;
166 if (tflags & TUNNEL_ROUTING)
167 flags |= GRE_ROUTING;
168 if (tflags & TUNNEL_KEY)
169 flags |= GRE_KEY;
170 if (tflags & TUNNEL_SEQ)
171 flags |= GRE_SEQ;
172 if (tflags & TUNNEL_STRICT)
173 flags |= GRE_STRICT;
174 if (tflags & TUNNEL_REC)
175 flags |= GRE_REC;
176 if (tflags & TUNNEL_VERSION)
177 flags |= GRE_VERSION;
178
179 return flags;
180}
181
182static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
183 bool *csum_err)
184{
185 const struct gre_base_hdr *greh;
186 __be32 *options;
187 int hdr_len;
188
189 if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
190 return -EINVAL;
191
192 greh = (struct gre_base_hdr *)skb_transport_header(skb);
193 if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
194 return -EINVAL;
195
196 tpi->flags = gre_flags_to_tnl_flags(greh->flags);
197 hdr_len = ip_gre_calc_hlen(tpi->flags);
198
199 if (!pskb_may_pull(skb, hdr_len))
200 return -EINVAL;
201
202 greh = (struct gre_base_hdr *)skb_transport_header(skb);
203 tpi->proto = greh->protocol;
204
205 options = (__be32 *)(greh + 1);
206 if (greh->flags & GRE_CSUM) {
207 if (skb_checksum_simple_validate(skb)) {
208 *csum_err = true;
209 return -EINVAL;
210 }
211
212 skb_checksum_try_convert(skb, IPPROTO_GRE, 0,
213 null_compute_pseudo);
214 options++;
215 }
216
217 if (greh->flags & GRE_KEY) {
218 tpi->key = *options;
219 options++;
220 } else {
221 tpi->key = 0;
222 }
223 if (unlikely(greh->flags & GRE_SEQ)) {
224 tpi->seq = *options;
225 options++;
226 } else {
227 tpi->seq = 0;
228 }
229 /* WCCP version 1 and 2 protocol decoding.
230 * - Change protocol to IP
231 * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
232 */
233 if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
234 tpi->proto = htons(ETH_P_IP);
235 if ((*(u8 *)options & 0xF0) != 0x40) {
236 hdr_len += 4;
237 if (!pskb_may_pull(skb, hdr_len))
238 return -EINVAL;
239 }
240 }
Jiri Benc7f290c92016-02-18 11:22:52 +0100241 return iptunnel_pull_header(skb, hdr_len, tpi->proto, false);
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700242}
243
244static void ipgre_err(struct sk_buff *skb, u32 info,
245 const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Pravin B Shelarc5441932013-03-25 14:49:35 +0000248 /* All the routers (except for Linux) return only
249 8 bytes of packet payload. It means, that precise relaying of
250 ICMP in the real Internet is absolutely infeasible.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Pravin B Shelarc5441932013-03-25 14:49:35 +0000252 Moreover, Cisco "wise men" put GRE key to the third word
253 in GRE header. It makes impossible maintaining even soft
254 state for keyed GRE tunnels with enabled checksum. Tell
255 them "thank you".
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256
Pravin B Shelarc5441932013-03-25 14:49:35 +0000257 Well, I wonder, rfc1812 was written by Cisco employee,
258 what the hell these idiots break standards established
259 by themselves???
260 */
261 struct net *net = dev_net(skb->dev);
262 struct ip_tunnel_net *itn;
Eric Dumazet96f5a842013-05-18 08:36:03 +0000263 const struct iphdr *iph;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300264 const int type = icmp_hdr(skb)->type;
265 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 struct ip_tunnel *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 switch (type) {
269 default:
270 case ICMP_PARAMETERPROB:
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700271 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
273 case ICMP_DEST_UNREACH:
274 switch (code) {
275 case ICMP_SR_FAILED:
276 case ICMP_PORT_UNREACH:
277 /* Impossible event. */
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700278 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 default:
280 /* All others are translated to HOST_UNREACH.
281 rfc2003 contains "deep thoughts" about NET_UNREACH,
282 I believe they are just ether pollution. --ANK
283 */
284 break;
285 }
286 break;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 case ICMP_TIME_EXCEEDED:
289 if (code != ICMP_EXC_TTL)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700290 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700292
293 case ICMP_REDIRECT:
294 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 }
296
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700297 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000298 itn = net_generic(net, gre_tap_net_id);
299 else
300 itn = net_generic(net, ipgre_net_id);
301
Duan Jiongc0c0c502014-01-28 11:49:43 +0800302 iph = (const struct iphdr *)(icmp_hdr(skb) + 1);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700303 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
304 iph->daddr, iph->saddr, tpi->key);
stephen hemmingerd2083282012-09-24 18:12:23 +0000305
Ian Morris51456b22015-04-03 09:17:26 +0100306 if (!t)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700307 return;
David S. Miller36393392012-06-14 22:21:46 -0700308
David S. Miller36393392012-06-14 22:21:46 -0700309 if (t->parms.iph.daddr == 0 ||
Joe Perchesf97c1e02007-12-16 13:45:43 -0800310 ipv4_is_multicast(t->parms.iph.daddr))
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700311 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
313 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700314 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Wei Yongjunda6185d82009-02-24 23:34:48 -0800316 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317 t->err_count++;
318 else
319 t->err_count = 1;
320 t->err_time = jiffies;
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700321}
322
323static void gre_err(struct sk_buff *skb, u32 info)
324{
325 /* All the routers (except for Linux) return only
326 * 8 bytes of packet payload. It means, that precise relaying of
327 * ICMP in the real Internet is absolutely infeasible.
328 *
329 * Moreover, Cisco "wise men" put GRE key to the third word
330 * in GRE header. It makes impossible maintaining even soft
331 * state for keyed
332 * GRE tunnels with enabled checksum. Tell them "thank you".
333 *
334 * Well, I wonder, rfc1812 was written by Cisco employee,
335 * what the hell these idiots break standards established
336 * by themselves???
337 */
338
339 const int type = icmp_hdr(skb)->type;
340 const int code = icmp_hdr(skb)->code;
341 struct tnl_ptk_info tpi;
342 bool csum_err = false;
343
344 if (parse_gre_header(skb, &tpi, &csum_err)) {
345 if (!csum_err) /* ignore csum errors. */
346 return;
347 }
348
349 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
350 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
351 skb->dev->ifindex, 0, IPPROTO_GRE, 0);
352 return;
353 }
354 if (type == ICMP_REDIRECT) {
355 ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
356 IPPROTO_GRE, 0);
357 return;
358 }
359
360 ipgre_err(skb, info, &tpi);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700363static __be64 key_to_tunnel_id(__be32 key)
364{
365#ifdef __BIG_ENDIAN
366 return (__force __be64)((__force u32)key);
367#else
368 return (__force __be64)((__force u64)key << 32);
369#endif
370}
371
372/* Returns the least-significant 32 bits of a __be64. */
373static __be32 tunnel_id_to_key(__be64 x)
374{
375#ifdef __BIG_ENDIAN
376 return (__force __be32)x;
377#else
378 return (__force __be32)((__force u64)x >> 32);
379#endif
380}
381
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700382static int ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000384 struct net *net = dev_net(skb->dev);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700385 struct metadata_dst *tun_dst = NULL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000386 struct ip_tunnel_net *itn;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000387 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 struct ip_tunnel *tunnel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700390 if (tpi->proto == htons(ETH_P_TEB))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000391 itn = net_generic(net, gre_tap_net_id);
392 else
393 itn = net_generic(net, ipgre_net_id);
394
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700395 iph = ip_hdr(skb);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700396 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
397 iph->saddr, iph->daddr, tpi->key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
stephen hemmingerd2083282012-09-24 18:12:23 +0000399 if (tunnel) {
Timo Teräs0e3da5b2013-12-16 11:02:09 +0200400 skb_pop_mac_header(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700401 if (tunnel->collect_md) {
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700402 __be16 flags;
403 __be64 tun_id;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700404
Pravin B Shelarc29a70d2015-08-26 23:46:50 -0700405 flags = tpi->flags & (TUNNEL_CSUM | TUNNEL_KEY);
406 tun_id = key_to_tunnel_id(tpi->key);
407 tun_dst = ip_tun_rx_dst(skb, flags, tun_id, 0);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700408 if (!tun_dst)
409 return PACKET_REJECT;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700410 }
411
412 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700413 return PACKET_RCVD;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 }
Pravin B Shelarbda7bb42013-06-17 17:49:38 -0700415 return PACKET_REJECT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416}
417
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700418static int gre_rcv(struct sk_buff *skb)
419{
420 struct tnl_ptk_info tpi;
421 bool csum_err = false;
422
423#ifdef CONFIG_NET_IPGRE_BROADCAST
424 if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
425 /* Looped back packet, drop it! */
426 if (rt_is_output_route(skb_rtable(skb)))
427 goto drop;
428 }
429#endif
430
431 if (parse_gre_header(skb, &tpi, &csum_err) < 0)
432 goto drop;
433
434 if (ipgre_rcv(skb, &tpi) == PACKET_RCVD)
435 return 0;
436
437 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
438drop:
439 kfree_skb(skb);
440 return 0;
441}
442
Edward Cree53936102016-02-11 21:01:07 +0000443static __sum16 gre_checksum(struct sk_buff *skb)
444{
445 __wsum csum;
446
447 if (skb->ip_summed == CHECKSUM_PARTIAL)
448 csum = lco_csum(skb);
449 else
450 csum = skb_checksum(skb, 0, skb->len, 0);
451 return csum_fold(csum);
452}
453
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700454static void build_header(struct sk_buff *skb, int hdr_len, __be16 flags,
455 __be16 proto, __be32 key, __be32 seq)
456{
457 struct gre_base_hdr *greh;
458
459 skb_push(skb, hdr_len);
460
461 skb_reset_transport_header(skb);
462 greh = (struct gre_base_hdr *)skb->data;
463 greh->flags = tnl_flags_to_gre_flags(flags);
464 greh->protocol = proto;
465
466 if (flags & (TUNNEL_KEY | TUNNEL_CSUM | TUNNEL_SEQ)) {
467 __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
468
469 if (flags & TUNNEL_SEQ) {
470 *ptr = seq;
471 ptr--;
472 }
473 if (flags & TUNNEL_KEY) {
474 *ptr = key;
475 ptr--;
476 }
477 if (flags & TUNNEL_CSUM &&
478 !(skb_shinfo(skb)->gso_type &
479 (SKB_GSO_GRE | SKB_GSO_GRE_CSUM))) {
480 *ptr = 0;
Edward Cree53936102016-02-11 21:01:07 +0000481 *(__sum16 *)ptr = gre_checksum(skb);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700482 }
483 }
484}
485
Pravin B Shelarc5441932013-03-25 14:49:35 +0000486static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
487 const struct iphdr *tnl_params,
488 __be16 proto)
489{
490 struct ip_tunnel *tunnel = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000491
Pravin B Shelarc5441932013-03-25 14:49:35 +0000492 if (tunnel->parms.o_flags & TUNNEL_SEQ)
493 tunnel->o_seqno++;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000494
Pravin B Shelarc5441932013-03-25 14:49:35 +0000495 /* Push GRE header. */
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700496 build_header(skb, tunnel->tun_hlen, tunnel->parms.o_flags,
497 proto, tunnel->parms.o_key, htonl(tunnel->o_seqno));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700499 skb_set_inner_protocol(skb, proto);
Nicolas Dichtelbf3d6a82013-05-27 23:48:15 +0000500 ip_tunnel_xmit(skb, dev, tnl_params, tnl_params->protocol);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501}
502
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700503static struct sk_buff *gre_handle_offloads(struct sk_buff *skb,
504 bool csum)
505{
Edward Cree6fa79662016-02-11 21:02:31 +0000506 return iptunnel_handle_offloads(skb, csum ? SKB_GSO_GRE_CSUM : SKB_GSO_GRE);
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -0700507}
508
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700509static struct rtable *gre_get_rt(struct sk_buff *skb,
510 struct net_device *dev,
511 struct flowi4 *fl,
512 const struct ip_tunnel_key *key)
513{
514 struct net *net = dev_net(dev);
515
516 memset(fl, 0, sizeof(*fl));
517 fl->daddr = key->u.ipv4.dst;
518 fl->saddr = key->u.ipv4.src;
519 fl->flowi4_tos = RT_TOS(key->tos);
520 fl->flowi4_mark = skb->mark;
521 fl->flowi4_proto = IPPROTO_GRE;
522
523 return ip_route_output_key(net, fl);
524}
525
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700526static void gre_fb_xmit(struct sk_buff *skb, struct net_device *dev)
527{
528 struct ip_tunnel_info *tun_info;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700529 const struct ip_tunnel_key *key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100530 struct rtable *rt = NULL;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700531 struct flowi4 fl;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700532 int min_headroom;
533 int tunnel_hlen;
534 __be16 df, flags;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100535 bool use_cache;
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700536 int err;
537
Jiri Benc61adedf2015-08-20 13:56:25 +0200538 tun_info = skb_tunnel_info(skb);
Jiri Benc7f9562a2015-08-28 20:48:20 +0200539 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
540 ip_tunnel_info_af(tun_info) != AF_INET))
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700541 goto err_free_skb;
542
543 key = &tun_info->key;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100544 use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
545 if (use_cache)
546 rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl.saddr);
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100547 if (!rt) {
548 rt = gre_get_rt(skb, dev, &fl, key);
549 if (IS_ERR(rt))
550 goto err_free_skb;
Daniel Borkmanndb3c6132016-03-04 15:15:07 +0100551 if (use_cache)
Paolo Abeni3c1cb4d2016-02-12 15:43:59 +0100552 dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
553 fl.saddr);
554 }
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700555
556 tunnel_hlen = ip_gre_calc_hlen(key->tun_flags);
557
558 min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len
559 + tunnel_hlen + sizeof(struct iphdr);
560 if (skb_headroom(skb) < min_headroom || skb_header_cloned(skb)) {
561 int head_delta = SKB_DATA_ALIGN(min_headroom -
562 skb_headroom(skb) +
563 16);
564 err = pskb_expand_head(skb, max_t(int, head_delta, 0),
565 0, GFP_ATOMIC);
566 if (unlikely(err))
567 goto err_free_rt;
568 }
569
570 /* Push Tunnel header. */
571 skb = gre_handle_offloads(skb, !!(tun_info->key.tun_flags & TUNNEL_CSUM));
572 if (IS_ERR(skb)) {
573 skb = NULL;
574 goto err_free_rt;
575 }
576
577 flags = tun_info->key.tun_flags & (TUNNEL_CSUM | TUNNEL_KEY);
578 build_header(skb, tunnel_hlen, flags, htons(ETH_P_TEB),
579 tunnel_id_to_key(tun_info->key.tun_id), 0);
580
581 df = key->tun_flags & TUNNEL_DONT_FRAGMENT ? htons(IP_DF) : 0;
Pravin B Shelar039f5062015-12-24 14:34:54 -0800582
583 iptunnel_xmit(skb->sk, rt, skb, fl.saddr, key->u.ipv4.dst, IPPROTO_GRE,
584 key->tos, key->ttl, df, false);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700585 return;
586
587err_free_rt:
588 ip_rt_put(rt);
589err_free_skb:
590 kfree_skb(skb);
591 dev->stats.tx_dropped++;
592}
593
Pravin B Shelarfc4099f2015-10-22 18:17:16 -0700594static int gre_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb)
595{
596 struct ip_tunnel_info *info = skb_tunnel_info(skb);
597 struct rtable *rt;
598 struct flowi4 fl4;
599
600 if (ip_tunnel_info_af(info) != AF_INET)
601 return -EINVAL;
602
603 rt = gre_get_rt(skb, dev, &fl4, &info->key);
604 if (IS_ERR(rt))
605 return PTR_ERR(rt);
606
607 ip_rt_put(rt);
608 info->key.u.ipv4.src = fl4.saddr;
609 return 0;
610}
611
Pravin B Shelarc5441932013-03-25 14:49:35 +0000612static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
613 struct net_device *dev)
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800614{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000615 struct ip_tunnel *tunnel = netdev_priv(dev);
616 const struct iphdr *tnl_params;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800617
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700618 if (tunnel->collect_md) {
619 gre_fb_xmit(skb, dev);
620 return NETDEV_TX_OK;
621 }
622
Pravin B Shelarc5441932013-03-25 14:49:35 +0000623 if (dev->header_ops) {
624 /* Need space for new headers */
625 if (skb_cow_head(skb, dev->needed_headroom -
Chen Gang2bac7cb2013-04-22 20:45:42 +0000626 (tunnel->hlen + sizeof(struct iphdr))))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000627 goto free_skb;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800628
Pravin B Shelarc5441932013-03-25 14:49:35 +0000629 tnl_params = (const struct iphdr *)skb->data;
Eric Dumazete985aad2010-09-27 03:57:11 +0000630
Pravin B Shelarc5441932013-03-25 14:49:35 +0000631 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
632 * to gre header.
633 */
634 skb_pull(skb, tunnel->hlen + sizeof(struct iphdr));
Timo Teräs8a0033a2014-12-15 09:24:13 +0200635 skb_reset_mac_header(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000636 } else {
637 if (skb_cow_head(skb, dev->needed_headroom))
638 goto free_skb;
Herbert Xue1a80002008-10-09 12:00:17 -0700639
Pravin B Shelarc5441932013-03-25 14:49:35 +0000640 tnl_params = &tunnel->parms.iph;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800641 }
642
Timo Teräs8a0033a2014-12-15 09:24:13 +0200643 skb = gre_handle_offloads(skb, !!(tunnel->parms.o_flags&TUNNEL_CSUM));
644 if (IS_ERR(skb))
645 goto out;
646
Pravin B Shelarc5441932013-03-25 14:49:35 +0000647 __gre_xmit(skb, dev, tnl_params, skb->protocol);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000648 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800649
Pravin B Shelarc5441932013-03-25 14:49:35 +0000650free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800651 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000652out:
653 dev->stats.tx_dropped++;
654 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800655}
656
Pravin B Shelarc5441932013-03-25 14:49:35 +0000657static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
658 struct net_device *dev)
659{
660 struct ip_tunnel *tunnel = netdev_priv(dev);
661
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700662 if (tunnel->collect_md) {
663 gre_fb_xmit(skb, dev);
664 return NETDEV_TX_OK;
665 }
666
Pravin B Shelar45f2e992013-06-17 17:49:51 -0700667 skb = gre_handle_offloads(skb, !!(tunnel->parms.o_flags&TUNNEL_CSUM));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000668 if (IS_ERR(skb))
669 goto out;
670
671 if (skb_cow_head(skb, dev->needed_headroom))
672 goto free_skb;
673
674 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
Pravin B Shelarc5441932013-03-25 14:49:35 +0000675 return NETDEV_TX_OK;
676
677free_skb:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800678 kfree_skb(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000679out:
680 dev->stats.tx_dropped++;
681 return NETDEV_TX_OK;
682}
683
684static int ipgre_tunnel_ioctl(struct net_device *dev,
685 struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686{
Tom Herbert4565e992014-09-17 12:26:01 -0700687 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689
Pravin B Shelarc5441932013-03-25 14:49:35 +0000690 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
691 return -EFAULT;
Cong Wang6c734fb2013-06-29 12:02:59 +0800692 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
693 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_GRE ||
694 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)) ||
695 ((p.i_flags|p.o_flags)&(GRE_VERSION|GRE_ROUTING)))
696 return -EINVAL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000697 }
698 p.i_flags = gre_flags_to_tnl_flags(p.i_flags);
699 p.o_flags = gre_flags_to_tnl_flags(p.o_flags);
700
701 err = ip_tunnel_ioctl(dev, &p, cmd);
702 if (err)
703 return err;
704
705 p.i_flags = tnl_flags_to_gre_flags(p.i_flags);
706 p.o_flags = tnl_flags_to_gre_flags(p.o_flags);
707
708 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
709 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 return 0;
711}
712
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713/* Nice toy. Unfortunately, useless in real life :-)
714 It allows to construct virtual multiprotocol broadcast "LAN"
715 over the Internet, provided multicast routing is tuned.
716
717
718 I have no idea was this bicycle invented before me,
719 so that I had to set ARPHRD_IPGRE to a random value.
720 I have an impression, that Cisco could make something similar,
721 but this feature is apparently missing in IOS<=11.2(8).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900722
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
724 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
725
726 ping -t 255 224.66.66.66
727
728 If nobody answers, mbone does not work.
729
730 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
731 ip addr add 10.66.66.<somewhat>/24 dev Universe
732 ifconfig Universe up
733 ifconfig Universe add fe80::<Your_real_addr>/10
734 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
735 ftp 10.66.66.66
736 ...
737 ftp fec0:6666:6666::193.233.7.65
738 ...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739 */
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700740static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
741 unsigned short type,
Eric Dumazet15078502010-09-15 11:07:53 +0000742 const void *daddr, const void *saddr, unsigned int len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743{
Patrick McHardy2941a482006-01-08 22:05:26 -0800744 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000745 struct iphdr *iph;
746 struct gre_base_hdr *greh;
747
748 iph = (struct iphdr *)skb_push(skb, t->hlen + sizeof(*iph));
749 greh = (struct gre_base_hdr *)(iph+1);
750 greh->flags = tnl_flags_to_gre_flags(t->parms.o_flags);
751 greh->protocol = htons(type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752
753 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754
Pravin B Shelarc5441932013-03-25 14:49:35 +0000755 /* Set the source hardware address. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756 if (saddr)
757 memcpy(&iph->saddr, saddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000758 if (daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 memcpy(&iph->daddr, daddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000760 if (iph->daddr)
Timo Teräs77a482b2013-08-06 13:45:43 +0300761 return t->hlen + sizeof(*iph);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900762
Pravin B Shelarc5441932013-03-25 14:49:35 +0000763 return -(t->hlen + sizeof(*iph));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764}
765
Timo Teras6a5f44d2007-10-23 20:31:53 -0700766static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
767{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000768 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
Timo Teras6a5f44d2007-10-23 20:31:53 -0700769 memcpy(haddr, &iph->saddr, 4);
770 return 4;
771}
772
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700773static const struct header_ops ipgre_header_ops = {
774 .create = ipgre_header,
Timo Teras6a5f44d2007-10-23 20:31:53 -0700775 .parse = ipgre_header_parse,
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700776};
777
Timo Teras6a5f44d2007-10-23 20:31:53 -0700778#ifdef CONFIG_NET_IPGRE_BROADCAST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779static int ipgre_open(struct net_device *dev)
780{
Patrick McHardy2941a482006-01-08 22:05:26 -0800781 struct ip_tunnel *t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782
Joe Perchesf97c1e02007-12-16 13:45:43 -0800783 if (ipv4_is_multicast(t->parms.iph.daddr)) {
David S. Millercbb1e852011-05-04 12:33:34 -0700784 struct flowi4 fl4;
785 struct rtable *rt;
Eric Dumazete985aad2010-09-27 03:57:11 +0000786
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200787 rt = ip_route_output_gre(t->net, &fl4,
David S. Millercbb1e852011-05-04 12:33:34 -0700788 t->parms.iph.daddr,
789 t->parms.iph.saddr,
790 t->parms.o_key,
791 RT_TOS(t->parms.iph.tos),
792 t->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800793 if (IS_ERR(rt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700794 return -EADDRNOTAVAIL;
Changli Gaod8d1f302010-06-10 23:31:35 -0700795 dev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796 ip_rt_put(rt);
Ian Morris51456b22015-04-03 09:17:26 +0100797 if (!__in_dev_get_rtnl(dev))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798 return -EADDRNOTAVAIL;
799 t->mlink = dev->ifindex;
Herbert Xue5ed6392005-10-03 14:35:55 -0700800 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700801 }
802 return 0;
803}
804
805static int ipgre_close(struct net_device *dev)
806{
Patrick McHardy2941a482006-01-08 22:05:26 -0800807 struct ip_tunnel *t = netdev_priv(dev);
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800808
Joe Perchesf97c1e02007-12-16 13:45:43 -0800809 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800810 struct in_device *in_dev;
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200811 in_dev = inetdev_by_index(t->net, t->mlink);
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000812 if (in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814 }
815 return 0;
816}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817#endif
818
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800819static const struct net_device_ops ipgre_netdev_ops = {
820 .ndo_init = ipgre_tunnel_init,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000821 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800822#ifdef CONFIG_NET_IPGRE_BROADCAST
823 .ndo_open = ipgre_open,
824 .ndo_stop = ipgre_close,
825#endif
Pravin B Shelarc5441932013-03-25 14:49:35 +0000826 .ndo_start_xmit = ipgre_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800827 .ndo_do_ioctl = ipgre_tunnel_ioctl,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000828 .ndo_change_mtu = ip_tunnel_change_mtu,
829 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200830 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800831};
832
Eric Dumazet6b78f162012-09-13 21:25:33 +0000833#define GRE_FEATURES (NETIF_F_SG | \
834 NETIF_F_FRAGLIST | \
835 NETIF_F_HIGHDMA | \
836 NETIF_F_HW_CSUM)
837
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838static void ipgre_tunnel_setup(struct net_device *dev)
839{
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800840 dev->netdev_ops = &ipgre_netdev_ops;
Nicolas Dichtel5a455272014-04-11 15:51:18 +0200841 dev->type = ARPHRD_IPGRE;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000842 ip_tunnel_setup(dev, ipgre_net_id);
843}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844
Pravin B Shelarc5441932013-03-25 14:49:35 +0000845static void __gre_tunnel_init(struct net_device *dev)
846{
847 struct ip_tunnel *tunnel;
Tom Herbert4565e992014-09-17 12:26:01 -0700848 int t_hlen;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000849
850 tunnel = netdev_priv(dev);
Tom Herbert4565e992014-09-17 12:26:01 -0700851 tunnel->tun_hlen = ip_gre_calc_hlen(tunnel->parms.o_flags);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000852 tunnel->parms.iph.protocol = IPPROTO_GRE;
853
Tom Herbert4565e992014-09-17 12:26:01 -0700854 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
855
856 t_hlen = tunnel->hlen + sizeof(struct iphdr);
857
858 dev->needed_headroom = LL_MAX_HEADER + t_hlen + 4;
859 dev->mtu = ETH_DATA_LEN - t_hlen - 4;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000860
Nicolas Dichtelb57708a2014-04-22 10:15:23 +0200861 dev->features |= GRE_FEATURES;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000862 dev->hw_features |= GRE_FEATURES;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000863
864 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
Alexander Duycka0ca1532016-04-05 09:13:39 -0700865 /* TCP offload with GRE SEQ is not supported, nor
866 * can we support 2 levels of outer headers requiring
867 * an update.
868 */
869 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
870 (tunnel->encap.type == TUNNEL_ENCAP_NONE)) {
871 dev->features |= NETIF_F_GSO_SOFTWARE;
872 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
873 }
874
Pravin B Shelarc5441932013-03-25 14:49:35 +0000875 /* Can use a lockless transmit, unless we generate
876 * output sequences
877 */
878 dev->features |= NETIF_F_LLTX;
879 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880}
881
882static int ipgre_tunnel_init(struct net_device *dev)
883{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000884 struct ip_tunnel *tunnel = netdev_priv(dev);
885 struct iphdr *iph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700886
Pravin B Shelarc5441932013-03-25 14:49:35 +0000887 __gre_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700888
Pravin B Shelarc5441932013-03-25 14:49:35 +0000889 memcpy(dev->dev_addr, &iph->saddr, 4);
890 memcpy(dev->broadcast, &iph->daddr, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891
Pravin B Shelarc5441932013-03-25 14:49:35 +0000892 dev->flags = IFF_NOARP;
Eric Dumazet02875872014-10-05 18:38:35 -0700893 netif_keep_dst(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000894 dev->addr_len = 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
Jiri Benca64b04d2016-04-27 11:29:06 +0200896 if (iph->daddr && !tunnel->collect_md) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897#ifdef CONFIG_NET_IPGRE_BROADCAST
Joe Perchesf97c1e02007-12-16 13:45:43 -0800898 if (ipv4_is_multicast(iph->daddr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700899 if (!iph->saddr)
900 return -EINVAL;
901 dev->flags = IFF_BROADCAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700902 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700903 }
904#endif
Jiri Benca64b04d2016-04-27 11:29:06 +0200905 } else if (!tunnel->collect_md) {
Timo Teras6a5f44d2007-10-23 20:31:53 -0700906 dev->header_ops = &ipgre_header_ops;
Jiri Benca64b04d2016-04-27 11:29:06 +0200907 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700908
Pravin B Shelarc5441932013-03-25 14:49:35 +0000909 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700910}
911
Pravin B Shelar9f57c672015-08-07 23:51:52 -0700912static const struct gre_protocol ipgre_protocol = {
913 .handler = gre_rcv,
914 .err_handler = gre_err,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700915};
916
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000917static int __net_init ipgre_init_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700918{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000919 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700920}
921
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000922static void __net_exit ipgre_exit_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700923{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000924 struct ip_tunnel_net *itn = net_generic(net, ipgre_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200925 ip_tunnel_delete_net(itn, &ipgre_link_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700926}
927
928static struct pernet_operations ipgre_net_ops = {
929 .init = ipgre_init_net,
930 .exit = ipgre_exit_net,
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000931 .id = &ipgre_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000932 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700933};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700934
Herbert Xuc19e6542008-10-09 11:59:55 -0700935static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
936{
937 __be16 flags;
938
939 if (!data)
940 return 0;
941
942 flags = 0;
943 if (data[IFLA_GRE_IFLAGS])
944 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
945 if (data[IFLA_GRE_OFLAGS])
946 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
947 if (flags & (GRE_VERSION|GRE_ROUTING))
948 return -EINVAL;
949
950 return 0;
951}
952
Herbert Xue1a80002008-10-09 12:00:17 -0700953static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[])
954{
955 __be32 daddr;
956
957 if (tb[IFLA_ADDRESS]) {
958 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
959 return -EINVAL;
960 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
961 return -EADDRNOTAVAIL;
962 }
963
964 if (!data)
965 goto out;
966
967 if (data[IFLA_GRE_REMOTE]) {
968 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
969 if (!daddr)
970 return -EINVAL;
971 }
972
973out:
974 return ipgre_tunnel_validate(tb, data);
975}
976
Pravin B Shelar2e15ea32015-08-07 23:51:42 -0700977static void ipgre_netlink_parms(struct net_device *dev,
978 struct nlattr *data[],
979 struct nlattr *tb[],
980 struct ip_tunnel_parm *parms)
Herbert Xuc19e6542008-10-09 11:59:55 -0700981{
Herbert Xu7bb82d92008-10-11 12:20:15 -0700982 memset(parms, 0, sizeof(*parms));
Herbert Xuc19e6542008-10-09 11:59:55 -0700983
984 parms->iph.protocol = IPPROTO_GRE;
985
986 if (!data)
987 return;
988
989 if (data[IFLA_GRE_LINK])
990 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
991
992 if (data[IFLA_GRE_IFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000993 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700994
995 if (data[IFLA_GRE_OFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000996 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700997
998 if (data[IFLA_GRE_IKEY])
999 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
1000
1001 if (data[IFLA_GRE_OKEY])
1002 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
1003
1004 if (data[IFLA_GRE_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +02001005 parms->iph.saddr = nla_get_in_addr(data[IFLA_GRE_LOCAL]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001006
1007 if (data[IFLA_GRE_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +02001008 parms->iph.daddr = nla_get_in_addr(data[IFLA_GRE_REMOTE]);
Herbert Xuc19e6542008-10-09 11:59:55 -07001009
1010 if (data[IFLA_GRE_TTL])
1011 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
1012
1013 if (data[IFLA_GRE_TOS])
1014 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
1015
1016 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC]))
1017 parms->iph.frag_off = htons(IP_DF);
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001018
1019 if (data[IFLA_GRE_COLLECT_METADATA]) {
1020 struct ip_tunnel *t = netdev_priv(dev);
1021
1022 t->collect_md = true;
1023 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001024}
1025
Tom Herbert4565e992014-09-17 12:26:01 -07001026/* This function returns true when ENCAP attributes are present in the nl msg */
1027static bool ipgre_netlink_encap_parms(struct nlattr *data[],
1028 struct ip_tunnel_encap *ipencap)
1029{
1030 bool ret = false;
1031
1032 memset(ipencap, 0, sizeof(*ipencap));
1033
1034 if (!data)
1035 return ret;
1036
1037 if (data[IFLA_GRE_ENCAP_TYPE]) {
1038 ret = true;
1039 ipencap->type = nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]);
1040 }
1041
1042 if (data[IFLA_GRE_ENCAP_FLAGS]) {
1043 ret = true;
1044 ipencap->flags = nla_get_u16(data[IFLA_GRE_ENCAP_FLAGS]);
1045 }
1046
1047 if (data[IFLA_GRE_ENCAP_SPORT]) {
1048 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001049 ipencap->sport = nla_get_be16(data[IFLA_GRE_ENCAP_SPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001050 }
1051
1052 if (data[IFLA_GRE_ENCAP_DPORT]) {
1053 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001054 ipencap->dport = nla_get_be16(data[IFLA_GRE_ENCAP_DPORT]);
Tom Herbert4565e992014-09-17 12:26:01 -07001055 }
1056
1057 return ret;
1058}
1059
Pravin B Shelarc5441932013-03-25 14:49:35 +00001060static int gre_tap_init(struct net_device *dev)
Herbert Xue1a80002008-10-09 12:00:17 -07001061{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001062 __gre_tunnel_init(dev);
stephen hemmingerbec94d42014-12-27 10:01:42 -08001063 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Herbert Xue1a80002008-10-09 12:00:17 -07001064
Pravin B Shelarc5441932013-03-25 14:49:35 +00001065 return ip_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -07001066}
1067
Pravin B Shelarc5441932013-03-25 14:49:35 +00001068static const struct net_device_ops gre_tap_netdev_ops = {
1069 .ndo_init = gre_tap_init,
1070 .ndo_uninit = ip_tunnel_uninit,
1071 .ndo_start_xmit = gre_tap_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001072 .ndo_set_mac_address = eth_mac_addr,
1073 .ndo_validate_addr = eth_validate_addr,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001074 .ndo_change_mtu = ip_tunnel_change_mtu,
1075 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +02001076 .ndo_get_iflink = ip_tunnel_get_iflink,
Pravin B Shelarfc4099f2015-10-22 18:17:16 -07001077 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -08001078};
1079
Herbert Xue1a80002008-10-09 12:00:17 -07001080static void ipgre_tap_setup(struct net_device *dev)
1081{
Herbert Xue1a80002008-10-09 12:00:17 -07001082 ether_setup(dev);
Jiri Bencd13b1612016-02-17 15:32:53 +01001083 dev->netdev_ops = &gre_tap_netdev_ops;
1084 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1085 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
Pravin B Shelarc5441932013-03-25 14:49:35 +00001086 ip_tunnel_setup(dev, gre_tap_net_id);
Herbert Xue1a80002008-10-09 12:00:17 -07001087}
1088
Pravin B Shelarc5441932013-03-25 14:49:35 +00001089static int ipgre_newlink(struct net *src_net, struct net_device *dev,
1090 struct nlattr *tb[], struct nlattr *data[])
Herbert Xuc19e6542008-10-09 11:59:55 -07001091{
Pravin B Shelarc5441932013-03-25 14:49:35 +00001092 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001093 struct ip_tunnel_encap ipencap;
1094
1095 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1096 struct ip_tunnel *t = netdev_priv(dev);
1097 int err = ip_tunnel_encap_setup(t, &ipencap);
1098
1099 if (err < 0)
1100 return err;
1101 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001102
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001103 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001104 return ip_tunnel_newlink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001105}
1106
1107static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
1108 struct nlattr *data[])
1109{
Herbert Xuc19e6542008-10-09 11:59:55 -07001110 struct ip_tunnel_parm p;
Tom Herbert4565e992014-09-17 12:26:01 -07001111 struct ip_tunnel_encap ipencap;
1112
1113 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1114 struct ip_tunnel *t = netdev_priv(dev);
1115 int err = ip_tunnel_encap_setup(t, &ipencap);
1116
1117 if (err < 0)
1118 return err;
1119 }
Herbert Xuc19e6542008-10-09 11:59:55 -07001120
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001121 ipgre_netlink_parms(dev, data, tb, &p);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001122 return ip_tunnel_changelink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -07001123}
1124
1125static size_t ipgre_get_size(const struct net_device *dev)
1126{
1127 return
1128 /* IFLA_GRE_LINK */
1129 nla_total_size(4) +
1130 /* IFLA_GRE_IFLAGS */
1131 nla_total_size(2) +
1132 /* IFLA_GRE_OFLAGS */
1133 nla_total_size(2) +
1134 /* IFLA_GRE_IKEY */
1135 nla_total_size(4) +
1136 /* IFLA_GRE_OKEY */
1137 nla_total_size(4) +
1138 /* IFLA_GRE_LOCAL */
1139 nla_total_size(4) +
1140 /* IFLA_GRE_REMOTE */
1141 nla_total_size(4) +
1142 /* IFLA_GRE_TTL */
1143 nla_total_size(1) +
1144 /* IFLA_GRE_TOS */
1145 nla_total_size(1) +
1146 /* IFLA_GRE_PMTUDISC */
1147 nla_total_size(1) +
Tom Herbert4565e992014-09-17 12:26:01 -07001148 /* IFLA_GRE_ENCAP_TYPE */
1149 nla_total_size(2) +
1150 /* IFLA_GRE_ENCAP_FLAGS */
1151 nla_total_size(2) +
1152 /* IFLA_GRE_ENCAP_SPORT */
1153 nla_total_size(2) +
1154 /* IFLA_GRE_ENCAP_DPORT */
1155 nla_total_size(2) +
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001156 /* IFLA_GRE_COLLECT_METADATA */
1157 nla_total_size(0) +
Herbert Xuc19e6542008-10-09 11:59:55 -07001158 0;
1159}
1160
1161static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
1162{
1163 struct ip_tunnel *t = netdev_priv(dev);
1164 struct ip_tunnel_parm *p = &t->parms;
1165
David S. Millerf3756b72012-04-01 20:39:02 -04001166 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
Pravin B Shelarc5441932013-03-25 14:49:35 +00001167 nla_put_be16(skb, IFLA_GRE_IFLAGS, tnl_flags_to_gre_flags(p->i_flags)) ||
1168 nla_put_be16(skb, IFLA_GRE_OFLAGS, tnl_flags_to_gre_flags(p->o_flags)) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001169 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
1170 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
Jiri Benc930345e2015-03-29 16:59:25 +02001171 nla_put_in_addr(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
1172 nla_put_in_addr(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
David S. Millerf3756b72012-04-01 20:39:02 -04001173 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
1174 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
1175 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
1176 !!(p->iph.frag_off & htons(IP_DF))))
1177 goto nla_put_failure;
Tom Herbert4565e992014-09-17 12:26:01 -07001178
1179 if (nla_put_u16(skb, IFLA_GRE_ENCAP_TYPE,
1180 t->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +01001181 nla_put_be16(skb, IFLA_GRE_ENCAP_SPORT,
1182 t->encap.sport) ||
1183 nla_put_be16(skb, IFLA_GRE_ENCAP_DPORT,
1184 t->encap.dport) ||
Tom Herbert4565e992014-09-17 12:26:01 -07001185 nla_put_u16(skb, IFLA_GRE_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -08001186 t->encap.flags))
Tom Herbert4565e992014-09-17 12:26:01 -07001187 goto nla_put_failure;
1188
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001189 if (t->collect_md) {
1190 if (nla_put_flag(skb, IFLA_GRE_COLLECT_METADATA))
1191 goto nla_put_failure;
1192 }
1193
Herbert Xuc19e6542008-10-09 11:59:55 -07001194 return 0;
1195
1196nla_put_failure:
1197 return -EMSGSIZE;
1198}
1199
1200static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
1201 [IFLA_GRE_LINK] = { .type = NLA_U32 },
1202 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
1203 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
1204 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
1205 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001206 [IFLA_GRE_LOCAL] = { .len = FIELD_SIZEOF(struct iphdr, saddr) },
1207 [IFLA_GRE_REMOTE] = { .len = FIELD_SIZEOF(struct iphdr, daddr) },
Herbert Xuc19e6542008-10-09 11:59:55 -07001208 [IFLA_GRE_TTL] = { .type = NLA_U8 },
1209 [IFLA_GRE_TOS] = { .type = NLA_U8 },
1210 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert4565e992014-09-17 12:26:01 -07001211 [IFLA_GRE_ENCAP_TYPE] = { .type = NLA_U16 },
1212 [IFLA_GRE_ENCAP_FLAGS] = { .type = NLA_U16 },
1213 [IFLA_GRE_ENCAP_SPORT] = { .type = NLA_U16 },
1214 [IFLA_GRE_ENCAP_DPORT] = { .type = NLA_U16 },
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001215 [IFLA_GRE_COLLECT_METADATA] = { .type = NLA_FLAG },
Herbert Xuc19e6542008-10-09 11:59:55 -07001216};
1217
1218static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
1219 .kind = "gre",
1220 .maxtype = IFLA_GRE_MAX,
1221 .policy = ipgre_policy,
1222 .priv_size = sizeof(struct ip_tunnel),
1223 .setup = ipgre_tunnel_setup,
1224 .validate = ipgre_tunnel_validate,
1225 .newlink = ipgre_newlink,
1226 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001227 .dellink = ip_tunnel_dellink,
Herbert Xuc19e6542008-10-09 11:59:55 -07001228 .get_size = ipgre_get_size,
1229 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001230 .get_link_net = ip_tunnel_get_link_net,
Herbert Xuc19e6542008-10-09 11:59:55 -07001231};
1232
Herbert Xue1a80002008-10-09 12:00:17 -07001233static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
1234 .kind = "gretap",
1235 .maxtype = IFLA_GRE_MAX,
1236 .policy = ipgre_policy,
1237 .priv_size = sizeof(struct ip_tunnel),
1238 .setup = ipgre_tap_setup,
1239 .validate = ipgre_tap_validate,
1240 .newlink = ipgre_newlink,
1241 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +00001242 .dellink = ip_tunnel_dellink,
Herbert Xue1a80002008-10-09 12:00:17 -07001243 .get_size = ipgre_get_size,
1244 .fill_info = ipgre_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +01001245 .get_link_net = ip_tunnel_get_link_net,
Herbert Xue1a80002008-10-09 12:00:17 -07001246};
1247
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001248struct net_device *gretap_fb_dev_create(struct net *net, const char *name,
1249 u8 name_assign_type)
1250{
1251 struct nlattr *tb[IFLA_MAX + 1];
1252 struct net_device *dev;
1253 struct ip_tunnel *t;
1254 int err;
1255
1256 memset(&tb, 0, sizeof(tb));
1257
1258 dev = rtnl_create_link(net, name, name_assign_type,
1259 &ipgre_tap_ops, tb);
1260 if (IS_ERR(dev))
1261 return dev;
1262
1263 /* Configure flow based GRE device. */
1264 t = netdev_priv(dev);
1265 t->collect_md = true;
1266
1267 err = ipgre_newlink(net, dev, tb, NULL);
1268 if (err < 0)
1269 goto out;
David Wragg7e059152016-02-10 00:05:58 +00001270
1271 /* openvswitch users expect packet sizes to be unrestricted,
1272 * so set the largest MTU we can.
1273 */
1274 err = __ip_tunnel_change_mtu(dev, IP_MAX_MTU, false);
1275 if (err)
1276 goto out;
1277
Pravin B Shelarb2acd1d2015-08-07 23:51:47 -07001278 return dev;
1279out:
1280 free_netdev(dev);
1281 return ERR_PTR(err);
1282}
1283EXPORT_SYMBOL_GPL(gretap_fb_dev_create);
1284
Pravin B Shelarc5441932013-03-25 14:49:35 +00001285static int __net_init ipgre_tap_init_net(struct net *net)
1286{
Pravin B Shelar2e15ea32015-08-07 23:51:42 -07001287 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, "gretap0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001288}
1289
1290static void __net_exit ipgre_tap_exit_net(struct net *net)
1291{
1292 struct ip_tunnel_net *itn = net_generic(net, gre_tap_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +02001293 ip_tunnel_delete_net(itn, &ipgre_tap_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001294}
1295
1296static struct pernet_operations ipgre_tap_net_ops = {
1297 .init = ipgre_tap_init_net,
1298 .exit = ipgre_tap_exit_net,
1299 .id = &gre_tap_net_id,
1300 .size = sizeof(struct ip_tunnel_net),
1301};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001302
1303static int __init ipgre_init(void)
1304{
1305 int err;
1306
Joe Perches058bd4d2012-03-11 18:36:11 +00001307 pr_info("GRE over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +00001309 err = register_pernet_device(&ipgre_net_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -07001310 if (err < 0)
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001311 return err;
1312
Pravin B Shelarc5441932013-03-25 14:49:35 +00001313 err = register_pernet_device(&ipgre_tap_net_ops);
1314 if (err < 0)
1315 goto pnet_tap_faied;
1316
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001317 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001318 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +00001319 pr_info("%s: can't add protocol\n", __func__);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001320 goto add_proto_failed;
1321 }
Pavel Emelyanov7daa0002008-04-16 01:10:05 -07001322
Herbert Xuc19e6542008-10-09 11:59:55 -07001323 err = rtnl_link_register(&ipgre_link_ops);
1324 if (err < 0)
1325 goto rtnl_link_failed;
1326
Herbert Xue1a80002008-10-09 12:00:17 -07001327 err = rtnl_link_register(&ipgre_tap_ops);
1328 if (err < 0)
1329 goto tap_ops_failed;
1330
Pravin B Shelarc5441932013-03-25 14:49:35 +00001331 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -07001332
Herbert Xue1a80002008-10-09 12:00:17 -07001333tap_ops_failed:
1334 rtnl_link_unregister(&ipgre_link_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001335rtnl_link_failed:
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001336 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001337add_proto_failed:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001338 unregister_pernet_device(&ipgre_tap_net_ops);
1339pnet_tap_faied:
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001340 unregister_pernet_device(&ipgre_net_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001341 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001342}
1343
Alexey Kuznetsovdb445752005-07-30 17:46:44 -07001344static void __exit ipgre_fini(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001345{
Herbert Xue1a80002008-10-09 12:00:17 -07001346 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001347 rtnl_link_unregister(&ipgre_link_ops);
Pravin B Shelar9f57c672015-08-07 23:51:52 -07001348 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001349 unregister_pernet_device(&ipgre_tap_net_ops);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001350 unregister_pernet_device(&ipgre_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001351}
1352
1353module_init(ipgre_init);
1354module_exit(ipgre_fini);
1355MODULE_LICENSE("GPL");
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001356MODULE_ALIAS_RTNL_LINK("gre");
1357MODULE_ALIAS_RTNL_LINK("gretap");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +03001358MODULE_ALIAS_NETDEV("gre0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001359MODULE_ALIAS_NETDEV("gretap0");