blob: c625e4dad4b05066d92fe02d1778b555234d0f2a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: GRE over IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Joe Perchesafd465032012-03-12 07:03:32 +000013#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14
Randy Dunlap4fc268d2006-01-11 12:17:47 -080015#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090019#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <asm/uaccess.h>
21#include <linux/skbuff.h>
22#include <linux/netdevice.h>
23#include <linux/in.h>
24#include <linux/tcp.h>
25#include <linux/udp.h>
26#include <linux/if_arp.h>
27#include <linux/mroute.h>
28#include <linux/init.h>
29#include <linux/in6.h>
30#include <linux/inetdevice.h>
31#include <linux/igmp.h>
32#include <linux/netfilter_ipv4.h>
Herbert Xue1a80002008-10-09 12:00:17 -070033#include <linux/etherdevice.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080034#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#include <net/sock.h>
37#include <net/ip.h>
38#include <net/icmp.h>
39#include <net/protocol.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +000040#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/arp.h>
42#include <net/checksum.h>
43#include <net/dsfield.h>
44#include <net/inet_ecn.h>
45#include <net/xfrm.h>
Pavel Emelyanov59a4c752008-04-16 01:08:53 -070046#include <net/net_namespace.h>
47#include <net/netns/generic.h>
Herbert Xuc19e6542008-10-09 11:59:55 -070048#include <net/rtnetlink.h>
Dmitry Kozlov00959ad2010-08-21 23:05:39 -070049#include <net/gre.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070050
Eric Dumazetdfd56b82011-12-10 09:48:31 +000051#if IS_ENABLED(CONFIG_IPV6)
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#include <net/ipv6.h>
53#include <net/ip6_fib.h>
54#include <net/ip6_route.h>
55#endif
56
57/*
58 Problems & solutions
59 --------------------
60
61 1. The most important issue is detecting local dead loops.
62 They would cause complete host lockup in transmit, which
63 would be "resolved" by stack overflow or, if queueing is enabled,
64 with infinite looping in net_bh.
65
66 We cannot track such dead loops during route installation,
67 it is infeasible task. The most general solutions would be
68 to keep skb->encapsulation counter (sort of local ttl),
Eric Dumazet6d0722a2010-09-29 23:35:10 -070069 and silently drop packet when it expires. It is a good
stephen hemmingerbff52852012-02-24 08:08:20 +000070 solution, but it supposes maintaining new variable in ALL
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 skb, even if no tunneling is used.
72
Eric Dumazet6d0722a2010-09-29 23:35:10 -070073 Current solution: xmit_recursion breaks dead loops. This is a percpu
74 counter, since when we enter the first ndo_xmit(), cpu migration is
75 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
Linus Torvalds1da177e2005-04-16 15:20:36 -070076
77 2. Networking dead loops would not kill routers, but would really
78 kill network. IP hop limit plays role of "t->recursion" in this case,
79 if we copy it from packet being encapsulated to upper header.
80 It is very good solution, but it introduces two problems:
81
82 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
83 do not work over tunnels.
84 - traceroute does not work. I planned to relay ICMP from tunnel,
85 so that this problem would be solved and traceroute output
86 would even more informative. This idea appeared to be wrong:
87 only Linux complies to rfc1812 now (yes, guys, Linux is the only
88 true router now :-)), all routers (at least, in neighbourhood of mine)
89 return only 8 bytes of payload. It is the end.
90
91 Hence, if we want that OSPF worked or traceroute said something reasonable,
92 we should search for another solution.
93
94 One of them is to parse packet trying to detect inner encapsulation
95 made by our node. It is difficult or even impossible, especially,
stephen hemmingerbff52852012-02-24 08:08:20 +000096 taking into account fragmentation. TO be short, ttl is not solution at all.
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
98 Current solution: The solution was UNEXPECTEDLY SIMPLE.
99 We force DF flag on tunnels with preconfigured hop limit,
100 that is ALL. :-) Well, it does not remove the problem completely,
101 but exponential growth of network traffic is changed to linear
102 (branches, that exceed pmtu are pruned) and tunnel mtu
stephen hemmingerbff52852012-02-24 08:08:20 +0000103 rapidly degrades to value <68, where looping stops.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104 Yes, it is not good if there exists a router in the loop,
105 which does not force DF, even when encapsulating packets have DF set.
106 But it is not our problem! Nobody could accuse us, we made
107 all that we could make. Even if it is your gated who injected
108 fatal route to network, even if it were you who configured
109 fatal static route: you are innocent. :-)
110
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 Alexey Kuznetsov.
112 */
113
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000114static bool log_ecn_error = true;
115module_param(log_ecn_error, bool, 0644);
116MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
117
Herbert Xuc19e6542008-10-09 11:59:55 -0700118static struct rtnl_link_ops ipgre_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119static int ipgre_tunnel_init(struct net_device *dev);
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700120
Eric Dumazetf99189b2009-11-17 10:42:49 +0000121static int ipgre_net_id __read_mostly;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000122static int gre_tap_net_id __read_mostly;
Pavel Emelyanoveb8ce742008-04-16 01:10:26 -0700123
Pravin B Shelarc5441932013-03-25 14:49:35 +0000124static __sum16 check_checksum(struct sk_buff *skb)
Eric Dumazete985aad2010-09-27 03:57:11 +0000125{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000126 __sum16 csum = 0;
Eric Dumazete985aad2010-09-27 03:57:11 +0000127
Pravin B Shelarc5441932013-03-25 14:49:35 +0000128 switch (skb->ip_summed) {
129 case CHECKSUM_COMPLETE:
130 csum = csum_fold(skb->csum);
Eric Dumazete985aad2010-09-27 03:57:11 +0000131
Pravin B Shelarc5441932013-03-25 14:49:35 +0000132 if (!csum)
133 break;
134 /* Fall through. */
stephen hemminger87b6d212012-04-12 06:31:16 +0000135
Pravin B Shelarc5441932013-03-25 14:49:35 +0000136 case CHECKSUM_NONE:
137 skb->csum = 0;
138 csum = __skb_checksum_complete(skb);
139 skb->ip_summed = CHECKSUM_COMPLETE;
140 break;
Eric Dumazete985aad2010-09-27 03:57:11 +0000141 }
stephen hemminger87b6d212012-04-12 06:31:16 +0000142
Pravin B Shelarc5441932013-03-25 14:49:35 +0000143 return csum;
Eric Dumazete985aad2010-09-27 03:57:11 +0000144}
145
Pravin B Shelarc5441932013-03-25 14:49:35 +0000146static int ip_gre_calc_hlen(__be16 o_flags)
stephen hemmingerd2083282012-09-24 18:12:23 +0000147{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000148 int addend = 4;
149
150 if (o_flags&TUNNEL_CSUM)
151 addend += 4;
152 if (o_flags&TUNNEL_KEY)
153 addend += 4;
154 if (o_flags&TUNNEL_SEQ)
155 addend += 4;
156 return addend;
157}
158
159static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
160 bool *csum_err, int *hdr_len)
161{
Eric Dumazet22251c72013-04-04 15:41:27 +0000162 unsigned int ip_hlen = ip_hdrlen(skb);
163 const struct gre_base_hdr *greh;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000164 __be32 *options;
165
166 if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
167 return -EINVAL;
168
Eric Dumazet22251c72013-04-04 15:41:27 +0000169 greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000170 if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
171 return -EINVAL;
172
173 tpi->flags = gre_flags_to_tnl_flags(greh->flags);
174 *hdr_len = ip_gre_calc_hlen(tpi->flags);
175
176 if (!pskb_may_pull(skb, *hdr_len))
177 return -EINVAL;
178
Eric Dumazet22251c72013-04-04 15:41:27 +0000179 greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
180
Pravin B Shelarc5441932013-03-25 14:49:35 +0000181 tpi->proto = greh->protocol;
182
183 options = (__be32 *)(greh + 1);
184 if (greh->flags & GRE_CSUM) {
185 if (check_checksum(skb)) {
186 *csum_err = true;
187 return -EINVAL;
188 }
189 options++;
190 }
191
192 if (greh->flags & GRE_KEY) {
193 tpi->key = *options;
194 options++;
stephen hemmingerd2083282012-09-24 18:12:23 +0000195 } else
Pravin B Shelarc5441932013-03-25 14:49:35 +0000196 tpi->key = 0;
stephen hemmingerd2083282012-09-24 18:12:23 +0000197
Pravin B Shelarc5441932013-03-25 14:49:35 +0000198 if (unlikely(greh->flags & GRE_SEQ)) {
199 tpi->seq = *options;
200 options++;
201 } else
202 tpi->seq = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Pravin B Shelarc5441932013-03-25 14:49:35 +0000204 /* WCCP version 1 and 2 protocol decoding.
205 * - Change protocol to IP
206 * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
207 */
208 if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
209 tpi->proto = htons(ETH_P_IP);
210 if ((*(u8 *)options & 0xF0) != 0x40) {
211 *hdr_len += 4;
212 if (!pskb_may_pull(skb, *hdr_len))
213 return -EINVAL;
Timo Terasafcf1242009-01-26 20:56:10 -0800214 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 }
Herbert Xue1a80002008-10-09 12:00:17 -0700216
Pravin B Shelarc5441932013-03-25 14:49:35 +0000217 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218}
219
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220static void ipgre_err(struct sk_buff *skb, u32 info)
221{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222
Pravin B Shelarc5441932013-03-25 14:49:35 +0000223 /* All the routers (except for Linux) return only
224 8 bytes of packet payload. It means, that precise relaying of
225 ICMP in the real Internet is absolutely infeasible.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226
Pravin B Shelarc5441932013-03-25 14:49:35 +0000227 Moreover, Cisco "wise men" put GRE key to the third word
228 in GRE header. It makes impossible maintaining even soft
229 state for keyed GRE tunnels with enabled checksum. Tell
230 them "thank you".
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231
Pravin B Shelarc5441932013-03-25 14:49:35 +0000232 Well, I wonder, rfc1812 was written by Cisco employee,
233 what the hell these idiots break standards established
234 by themselves???
235 */
236 struct net *net = dev_net(skb->dev);
237 struct ip_tunnel_net *itn;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000238 const struct iphdr *iph = (const struct iphdr *)skb->data;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300239 const int type = icmp_hdr(skb)->type;
240 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 struct ip_tunnel *t;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000242 struct tnl_ptk_info tpi;
243 int hdr_len;
244 bool csum_err = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245
Pravin B Shelarc5441932013-03-25 14:49:35 +0000246 if (parse_gre_header(skb, &tpi, &csum_err, &hdr_len)) {
247 if (!csum_err) /* ignore csum errors. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 }
250
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 switch (type) {
252 default:
253 case ICMP_PARAMETERPROB:
254 return;
255
256 case ICMP_DEST_UNREACH:
257 switch (code) {
258 case ICMP_SR_FAILED:
259 case ICMP_PORT_UNREACH:
260 /* Impossible event. */
261 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 default:
263 /* All others are translated to HOST_UNREACH.
264 rfc2003 contains "deep thoughts" about NET_UNREACH,
265 I believe they are just ether pollution. --ANK
266 */
267 break;
268 }
269 break;
270 case ICMP_TIME_EXCEEDED:
271 if (code != ICMP_EXC_TTL)
272 return;
273 break;
David S. Miller55be7a92012-07-11 21:27:49 -0700274
275 case ICMP_REDIRECT:
276 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 }
278
Pravin B Shelarc5441932013-03-25 14:49:35 +0000279 if (tpi.proto == htons(ETH_P_TEB))
280 itn = net_generic(net, gre_tap_net_id);
281 else
282 itn = net_generic(net, ipgre_net_id);
283
284 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi.flags,
285 iph->daddr, iph->saddr, tpi.key);
stephen hemmingerd2083282012-09-24 18:12:23 +0000286
David S. Miller36393392012-06-14 22:21:46 -0700287 if (t == NULL)
stephen hemminger0c5794a2012-09-24 18:12:24 +0000288 return;
David S. Miller36393392012-06-14 22:21:46 -0700289
290 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
291 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
292 t->parms.link, 0, IPPROTO_GRE, 0);
stephen hemminger0c5794a2012-09-24 18:12:24 +0000293 return;
David S. Miller36393392012-06-14 22:21:46 -0700294 }
David S. Miller55be7a92012-07-11 21:27:49 -0700295 if (type == ICMP_REDIRECT) {
296 ipv4_redirect(skb, dev_net(skb->dev), t->parms.link, 0,
297 IPPROTO_GRE, 0);
stephen hemminger0c5794a2012-09-24 18:12:24 +0000298 return;
David S. Miller55be7a92012-07-11 21:27:49 -0700299 }
David S. Miller36393392012-06-14 22:21:46 -0700300 if (t->parms.iph.daddr == 0 ||
Joe Perchesf97c1e02007-12-16 13:45:43 -0800301 ipv4_is_multicast(t->parms.iph.daddr))
stephen hemminger0c5794a2012-09-24 18:12:24 +0000302 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
304 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
stephen hemminger0c5794a2012-09-24 18:12:24 +0000305 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
Wei Yongjunda6185d82009-02-24 23:34:48 -0800307 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308 t->err_count++;
309 else
310 t->err_count = 1;
311 t->err_time = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312}
313
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314static int ipgre_rcv(struct sk_buff *skb)
315{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000316 struct net *net = dev_net(skb->dev);
317 struct ip_tunnel_net *itn;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000318 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319 struct ip_tunnel *tunnel;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000320 struct tnl_ptk_info tpi;
321 int hdr_len;
322 bool csum_err = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
Pravin B Shelarc5441932013-03-25 14:49:35 +0000324 if (parse_gre_header(skb, &tpi, &csum_err, &hdr_len) < 0)
stephen hemminger0c5794a2012-09-24 18:12:24 +0000325 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326
Pravin B Shelarc5441932013-03-25 14:49:35 +0000327 if (tpi.proto == htons(ETH_P_TEB))
328 itn = net_generic(net, gre_tap_net_id);
329 else
330 itn = net_generic(net, ipgre_net_id);
331
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700332 iph = ip_hdr(skb);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000333 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi.flags,
334 iph->saddr, iph->daddr, tpi.key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335
stephen hemmingerd2083282012-09-24 18:12:23 +0000336 if (tunnel) {
Pravin B Shelarc5441932013-03-25 14:49:35 +0000337 ip_tunnel_rcv(tunnel, skb, &tpi, log_ecn_error);
Eric Dumazet8990f462010-09-20 00:12:11 +0000338 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 }
Herbert Xu45af08b2006-04-05 22:31:19 -0700340 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341drop:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 kfree_skb(skb);
Eric Dumazeta02cec22010-09-22 20:43:57 +0000343 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344}
345
Pravin B Shelar8f100982013-02-24 20:05:05 +0000346static struct sk_buff *handle_offloads(struct ip_tunnel *tunnel, struct sk_buff *skb)
Pravin B Shelar68c33162013-02-14 14:02:41 +0000347{
348 int err;
349
350 if (skb_is_gso(skb)) {
351 err = skb_unclone(skb, GFP_ATOMIC);
352 if (unlikely(err))
353 goto error;
354 skb_shinfo(skb)->gso_type |= SKB_GSO_GRE;
355 return skb;
Pravin B Shelar8f100982013-02-24 20:05:05 +0000356 } else if (skb->ip_summed == CHECKSUM_PARTIAL &&
Pravin B Shelarc5441932013-03-25 14:49:35 +0000357 tunnel->parms.o_flags&TUNNEL_CSUM) {
Pravin B Shelar8f100982013-02-24 20:05:05 +0000358 err = skb_checksum_help(skb);
359 if (unlikely(err))
360 goto error;
361 } else if (skb->ip_summed != CHECKSUM_PARTIAL)
Dmitry Kravkovaa0e51c2013-02-18 09:50:52 +0000362 skb->ip_summed = CHECKSUM_NONE;
Pravin B Shelar68c33162013-02-14 14:02:41 +0000363
364 return skb;
365
366error:
367 kfree_skb(skb);
368 return ERR_PTR(err);
369}
370
Pravin B Shelarc5441932013-03-25 14:49:35 +0000371static struct sk_buff *gre_build_header(struct sk_buff *skb,
372 const struct tnl_ptk_info *tpi,
373 int hdr_len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000375 struct gre_base_hdr *greh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376
Pravin B Shelarc5441932013-03-25 14:49:35 +0000377 skb_push(skb, hdr_len);
378
379 greh = (struct gre_base_hdr *)skb->data;
380 greh->flags = tnl_flags_to_gre_flags(tpi->flags);
381 greh->protocol = tpi->proto;
382
383 if (tpi->flags&(TUNNEL_KEY|TUNNEL_CSUM|TUNNEL_SEQ)) {
384 __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
385
386 if (tpi->flags&TUNNEL_SEQ) {
387 *ptr = tpi->seq;
388 ptr--;
389 }
390 if (tpi->flags&TUNNEL_KEY) {
391 *ptr = tpi->key;
392 ptr--;
393 }
394 if (tpi->flags&TUNNEL_CSUM &&
395 !(skb_shinfo(skb)->gso_type & SKB_GSO_GRE)) {
396 *(__sum16 *)ptr = 0;
397 *(__sum16 *)ptr = csum_fold(skb_checksum(skb, 0,
398 skb->len, 0));
399 }
Pravin B Shelar68c33162013-02-14 14:02:41 +0000400 }
401
Pravin B Shelarc5441932013-03-25 14:49:35 +0000402 return skb;
403}
404
405static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
406 const struct iphdr *tnl_params,
407 __be16 proto)
408{
409 struct ip_tunnel *tunnel = netdev_priv(dev);
410 struct tnl_ptk_info tpi;
411
412 if (likely(!skb->encapsulation)) {
Pravin B Shelar68c33162013-02-14 14:02:41 +0000413 skb_reset_inner_headers(skb);
414 skb->encapsulation = 1;
415 }
Eric Dumazet6b78f162012-09-13 21:25:33 +0000416
Pravin B Shelarc5441932013-03-25 14:49:35 +0000417 tpi.flags = tunnel->parms.o_flags;
418 tpi.proto = proto;
419 tpi.key = tunnel->parms.o_key;
420 if (tunnel->parms.o_flags & TUNNEL_SEQ)
421 tunnel->o_seqno++;
422 tpi.seq = htonl(tunnel->o_seqno);
Eric Dumazetcef401d2013-01-25 20:34:37 +0000423
Pravin B Shelarc5441932013-03-25 14:49:35 +0000424 /* Push GRE header. */
425 skb = gre_build_header(skb, &tpi, tunnel->hlen);
426 if (unlikely(!skb)) {
427 dev->stats.tx_dropped++;
428 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429 }
430
Pravin B Shelarc5441932013-03-25 14:49:35 +0000431 ip_tunnel_xmit(skb, dev, tnl_params);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432}
433
Pravin B Shelarc5441932013-03-25 14:49:35 +0000434static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
435 struct net_device *dev)
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800436{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000437 struct ip_tunnel *tunnel = netdev_priv(dev);
438 const struct iphdr *tnl_params;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800439
Pravin B Shelarc5441932013-03-25 14:49:35 +0000440 skb = handle_offloads(tunnel, skb);
441 if (IS_ERR(skb))
442 goto out;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800443
Pravin B Shelarc5441932013-03-25 14:49:35 +0000444 if (dev->header_ops) {
445 /* Need space for new headers */
446 if (skb_cow_head(skb, dev->needed_headroom -
Chen Gang2bac7cb2013-04-22 20:45:42 +0000447 (tunnel->hlen + sizeof(struct iphdr))))
Pravin B Shelarc5441932013-03-25 14:49:35 +0000448 goto free_skb;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800449
Pravin B Shelarc5441932013-03-25 14:49:35 +0000450 tnl_params = (const struct iphdr *)skb->data;
Eric Dumazete985aad2010-09-27 03:57:11 +0000451
Pravin B Shelarc5441932013-03-25 14:49:35 +0000452 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
453 * to gre header.
454 */
455 skb_pull(skb, tunnel->hlen + sizeof(struct iphdr));
456 } else {
457 if (skb_cow_head(skb, dev->needed_headroom))
458 goto free_skb;
Herbert Xue1a80002008-10-09 12:00:17 -0700459
Pravin B Shelarc5441932013-03-25 14:49:35 +0000460 tnl_params = &tunnel->parms.iph;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800461 }
462
Pravin B Shelarc5441932013-03-25 14:49:35 +0000463 __gre_xmit(skb, dev, tnl_params, skb->protocol);
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800464
Pravin B Shelarc5441932013-03-25 14:49:35 +0000465 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800466
Pravin B Shelarc5441932013-03-25 14:49:35 +0000467free_skb:
468 dev_kfree_skb(skb);
469out:
470 dev->stats.tx_dropped++;
471 return NETDEV_TX_OK;
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800472}
473
Pravin B Shelarc5441932013-03-25 14:49:35 +0000474static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
475 struct net_device *dev)
476{
477 struct ip_tunnel *tunnel = netdev_priv(dev);
478
479 skb = handle_offloads(tunnel, skb);
480 if (IS_ERR(skb))
481 goto out;
482
483 if (skb_cow_head(skb, dev->needed_headroom))
484 goto free_skb;
485
486 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
487
488 return NETDEV_TX_OK;
489
490free_skb:
491 dev_kfree_skb(skb);
492out:
493 dev->stats.tx_dropped++;
494 return NETDEV_TX_OK;
495}
496
497static int ipgre_tunnel_ioctl(struct net_device *dev,
498 struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499{
500 int err = 0;
501 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700502
Pravin B Shelarc5441932013-03-25 14:49:35 +0000503 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
504 return -EFAULT;
505 if (p.iph.version != 4 || p.iph.protocol != IPPROTO_GRE ||
506 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)) ||
507 ((p.i_flags|p.o_flags)&(GRE_VERSION|GRE_ROUTING))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 return -EINVAL;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000509 }
510 p.i_flags = gre_flags_to_tnl_flags(p.i_flags);
511 p.o_flags = gre_flags_to_tnl_flags(p.o_flags);
512
513 err = ip_tunnel_ioctl(dev, &p, cmd);
514 if (err)
515 return err;
516
517 p.i_flags = tnl_flags_to_gre_flags(p.i_flags);
518 p.o_flags = tnl_flags_to_gre_flags(p.o_flags);
519
520 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
521 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700522 return 0;
523}
524
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525/* Nice toy. Unfortunately, useless in real life :-)
526 It allows to construct virtual multiprotocol broadcast "LAN"
527 over the Internet, provided multicast routing is tuned.
528
529
530 I have no idea was this bicycle invented before me,
531 so that I had to set ARPHRD_IPGRE to a random value.
532 I have an impression, that Cisco could make something similar,
533 but this feature is apparently missing in IOS<=11.2(8).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900534
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
536 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
537
538 ping -t 255 224.66.66.66
539
540 If nobody answers, mbone does not work.
541
542 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
543 ip addr add 10.66.66.<somewhat>/24 dev Universe
544 ifconfig Universe up
545 ifconfig Universe add fe80::<Your_real_addr>/10
546 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
547 ftp 10.66.66.66
548 ...
549 ftp fec0:6666:6666::193.233.7.65
550 ...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 */
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700552static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
553 unsigned short type,
Eric Dumazet15078502010-09-15 11:07:53 +0000554 const void *daddr, const void *saddr, unsigned int len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555{
Patrick McHardy2941a482006-01-08 22:05:26 -0800556 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000557 struct iphdr *iph;
558 struct gre_base_hdr *greh;
559
560 iph = (struct iphdr *)skb_push(skb, t->hlen + sizeof(*iph));
561 greh = (struct gre_base_hdr *)(iph+1);
562 greh->flags = tnl_flags_to_gre_flags(t->parms.o_flags);
563 greh->protocol = htons(type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564
565 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700566
Pravin B Shelarc5441932013-03-25 14:49:35 +0000567 /* Set the source hardware address. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 if (saddr)
569 memcpy(&iph->saddr, saddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000570 if (daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 memcpy(&iph->daddr, daddr, 4);
Timo Teräs6d55cb92010-03-03 04:01:13 +0000572 if (iph->daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573 return t->hlen;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900574
Pravin B Shelarc5441932013-03-25 14:49:35 +0000575 return -(t->hlen + sizeof(*iph));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576}
577
Timo Teras6a5f44d2007-10-23 20:31:53 -0700578static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
579{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000580 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
Timo Teras6a5f44d2007-10-23 20:31:53 -0700581 memcpy(haddr, &iph->saddr, 4);
582 return 4;
583}
584
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700585static const struct header_ops ipgre_header_ops = {
586 .create = ipgre_header,
Timo Teras6a5f44d2007-10-23 20:31:53 -0700587 .parse = ipgre_header_parse,
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700588};
589
Timo Teras6a5f44d2007-10-23 20:31:53 -0700590#ifdef CONFIG_NET_IPGRE_BROADCAST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591static int ipgre_open(struct net_device *dev)
592{
Patrick McHardy2941a482006-01-08 22:05:26 -0800593 struct ip_tunnel *t = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594
Joe Perchesf97c1e02007-12-16 13:45:43 -0800595 if (ipv4_is_multicast(t->parms.iph.daddr)) {
David S. Millercbb1e852011-05-04 12:33:34 -0700596 struct flowi4 fl4;
597 struct rtable *rt;
Eric Dumazete985aad2010-09-27 03:57:11 +0000598
David S. Millercbb1e852011-05-04 12:33:34 -0700599 rt = ip_route_output_gre(dev_net(dev), &fl4,
600 t->parms.iph.daddr,
601 t->parms.iph.saddr,
602 t->parms.o_key,
603 RT_TOS(t->parms.iph.tos),
604 t->parms.link);
David S. Millerb23dd4f2011-03-02 14:31:35 -0800605 if (IS_ERR(rt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 return -EADDRNOTAVAIL;
Changli Gaod8d1f302010-06-10 23:31:35 -0700607 dev = rt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700608 ip_rt_put(rt);
Herbert Xue5ed6392005-10-03 14:35:55 -0700609 if (__in_dev_get_rtnl(dev) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610 return -EADDRNOTAVAIL;
611 t->mlink = dev->ifindex;
Herbert Xue5ed6392005-10-03 14:35:55 -0700612 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 }
614 return 0;
615}
616
617static int ipgre_close(struct net_device *dev)
618{
Patrick McHardy2941a482006-01-08 22:05:26 -0800619 struct ip_tunnel *t = netdev_priv(dev);
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800620
Joe Perchesf97c1e02007-12-16 13:45:43 -0800621 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800622 struct in_device *in_dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900623 in_dev = inetdev_by_index(dev_net(dev), t->mlink);
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000624 if (in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 }
627 return 0;
628}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700629#endif
630
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800631static const struct net_device_ops ipgre_netdev_ops = {
632 .ndo_init = ipgre_tunnel_init,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000633 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800634#ifdef CONFIG_NET_IPGRE_BROADCAST
635 .ndo_open = ipgre_open,
636 .ndo_stop = ipgre_close,
637#endif
Pravin B Shelarc5441932013-03-25 14:49:35 +0000638 .ndo_start_xmit = ipgre_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800639 .ndo_do_ioctl = ipgre_tunnel_ioctl,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000640 .ndo_change_mtu = ip_tunnel_change_mtu,
641 .ndo_get_stats64 = ip_tunnel_get_stats64,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800642};
643
Eric Dumazet6b78f162012-09-13 21:25:33 +0000644#define GRE_FEATURES (NETIF_F_SG | \
645 NETIF_F_FRAGLIST | \
646 NETIF_F_HIGHDMA | \
647 NETIF_F_HW_CSUM)
648
Linus Torvalds1da177e2005-04-16 15:20:36 -0700649static void ipgre_tunnel_setup(struct net_device *dev)
650{
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800651 dev->netdev_ops = &ipgre_netdev_ops;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000652 ip_tunnel_setup(dev, ipgre_net_id);
653}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654
Pravin B Shelarc5441932013-03-25 14:49:35 +0000655static void __gre_tunnel_init(struct net_device *dev)
656{
657 struct ip_tunnel *tunnel;
658
659 tunnel = netdev_priv(dev);
660 tunnel->hlen = ip_gre_calc_hlen(tunnel->parms.o_flags);
661 tunnel->parms.iph.protocol = IPPROTO_GRE;
662
663 dev->needed_headroom = LL_MAX_HEADER + sizeof(struct iphdr) + 4;
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800664 dev->mtu = ETH_DATA_LEN - sizeof(struct iphdr) - 4;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000665
Pravin B Shelarc5441932013-03-25 14:49:35 +0000666 dev->features |= NETIF_F_NETNS_LOCAL | GRE_FEATURES;
Eric Dumazet6b78f162012-09-13 21:25:33 +0000667 dev->hw_features |= GRE_FEATURES;
Pravin B Shelarc5441932013-03-25 14:49:35 +0000668
669 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
670 /* TCP offload with GRE SEQ is not supported. */
671 dev->features |= NETIF_F_GSO_SOFTWARE;
672 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
673 /* Can use a lockless transmit, unless we generate
674 * output sequences
675 */
676 dev->features |= NETIF_F_LLTX;
677 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700678}
679
680static int ipgre_tunnel_init(struct net_device *dev)
681{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000682 struct ip_tunnel *tunnel = netdev_priv(dev);
683 struct iphdr *iph = &tunnel->parms.iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684
Pravin B Shelarc5441932013-03-25 14:49:35 +0000685 __gre_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686
Pravin B Shelarc5441932013-03-25 14:49:35 +0000687 memcpy(dev->dev_addr, &iph->saddr, 4);
688 memcpy(dev->broadcast, &iph->daddr, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689
Pravin B Shelarc5441932013-03-25 14:49:35 +0000690 dev->type = ARPHRD_IPGRE;
691 dev->flags = IFF_NOARP;
692 dev->priv_flags &= ~IFF_XMIT_DST_RELEASE;
693 dev->addr_len = 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695 if (iph->daddr) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696#ifdef CONFIG_NET_IPGRE_BROADCAST
Joe Perchesf97c1e02007-12-16 13:45:43 -0800697 if (ipv4_is_multicast(iph->daddr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 if (!iph->saddr)
699 return -EINVAL;
700 dev->flags = IFF_BROADCAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700701 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 }
703#endif
Michal Schmidtee34c1e2007-12-13 09:46:32 -0800704 } else
Timo Teras6a5f44d2007-10-23 20:31:53 -0700705 dev->header_ops = &ipgre_header_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706
Pravin B Shelarc5441932013-03-25 14:49:35 +0000707 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708}
709
Dmitry Kozlov00959ad2010-08-21 23:05:39 -0700710static const struct gre_protocol ipgre_protocol = {
711 .handler = ipgre_rcv,
712 .err_handler = ipgre_err,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713};
714
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000715static int __net_init ipgre_init_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700716{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000717 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700718}
719
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000720static void __net_exit ipgre_exit_net(struct net *net)
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700721{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000722 struct ip_tunnel_net *itn = net_generic(net, ipgre_net_id);
723 ip_tunnel_delete_net(itn);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700724}
725
726static struct pernet_operations ipgre_net_ops = {
727 .init = ipgre_init_net,
728 .exit = ipgre_exit_net,
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000729 .id = &ipgre_net_id,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000730 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700731};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732
Herbert Xuc19e6542008-10-09 11:59:55 -0700733static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
734{
735 __be16 flags;
736
737 if (!data)
738 return 0;
739
740 flags = 0;
741 if (data[IFLA_GRE_IFLAGS])
742 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
743 if (data[IFLA_GRE_OFLAGS])
744 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
745 if (flags & (GRE_VERSION|GRE_ROUTING))
746 return -EINVAL;
747
748 return 0;
749}
750
Herbert Xue1a80002008-10-09 12:00:17 -0700751static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[])
752{
753 __be32 daddr;
754
755 if (tb[IFLA_ADDRESS]) {
756 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
757 return -EINVAL;
758 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
759 return -EADDRNOTAVAIL;
760 }
761
762 if (!data)
763 goto out;
764
765 if (data[IFLA_GRE_REMOTE]) {
766 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
767 if (!daddr)
768 return -EINVAL;
769 }
770
771out:
772 return ipgre_tunnel_validate(tb, data);
773}
774
Pravin B Shelarc5441932013-03-25 14:49:35 +0000775static void ipgre_netlink_parms(struct nlattr *data[], struct nlattr *tb[],
776 struct ip_tunnel_parm *parms)
Herbert Xuc19e6542008-10-09 11:59:55 -0700777{
Herbert Xu7bb82d92008-10-11 12:20:15 -0700778 memset(parms, 0, sizeof(*parms));
Herbert Xuc19e6542008-10-09 11:59:55 -0700779
780 parms->iph.protocol = IPPROTO_GRE;
781
782 if (!data)
783 return;
784
785 if (data[IFLA_GRE_LINK])
786 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
787
788 if (data[IFLA_GRE_IFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000789 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700790
791 if (data[IFLA_GRE_OFLAGS])
Pravin B Shelarc5441932013-03-25 14:49:35 +0000792 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
Herbert Xuc19e6542008-10-09 11:59:55 -0700793
794 if (data[IFLA_GRE_IKEY])
795 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
796
797 if (data[IFLA_GRE_OKEY])
798 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
799
800 if (data[IFLA_GRE_LOCAL])
Patrick McHardy4d74f8b2008-10-10 12:11:06 -0700801 parms->iph.saddr = nla_get_be32(data[IFLA_GRE_LOCAL]);
Herbert Xuc19e6542008-10-09 11:59:55 -0700802
803 if (data[IFLA_GRE_REMOTE])
Patrick McHardy4d74f8b2008-10-10 12:11:06 -0700804 parms->iph.daddr = nla_get_be32(data[IFLA_GRE_REMOTE]);
Herbert Xuc19e6542008-10-09 11:59:55 -0700805
806 if (data[IFLA_GRE_TTL])
807 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
808
809 if (data[IFLA_GRE_TOS])
810 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
811
812 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC]))
813 parms->iph.frag_off = htons(IP_DF);
814}
815
Pravin B Shelarc5441932013-03-25 14:49:35 +0000816static int gre_tap_init(struct net_device *dev)
Herbert Xue1a80002008-10-09 12:00:17 -0700817{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000818 __gre_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -0700819
Pravin B Shelarc5441932013-03-25 14:49:35 +0000820 return ip_tunnel_init(dev);
Herbert Xue1a80002008-10-09 12:00:17 -0700821}
822
Pravin B Shelarc5441932013-03-25 14:49:35 +0000823static const struct net_device_ops gre_tap_netdev_ops = {
824 .ndo_init = gre_tap_init,
825 .ndo_uninit = ip_tunnel_uninit,
826 .ndo_start_xmit = gre_tap_xmit,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800827 .ndo_set_mac_address = eth_mac_addr,
828 .ndo_validate_addr = eth_validate_addr,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000829 .ndo_change_mtu = ip_tunnel_change_mtu,
830 .ndo_get_stats64 = ip_tunnel_get_stats64,
Stephen Hemmingerb8c26a32008-11-20 20:34:29 -0800831};
832
Herbert Xue1a80002008-10-09 12:00:17 -0700833static void ipgre_tap_setup(struct net_device *dev)
834{
Herbert Xue1a80002008-10-09 12:00:17 -0700835 ether_setup(dev);
Pravin B Shelarc5441932013-03-25 14:49:35 +0000836 dev->netdev_ops = &gre_tap_netdev_ops;
837 ip_tunnel_setup(dev, gre_tap_net_id);
Herbert Xue1a80002008-10-09 12:00:17 -0700838}
839
Pravin B Shelarc5441932013-03-25 14:49:35 +0000840static int ipgre_newlink(struct net *src_net, struct net_device *dev,
841 struct nlattr *tb[], struct nlattr *data[])
Herbert Xuc19e6542008-10-09 11:59:55 -0700842{
Pravin B Shelarc5441932013-03-25 14:49:35 +0000843 struct ip_tunnel_parm p;
Herbert Xuc19e6542008-10-09 11:59:55 -0700844
Pravin B Shelarc5441932013-03-25 14:49:35 +0000845 ipgre_netlink_parms(data, tb, &p);
846 return ip_tunnel_newlink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -0700847}
848
849static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
850 struct nlattr *data[])
851{
Herbert Xuc19e6542008-10-09 11:59:55 -0700852 struct ip_tunnel_parm p;
Herbert Xuc19e6542008-10-09 11:59:55 -0700853
Pravin B Shelarc5441932013-03-25 14:49:35 +0000854 ipgre_netlink_parms(data, tb, &p);
855 return ip_tunnel_changelink(dev, tb, &p);
Herbert Xuc19e6542008-10-09 11:59:55 -0700856}
857
858static size_t ipgre_get_size(const struct net_device *dev)
859{
860 return
861 /* IFLA_GRE_LINK */
862 nla_total_size(4) +
863 /* IFLA_GRE_IFLAGS */
864 nla_total_size(2) +
865 /* IFLA_GRE_OFLAGS */
866 nla_total_size(2) +
867 /* IFLA_GRE_IKEY */
868 nla_total_size(4) +
869 /* IFLA_GRE_OKEY */
870 nla_total_size(4) +
871 /* IFLA_GRE_LOCAL */
872 nla_total_size(4) +
873 /* IFLA_GRE_REMOTE */
874 nla_total_size(4) +
875 /* IFLA_GRE_TTL */
876 nla_total_size(1) +
877 /* IFLA_GRE_TOS */
878 nla_total_size(1) +
879 /* IFLA_GRE_PMTUDISC */
880 nla_total_size(1) +
881 0;
882}
883
884static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
885{
886 struct ip_tunnel *t = netdev_priv(dev);
887 struct ip_tunnel_parm *p = &t->parms;
888
David S. Millerf3756b72012-04-01 20:39:02 -0400889 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
Pravin B Shelarc5441932013-03-25 14:49:35 +0000890 nla_put_be16(skb, IFLA_GRE_IFLAGS, tnl_flags_to_gre_flags(p->i_flags)) ||
891 nla_put_be16(skb, IFLA_GRE_OFLAGS, tnl_flags_to_gre_flags(p->o_flags)) ||
David S. Millerf3756b72012-04-01 20:39:02 -0400892 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
893 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
894 nla_put_be32(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
895 nla_put_be32(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
896 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
897 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
898 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
899 !!(p->iph.frag_off & htons(IP_DF))))
900 goto nla_put_failure;
Herbert Xuc19e6542008-10-09 11:59:55 -0700901 return 0;
902
903nla_put_failure:
904 return -EMSGSIZE;
905}
906
907static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
908 [IFLA_GRE_LINK] = { .type = NLA_U32 },
909 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
910 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
911 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
912 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
Patrick McHardy4d74f8b2008-10-10 12:11:06 -0700913 [IFLA_GRE_LOCAL] = { .len = FIELD_SIZEOF(struct iphdr, saddr) },
914 [IFLA_GRE_REMOTE] = { .len = FIELD_SIZEOF(struct iphdr, daddr) },
Herbert Xuc19e6542008-10-09 11:59:55 -0700915 [IFLA_GRE_TTL] = { .type = NLA_U8 },
916 [IFLA_GRE_TOS] = { .type = NLA_U8 },
917 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
918};
919
920static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
921 .kind = "gre",
922 .maxtype = IFLA_GRE_MAX,
923 .policy = ipgre_policy,
924 .priv_size = sizeof(struct ip_tunnel),
925 .setup = ipgre_tunnel_setup,
926 .validate = ipgre_tunnel_validate,
927 .newlink = ipgre_newlink,
928 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000929 .dellink = ip_tunnel_dellink,
Herbert Xuc19e6542008-10-09 11:59:55 -0700930 .get_size = ipgre_get_size,
931 .fill_info = ipgre_fill_info,
932};
933
Herbert Xue1a80002008-10-09 12:00:17 -0700934static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
935 .kind = "gretap",
936 .maxtype = IFLA_GRE_MAX,
937 .policy = ipgre_policy,
938 .priv_size = sizeof(struct ip_tunnel),
939 .setup = ipgre_tap_setup,
940 .validate = ipgre_tap_validate,
941 .newlink = ipgre_newlink,
942 .changelink = ipgre_changelink,
Pravin B Shelarc5441932013-03-25 14:49:35 +0000943 .dellink = ip_tunnel_dellink,
Herbert Xue1a80002008-10-09 12:00:17 -0700944 .get_size = ipgre_get_size,
945 .fill_info = ipgre_fill_info,
946};
947
Pravin B Shelarc5441932013-03-25 14:49:35 +0000948static int __net_init ipgre_tap_init_net(struct net *net)
949{
950 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, NULL);
951}
952
953static void __net_exit ipgre_tap_exit_net(struct net *net)
954{
955 struct ip_tunnel_net *itn = net_generic(net, gre_tap_net_id);
956 ip_tunnel_delete_net(itn);
957}
958
959static struct pernet_operations ipgre_tap_net_ops = {
960 .init = ipgre_tap_init_net,
961 .exit = ipgre_tap_exit_net,
962 .id = &gre_tap_net_id,
963 .size = sizeof(struct ip_tunnel_net),
964};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700965
966static int __init ipgre_init(void)
967{
968 int err;
969
Joe Perches058bd4d2012-03-11 18:36:11 +0000970 pr_info("GRE over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971
Eric W. Biedermancfb8fbf2009-11-29 15:46:13 +0000972 err = register_pernet_device(&ipgre_net_ops);
Pavel Emelyanov59a4c752008-04-16 01:08:53 -0700973 if (err < 0)
Alexey Dobriyanc2892f02010-02-16 07:57:44 +0000974 return err;
975
Pravin B Shelarc5441932013-03-25 14:49:35 +0000976 err = register_pernet_device(&ipgre_tap_net_ops);
977 if (err < 0)
978 goto pnet_tap_faied;
979
Dmitry Kozlov00959ad2010-08-21 23:05:39 -0700980 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +0000981 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +0000982 pr_info("%s: can't add protocol\n", __func__);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +0000983 goto add_proto_failed;
984 }
Pavel Emelyanov7daa0002008-04-16 01:10:05 -0700985
Herbert Xuc19e6542008-10-09 11:59:55 -0700986 err = rtnl_link_register(&ipgre_link_ops);
987 if (err < 0)
988 goto rtnl_link_failed;
989
Herbert Xue1a80002008-10-09 12:00:17 -0700990 err = rtnl_link_register(&ipgre_tap_ops);
991 if (err < 0)
992 goto tap_ops_failed;
993
Pravin B Shelarc5441932013-03-25 14:49:35 +0000994 return 0;
Herbert Xuc19e6542008-10-09 11:59:55 -0700995
Herbert Xue1a80002008-10-09 12:00:17 -0700996tap_ops_failed:
997 rtnl_link_unregister(&ipgre_link_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -0700998rtnl_link_failed:
Dmitry Kozlov00959ad2010-08-21 23:05:39 -0700999 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001000add_proto_failed:
Pravin B Shelarc5441932013-03-25 14:49:35 +00001001 unregister_pernet_device(&ipgre_tap_net_ops);
1002pnet_tap_faied:
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001003 unregister_pernet_device(&ipgre_net_ops);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001004 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001005}
1006
Alexey Kuznetsovdb445752005-07-30 17:46:44 -07001007static void __exit ipgre_fini(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008{
Herbert Xue1a80002008-10-09 12:00:17 -07001009 rtnl_link_unregister(&ipgre_tap_ops);
Herbert Xuc19e6542008-10-09 11:59:55 -07001010 rtnl_link_unregister(&ipgre_link_ops);
Dmitry Kozlov00959ad2010-08-21 23:05:39 -07001011 if (gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO) < 0)
Joe Perches058bd4d2012-03-11 18:36:11 +00001012 pr_info("%s: can't remove protocol\n", __func__);
Pravin B Shelarc5441932013-03-25 14:49:35 +00001013 unregister_pernet_device(&ipgre_tap_net_ops);
Alexey Dobriyanc2892f02010-02-16 07:57:44 +00001014 unregister_pernet_device(&ipgre_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015}
1016
1017module_init(ipgre_init);
1018module_exit(ipgre_fini);
1019MODULE_LICENSE("GPL");
Patrick McHardy4d74f8b2008-10-10 12:11:06 -07001020MODULE_ALIAS_RTNL_LINK("gre");
1021MODULE_ALIAS_RTNL_LINK("gretap");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +03001022MODULE_ALIAS_NETDEV("gre0");
Pravin B Shelarc5441932013-03-25 14:49:35 +00001023MODULE_ALIAS_NETDEV("gretap0");