blob: c9392589c4157e4ac5d4c2e619b6f3ed265165be [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002 * Linux NET3: IP/IP protocol decoder.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Authors:
5 * Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
6 *
7 * Fixes:
8 * Alan Cox : Merged and made usable non modular (its so tiny its silly as
9 * a module taking up 2 pages).
10 * Alan Cox : Fixed bug with 1.3.18 and IPIP not working (now needs to set skb->h.iph)
11 * to keep ip_forward happy.
12 * Alan Cox : More fixes for 1.3.21, and firewall fix. Maybe this will work soon 8).
13 * Kai Schulte : Fixed #defines for IP_FIREWALL->FIREWALL
14 * David Woodhouse : Perform some basic ICMP handling.
15 * IPIP Routing without decapsulation.
16 * Carlos Picoto : GRE over IP support
17 * Alexey Kuznetsov: Reworked. Really, now it is truncated version of ipv4/ip_gre.c.
18 * I do not want to merge them together.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 *
25 */
26
27/* tunnel.c: an IP tunnel driver
28
29 The purpose of this driver is to provide an IP tunnel through
30 which you can tunnel network traffic transparently across subnets.
31
32 This was written by looking at Nick Holloway's dummy driver
33 Thanks for the great code!
34
35 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090036
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 Minor tweaks:
38 Cleaned up the code a little and added some pre-1.3.0 tweaks.
39 dev->hard_header/hard_header_len changed to use no headers.
40 Comments/bracketing tweaked.
41 Made the tunnels use dev->name not tunnel: when error reporting.
42 Added tx_dropped stat
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090043
Alan Cox113aa832008-10-13 19:01:08 -070044 -Alan Cox (alan@lxorguk.ukuu.org.uk) 21 March 95
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46 Reworked:
47 Changed to tunnel to destination gateway in addition to the
48 tunnel's pointopoint address
49 Almost completely rewritten
50 Note: There is currently no firewall or ICMP handling done.
51
52 -Sam Lantinga (slouken@cs.ucdavis.edu) 02/13/96
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090053
Linus Torvalds1da177e2005-04-16 15:20:36 -070054*/
55
56/* Things I wish I had known when writing the tunnel driver:
57
58 When the tunnel_xmit() function is called, the skb contains the
59 packet to be sent (plus a great deal of extra info), and dev
60 contains the tunnel device that _we_ are.
61
62 When we are passed a packet, we are expected to fill in the
63 source address with our source IP address.
64
65 What is the proper way to allocate, copy and free a buffer?
66 After you allocate it, it is a "0 length" chunk of memory
67 starting at zero. If you want to add headers to the buffer
68 later, you'll have to call "skb_reserve(skb, amount)" with
69 the amount of memory you want reserved. Then, you call
70 "skb_put(skb, amount)" with the amount of space you want in
71 the buffer. skb_put() returns a pointer to the top (#0) of
72 that buffer. skb->len is set to the amount of space you have
73 "allocated" with skb_put(). You can then write up to skb->len
74 bytes to that buffer. If you need more, you can call skb_put()
75 again with the additional amount of space you need. You can
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090076 find out how much more space you can allocate by calling
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 "skb_tailroom(skb)".
78 Now, to add header space, call "skb_push(skb, header_len)".
79 This creates space at the beginning of the buffer and returns
80 a pointer to this new space. If later you need to strip a
81 header from a buffer, call "skb_pull(skb, header_len)".
82 skb_headroom() will return how much space is left at the top
83 of the buffer (before the main data). Remember, this headroom
84 space must be reserved before the skb_put() function is called.
85 */
86
87/*
88 This version of net/ipv4/ipip.c is cloned of net/ipv4/ip_gre.c
89
90 For comments look at net/ipv4/ip_gre.c --ANK
91 */
92
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090093
Randy Dunlap4fc268d2006-01-11 12:17:47 -080094#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070095#include <linux/module.h>
96#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070097#include <linux/kernel.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090098#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070099#include <asm/uaccess.h>
100#include <linux/skbuff.h>
101#include <linux/netdevice.h>
102#include <linux/in.h>
103#include <linux/tcp.h>
104#include <linux/udp.h>
105#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#include <linux/init.h>
107#include <linux/netfilter_ipv4.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800108#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
110#include <net/sock.h>
111#include <net/ip.h>
112#include <net/icmp.h>
Pravin B Shelarc5441932013-03-25 14:49:35 +0000113#include <net/ip_tunnels.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#include <net/inet_ecn.h>
115#include <net/xfrm.h>
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700116#include <net/net_namespace.h>
117#include <net/netns/generic.h>
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700118#include <net/dst_metadata.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000120static bool log_ecn_error = true;
121module_param(log_ecn_error, bool, 0644);
122MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
123
Eric Dumazetf99189b2009-11-17 10:42:49 +0000124static int ipip_net_id __read_mostly;
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700125
Eric Dumazet3c97af92010-09-27 00:35:50 +0000126static int ipip_tunnel_init(struct net_device *dev);
Nicolas Dichtel09746582012-11-09 06:09:59 +0000127static struct rtnl_link_ops ipip_link_ops __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
Herbert Xud2acc342006-03-28 01:12:13 -0800129static int ipip_err(struct sk_buff *skb, u32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131
Rami Rosen071f92d2008-05-21 17:47:54 -0700132/* All the routers (except for Linux) return only
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133 8 bytes of packet payload. It means, that precise relaying of
134 ICMP in the real Internet is absolutely infeasible.
135 */
Pravin B Shelarfd581562013-03-25 14:49:41 +0000136 struct net *net = dev_net(skb->dev);
137 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000138 const struct iphdr *iph = (const struct iphdr *)skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 struct ip_tunnel *t;
Herbert Xud2acc342006-03-28 01:12:13 -0800140 int err;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000141 const int type = icmp_hdr(skb)->type;
142 const int code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Herbert Xud2acc342006-03-28 01:12:13 -0800144 err = -ENOENT;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000145 t = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
146 iph->daddr, iph->saddr, 0);
Ian Morris51456b22015-04-03 09:17:26 +0100147 if (!t)
David S. Miller36393392012-06-14 22:21:46 -0700148 goto out;
149
150 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
151 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200152 t->parms.link, 0, iph->protocol, 0);
David S. Miller36393392012-06-14 22:21:46 -0700153 err = 0;
154 goto out;
155 }
156
David S. Miller55be7a92012-07-11 21:27:49 -0700157 if (type == ICMP_REDIRECT) {
Dmitry Popov23468292014-06-06 23:19:21 +0400158 ipv4_redirect(skb, dev_net(skb->dev), t->parms.link, 0,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200159 iph->protocol, 0);
David S. Miller55be7a92012-07-11 21:27:49 -0700160 err = 0;
161 goto out;
162 }
163
David S. Miller36393392012-06-14 22:21:46 -0700164 if (t->parms.iph.daddr == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 goto out;
Herbert Xud2acc342006-03-28 01:12:13 -0800166
167 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
169 goto out;
170
Wei Yongjun26d94b42009-02-24 23:36:47 -0800171 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 t->err_count++;
173 else
174 t->err_count = 1;
175 t->err_time = jiffies;
stephen hemmingerb0558ef2012-09-24 18:12:25 +0000176
Pravin B Shelarfd581562013-03-25 14:49:41 +0000177out:
Herbert Xud2acc342006-03-28 01:12:13 -0800178 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179}
180
Simon Horman1b69e7e2016-07-07 07:56:14 +0200181static const struct tnl_ptk_info ipip_tpi = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000182 /* no tunnel info required for ipip. */
183 .proto = htons(ETH_P_IP),
184};
185
Simon Horman1b69e7e2016-07-07 07:56:14 +0200186#if IS_ENABLED(CONFIG_MPLS)
187static const struct tnl_ptk_info mplsip_tpi = {
188 /* no tunnel info required for mplsip. */
189 .proto = htons(ETH_P_MPLS_UC),
190};
191#endif
192
193static int ipip_tunnel_rcv(struct sk_buff *skb, u8 ipproto)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000195 struct net *net = dev_net(skb->dev);
196 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700197 struct metadata_dst *tun_dst = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 struct ip_tunnel *tunnel;
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700199 const struct iphdr *iph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
Pravin B Shelar3d7b46c2013-06-17 17:50:02 -0700201 iph = ip_hdr(skb);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000202 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY,
203 iph->saddr, iph->daddr, 0);
204 if (tunnel) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200205 const struct tnl_ptk_info *tpi;
206
207 if (tunnel->parms.iph.protocol != ipproto &&
208 tunnel->parms.iph.protocol != 0)
209 goto drop;
210
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000211 if (!xfrm4_policy_check(NULL, XFRM_POLICY_IN, skb))
212 goto drop;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200213#if IS_ENABLED(CONFIG_MPLS)
214 if (ipproto == IPPROTO_MPLS)
215 tpi = &mplsip_tpi;
216 else
217#endif
218 tpi = &ipip_tpi;
219 if (iptunnel_pull_header(skb, 0, tpi->proto, false))
Li Hongjun737e8282013-08-28 11:54:50 +0200220 goto drop;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700221 if (tunnel->collect_md) {
222 tun_dst = ip_tun_rx_dst(skb, 0, 0, 0);
223 if (!tun_dst)
224 return 0;
225 }
226 return ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 return -1;
stephen hemmingereccc1bb2012-09-25 11:02:48 +0000230
231drop:
232 kfree_skb(skb);
233 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234}
235
Simon Horman1b69e7e2016-07-07 07:56:14 +0200236static int ipip_rcv(struct sk_buff *skb)
237{
238 return ipip_tunnel_rcv(skb, IPPROTO_IPIP);
239}
240
241#if IS_ENABLED(CONFIG_MPLS)
242static int mplsip_rcv(struct sk_buff *skb)
243{
244 return ipip_tunnel_rcv(skb, IPPROTO_MPLS);
245}
246#endif
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248/*
249 * This function assumes it is being called from dev_queue_xmit()
250 * and that skb is filled properly by that function.
251 */
Simon Horman1b69e7e2016-07-07 07:56:14 +0200252static netdev_tx_t ipip_tunnel_xmit(struct sk_buff *skb,
253 struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254{
Patrick McHardy2941a482006-01-08 22:05:26 -0800255 struct ip_tunnel *tunnel = netdev_priv(dev);
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000256 const struct iphdr *tiph = &tunnel->parms.iph;
Simon Horman1b69e7e2016-07-07 07:56:14 +0200257 u8 ipproto;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258
Simon Horman1b69e7e2016-07-07 07:56:14 +0200259 switch (skb->protocol) {
260 case htons(ETH_P_IP):
261 ipproto = IPPROTO_IPIP;
262 break;
263#if IS_ENABLED(CONFIG_MPLS)
264 case htons(ETH_P_MPLS_UC):
265 ipproto = IPPROTO_MPLS;
266 break;
267#endif
268 default:
269 goto tx_error;
270 }
271
272 if (tiph->protocol != ipproto && tiph->protocol != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 goto tx_error;
Eric Dumazetcef401d2013-01-25 20:34:37 +0000274
Tom Herbert7e133182016-05-18 09:06:10 -0700275 if (iptunnel_handle_offloads(skb, SKB_GSO_IPXIP4))
Alexander Duyckaed069d2016-04-14 15:33:37 -0400276 goto tx_error;
Pravin B Shelar4f3ed922013-03-08 15:12:52 +0000277
Simon Horman1b69e7e2016-07-07 07:56:14 +0200278 skb_set_inner_ipproto(skb, ipproto);
Tom Herbert077c5a02014-09-29 20:22:31 -0700279
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700280 if (tunnel->collect_md)
281 ip_md_tunnel_xmit(skb, dev, ipproto);
282 else
283 ip_tunnel_xmit(skb, dev, tiph, ipproto);
Patrick McHardy6ed10652009-06-23 06:03:08 +0000284 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286tx_error:
Eric Dumazet3acfa1e2014-01-18 18:27:49 -0800287 kfree_skb(skb);
Alexander Duyckaed069d2016-04-14 15:33:37 -0400288
Eric Dumazetcb32f512013-10-19 11:42:57 -0700289 dev->stats.tx_errors++;
Patrick McHardy6ed10652009-06-23 06:03:08 +0000290 return NETDEV_TX_OK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291}
292
Simon Horman1b69e7e2016-07-07 07:56:14 +0200293static bool ipip_tunnel_ioctl_verify_protocol(u8 ipproto)
294{
295 switch (ipproto) {
296 case 0:
297 case IPPROTO_IPIP:
298#if IS_ENABLED(CONFIG_MPLS)
299 case IPPROTO_MPLS:
300#endif
301 return true;
302 }
303
304 return false;
305}
306
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307static int
Pravin B Shelarfd581562013-03-25 14:49:41 +0000308ipip_tunnel_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309{
310 int err = 0;
311 struct ip_tunnel_parm p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
Pravin B Shelarfd581562013-03-25 14:49:41 +0000313 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p)))
314 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315
Cong Wang3b7b5142013-07-02 14:49:34 +0800316 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
Simon Horman1b69e7e2016-07-07 07:56:14 +0200317 if (p.iph.version != 4 ||
318 !ipip_tunnel_ioctl_verify_protocol(p.iph.protocol) ||
Cong Wang3b7b5142013-07-02 14:49:34 +0800319 p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF)))
320 return -EINVAL;
321 }
322
Eric Dumazet252a8fb2015-05-15 08:58:45 -0700323 p.i_key = p.o_key = 0;
324 p.i_flags = p.o_flags = 0;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000325 err = ip_tunnel_ioctl(dev, &p, cmd);
326 if (err)
327 return err;
328
329 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p)))
330 return -EFAULT;
331
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 return 0;
333}
334
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800335static const struct net_device_ops ipip_netdev_ops = {
Pravin B Shelarfd581562013-03-25 14:49:41 +0000336 .ndo_init = ipip_tunnel_init,
337 .ndo_uninit = ip_tunnel_uninit,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800338 .ndo_start_xmit = ipip_tunnel_xmit,
339 .ndo_do_ioctl = ipip_tunnel_ioctl,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000340 .ndo_change_mtu = ip_tunnel_change_mtu,
341 .ndo_get_stats64 = ip_tunnel_get_stats64,
Nicolas Dichtel1e995842015-04-02 17:07:02 +0200342 .ndo_get_iflink = ip_tunnel_get_iflink,
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800343};
344
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000345#define IPIP_FEATURES (NETIF_F_SG | \
346 NETIF_F_FRAGLIST | \
347 NETIF_F_HIGHDMA | \
Eric Dumazetcb32f512013-10-19 11:42:57 -0700348 NETIF_F_GSO_SOFTWARE | \
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000349 NETIF_F_HW_CSUM)
350
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351static void ipip_tunnel_setup(struct net_device *dev)
352{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800353 dev->netdev_ops = &ipip_netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354
355 dev->type = ARPHRD_TUNNEL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 dev->flags = IFF_NOARP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 dev->addr_len = 4;
Eric Dumazet153f0942010-09-28 00:17:17 +0000358 dev->features |= NETIF_F_LLTX;
Eric Dumazet02875872014-10-05 18:38:35 -0700359 netif_keep_dst(dev);
Eric Dumazetc3b89fb2012-11-08 09:59:52 +0000360
361 dev->features |= IPIP_FEATURES;
362 dev->hw_features |= IPIP_FEATURES;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000363 ip_tunnel_setup(dev, ipip_net_id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364}
365
Eric Dumazet3c97af92010-09-27 00:35:50 +0000366static int ipip_tunnel_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367{
Stephen Hemminger23a12b12008-11-20 20:33:21 -0800368 struct ip_tunnel *tunnel = netdev_priv(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370 memcpy(dev->dev_addr, &tunnel->parms.iph.saddr, 4);
371 memcpy(dev->broadcast, &tunnel->parms.iph.daddr, 4);
372
Tom Herbert473ab822014-09-17 12:26:00 -0700373 tunnel->tun_hlen = 0;
374 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
Pravin B Shelarfd581562013-03-25 14:49:41 +0000375 return ip_tunnel_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376}
377
Simon Horman1b69e7e2016-07-07 07:56:14 +0200378static int ipip_tunnel_validate(struct nlattr *tb[], struct nlattr *data[])
379{
380 u8 proto;
381
382 if (!data || !data[IFLA_IPTUN_PROTO])
383 return 0;
384
385 proto = nla_get_u8(data[IFLA_IPTUN_PROTO]);
386 if (proto != IPPROTO_IPIP && proto != IPPROTO_MPLS && proto != 0)
387 return -EINVAL;
388
389 return 0;
390}
391
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000392static void ipip_netlink_parms(struct nlattr *data[],
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700393 struct ip_tunnel_parm *parms, bool *collect_md)
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000394{
395 memset(parms, 0, sizeof(*parms));
396
397 parms->iph.version = 4;
398 parms->iph.protocol = IPPROTO_IPIP;
399 parms->iph.ihl = 5;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700400 *collect_md = false;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000401
402 if (!data)
403 return;
404
405 if (data[IFLA_IPTUN_LINK])
406 parms->link = nla_get_u32(data[IFLA_IPTUN_LINK]);
407
408 if (data[IFLA_IPTUN_LOCAL])
Jiri Benc67b61f62015-03-29 16:59:26 +0200409 parms->iph.saddr = nla_get_in_addr(data[IFLA_IPTUN_LOCAL]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000410
411 if (data[IFLA_IPTUN_REMOTE])
Jiri Benc67b61f62015-03-29 16:59:26 +0200412 parms->iph.daddr = nla_get_in_addr(data[IFLA_IPTUN_REMOTE]);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000413
414 if (data[IFLA_IPTUN_TTL]) {
415 parms->iph.ttl = nla_get_u8(data[IFLA_IPTUN_TTL]);
416 if (parms->iph.ttl)
417 parms->iph.frag_off = htons(IP_DF);
418 }
419
420 if (data[IFLA_IPTUN_TOS])
421 parms->iph.tos = nla_get_u8(data[IFLA_IPTUN_TOS]);
422
Simon Horman1b69e7e2016-07-07 07:56:14 +0200423 if (data[IFLA_IPTUN_PROTO])
424 parms->iph.protocol = nla_get_u8(data[IFLA_IPTUN_PROTO]);
425
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000426 if (!data[IFLA_IPTUN_PMTUDISC] || nla_get_u8(data[IFLA_IPTUN_PMTUDISC]))
427 parms->iph.frag_off = htons(IP_DF);
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700428
429 if (data[IFLA_IPTUN_COLLECT_METADATA])
430 *collect_md = true;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000431}
432
Tom Herbert473ab822014-09-17 12:26:00 -0700433/* This function returns true when ENCAP attributes are present in the nl msg */
434static bool ipip_netlink_encap_parms(struct nlattr *data[],
435 struct ip_tunnel_encap *ipencap)
436{
437 bool ret = false;
438
439 memset(ipencap, 0, sizeof(*ipencap));
440
441 if (!data)
442 return ret;
443
444 if (data[IFLA_IPTUN_ENCAP_TYPE]) {
445 ret = true;
446 ipencap->type = nla_get_u16(data[IFLA_IPTUN_ENCAP_TYPE]);
447 }
448
449 if (data[IFLA_IPTUN_ENCAP_FLAGS]) {
450 ret = true;
451 ipencap->flags = nla_get_u16(data[IFLA_IPTUN_ENCAP_FLAGS]);
452 }
453
454 if (data[IFLA_IPTUN_ENCAP_SPORT]) {
455 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100456 ipencap->sport = nla_get_be16(data[IFLA_IPTUN_ENCAP_SPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700457 }
458
459 if (data[IFLA_IPTUN_ENCAP_DPORT]) {
460 ret = true;
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100461 ipencap->dport = nla_get_be16(data[IFLA_IPTUN_ENCAP_DPORT]);
Tom Herbert473ab822014-09-17 12:26:00 -0700462 }
463
464 return ret;
465}
466
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000467static int ipip_newlink(struct net *src_net, struct net_device *dev,
468 struct nlattr *tb[], struct nlattr *data[])
469{
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700470 struct ip_tunnel *t = netdev_priv(dev);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000471 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700472 struct ip_tunnel_encap ipencap;
473
474 if (ipip_netlink_encap_parms(data, &ipencap)) {
Tom Herbert473ab822014-09-17 12:26:00 -0700475 int err = ip_tunnel_encap_setup(t, &ipencap);
476
477 if (err < 0)
478 return err;
479 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000480
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700481 ipip_netlink_parms(data, &p, &t->collect_md);
Pravin B Shelarfd581562013-03-25 14:49:41 +0000482 return ip_tunnel_newlink(dev, tb, &p);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000483}
484
485static int ipip_changelink(struct net_device *dev, struct nlattr *tb[],
486 struct nlattr *data[])
487{
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000488 struct ip_tunnel_parm p;
Tom Herbert473ab822014-09-17 12:26:00 -0700489 struct ip_tunnel_encap ipencap;
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700490 bool collect_md;
Tom Herbert473ab822014-09-17 12:26:00 -0700491
492 if (ipip_netlink_encap_parms(data, &ipencap)) {
493 struct ip_tunnel *t = netdev_priv(dev);
494 int err = ip_tunnel_encap_setup(t, &ipencap);
495
496 if (err < 0)
497 return err;
498 }
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000499
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700500 ipip_netlink_parms(data, &p, &collect_md);
501 if (collect_md)
502 return -EINVAL;
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000503
504 if (((dev->flags & IFF_POINTOPOINT) && !p.iph.daddr) ||
505 (!(dev->flags & IFF_POINTOPOINT) && p.iph.daddr))
506 return -EINVAL;
507
Pravin B Shelarfd581562013-03-25 14:49:41 +0000508 return ip_tunnel_changelink(dev, tb, &p);
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000509}
510
Nicolas Dichtel09746582012-11-09 06:09:59 +0000511static size_t ipip_get_size(const struct net_device *dev)
512{
513 return
514 /* IFLA_IPTUN_LINK */
515 nla_total_size(4) +
516 /* IFLA_IPTUN_LOCAL */
517 nla_total_size(4) +
518 /* IFLA_IPTUN_REMOTE */
519 nla_total_size(4) +
520 /* IFLA_IPTUN_TTL */
521 nla_total_size(1) +
522 /* IFLA_IPTUN_TOS */
523 nla_total_size(1) +
Simon Horman1b69e7e2016-07-07 07:56:14 +0200524 /* IFLA_IPTUN_PROTO */
525 nla_total_size(1) +
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000526 /* IFLA_IPTUN_PMTUDISC */
527 nla_total_size(1) +
Tom Herbert473ab822014-09-17 12:26:00 -0700528 /* IFLA_IPTUN_ENCAP_TYPE */
529 nla_total_size(2) +
530 /* IFLA_IPTUN_ENCAP_FLAGS */
531 nla_total_size(2) +
532 /* IFLA_IPTUN_ENCAP_SPORT */
533 nla_total_size(2) +
534 /* IFLA_IPTUN_ENCAP_DPORT */
535 nla_total_size(2) +
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700536 /* IFLA_IPTUN_COLLECT_METADATA */
537 nla_total_size(0) +
Nicolas Dichtel09746582012-11-09 06:09:59 +0000538 0;
539}
540
541static int ipip_fill_info(struct sk_buff *skb, const struct net_device *dev)
542{
543 struct ip_tunnel *tunnel = netdev_priv(dev);
544 struct ip_tunnel_parm *parm = &tunnel->parms;
545
546 if (nla_put_u32(skb, IFLA_IPTUN_LINK, parm->link) ||
Jiri Benc930345e2015-03-29 16:59:25 +0200547 nla_put_in_addr(skb, IFLA_IPTUN_LOCAL, parm->iph.saddr) ||
548 nla_put_in_addr(skb, IFLA_IPTUN_REMOTE, parm->iph.daddr) ||
Nicolas Dichtel09746582012-11-09 06:09:59 +0000549 nla_put_u8(skb, IFLA_IPTUN_TTL, parm->iph.ttl) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000550 nla_put_u8(skb, IFLA_IPTUN_TOS, parm->iph.tos) ||
Simon Horman1b69e7e2016-07-07 07:56:14 +0200551 nla_put_u8(skb, IFLA_IPTUN_PROTO, parm->iph.protocol) ||
Nicolas Dichtelbefe2aa2012-11-14 05:14:02 +0000552 nla_put_u8(skb, IFLA_IPTUN_PMTUDISC,
553 !!(parm->iph.frag_off & htons(IP_DF))))
Nicolas Dichtel09746582012-11-09 06:09:59 +0000554 goto nla_put_failure;
Tom Herbert473ab822014-09-17 12:26:00 -0700555
556 if (nla_put_u16(skb, IFLA_IPTUN_ENCAP_TYPE,
557 tunnel->encap.type) ||
Sabrina Dubroca3e97fa72015-02-06 17:22:22 +0100558 nla_put_be16(skb, IFLA_IPTUN_ENCAP_SPORT,
559 tunnel->encap.sport) ||
560 nla_put_be16(skb, IFLA_IPTUN_ENCAP_DPORT,
561 tunnel->encap.dport) ||
Tom Herbert473ab822014-09-17 12:26:00 -0700562 nla_put_u16(skb, IFLA_IPTUN_ENCAP_FLAGS,
Tom Herberte1b2cb62014-11-05 16:49:38 -0800563 tunnel->encap.flags))
Tom Herbert473ab822014-09-17 12:26:00 -0700564 goto nla_put_failure;
565
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700566 if (tunnel->collect_md)
567 if (nla_put_flag(skb, IFLA_IPTUN_COLLECT_METADATA))
568 goto nla_put_failure;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000569 return 0;
570
571nla_put_failure:
572 return -EMSGSIZE;
573}
574
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000575static const struct nla_policy ipip_policy[IFLA_IPTUN_MAX + 1] = {
576 [IFLA_IPTUN_LINK] = { .type = NLA_U32 },
577 [IFLA_IPTUN_LOCAL] = { .type = NLA_U32 },
578 [IFLA_IPTUN_REMOTE] = { .type = NLA_U32 },
579 [IFLA_IPTUN_TTL] = { .type = NLA_U8 },
580 [IFLA_IPTUN_TOS] = { .type = NLA_U8 },
Simon Horman1b69e7e2016-07-07 07:56:14 +0200581 [IFLA_IPTUN_PROTO] = { .type = NLA_U8 },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000582 [IFLA_IPTUN_PMTUDISC] = { .type = NLA_U8 },
Tom Herbert473ab822014-09-17 12:26:00 -0700583 [IFLA_IPTUN_ENCAP_TYPE] = { .type = NLA_U16 },
584 [IFLA_IPTUN_ENCAP_FLAGS] = { .type = NLA_U16 },
585 [IFLA_IPTUN_ENCAP_SPORT] = { .type = NLA_U16 },
586 [IFLA_IPTUN_ENCAP_DPORT] = { .type = NLA_U16 },
Alexei Starovoitovcfc73812016-09-15 13:00:29 -0700587 [IFLA_IPTUN_COLLECT_METADATA] = { .type = NLA_FLAG },
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000588};
589
Nicolas Dichtel09746582012-11-09 06:09:59 +0000590static struct rtnl_link_ops ipip_link_ops __read_mostly = {
591 .kind = "ipip",
592 .maxtype = IFLA_IPTUN_MAX,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000593 .policy = ipip_policy,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000594 .priv_size = sizeof(struct ip_tunnel),
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000595 .setup = ipip_tunnel_setup,
Simon Horman1b69e7e2016-07-07 07:56:14 +0200596 .validate = ipip_tunnel_validate,
Nicolas Dichtelbe42da02012-11-14 05:14:03 +0000597 .newlink = ipip_newlink,
598 .changelink = ipip_changelink,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000599 .dellink = ip_tunnel_dellink,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000600 .get_size = ipip_get_size,
601 .fill_info = ipip_fill_info,
Nicolas Dichtel1728d4f2015-01-15 15:11:17 +0100602 .get_link_net = ip_tunnel_get_link_net,
Nicolas Dichtel09746582012-11-09 06:09:59 +0000603};
604
Eric Dumazet6dcd8142010-08-30 07:04:14 +0000605static struct xfrm_tunnel ipip_handler __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 .handler = ipip_rcv,
607 .err_handler = ipip_err,
Herbert Xud2acc342006-03-28 01:12:13 -0800608 .priority = 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609};
610
Simon Horman1b69e7e2016-07-07 07:56:14 +0200611#if IS_ENABLED(CONFIG_MPLS)
612static struct xfrm_tunnel mplsip_handler __read_mostly = {
613 .handler = mplsip_rcv,
614 .err_handler = ipip_err,
615 .priority = 1,
616};
617#endif
618
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000619static int __net_init ipip_init_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700620{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000621 return ip_tunnel_init_net(net, ipip_net_id, &ipip_link_ops, "tunl0");
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700622}
623
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +0000624static void __net_exit ipip_exit_net(struct net *net)
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700625{
Pravin B Shelarfd581562013-03-25 14:49:41 +0000626 struct ip_tunnel_net *itn = net_generic(net, ipip_net_id);
Nicolas Dichtel6c742e72013-08-13 17:51:11 +0200627 ip_tunnel_delete_net(itn, &ipip_link_ops);
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700628}
629
630static struct pernet_operations ipip_net_ops = {
631 .init = ipip_init_net,
632 .exit = ipip_exit_net,
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000633 .id = &ipip_net_id,
Pravin B Shelarfd581562013-03-25 14:49:41 +0000634 .size = sizeof(struct ip_tunnel_net),
Pavel Emelyanov10dc4c72008-04-16 01:03:13 -0700635};
636
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637static int __init ipip_init(void)
638{
639 int err;
640
Simon Horman1b69e7e2016-07-07 07:56:14 +0200641 pr_info("ipip: IPv4 and MPLS over IPv4 tunneling driver\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000643 err = register_pernet_device(&ipip_net_ops);
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000644 if (err < 0)
645 return err;
646 err = xfrm4_tunnel_register(&ipip_handler, AF_INET);
647 if (err < 0) {
Joe Perches058bd4d2012-03-11 18:36:11 +0000648 pr_info("%s: can't register tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200649 goto xfrm_tunnel_ipip_failed;
Alexey Dobriyand5aa4072010-02-16 09:05:04 +0000650 }
Simon Horman1b69e7e2016-07-07 07:56:14 +0200651#if IS_ENABLED(CONFIG_MPLS)
652 err = xfrm4_tunnel_register(&mplsip_handler, AF_MPLS);
653 if (err < 0) {
654 pr_info("%s: can't register tunnel\n", __func__);
655 goto xfrm_tunnel_mplsip_failed;
656 }
657#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000658 err = rtnl_link_register(&ipip_link_ops);
659 if (err < 0)
660 goto rtnl_link_failed;
661
662out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663 return err;
Nicolas Dichtel09746582012-11-09 06:09:59 +0000664
665rtnl_link_failed:
Simon Horman1b69e7e2016-07-07 07:56:14 +0200666#if IS_ENABLED(CONFIG_MPLS)
667 xfrm4_tunnel_deregister(&mplsip_handler, AF_INET);
668xfrm_tunnel_mplsip_failed:
669
670#endif
Nicolas Dichtel09746582012-11-09 06:09:59 +0000671 xfrm4_tunnel_deregister(&ipip_handler, AF_INET);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200672xfrm_tunnel_ipip_failed:
Nicolas Dichtel09746582012-11-09 06:09:59 +0000673 unregister_pernet_device(&ipip_net_ops);
674 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675}
676
677static void __exit ipip_fini(void)
678{
Nicolas Dichtel09746582012-11-09 06:09:59 +0000679 rtnl_link_unregister(&ipip_link_ops);
Kazunori MIYAZAWAc0d56402007-02-13 12:54:47 -0800680 if (xfrm4_tunnel_deregister(&ipip_handler, AF_INET))
Joe Perches058bd4d2012-03-11 18:36:11 +0000681 pr_info("%s: can't deregister tunnel\n", __func__);
Simon Horman1b69e7e2016-07-07 07:56:14 +0200682#if IS_ENABLED(CONFIG_MPLS)
683 if (xfrm4_tunnel_deregister(&mplsip_handler, AF_MPLS))
684 pr_info("%s: can't deregister tunnel\n", __func__);
685#endif
Eric W. Biederman86de8a62009-11-29 15:46:14 +0000686 unregister_pernet_device(&ipip_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687}
688
689module_init(ipip_init);
690module_exit(ipip_fini);
691MODULE_LICENSE("GPL");
Tom Gundersenf98f89a2014-05-15 23:21:30 +0200692MODULE_ALIAS_RTNL_LINK("ipip");
Vasiliy Kulikov8909c9a2011-03-02 00:33:13 +0300693MODULE_ALIAS_NETDEV("tunl0");