blob: eba1271b9735cec24b5a9b986b9958ee95337332 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * TUN - Universal TUN/TAP device driver.
3 * Copyright (C) 1999-2002 Maxim Krasnyansky <maxk@qualcomm.com>
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * $Id: tun.c,v 1.15 2002/03/01 02:44:24 maxk Exp $
16 */
17
18/*
19 * Changes:
20 *
Brian Braunstein36226a82007-04-26 01:00:55 -070021 * Brian Braunstein <linuxkernel@bristyle.com> 2007/03/23
22 * Fixed hw address handling. Now net_device.dev_addr is kept consistent
23 * with tun.dev_addr when the address is set by this module.
24 *
Mike Kershawff4cc3a2005-09-01 17:40:05 -070025 * Mike Kershaw <dragorn@kismetwireless.net> 2005/08/14
26 * Add TUNSETLINK ioctl to set the link encapsulation
27 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 * Mark Smith <markzzzsmith@yahoo.com.au>
29 * Use random_ether_addr() for tap MAC address.
30 *
31 * Harald Roelle <harald.roelle@ifi.lmu.de> 2004/04/20
32 * Fixes in packet dropping, queue length setting and queue wakeup.
33 * Increased default tx queue length.
34 * Added ethtool API.
35 * Minor cleanups
36 *
37 * Daniel Podlejski <underley@underley.eu.org>
38 * Modifications for 2.3.99-pre5 kernel.
39 */
40
41#define DRV_NAME "tun"
42#define DRV_VERSION "1.6"
43#define DRV_DESCRIPTION "Universal TUN/TAP device driver"
44#define DRV_COPYRIGHT "(C) 1999-2004 Max Krasnyansky <maxk@qualcomm.com>"
45
Linus Torvalds1da177e2005-04-16 15:20:36 -070046#include <linux/module.h>
47#include <linux/errno.h>
48#include <linux/kernel.h>
49#include <linux/major.h>
50#include <linux/slab.h>
Arnd Bergmannfd3e05b2008-05-20 19:16:24 +020051#include <linux/smp_lock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#include <linux/poll.h>
53#include <linux/fcntl.h>
54#include <linux/init.h>
55#include <linux/skbuff.h>
56#include <linux/netdevice.h>
57#include <linux/etherdevice.h>
58#include <linux/miscdevice.h>
59#include <linux/ethtool.h>
60#include <linux/rtnetlink.h>
61#include <linux/if.h>
62#include <linux/if_arp.h>
63#include <linux/if_ether.h>
64#include <linux/if_tun.h>
65#include <linux/crc32.h>
Pavel Emelyanovd647a592008-04-16 00:41:16 -070066#include <linux/nsproxy.h>
Eric W. Biederman881d9662007-09-17 11:56:21 -070067#include <net/net_namespace.h>
Pavel Emelyanov79d17602008-04-16 00:40:46 -070068#include <net/netns/generic.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070069
70#include <asm/system.h>
71#include <asm/uaccess.h>
72
Rusty Russell14daa022008-04-12 18:48:58 -070073/* Uncomment to enable debugging */
74/* #define TUN_DEBUG 1 */
75
Linus Torvalds1da177e2005-04-16 15:20:36 -070076#ifdef TUN_DEBUG
77static int debug;
Rusty Russell14daa022008-04-12 18:48:58 -070078
79#define DBG if(tun->debug)printk
80#define DBG1 if(debug==2)printk
81#else
82#define DBG( a... )
83#define DBG1( a... )
Linus Torvalds1da177e2005-04-16 15:20:36 -070084#endif
85
Rusty Russell14daa022008-04-12 18:48:58 -070086struct tun_struct {
87 struct list_head list;
88 unsigned long flags;
89 int attached;
90 uid_t owner;
91 gid_t group;
92
93 wait_queue_head_t read_wait;
94 struct sk_buff_head readq;
95
96 struct net_device *dev;
97
98 struct fasync_struct *fasync;
99
100 unsigned long if_flags;
101 u8 dev_addr[ETH_ALEN];
102 u32 chr_filter[2];
103 u32 net_filter[2];
104
105#ifdef TUN_DEBUG
106 int debug;
107#endif
108};
109
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110/* Network device part of the driver */
111
Pavel Emelyanov79d17602008-04-16 00:40:46 -0700112static unsigned int tun_net_id;
113struct tun_net {
114 struct list_head dev_list;
115};
116
Jeff Garzik7282d492006-09-13 14:30:00 -0400117static const struct ethtool_ops tun_ethtool_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118
119/* Net device open. */
120static int tun_net_open(struct net_device *dev)
121{
122 netif_start_queue(dev);
123 return 0;
124}
125
126/* Net device close. */
127static int tun_net_close(struct net_device *dev)
128{
129 netif_stop_queue(dev);
130 return 0;
131}
132
133/* Net device start xmit */
134static int tun_net_xmit(struct sk_buff *skb, struct net_device *dev)
135{
136 struct tun_struct *tun = netdev_priv(dev);
137
138 DBG(KERN_INFO "%s: tun_net_xmit %d\n", tun->dev->name, skb->len);
139
140 /* Drop packet if interface is not attached */
141 if (!tun->attached)
142 goto drop;
143
144 /* Packet dropping */
145 if (skb_queue_len(&tun->readq) >= dev->tx_queue_len) {
146 if (!(tun->flags & TUN_ONE_QUEUE)) {
147 /* Normal queueing mode. */
148 /* Packet scheduler handles dropping of further packets. */
149 netif_stop_queue(dev);
150
151 /* We won't see all dropped packets individually, so overrun
152 * error is more appropriate. */
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700153 dev->stats.tx_fifo_errors++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 } else {
155 /* Single queue mode.
156 * Driver handles dropping of all packets itself. */
157 goto drop;
158 }
159 }
160
161 /* Queue packet */
162 skb_queue_tail(&tun->readq, skb);
163 dev->trans_start = jiffies;
164
165 /* Notify and wake up reader process */
166 if (tun->flags & TUN_FASYNC)
167 kill_fasync(&tun->fasync, SIGIO, POLL_IN);
168 wake_up_interruptible(&tun->read_wait);
169 return 0;
170
171drop:
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700172 dev->stats.tx_dropped++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 kfree_skb(skb);
174 return 0;
175}
176
177/** Add the specified Ethernet address to this multicast filter. */
178static void
179add_multi(u32* filter, const u8* addr)
180{
181 int bit_nr = ether_crc(ETH_ALEN, addr) >> 26;
182 filter[bit_nr >> 5] |= 1 << (bit_nr & 31);
183}
184
185/** Remove the specified Ethernet addres from this multicast filter. */
186static void
187del_multi(u32* filter, const u8* addr)
188{
189 int bit_nr = ether_crc(ETH_ALEN, addr) >> 26;
190 filter[bit_nr >> 5] &= ~(1 << (bit_nr & 31));
191}
192
193/** Update the list of multicast groups to which the network device belongs.
194 * This list is used to filter packets being sent from the character device to
195 * the network device. */
196static void
197tun_net_mclist(struct net_device *dev)
198{
199 struct tun_struct *tun = netdev_priv(dev);
200 const struct dev_mc_list *mclist;
201 int i;
Joe Perches0795af52007-10-03 17:59:30 -0700202 DECLARE_MAC_BUF(mac);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 DBG(KERN_DEBUG "%s: tun_net_mclist: mc_count %d\n",
204 dev->name, dev->mc_count);
205 memset(tun->chr_filter, 0, sizeof tun->chr_filter);
206 for (i = 0, mclist = dev->mc_list; i < dev->mc_count && mclist != NULL;
207 i++, mclist = mclist->next) {
208 add_multi(tun->net_filter, mclist->dmi_addr);
Joe Perches0795af52007-10-03 17:59:30 -0700209 DBG(KERN_DEBUG "%s: tun_net_mclist: %s\n",
210 dev->name, print_mac(mac, mclist->dmi_addr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211 }
212}
213
Ed Swierk4885a502007-09-16 12:21:38 -0700214#define MIN_MTU 68
215#define MAX_MTU 65535
216
217static int
218tun_net_change_mtu(struct net_device *dev, int new_mtu)
219{
220 if (new_mtu < MIN_MTU || new_mtu + dev->hard_header_len > MAX_MTU)
221 return -EINVAL;
222 dev->mtu = new_mtu;
223 return 0;
224}
225
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226/* Initialize net device. */
227static void tun_net_init(struct net_device *dev)
228{
229 struct tun_struct *tun = netdev_priv(dev);
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400230
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231 switch (tun->flags & TUN_TYPE_MASK) {
232 case TUN_TUN_DEV:
233 /* Point-to-Point TUN Device */
234 dev->hard_header_len = 0;
235 dev->addr_len = 0;
236 dev->mtu = 1500;
Ed Swierk4885a502007-09-16 12:21:38 -0700237 dev->change_mtu = tun_net_change_mtu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238
239 /* Zero header length */
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400240 dev->type = ARPHRD_NONE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 dev->flags = IFF_POINTOPOINT | IFF_NOARP | IFF_MULTICAST;
242 dev->tx_queue_len = TUN_READQ_SIZE; /* We prefer our own queue length */
243 break;
244
245 case TUN_TAP_DEV:
246 /* Ethernet TAP Device */
247 dev->set_multicast_list = tun_net_mclist;
248
249 ether_setup(dev);
Ed Swierk4885a502007-09-16 12:21:38 -0700250 dev->change_mtu = tun_net_change_mtu;
Brian Braunstein36226a82007-04-26 01:00:55 -0700251
252 /* random address already created for us by tun_set_iff, use it */
253 memcpy(dev->dev_addr, tun->dev_addr, min(sizeof(tun->dev_addr), sizeof(dev->dev_addr)) );
254
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 dev->tx_queue_len = TUN_READQ_SIZE; /* We prefer our own queue length */
256 break;
257 }
258}
259
260/* Character device part */
261
262/* Poll */
263static unsigned int tun_chr_poll(struct file *file, poll_table * wait)
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400264{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265 struct tun_struct *tun = file->private_data;
266 unsigned int mask = POLLOUT | POLLWRNORM;
267
268 if (!tun)
269 return -EBADFD;
270
271 DBG(KERN_INFO "%s: tun_chr_poll\n", tun->dev->name);
272
273 poll_wait(file, &tun->read_wait, wait);
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400274
David S. Millerb03efcf2005-07-08 14:57:23 -0700275 if (!skb_queue_empty(&tun->readq))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 mask |= POLLIN | POLLRDNORM;
277
278 return mask;
279}
280
281/* Get packet from user space buffer */
282static __inline__ ssize_t tun_get_user(struct tun_struct *tun, struct iovec *iv, size_t count)
283{
284 struct tun_pi pi = { 0, __constant_htons(ETH_P_IP) };
285 struct sk_buff *skb;
286 size_t len = count, align = 0;
287
288 if (!(tun->flags & TUN_NO_PI)) {
289 if ((len -= sizeof(pi)) > count)
290 return -EINVAL;
291
292 if(memcpy_fromiovec((void *)&pi, iv, sizeof(pi)))
293 return -EFAULT;
294 }
295
Rusty Russelle01bf1c2008-04-12 18:49:30 -0700296 if ((tun->flags & TUN_TYPE_MASK) == TUN_TAP_DEV) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 align = NET_IP_ALIGN;
Rusty Russelle01bf1c2008-04-12 18:49:30 -0700298 if (unlikely(len < ETH_HLEN))
299 return -EINVAL;
300 }
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400301
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 if (!(skb = alloc_skb(len + align, GFP_KERNEL))) {
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700303 tun->dev->stats.rx_dropped++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304 return -ENOMEM;
305 }
306
307 if (align)
308 skb_reserve(skb, align);
Dave Jones8f227572006-03-11 18:49:13 -0800309 if (memcpy_fromiovec(skb_put(skb, len), iv, len)) {
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700310 tun->dev->stats.rx_dropped++;
Dave Jones8f227572006-03-11 18:49:13 -0800311 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 return -EFAULT;
Dave Jones8f227572006-03-11 18:49:13 -0800313 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 switch (tun->flags & TUN_TYPE_MASK) {
316 case TUN_TUN_DEV:
Ang Way Chuangf09f7ee2008-06-17 21:10:33 -0700317 if (tun->flags & TUN_NO_PI) {
318 switch (skb->data[0] & 0xf0) {
319 case 0x40:
320 pi.proto = htons(ETH_P_IP);
321 break;
322 case 0x60:
323 pi.proto = htons(ETH_P_IPV6);
324 break;
325 default:
326 tun->dev->stats.rx_dropped++;
327 kfree_skb(skb);
328 return -EINVAL;
329 }
330 }
331
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -0700332 skb_reset_mac_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 skb->protocol = pi.proto;
Arnaldo Carvalho de Melo4c13eb62007-04-25 17:40:23 -0700334 skb->dev = tun->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 break;
336 case TUN_TAP_DEV:
337 skb->protocol = eth_type_trans(skb, tun->dev);
338 break;
339 };
340
341 if (tun->flags & TUN_NOCHECKSUM)
342 skb->ip_summed = CHECKSUM_UNNECESSARY;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400343
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 netif_rx_ni(skb);
345 tun->dev->last_rx = jiffies;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400346
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700347 tun->dev->stats.rx_packets++;
348 tun->dev->stats.rx_bytes += len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 return count;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400351}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352
Badari Pulavartyee0b3e62006-09-30 23:28:47 -0700353static ssize_t tun_chr_aio_write(struct kiocb *iocb, const struct iovec *iv,
354 unsigned long count, loff_t pos)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355{
Badari Pulavartyee0b3e62006-09-30 23:28:47 -0700356 struct tun_struct *tun = iocb->ki_filp->private_data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357
358 if (!tun)
359 return -EBADFD;
360
361 DBG(KERN_INFO "%s: tun_chr_write %ld\n", tun->dev->name, count);
362
Akinobu Mita52427c92007-11-19 22:46:51 -0800363 return tun_get_user(tun, (struct iovec *) iv, iov_length(iv, count));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364}
365
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366/* Put packet to the user space buffer */
367static __inline__ ssize_t tun_put_user(struct tun_struct *tun,
368 struct sk_buff *skb,
369 struct iovec *iv, int len)
370{
371 struct tun_pi pi = { 0, skb->protocol };
372 ssize_t total = 0;
373
374 if (!(tun->flags & TUN_NO_PI)) {
375 if ((len -= sizeof(pi)) < 0)
376 return -EINVAL;
377
378 if (len < skb->len) {
379 /* Packet will be striped */
380 pi.flags |= TUN_PKT_STRIP;
381 }
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400382
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383 if (memcpy_toiovec(iv, (void *) &pi, sizeof(pi)))
384 return -EFAULT;
385 total += sizeof(pi);
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400386 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387
388 len = min_t(int, skb->len, len);
389
390 skb_copy_datagram_iovec(skb, 0, iv, len);
391 total += len;
392
Jeff Garzik09f75cd2007-10-03 17:41:50 -0700393 tun->dev->stats.tx_packets++;
394 tun->dev->stats.tx_bytes += len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395
396 return total;
397}
398
Badari Pulavartyee0b3e62006-09-30 23:28:47 -0700399static ssize_t tun_chr_aio_read(struct kiocb *iocb, const struct iovec *iv,
400 unsigned long count, loff_t pos)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700401{
Badari Pulavartyee0b3e62006-09-30 23:28:47 -0700402 struct file *file = iocb->ki_filp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 struct tun_struct *tun = file->private_data;
404 DECLARE_WAITQUEUE(wait, current);
405 struct sk_buff *skb;
406 ssize_t len, ret = 0;
Joe Perches0795af52007-10-03 17:59:30 -0700407 DECLARE_MAC_BUF(mac);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408
409 if (!tun)
410 return -EBADFD;
411
412 DBG(KERN_INFO "%s: tun_chr_read\n", tun->dev->name);
413
Akinobu Mita52427c92007-11-19 22:46:51 -0800414 len = iov_length(iv, count);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 if (len < 0)
416 return -EINVAL;
417
418 add_wait_queue(&tun->read_wait, &wait);
419 while (len) {
420 const u8 ones[ ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
421 u8 addr[ ETH_ALEN];
422 int bit_nr;
423
424 current->state = TASK_INTERRUPTIBLE;
425
426 /* Read frames from the queue */
427 if (!(skb=skb_dequeue(&tun->readq))) {
428 if (file->f_flags & O_NONBLOCK) {
429 ret = -EAGAIN;
430 break;
431 }
432 if (signal_pending(current)) {
433 ret = -ERESTARTSYS;
434 break;
435 }
436
437 /* Nothing to read, let's sleep */
438 schedule();
439 continue;
440 }
441 netif_wake_queue(tun->dev);
442
443 /** Decide whether to accept this packet. This code is designed to
444 * behave identically to an Ethernet interface. Accept the packet if
445 * - we are promiscuous.
446 * - the packet is addressed to us.
447 * - the packet is broadcast.
448 * - the packet is multicast and
449 * - we are multicast promiscous.
450 * - we belong to the multicast group.
451 */
Arnaldo Carvalho de Melod626f622007-03-27 18:55:52 -0300452 skb_copy_from_linear_data(skb, addr, min_t(size_t, sizeof addr,
453 skb->len));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 bit_nr = ether_crc(sizeof addr, addr) >> 26;
455 if ((tun->if_flags & IFF_PROMISC) ||
456 memcmp(addr, tun->dev_addr, sizeof addr) == 0 ||
457 memcmp(addr, ones, sizeof addr) == 0 ||
458 (((addr[0] == 1 && addr[1] == 0 && addr[2] == 0x5e) ||
459 (addr[0] == 0x33 && addr[1] == 0x33)) &&
460 ((tun->if_flags & IFF_ALLMULTI) ||
461 (tun->chr_filter[bit_nr >> 5] & (1 << (bit_nr & 31)))))) {
Joe Perches0795af52007-10-03 17:59:30 -0700462 DBG(KERN_DEBUG "%s: tun_chr_readv: accepted: %s\n",
463 tun->dev->name, print_mac(mac, addr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700464 ret = tun_put_user(tun, skb, (struct iovec *) iv, len);
465 kfree_skb(skb);
466 break;
467 } else {
Joe Perches0795af52007-10-03 17:59:30 -0700468 DBG(KERN_DEBUG "%s: tun_chr_readv: rejected: %s\n",
469 tun->dev->name, print_mac(mac, addr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700470 kfree_skb(skb);
471 continue;
472 }
473 }
474
475 current->state = TASK_RUNNING;
476 remove_wait_queue(&tun->read_wait, &wait);
477
478 return ret;
479}
480
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481static void tun_setup(struct net_device *dev)
482{
483 struct tun_struct *tun = netdev_priv(dev);
484
485 skb_queue_head_init(&tun->readq);
486 init_waitqueue_head(&tun->read_wait);
487
488 tun->owner = -1;
Guido Guenther8c644622007-07-02 22:50:25 -0700489 tun->group = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
Linus Torvalds1da177e2005-04-16 15:20:36 -0700491 dev->open = tun_net_open;
492 dev->hard_start_xmit = tun_net_xmit;
493 dev->stop = tun_net_close;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494 dev->ethtool_ops = &tun_ethtool_ops;
495 dev->destructor = free_netdev;
Pavel Emelyanovfc54c652008-04-16 00:41:53 -0700496 dev->features |= NETIF_F_NETNS_LOCAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497}
498
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700499static struct tun_struct *tun_get_by_name(struct tun_net *tn, const char *name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500{
501 struct tun_struct *tun;
502
503 ASSERT_RTNL();
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700504 list_for_each_entry(tun, &tn->dev_list, list) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505 if (!strncmp(tun->dev->name, name, IFNAMSIZ))
506 return tun;
507 }
508
509 return NULL;
510}
511
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700512static int tun_set_iff(struct net *net, struct file *file, struct ifreq *ifr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513{
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700514 struct tun_net *tn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 struct tun_struct *tun;
516 struct net_device *dev;
517 int err;
518
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700519 tn = net_generic(net, tun_net_id);
520 tun = tun_get_by_name(tn, ifr->ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 if (tun) {
522 if (tun->attached)
523 return -EBUSY;
524
525 /* Check permissions */
Guido Guenther8c644622007-07-02 22:50:25 -0700526 if (((tun->owner != -1 &&
527 current->euid != tun->owner) ||
528 (tun->group != -1 &&
529 current->egid != tun->group)) &&
530 !capable(CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700531 return -EPERM;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400532 }
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700533 else if (__dev_get_by_name(net, ifr->ifr_name))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 return -EINVAL;
535 else {
536 char *name;
537 unsigned long flags = 0;
538
539 err = -EINVAL;
540
David Woodhouseca6bb5d2006-06-22 16:07:52 -0700541 if (!capable(CAP_NET_ADMIN))
542 return -EPERM;
543
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 /* Set dev type */
545 if (ifr->ifr_flags & IFF_TUN) {
546 /* TUN device */
547 flags |= TUN_TUN_DEV;
548 name = "tun%d";
549 } else if (ifr->ifr_flags & IFF_TAP) {
550 /* TAP device */
551 flags |= TUN_TAP_DEV;
552 name = "tap%d";
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400553 } else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554 goto failed;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400555
Linus Torvalds1da177e2005-04-16 15:20:36 -0700556 if (*ifr->ifr_name)
557 name = ifr->ifr_name;
558
559 dev = alloc_netdev(sizeof(struct tun_struct), name,
560 tun_setup);
561 if (!dev)
562 return -ENOMEM;
563
Pavel Emelyanovfc54c652008-04-16 00:41:53 -0700564 dev_net_set(dev, net);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565 tun = netdev_priv(dev);
566 tun->dev = dev;
567 tun->flags = flags;
568 /* Be promiscuous by default to maintain previous behaviour. */
569 tun->if_flags = IFF_PROMISC;
570 /* Generate random Ethernet address. */
Al Viroa3edb082007-12-22 17:52:42 +0000571 *(__be16 *)tun->dev_addr = htons(0x00FF);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700572 get_random_bytes(tun->dev_addr + sizeof(u16), 4);
573 memset(tun->chr_filter, 0, sizeof tun->chr_filter);
574
575 tun_net_init(dev);
576
577 if (strchr(dev->name, '%')) {
578 err = dev_alloc_name(dev, dev->name);
579 if (err < 0)
580 goto err_free_dev;
581 }
582
583 err = register_netdevice(tun->dev);
584 if (err < 0)
585 goto err_free_dev;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400586
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700587 list_add(&tun->list, &tn->dev_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 }
589
590 DBG(KERN_INFO "%s: tun_set_iff\n", tun->dev->name);
591
592 if (ifr->ifr_flags & IFF_NO_PI)
593 tun->flags |= TUN_NO_PI;
Nathaniel Filardoa26af1e2008-02-05 03:05:07 -0800594 else
595 tun->flags &= ~TUN_NO_PI;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596
597 if (ifr->ifr_flags & IFF_ONE_QUEUE)
598 tun->flags |= TUN_ONE_QUEUE;
Nathaniel Filardoa26af1e2008-02-05 03:05:07 -0800599 else
600 tun->flags &= ~TUN_ONE_QUEUE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601
602 file->private_data = tun;
603 tun->attached = 1;
Pavel Emelyanovfc54c652008-04-16 00:41:53 -0700604 get_net(dev_net(tun->dev));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605
Max Krasnyanskye35259a2008-07-10 16:59:11 -0700606 /* Make sure persistent devices do not get stuck in
607 * xoff state.
608 */
609 if (netif_running(tun->dev))
610 netif_wake_queue(tun->dev);
611
Linus Torvalds1da177e2005-04-16 15:20:36 -0700612 strcpy(ifr->ifr_name, tun->dev->name);
613 return 0;
614
615 err_free_dev:
616 free_netdev(dev);
617 failed:
618 return err;
619}
620
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400621static int tun_chr_ioctl(struct inode *inode, struct file *file,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622 unsigned int cmd, unsigned long arg)
623{
624 struct tun_struct *tun = file->private_data;
625 void __user* argp = (void __user*)arg;
626 struct ifreq ifr;
Joe Perches0795af52007-10-03 17:59:30 -0700627 DECLARE_MAC_BUF(mac);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700628
629 if (cmd == TUNSETIFF || _IOC_TYPE(cmd) == 0x89)
630 if (copy_from_user(&ifr, argp, sizeof ifr))
631 return -EFAULT;
632
633 if (cmd == TUNSETIFF && !tun) {
634 int err;
635
636 ifr.ifr_name[IFNAMSIZ-1] = '\0';
637
638 rtnl_lock();
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700639 err = tun_set_iff(current->nsproxy->net_ns, file, &ifr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 rtnl_unlock();
641
642 if (err)
643 return err;
644
645 if (copy_to_user(argp, &ifr, sizeof(ifr)))
646 return -EFAULT;
647 return 0;
648 }
649
650 if (!tun)
651 return -EBADFD;
652
653 DBG(KERN_INFO "%s: tun_chr_ioctl cmd %d\n", tun->dev->name, cmd);
654
655 switch (cmd) {
656 case TUNSETNOCSUM:
657 /* Disable/Enable checksum */
658 if (arg)
659 tun->flags |= TUN_NOCHECKSUM;
660 else
661 tun->flags &= ~TUN_NOCHECKSUM;
662
663 DBG(KERN_INFO "%s: checksum %s\n",
664 tun->dev->name, arg ? "disabled" : "enabled");
665 break;
666
667 case TUNSETPERSIST:
668 /* Disable/Enable persist mode */
669 if (arg)
670 tun->flags |= TUN_PERSIST;
671 else
672 tun->flags &= ~TUN_PERSIST;
673
674 DBG(KERN_INFO "%s: persist %s\n",
Toyo Abec6e991d2007-12-24 21:29:35 -0800675 tun->dev->name, arg ? "enabled" : "disabled");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676 break;
677
678 case TUNSETOWNER:
679 /* Set owner of the device */
680 tun->owner = (uid_t) arg;
681
682 DBG(KERN_INFO "%s: owner set to %d\n", tun->dev->name, tun->owner);
683 break;
684
Guido Guenther8c644622007-07-02 22:50:25 -0700685 case TUNSETGROUP:
686 /* Set group of the device */
687 tun->group= (gid_t) arg;
688
689 DBG(KERN_INFO "%s: group set to %d\n", tun->dev->name, tun->group);
690 break;
691
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700692 case TUNSETLINK:
David S. Miller48abfe02008-04-23 19:37:58 -0700693 {
694 int ret;
695
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700696 /* Only allow setting the type when the interface is down */
David S. Miller48abfe02008-04-23 19:37:58 -0700697 rtnl_lock();
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700698 if (tun->dev->flags & IFF_UP) {
699 DBG(KERN_INFO "%s: Linktype set failed because interface is up\n",
700 tun->dev->name);
David S. Miller48abfe02008-04-23 19:37:58 -0700701 ret = -EBUSY;
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700702 } else {
703 tun->dev->type = (int) arg;
704 DBG(KERN_INFO "%s: linktype set to %d\n", tun->dev->name, tun->dev->type);
David S. Miller48abfe02008-04-23 19:37:58 -0700705 ret = 0;
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700706 }
David S. Miller48abfe02008-04-23 19:37:58 -0700707 rtnl_unlock();
708 return ret;
709 }
Mike Kershawff4cc3a2005-09-01 17:40:05 -0700710
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711#ifdef TUN_DEBUG
712 case TUNSETDEBUG:
713 tun->debug = arg;
714 break;
715#endif
716
717 case SIOCGIFFLAGS:
718 ifr.ifr_flags = tun->if_flags;
719 if (copy_to_user( argp, &ifr, sizeof ifr))
720 return -EFAULT;
721 return 0;
722
723 case SIOCSIFFLAGS:
724 /** Set the character device's interface flags. Currently only
725 * IFF_PROMISC and IFF_ALLMULTI are used. */
726 tun->if_flags = ifr.ifr_flags;
727 DBG(KERN_INFO "%s: interface flags 0x%lx\n",
728 tun->dev->name, tun->if_flags);
729 return 0;
730
731 case SIOCGIFHWADDR:
Brian Braunstein36226a82007-04-26 01:00:55 -0700732 /* Note: the actual net device's address may be different */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 memcpy(ifr.ifr_hwaddr.sa_data, tun->dev_addr,
734 min(sizeof ifr.ifr_hwaddr.sa_data, sizeof tun->dev_addr));
735 if (copy_to_user( argp, &ifr, sizeof ifr))
736 return -EFAULT;
737 return 0;
738
739 case SIOCSIFHWADDR:
Brian Braunstein36226a82007-04-26 01:00:55 -0700740 {
741 /* try to set the actual net device's hw address */
Kim B. Heino40102372008-02-29 12:26:21 -0800742 int ret;
743
744 rtnl_lock();
745 ret = dev_set_mac_address(tun->dev, &ifr.ifr_hwaddr);
746 rtnl_unlock();
Brian Braunstein36226a82007-04-26 01:00:55 -0700747
748 if (ret == 0) {
749 /** Set the character device's hardware address. This is used when
750 * filtering packets being sent from the network device to the character
751 * device. */
752 memcpy(tun->dev_addr, ifr.ifr_hwaddr.sa_data,
753 min(sizeof ifr.ifr_hwaddr.sa_data, sizeof tun->dev_addr));
754 DBG(KERN_DEBUG "%s: set hardware address: %x:%x:%x:%x:%x:%x\n",
755 tun->dev->name,
756 tun->dev_addr[0], tun->dev_addr[1], tun->dev_addr[2],
757 tun->dev_addr[3], tun->dev_addr[4], tun->dev_addr[5]);
758 }
759
760 return ret;
761 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762
763 case SIOCADDMULTI:
764 /** Add the specified group to the character device's multicast filter
765 * list. */
David S. Miller9edb74c2008-04-24 03:44:43 -0700766 rtnl_lock();
767 netif_tx_lock_bh(tun->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768 add_multi(tun->chr_filter, ifr.ifr_hwaddr.sa_data);
David S. Miller9edb74c2008-04-24 03:44:43 -0700769 netif_tx_unlock_bh(tun->dev);
770 rtnl_unlock();
771
Joe Perches0795af52007-10-03 17:59:30 -0700772 DBG(KERN_DEBUG "%s: add multi: %s\n",
773 tun->dev->name, print_mac(mac, ifr.ifr_hwaddr.sa_data));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774 return 0;
775
776 case SIOCDELMULTI:
777 /** Remove the specified group from the character device's multicast
778 * filter list. */
David S. Miller9edb74c2008-04-24 03:44:43 -0700779 rtnl_lock();
780 netif_tx_lock_bh(tun->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781 del_multi(tun->chr_filter, ifr.ifr_hwaddr.sa_data);
David S. Miller9edb74c2008-04-24 03:44:43 -0700782 netif_tx_unlock_bh(tun->dev);
783 rtnl_unlock();
784
Joe Perches0795af52007-10-03 17:59:30 -0700785 DBG(KERN_DEBUG "%s: del multi: %s\n",
786 tun->dev->name, print_mac(mac, ifr.ifr_hwaddr.sa_data));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700787 return 0;
788
789 default:
790 return -EINVAL;
791 };
792
793 return 0;
794}
795
796static int tun_chr_fasync(int fd, struct file *file, int on)
797{
798 struct tun_struct *tun = file->private_data;
799 int ret;
800
801 if (!tun)
802 return -EBADFD;
803
804 DBG(KERN_INFO "%s: tun_chr_fasync %d\n", tun->dev->name, on);
805
Jonathan Corbet9d319522008-06-19 15:50:37 -0600806 lock_kernel();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700807 if ((ret = fasync_helper(fd, file, on, &tun->fasync)) < 0)
Jonathan Corbet9d319522008-06-19 15:50:37 -0600808 goto out;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400809
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810 if (on) {
Eric W. Biederman609d7fa2006-10-02 02:17:15 -0700811 ret = __f_setown(file, task_pid(current), PIDTYPE_PID, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812 if (ret)
Jonathan Corbet9d319522008-06-19 15:50:37 -0600813 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814 tun->flags |= TUN_FASYNC;
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400815 } else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816 tun->flags &= ~TUN_FASYNC;
Jonathan Corbet9d319522008-06-19 15:50:37 -0600817 ret = 0;
818out:
819 unlock_kernel();
820 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821}
822
823static int tun_chr_open(struct inode *inode, struct file * file)
824{
Arnd Bergmannfd3e05b2008-05-20 19:16:24 +0200825 cycle_kernel_lock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 DBG1(KERN_INFO "tunX: tun_chr_open\n");
827 file->private_data = NULL;
828 return 0;
829}
830
831static int tun_chr_close(struct inode *inode, struct file *file)
832{
833 struct tun_struct *tun = file->private_data;
834
835 if (!tun)
836 return 0;
837
838 DBG(KERN_INFO "%s: tun_chr_close\n", tun->dev->name);
839
840 tun_chr_fasync(-1, file, 0);
841
842 rtnl_lock();
843
844 /* Detach from net device */
845 file->private_data = NULL;
846 tun->attached = 0;
Pavel Emelyanovfc54c652008-04-16 00:41:53 -0700847 put_net(dev_net(tun->dev));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700848
849 /* Drop read queue */
850 skb_queue_purge(&tun->readq);
851
852 if (!(tun->flags & TUN_PERSIST)) {
853 list_del(&tun->list);
854 unregister_netdevice(tun->dev);
855 }
856
857 rtnl_unlock();
858
859 return 0;
860}
861
Arjan van de Vend54b1fd2007-02-12 00:55:34 -0800862static const struct file_operations tun_fops = {
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400863 .owner = THIS_MODULE,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864 .llseek = no_llseek,
Badari Pulavartyee0b3e62006-09-30 23:28:47 -0700865 .read = do_sync_read,
866 .aio_read = tun_chr_aio_read,
867 .write = do_sync_write,
868 .aio_write = tun_chr_aio_write,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869 .poll = tun_chr_poll,
870 .ioctl = tun_chr_ioctl,
871 .open = tun_chr_open,
872 .release = tun_chr_close,
Jeff Garzik6aa20a22006-09-13 13:24:59 -0400873 .fasync = tun_chr_fasync
Linus Torvalds1da177e2005-04-16 15:20:36 -0700874};
875
876static struct miscdevice tun_miscdev = {
877 .minor = TUN_MINOR,
878 .name = "tun",
879 .fops = &tun_fops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880};
881
882/* ethtool interface */
883
884static int tun_get_settings(struct net_device *dev, struct ethtool_cmd *cmd)
885{
886 cmd->supported = 0;
887 cmd->advertising = 0;
888 cmd->speed = SPEED_10;
889 cmd->duplex = DUPLEX_FULL;
890 cmd->port = PORT_TP;
891 cmd->phy_address = 0;
892 cmd->transceiver = XCVR_INTERNAL;
893 cmd->autoneg = AUTONEG_DISABLE;
894 cmd->maxtxpkt = 0;
895 cmd->maxrxpkt = 0;
896 return 0;
897}
898
899static void tun_get_drvinfo(struct net_device *dev, struct ethtool_drvinfo *info)
900{
901 struct tun_struct *tun = netdev_priv(dev);
902
903 strcpy(info->driver, DRV_NAME);
904 strcpy(info->version, DRV_VERSION);
905 strcpy(info->fw_version, "N/A");
906
907 switch (tun->flags & TUN_TYPE_MASK) {
908 case TUN_TUN_DEV:
909 strcpy(info->bus_info, "tun");
910 break;
911 case TUN_TAP_DEV:
912 strcpy(info->bus_info, "tap");
913 break;
914 }
915}
916
917static u32 tun_get_msglevel(struct net_device *dev)
918{
919#ifdef TUN_DEBUG
920 struct tun_struct *tun = netdev_priv(dev);
921 return tun->debug;
922#else
923 return -EOPNOTSUPP;
924#endif
925}
926
927static void tun_set_msglevel(struct net_device *dev, u32 value)
928{
929#ifdef TUN_DEBUG
930 struct tun_struct *tun = netdev_priv(dev);
931 tun->debug = value;
932#endif
933}
934
935static u32 tun_get_link(struct net_device *dev)
936{
937 struct tun_struct *tun = netdev_priv(dev);
938 return tun->attached;
939}
940
941static u32 tun_get_rx_csum(struct net_device *dev)
942{
943 struct tun_struct *tun = netdev_priv(dev);
944 return (tun->flags & TUN_NOCHECKSUM) == 0;
945}
946
947static int tun_set_rx_csum(struct net_device *dev, u32 data)
948{
949 struct tun_struct *tun = netdev_priv(dev);
950 if (data)
951 tun->flags &= ~TUN_NOCHECKSUM;
952 else
953 tun->flags |= TUN_NOCHECKSUM;
954 return 0;
955}
956
Jeff Garzik7282d492006-09-13 14:30:00 -0400957static const struct ethtool_ops tun_ethtool_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700958 .get_settings = tun_get_settings,
959 .get_drvinfo = tun_get_drvinfo,
960 .get_msglevel = tun_get_msglevel,
961 .set_msglevel = tun_set_msglevel,
962 .get_link = tun_get_link,
963 .get_rx_csum = tun_get_rx_csum,
964 .set_rx_csum = tun_set_rx_csum
965};
966
Pavel Emelyanov79d17602008-04-16 00:40:46 -0700967static int tun_init_net(struct net *net)
968{
969 struct tun_net *tn;
970
971 tn = kmalloc(sizeof(*tn), GFP_KERNEL);
972 if (tn == NULL)
973 return -ENOMEM;
974
975 INIT_LIST_HEAD(&tn->dev_list);
976
977 if (net_assign_generic(net, tun_net_id, tn)) {
978 kfree(tn);
979 return -ENOMEM;
980 }
981
982 return 0;
983}
984
985static void tun_exit_net(struct net *net)
986{
987 struct tun_net *tn;
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700988 struct tun_struct *tun, *nxt;
Pavel Emelyanov79d17602008-04-16 00:40:46 -0700989
990 tn = net_generic(net, tun_net_id);
Pavel Emelyanovd647a592008-04-16 00:41:16 -0700991
992 rtnl_lock();
993 list_for_each_entry_safe(tun, nxt, &tn->dev_list, list) {
994 DBG(KERN_INFO "%s cleaned up\n", tun->dev->name);
995 unregister_netdevice(tun->dev);
996 }
997 rtnl_unlock();
998
Pavel Emelyanov79d17602008-04-16 00:40:46 -0700999 kfree(tn);
1000}
1001
1002static struct pernet_operations tun_net_ops = {
1003 .init = tun_init_net,
1004 .exit = tun_exit_net,
1005};
1006
Linus Torvalds1da177e2005-04-16 15:20:36 -07001007static int __init tun_init(void)
1008{
1009 int ret = 0;
1010
1011 printk(KERN_INFO "tun: %s, %s\n", DRV_DESCRIPTION, DRV_VERSION);
1012 printk(KERN_INFO "tun: %s\n", DRV_COPYRIGHT);
1013
Pavel Emelyanov79d17602008-04-16 00:40:46 -07001014 ret = register_pernet_gen_device(&tun_net_id, &tun_net_ops);
1015 if (ret) {
1016 printk(KERN_ERR "tun: Can't register pernet ops\n");
1017 goto err_pernet;
1018 }
1019
Linus Torvalds1da177e2005-04-16 15:20:36 -07001020 ret = misc_register(&tun_miscdev);
Pavel Emelyanov79d17602008-04-16 00:40:46 -07001021 if (ret) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022 printk(KERN_ERR "tun: Can't register misc device %d\n", TUN_MINOR);
Pavel Emelyanov79d17602008-04-16 00:40:46 -07001023 goto err_misc;
1024 }
1025 return 0;
1026
1027err_misc:
1028 unregister_pernet_gen_device(tun_net_id, &tun_net_ops);
1029err_pernet:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030 return ret;
1031}
1032
1033static void tun_cleanup(void)
1034{
Jeff Garzik6aa20a22006-09-13 13:24:59 -04001035 misc_deregister(&tun_miscdev);
Pavel Emelyanov79d17602008-04-16 00:40:46 -07001036 unregister_pernet_gen_device(tun_net_id, &tun_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001037}
1038
1039module_init(tun_init);
1040module_exit(tun_cleanup);
1041MODULE_DESCRIPTION(DRV_DESCRIPTION);
1042MODULE_AUTHOR(DRV_COPYRIGHT);
1043MODULE_LICENSE("GPL");
1044MODULE_ALIAS_MISCDEV(TUN_MINOR);