blob: 43af9e9b26525ad1fcc4f96df93168d4bfe1990c [file] [log] [blame]
Pavel Emelyanove314dbd2007-09-25 16:14:46 -07001/*
2 * drivers/net/veth.c
3 *
4 * Copyright (C) 2007 OpenVZ http://openvz.org, SWsoft Inc
5 *
6 * Author: Pavel Emelianov <xemul@openvz.org>
7 * Ethtool interface from: Eric W. Biederman <ebiederm@xmission.com>
8 *
9 */
10
11#include <linux/list.h>
12#include <linux/netdevice.h>
13#include <linux/ethtool.h>
14#include <linux/etherdevice.h>
15
16#include <net/dst.h>
17#include <net/xfrm.h>
Stephen Hemmingerecef9692007-12-25 17:23:59 -080018#include <linux/veth.h>
Pavel Emelyanove314dbd2007-09-25 16:14:46 -070019
20#define DRV_NAME "veth"
21#define DRV_VERSION "1.0"
22
23struct veth_net_stats {
24 unsigned long rx_packets;
25 unsigned long tx_packets;
26 unsigned long rx_bytes;
27 unsigned long tx_bytes;
28 unsigned long tx_dropped;
29};
30
31struct veth_priv {
32 struct net_device *peer;
33 struct net_device *dev;
34 struct list_head list;
35 struct veth_net_stats *stats;
36 unsigned ip_summed;
37};
38
39static LIST_HEAD(veth_list);
40
41/*
42 * ethtool interface
43 */
44
45static struct {
46 const char string[ETH_GSTRING_LEN];
47} ethtool_stats_keys[] = {
48 { "peer_ifindex" },
49};
50
51static int veth_get_settings(struct net_device *dev, struct ethtool_cmd *cmd)
52{
53 cmd->supported = 0;
54 cmd->advertising = 0;
55 cmd->speed = SPEED_10000;
56 cmd->duplex = DUPLEX_FULL;
57 cmd->port = PORT_TP;
58 cmd->phy_address = 0;
59 cmd->transceiver = XCVR_INTERNAL;
60 cmd->autoneg = AUTONEG_DISABLE;
61 cmd->maxtxpkt = 0;
62 cmd->maxrxpkt = 0;
63 return 0;
64}
65
66static void veth_get_drvinfo(struct net_device *dev, struct ethtool_drvinfo *info)
67{
68 strcpy(info->driver, DRV_NAME);
69 strcpy(info->version, DRV_VERSION);
70 strcpy(info->fw_version, "N/A");
71}
72
73static void veth_get_strings(struct net_device *dev, u32 stringset, u8 *buf)
74{
75 switch(stringset) {
76 case ETH_SS_STATS:
77 memcpy(buf, &ethtool_stats_keys, sizeof(ethtool_stats_keys));
78 break;
79 }
80}
81
Jeff Garzikb9f2c042007-10-03 18:07:32 -070082static int veth_get_sset_count(struct net_device *dev, int sset)
Pavel Emelyanove314dbd2007-09-25 16:14:46 -070083{
Jeff Garzikb9f2c042007-10-03 18:07:32 -070084 switch (sset) {
85 case ETH_SS_STATS:
86 return ARRAY_SIZE(ethtool_stats_keys);
87 default:
88 return -EOPNOTSUPP;
89 }
Pavel Emelyanove314dbd2007-09-25 16:14:46 -070090}
91
92static void veth_get_ethtool_stats(struct net_device *dev,
93 struct ethtool_stats *stats, u64 *data)
94{
95 struct veth_priv *priv;
96
97 priv = netdev_priv(dev);
98 data[0] = priv->peer->ifindex;
99}
100
101static u32 veth_get_rx_csum(struct net_device *dev)
102{
103 struct veth_priv *priv;
104
105 priv = netdev_priv(dev);
106 return priv->ip_summed == CHECKSUM_UNNECESSARY;
107}
108
109static int veth_set_rx_csum(struct net_device *dev, u32 data)
110{
111 struct veth_priv *priv;
112
113 priv = netdev_priv(dev);
114 priv->ip_summed = data ? CHECKSUM_UNNECESSARY : CHECKSUM_NONE;
115 return 0;
116}
117
118static u32 veth_get_tx_csum(struct net_device *dev)
119{
120 return (dev->features & NETIF_F_NO_CSUM) != 0;
121}
122
123static int veth_set_tx_csum(struct net_device *dev, u32 data)
124{
125 if (data)
126 dev->features |= NETIF_F_NO_CSUM;
127 else
128 dev->features &= ~NETIF_F_NO_CSUM;
129 return 0;
130}
131
132static struct ethtool_ops veth_ethtool_ops = {
133 .get_settings = veth_get_settings,
134 .get_drvinfo = veth_get_drvinfo,
135 .get_link = ethtool_op_get_link,
136 .get_rx_csum = veth_get_rx_csum,
137 .set_rx_csum = veth_set_rx_csum,
138 .get_tx_csum = veth_get_tx_csum,
139 .set_tx_csum = veth_set_tx_csum,
140 .get_sg = ethtool_op_get_sg,
141 .set_sg = ethtool_op_set_sg,
142 .get_strings = veth_get_strings,
Jeff Garzikb9f2c042007-10-03 18:07:32 -0700143 .get_sset_count = veth_get_sset_count,
Pavel Emelyanove314dbd2007-09-25 16:14:46 -0700144 .get_ethtool_stats = veth_get_ethtool_stats,
145};
146
147/*
148 * xmit
149 */
150
151static int veth_xmit(struct sk_buff *skb, struct net_device *dev)
152{
153 struct net_device *rcv = NULL;
154 struct veth_priv *priv, *rcv_priv;
155 struct veth_net_stats *stats;
156 int length, cpu;
157
158 skb_orphan(skb);
159
160 priv = netdev_priv(dev);
161 rcv = priv->peer;
162 rcv_priv = netdev_priv(rcv);
163
164 cpu = smp_processor_id();
165 stats = per_cpu_ptr(priv->stats, cpu);
166
167 if (!(rcv->flags & IFF_UP))
168 goto outf;
169
170 skb->pkt_type = PACKET_HOST;
171 skb->protocol = eth_type_trans(skb, rcv);
172 if (dev->features & NETIF_F_NO_CSUM)
173 skb->ip_summed = rcv_priv->ip_summed;
174
175 dst_release(skb->dst);
176 skb->dst = NULL;
177 skb->mark = 0;
178 secpath_reset(skb);
179 nf_reset(skb);
180
181 length = skb->len;
182
183 stats->tx_bytes += length;
184 stats->tx_packets++;
185
186 stats = per_cpu_ptr(rcv_priv->stats, cpu);
187 stats->rx_bytes += length;
188 stats->rx_packets++;
189
190 netif_rx(skb);
191 return 0;
192
193outf:
194 kfree_skb(skb);
195 stats->tx_dropped++;
196 return 0;
197}
198
199/*
200 * general routines
201 */
202
203static struct net_device_stats *veth_get_stats(struct net_device *dev)
204{
205 struct veth_priv *priv;
206 struct net_device_stats *dev_stats;
207 int cpu;
208 struct veth_net_stats *stats;
209
210 priv = netdev_priv(dev);
211 dev_stats = &dev->stats;
212
213 dev_stats->rx_packets = 0;
214 dev_stats->tx_packets = 0;
215 dev_stats->rx_bytes = 0;
216 dev_stats->tx_bytes = 0;
217 dev_stats->tx_dropped = 0;
218
219 for_each_online_cpu(cpu) {
220 stats = per_cpu_ptr(priv->stats, cpu);
221
222 dev_stats->rx_packets += stats->rx_packets;
223 dev_stats->tx_packets += stats->tx_packets;
224 dev_stats->rx_bytes += stats->rx_bytes;
225 dev_stats->tx_bytes += stats->tx_bytes;
226 dev_stats->tx_dropped += stats->tx_dropped;
227 }
228
229 return dev_stats;
230}
231
232static int veth_open(struct net_device *dev)
233{
234 struct veth_priv *priv;
235
236 priv = netdev_priv(dev);
237 if (priv->peer == NULL)
238 return -ENOTCONN;
239
240 if (priv->peer->flags & IFF_UP) {
241 netif_carrier_on(dev);
242 netif_carrier_on(priv->peer);
243 }
244 return 0;
245}
246
247static int veth_close(struct net_device *dev)
248{
249 struct veth_priv *priv;
250
251 if (netif_carrier_ok(dev)) {
252 priv = netdev_priv(dev);
253 netif_carrier_off(dev);
254 netif_carrier_off(priv->peer);
255 }
256 return 0;
257}
258
259static int veth_dev_init(struct net_device *dev)
260{
261 struct veth_net_stats *stats;
262 struct veth_priv *priv;
263
264 stats = alloc_percpu(struct veth_net_stats);
265 if (stats == NULL)
266 return -ENOMEM;
267
268 priv = netdev_priv(dev);
269 priv->stats = stats;
270 return 0;
271}
272
273static void veth_dev_free(struct net_device *dev)
274{
275 struct veth_priv *priv;
276
277 priv = netdev_priv(dev);
278 free_percpu(priv->stats);
279 free_netdev(dev);
280}
281
282static void veth_setup(struct net_device *dev)
283{
284 ether_setup(dev);
285
286 dev->hard_start_xmit = veth_xmit;
287 dev->get_stats = veth_get_stats;
288 dev->open = veth_open;
289 dev->stop = veth_close;
290 dev->ethtool_ops = &veth_ethtool_ops;
291 dev->features |= NETIF_F_LLTX;
292 dev->init = veth_dev_init;
293 dev->destructor = veth_dev_free;
294}
295
296/*
297 * netlink interface
298 */
299
300static int veth_validate(struct nlattr *tb[], struct nlattr *data[])
301{
302 if (tb[IFLA_ADDRESS]) {
303 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
304 return -EINVAL;
305 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
306 return -EADDRNOTAVAIL;
307 }
308 return 0;
309}
310
311static struct rtnl_link_ops veth_link_ops;
312
313static int veth_newlink(struct net_device *dev,
314 struct nlattr *tb[], struct nlattr *data[])
315{
316 int err;
317 struct net_device *peer;
318 struct veth_priv *priv;
319 char ifname[IFNAMSIZ];
320 struct nlattr *peer_tb[IFLA_MAX + 1], **tbp;
321
322 /*
323 * create and register peer first
324 *
325 * struct ifinfomsg is at the head of VETH_INFO_PEER, but we
326 * skip it since no info from it is useful yet
327 */
328
329 if (data != NULL && data[VETH_INFO_PEER] != NULL) {
330 struct nlattr *nla_peer;
331
332 nla_peer = data[VETH_INFO_PEER];
333 err = nla_parse(peer_tb, IFLA_MAX,
334 nla_data(nla_peer) + sizeof(struct ifinfomsg),
335 nla_len(nla_peer) - sizeof(struct ifinfomsg),
336 ifla_policy);
337 if (err < 0)
338 return err;
339
340 err = veth_validate(peer_tb, NULL);
341 if (err < 0)
342 return err;
343
344 tbp = peer_tb;
345 } else
346 tbp = tb;
347
348 if (tbp[IFLA_IFNAME])
349 nla_strlcpy(ifname, tbp[IFLA_IFNAME], IFNAMSIZ);
350 else
351 snprintf(ifname, IFNAMSIZ, DRV_NAME "%%d");
352
Eric W. Biederman881d9662007-09-17 11:56:21 -0700353 peer = rtnl_create_link(dev->nd_net, ifname, &veth_link_ops, tbp);
Pavel Emelyanove314dbd2007-09-25 16:14:46 -0700354 if (IS_ERR(peer))
355 return PTR_ERR(peer);
356
357 if (tbp[IFLA_ADDRESS] == NULL)
358 random_ether_addr(peer->dev_addr);
359
360 err = register_netdevice(peer);
361 if (err < 0)
362 goto err_register_peer;
363
364 netif_carrier_off(peer);
365
366 /*
367 * register dev last
368 *
369 * note, that since we've registered new device the dev's name
370 * should be re-allocated
371 */
372
373 if (tb[IFLA_ADDRESS] == NULL)
374 random_ether_addr(dev->dev_addr);
375
376 if (tb[IFLA_IFNAME])
377 nla_strlcpy(dev->name, tb[IFLA_IFNAME], IFNAMSIZ);
378 else
379 snprintf(dev->name, IFNAMSIZ, DRV_NAME "%%d");
380
381 if (strchr(dev->name, '%')) {
382 err = dev_alloc_name(dev, dev->name);
383 if (err < 0)
384 goto err_alloc_name;
385 }
386
387 err = register_netdevice(dev);
388 if (err < 0)
389 goto err_register_dev;
390
391 netif_carrier_off(dev);
392
393 /*
394 * tie the deviced together
395 */
396
397 priv = netdev_priv(dev);
398 priv->dev = dev;
399 priv->peer = peer;
400 list_add(&priv->list, &veth_list);
401
402 priv = netdev_priv(peer);
403 priv->dev = peer;
404 priv->peer = dev;
405 INIT_LIST_HEAD(&priv->list);
406 return 0;
407
408err_register_dev:
409 /* nothing to do */
410err_alloc_name:
411 unregister_netdevice(peer);
412 return err;
413
414err_register_peer:
415 free_netdev(peer);
416 return err;
417}
418
419static void veth_dellink(struct net_device *dev)
420{
421 struct veth_priv *priv;
422 struct net_device *peer;
423
424 priv = netdev_priv(dev);
425 peer = priv->peer;
426
427 if (!list_empty(&priv->list))
428 list_del(&priv->list);
429
430 priv = netdev_priv(peer);
431 if (!list_empty(&priv->list))
432 list_del(&priv->list);
433
434 unregister_netdevice(dev);
435 unregister_netdevice(peer);
436}
437
438static const struct nla_policy veth_policy[VETH_INFO_MAX + 1];
439
440static struct rtnl_link_ops veth_link_ops = {
441 .kind = DRV_NAME,
442 .priv_size = sizeof(struct veth_priv),
443 .setup = veth_setup,
444 .validate = veth_validate,
445 .newlink = veth_newlink,
446 .dellink = veth_dellink,
447 .policy = veth_policy,
448 .maxtype = VETH_INFO_MAX,
449};
450
451/*
452 * init/fini
453 */
454
455static __init int veth_init(void)
456{
457 return rtnl_link_register(&veth_link_ops);
458}
459
460static __exit void veth_exit(void)
461{
462 struct veth_priv *priv, *next;
463
464 rtnl_lock();
465 /*
466 * cannot trust __rtnl_link_unregister() to unregister all
467 * devices, as each ->dellink call will remove two devices
468 * from the list at once.
469 */
470 list_for_each_entry_safe(priv, next, &veth_list, list)
471 veth_dellink(priv->dev);
472
473 __rtnl_link_unregister(&veth_link_ops);
474 rtnl_unlock();
475}
476
477module_init(veth_init);
478module_exit(veth_exit);
479
480MODULE_DESCRIPTION("Virtual Ethernet Tunnel");
481MODULE_LICENSE("GPL v2");
482MODULE_ALIAS_RTNL_LINK(DRV_NAME);