blob: da687c8dc6ff013e62f04b535f2a26483e4db284 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Userspace interface
3 * Linux ethernet bridge
4 *
5 * Authors:
6 * Lennert Buytenhek <buytenh@gnu.org>
7 *
8 * $Id: br_if.c,v 1.7 2001/12/24 00:59:55 davem Exp $
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 */
15
16#include <linux/kernel.h>
17#include <linux/netdevice.h>
18#include <linux/ethtool.h>
19#include <linux/if_arp.h>
20#include <linux/module.h>
21#include <linux/init.h>
22#include <linux/rtnetlink.h>
Kris Katterjohn46f25df2006-01-05 16:35:42 -080023#include <linux/if_ether.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <net/sock.h>
25
26#include "br_private.h"
27
28/*
29 * Determine initial path cost based on speed.
30 * using recommendations from 802.1d standard
31 *
32 * Need to simulate user ioctl because not all device's that support
33 * ethtool, use ethtool_ops. Also, since driver might sleep need to
34 * not be holding any locks.
35 */
Stephen Hemminger4433f422005-12-20 15:19:51 -080036static int port_cost(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -070037{
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 struct ethtool_cmd ecmd = { ETHTOOL_GSET };
39 struct ifreq ifr;
40 mm_segment_t old_fs;
41 int err;
42
43 strncpy(ifr.ifr_name, dev->name, IFNAMSIZ);
44 ifr.ifr_data = (void __user *) &ecmd;
45
46 old_fs = get_fs();
47 set_fs(KERNEL_DS);
48 err = dev_ethtool(&ifr);
49 set_fs(old_fs);
50
51 if (!err) {
52 switch(ecmd.speed) {
53 case SPEED_100:
54 return 19;
55 case SPEED_1000:
56 return 4;
57 case SPEED_10000:
58 return 2;
59 case SPEED_10:
60 return 100;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 }
62 }
63
64 /* Old silly heuristics based on name */
65 if (!strncmp(dev->name, "lec", 3))
66 return 7;
67
68 if (!strncmp(dev->name, "plip", 4))
69 return 2500;
70
71 return 100; /* assume old 10Mbps */
72}
73
Stephen Hemminger4433f422005-12-20 15:19:51 -080074
75/*
76 * Check for port carrier transistions.
77 * Called from work queue to allow for calling functions that
78 * might sleep (such as speed check), and to debounce.
79 */
80static void port_carrier_check(void *arg)
81{
82 struct net_bridge_port *p = arg;
83
84 rtnl_lock();
85 if (netif_carrier_ok(p->dev)) {
86 u32 cost = port_cost(p->dev);
87
88 spin_lock_bh(&p->br->lock);
89 if (p->state == BR_STATE_DISABLED) {
90 p->path_cost = cost;
91 br_stp_enable_port(p);
92 }
93 spin_unlock_bh(&p->br->lock);
94 } else {
95 spin_lock_bh(&p->br->lock);
96 if (p->state != BR_STATE_DISABLED)
97 br_stp_disable_port(p);
98 spin_unlock_bh(&p->br->lock);
99 }
100 rtnl_unlock();
101}
102
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103static void destroy_nbp(struct net_bridge_port *p)
104{
105 struct net_device *dev = p->dev;
106
Stephen Hemminger3f4cfc22006-01-31 17:44:07 -0800107 dev->br_port = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700108 p->br = NULL;
109 p->dev = NULL;
110 dev_put(dev);
111
112 br_sysfs_freeif(p);
113}
114
115static void destroy_nbp_rcu(struct rcu_head *head)
116{
117 struct net_bridge_port *p =
118 container_of(head, struct net_bridge_port, rcu);
119 destroy_nbp(p);
120}
121
Stephen Hemminger3f4cfc22006-01-31 17:44:07 -0800122/* Delete port(interface) from bridge is done in two steps.
123 * via RCU. First step, marks device as down. That deletes
124 * all the timers and stops new packets from flowing through.
125 *
126 * Final cleanup doesn't occur until after all CPU's finished
127 * processing packets.
128 *
129 * Protected from multiple admin operations by RTNL mutex
130 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131static void del_nbp(struct net_bridge_port *p)
132{
133 struct net_bridge *br = p->br;
134 struct net_device *dev = p->dev;
135
Stephen Hemminger3f4cfc22006-01-31 17:44:07 -0800136 /* Race between RTNL notify and RCU callback */
137 if (p->deleted)
138 return;
139
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140 dev_set_promiscuity(dev, -1);
141
Stephen Hemminger4433f422005-12-20 15:19:51 -0800142 cancel_delayed_work(&p->carrier_check);
143 flush_scheduled_work();
144
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 spin_lock_bh(&br->lock);
146 br_stp_disable_port(p);
Stephen Hemminger3f4cfc22006-01-31 17:44:07 -0800147 p->deleted = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 spin_unlock_bh(&br->lock);
149
150 br_fdb_delete_by_port(br, p);
151
152 list_del_rcu(&p->list);
153
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 call_rcu(&p->rcu, destroy_nbp_rcu);
155}
156
157/* called with RTNL */
158static void del_br(struct net_bridge *br)
159{
160 struct net_bridge_port *p, *n;
161
162 list_for_each_entry_safe(p, n, &br->port_list, list) {
163 br_sysfs_removeif(p);
164 del_nbp(p);
165 }
166
167 del_timer_sync(&br->gc_timer);
168
169 br_sysfs_delbr(br->dev);
170 unregister_netdevice(br->dev);
171}
172
173static struct net_device *new_bridge_dev(const char *name)
174{
175 struct net_bridge *br;
176 struct net_device *dev;
177
178 dev = alloc_netdev(sizeof(struct net_bridge), name,
179 br_dev_setup);
180
181 if (!dev)
182 return NULL;
183
184 br = netdev_priv(dev);
185 br->dev = dev;
186
187 spin_lock_init(&br->lock);
188 INIT_LIST_HEAD(&br->port_list);
189 spin_lock_init(&br->hash_lock);
190
191 br->bridge_id.prio[0] = 0x80;
192 br->bridge_id.prio[1] = 0x00;
193 memset(br->bridge_id.addr, 0, ETH_ALEN);
194
Stephen Hemmingeredb5e462005-12-21 19:00:58 -0800195 br->feature_mask = dev->features;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 br->stp_enabled = 0;
197 br->designated_root = br->bridge_id;
198 br->root_path_cost = 0;
199 br->root_port = 0;
200 br->bridge_max_age = br->max_age = 20 * HZ;
201 br->bridge_hello_time = br->hello_time = 2 * HZ;
202 br->bridge_forward_delay = br->forward_delay = 15 * HZ;
203 br->topology_change = 0;
204 br->topology_change_detected = 0;
205 br->ageing_time = 300 * HZ;
206 INIT_LIST_HEAD(&br->age_list);
207
208 br_stp_timer_init(br);
209
210 return dev;
211}
212
213/* find an available port number */
214static int find_portno(struct net_bridge *br)
215{
216 int index;
217 struct net_bridge_port *p;
218 unsigned long *inuse;
219
220 inuse = kmalloc(BITS_TO_LONGS(BR_MAX_PORTS)*sizeof(unsigned long),
221 GFP_KERNEL);
222 if (!inuse)
223 return -ENOMEM;
224
225 memset(inuse, 0, BITS_TO_LONGS(BR_MAX_PORTS)*sizeof(unsigned long));
226 set_bit(0, inuse); /* zero is reserved */
227 list_for_each_entry(p, &br->port_list, list) {
228 set_bit(p->port_no, inuse);
229 }
230 index = find_first_zero_bit(inuse, BR_MAX_PORTS);
231 kfree(inuse);
232
233 return (index >= BR_MAX_PORTS) ? -EXFULL : index;
234}
235
Stephen Hemminger4433f422005-12-20 15:19:51 -0800236/* called with RTNL but without bridge lock */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237static struct net_bridge_port *new_nbp(struct net_bridge *br,
Stephen Hemminger4433f422005-12-20 15:19:51 -0800238 struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239{
240 int index;
241 struct net_bridge_port *p;
242
243 index = find_portno(br);
244 if (index < 0)
245 return ERR_PTR(index);
246
247 p = kmalloc(sizeof(*p), GFP_KERNEL);
248 if (p == NULL)
249 return ERR_PTR(-ENOMEM);
250
251 memset(p, 0, sizeof(*p));
252 p->br = br;
253 dev_hold(dev);
254 p->dev = dev;
Stephen Hemminger4433f422005-12-20 15:19:51 -0800255 p->path_cost = port_cost(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256 p->priority = 0x8000 >> BR_PORT_BITS;
257 dev->br_port = p;
258 p->port_no = index;
259 br_init_port(p);
260 p->state = BR_STATE_DISABLED;
Stephen Hemminger4433f422005-12-20 15:19:51 -0800261 INIT_WORK(&p->carrier_check, port_carrier_check, p);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 kobject_init(&p->kobj);
263
264 return p;
265}
266
267int br_add_bridge(const char *name)
268{
269 struct net_device *dev;
270 int ret;
271
272 dev = new_bridge_dev(name);
273 if (!dev)
274 return -ENOMEM;
275
276 rtnl_lock();
277 if (strchr(dev->name, '%')) {
278 ret = dev_alloc_name(dev, dev->name);
279 if (ret < 0)
280 goto err1;
281 }
282
283 ret = register_netdevice(dev);
284 if (ret)
285 goto err2;
286
287 /* network device kobject is not setup until
288 * after rtnl_unlock does it's hotplug magic.
289 * so hold reference to avoid race.
290 */
291 dev_hold(dev);
292 rtnl_unlock();
293
294 ret = br_sysfs_addbr(dev);
295 dev_put(dev);
296
297 if (ret)
298 unregister_netdev(dev);
299 out:
300 return ret;
301
302 err2:
303 free_netdev(dev);
304 err1:
305 rtnl_unlock();
306 goto out;
307}
308
309int br_del_bridge(const char *name)
310{
311 struct net_device *dev;
312 int ret = 0;
313
314 rtnl_lock();
315 dev = __dev_get_by_name(name);
316 if (dev == NULL)
317 ret = -ENXIO; /* Could not find device */
318
319 else if (!(dev->priv_flags & IFF_EBRIDGE)) {
320 /* Attempt to delete non bridge device! */
321 ret = -EPERM;
322 }
323
324 else if (dev->flags & IFF_UP) {
325 /* Not shutdown yet. */
326 ret = -EBUSY;
327 }
328
329 else
330 del_br(netdev_priv(dev));
331
332 rtnl_unlock();
333 return ret;
334}
335
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800336/* MTU of the bridge pseudo-device: ETH_DATA_LEN or the minimum of the ports */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337int br_min_mtu(const struct net_bridge *br)
338{
339 const struct net_bridge_port *p;
340 int mtu = 0;
341
342 ASSERT_RTNL();
343
344 if (list_empty(&br->port_list))
Kris Katterjohn46f25df2006-01-05 16:35:42 -0800345 mtu = ETH_DATA_LEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 else {
347 list_for_each_entry(p, &br->port_list, list) {
348 if (!mtu || p->dev->mtu < mtu)
349 mtu = p->dev->mtu;
350 }
351 }
352 return mtu;
353}
354
Stephen Hemminger81d35302005-05-29 14:15:17 -0700355/*
356 * Recomputes features using slave's features
357 */
358void br_features_recompute(struct net_bridge *br)
359{
360 struct net_bridge_port *p;
361 unsigned long features, checksum;
362
Stephen Hemmingeredb5e462005-12-21 19:00:58 -0800363 features = br->feature_mask &~ NETIF_F_IP_CSUM;
364 checksum = br->feature_mask & NETIF_F_IP_CSUM;
Stephen Hemminger81d35302005-05-29 14:15:17 -0700365
366 list_for_each_entry(p, &br->port_list, list) {
367 if (!(p->dev->features
368 & (NETIF_F_IP_CSUM|NETIF_F_NO_CSUM|NETIF_F_HW_CSUM)))
369 checksum = 0;
370 features &= p->dev->features;
371 }
372
373 br->dev->features = features | checksum | NETIF_F_LLTX;
374}
375
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376/* called with RTNL */
377int br_add_if(struct net_bridge *br, struct net_device *dev)
378{
379 struct net_bridge_port *p;
380 int err = 0;
381
382 if (dev->flags & IFF_LOOPBACK || dev->type != ARPHRD_ETHER)
383 return -EINVAL;
384
385 if (dev->hard_start_xmit == br_dev_xmit)
386 return -ELOOP;
387
388 if (dev->br_port != NULL)
389 return -EBUSY;
390
Stephen Hemminger4433f422005-12-20 15:19:51 -0800391 if (IS_ERR(p = new_nbp(br, dev)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 return PTR_ERR(p);
393
394 if ((err = br_fdb_insert(br, p, dev->dev_addr)))
395 destroy_nbp(p);
396
397 else if ((err = br_sysfs_addif(p)))
398 del_nbp(p);
399 else {
400 dev_set_promiscuity(dev, 1);
401
402 list_add_rcu(&p->list, &br->port_list);
403
404 spin_lock_bh(&br->lock);
405 br_stp_recalculate_bridge_id(br);
Olaf Rempel133747e2005-11-23 19:04:08 -0800406 br_features_recompute(br);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700407 if ((br->dev->flags & IFF_UP)
408 && (dev->flags & IFF_UP) && netif_carrier_ok(dev))
409 br_stp_enable_port(p);
410 spin_unlock_bh(&br->lock);
411
412 dev_set_mtu(br->dev, br_min_mtu(br));
413 }
414
415 return err;
416}
417
418/* called with RTNL */
419int br_del_if(struct net_bridge *br, struct net_device *dev)
420{
421 struct net_bridge_port *p = dev->br_port;
422
423 if (!p || p->br != br)
424 return -EINVAL;
425
426 br_sysfs_removeif(p);
427 del_nbp(p);
428
429 spin_lock_bh(&br->lock);
430 br_stp_recalculate_bridge_id(br);
Stephen Hemminger81d35302005-05-29 14:15:17 -0700431 br_features_recompute(br);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432 spin_unlock_bh(&br->lock);
433
434 return 0;
435}
436
437void __exit br_cleanup_bridges(void)
438{
439 struct net_device *dev, *nxt;
440
441 rtnl_lock();
442 for (dev = dev_base; dev; dev = nxt) {
443 nxt = dev->next;
444 if (dev->priv_flags & IFF_EBRIDGE)
445 del_br(dev->priv);
446 }
447 rtnl_unlock();
448
449}