blob: 31fe980e4e28e5c102780aa6d9ae8450cc224763 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Bond several ethernet interfaces into a Cisco, running 'Etherchannel'.
3 *
4 * Portions are (c) Copyright 1995 Simon "Guru Aleph-Null" Janes
5 * NCM: Network and Communications Management, Inc.
6 *
7 * BUT, I'm the one who modified it for ethernet, so:
8 * (c) Copyright 1999, Thomas Davis, tadavis@lbl.gov
9 *
10 * This software may be used and distributed according to the terms
11 * of the GNU Public License, incorporated herein by reference.
12 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 */
14
15#ifndef _LINUX_BONDING_H
16#define _LINUX_BONDING_H
17
18#include <linux/timer.h>
19#include <linux/proc_fs.h>
20#include <linux/if_bonding.h>
Neil Hormane843fa52010-10-13 16:01:50 +000021#include <linux/cpumask.h>
Brian Haley305d5522008-11-04 17:51:14 -080022#include <linux/in6.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include "bond_3ad.h"
24#include "bond_alb.h"
25
Andy Gospodarekbb1d9122010-06-02 08:40:18 +000026#define DRV_VERSION "3.7.0"
27#define DRV_RELDATE "June 2, 2010"
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#define DRV_NAME "bonding"
29#define DRV_DESCRIPTION "Ethernet Channel Bonding Driver"
30
31#define BOND_MAX_ARP_TARGETS 16
32
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#define IS_UP(dev) \
34 ((((dev)->flags & IFF_UP) == IFF_UP) && \
35 netif_running(dev) && \
36 netif_carrier_ok(dev))
37
38/*
39 * Checks whether bond is ready for transmit.
40 *
41 * Caller must hold bond->lock
42 */
43#define BOND_IS_OK(bond) \
44 (((bond)->dev->flags & IFF_UP) && \
45 netif_running((bond)->dev) && \
46 ((bond)->slave_cnt > 0))
47
48/*
49 * Checks whether slave is ready for transmit.
50 */
51#define SLAVE_IS_OK(slave) \
52 (((slave)->dev->flags & IFF_UP) && \
53 netif_running((slave)->dev) && \
54 ((slave)->link == BOND_LINK_UP) && \
55 ((slave)->state == BOND_STATE_ACTIVE))
56
57
58#define USES_PRIMARY(mode) \
59 (((mode) == BOND_MODE_ACTIVEBACKUP) || \
60 ((mode) == BOND_MODE_TLB) || \
61 ((mode) == BOND_MODE_ALB))
62
Andy Gospodarekbb1d9122010-06-02 08:40:18 +000063#define TX_QUEUE_OVERRIDE(mode) \
64 (((mode) == BOND_MODE_ACTIVEBACKUP) || \
65 ((mode) == BOND_MODE_ROUNDROBIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -070066/*
67 * Less bad way to call ioctl from within the kernel; this needs to be
68 * done some other way to get the call out of interrupt context.
69 * Needs "ioctl" variable to be supplied by calling context.
70 */
71#define IOCTL(dev, arg, cmd) ({ \
72 int res = 0; \
73 mm_segment_t fs = get_fs(); \
74 set_fs(get_ds()); \
75 res = ioctl(dev, arg, cmd); \
76 set_fs(fs); \
77 res; })
78
79/**
80 * bond_for_each_slave_from - iterate the slaves list from a starting point
81 * @bond: the bond holding this list.
82 * @pos: current slave.
83 * @cnt: counter for max number of moves
84 * @start: starting point.
85 *
86 * Caller must hold bond->lock
87 */
88#define bond_for_each_slave_from(bond, pos, cnt, start) \
89 for (cnt = 0, pos = start; \
90 cnt < (bond)->slave_cnt; \
91 cnt++, pos = (pos)->next)
92
93/**
94 * bond_for_each_slave_from_to - iterate the slaves list from start point to stop point
95 * @bond: the bond holding this list.
96 * @pos: current slave.
97 * @cnt: counter for number max of moves
98 * @start: start point.
99 * @stop: stop point.
100 *
101 * Caller must hold bond->lock
102 */
103#define bond_for_each_slave_from_to(bond, pos, cnt, start, stop) \
104 for (cnt = 0, pos = start; \
105 ((cnt < (bond)->slave_cnt) && (pos != (stop)->next)); \
106 cnt++, pos = (pos)->next)
107
108/**
109 * bond_for_each_slave - iterate the slaves list from head
110 * @bond: the bond holding this list.
111 * @pos: current slave.
112 * @cnt: counter for max number of moves
113 *
114 * Caller must hold bond->lock
115 */
116#define bond_for_each_slave(bond, pos, cnt) \
117 bond_for_each_slave_from(bond, pos, cnt, (bond)->first_slave)
118
119
Neil Hormane843fa52010-10-13 16:01:50 +0000120#ifdef CONFIG_NET_POLL_CONTROLLER
Neil Hormanfb4fa762010-12-06 09:05:50 +0000121extern atomic_t netpoll_block_tx;
Neil Hormane843fa52010-10-13 16:01:50 +0000122
123static inline void block_netpoll_tx(void)
124{
Neil Hormanfb4fa762010-12-06 09:05:50 +0000125 atomic_inc(&netpoll_block_tx);
Neil Hormane843fa52010-10-13 16:01:50 +0000126}
127
128static inline void unblock_netpoll_tx(void)
129{
Neil Hormanfb4fa762010-12-06 09:05:50 +0000130 atomic_dec(&netpoll_block_tx);
Neil Hormane843fa52010-10-13 16:01:50 +0000131}
132
133static inline int is_netpoll_tx_blocked(struct net_device *dev)
134{
135 if (unlikely(dev->priv_flags & IFF_IN_NETPOLL))
Neil Hormanfb4fa762010-12-06 09:05:50 +0000136 return atomic_read(&netpoll_block_tx);
Neil Hormane843fa52010-10-13 16:01:50 +0000137 return 0;
138}
139#else
140#define block_netpoll_tx()
141#define unblock_netpoll_tx()
142#define is_netpoll_tx_blocked(dev) (0)
143#endif
144
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145struct bond_params {
146 int mode;
Jay Vosburgh169a3e62005-06-26 17:54:11 -0400147 int xmit_policy;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 int miimon;
Moni Shoua7893b242008-05-17 21:10:12 -0700149 int num_grat_arp;
Brian Haley305d5522008-11-04 17:51:14 -0800150 int num_unsol_na;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 int arp_interval;
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700152 int arp_validate;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 int use_carrier;
Jay Vosburghdd957c52007-10-09 19:57:24 -0700154 int fail_over_mac;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 int updelay;
156 int downdelay;
157 int lacp_fast;
Jay Vosburghfd989c82008-11-04 17:51:16 -0800158 int ad_select;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 char primary[IFNAMSIZ];
Jiri Pirkoa5499522009-09-25 03:28:09 +0000160 int primary_reselect;
Al Virod3bb52b2007-08-22 20:06:58 -0400161 __be32 arp_targets[BOND_MAX_ARP_TARGETS];
Andy Gospodarekbb1d9122010-06-02 08:40:18 +0000162 int tx_queues;
Andy Gospodarekebd8e492010-06-02 08:39:21 +0000163 int all_slaves_active;
Flavio Leitnerc2952c32010-10-05 14:23:59 +0000164 int resend_igmp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165};
166
Mitch Williams12479f92005-11-09 10:35:44 -0800167struct bond_parm_tbl {
168 char *modename;
169 int mode;
170};
171
Jay Vosburghece95f72008-01-17 16:25:01 -0800172#define BOND_MAX_MODENAME_LEN 20
173
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174struct vlan_entry {
175 struct list_head vlan_list;
Al Virod3bb52b2007-08-22 20:06:58 -0400176 __be32 vlan_ip;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 unsigned short vlan_id;
Brian Haley305d5522008-11-04 17:51:14 -0800178#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
179 struct in6_addr vlan_ipv6;
180#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181};
182
183struct slave {
Mitch Williamse944ef72005-11-09 10:36:50 -0800184 struct net_device *dev; /* first - useful for panic debug */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185 struct slave *next;
186 struct slave *prev;
Jay Vosburgh8bb5f962006-09-22 21:52:51 -0700187 int delay;
Andy Gospodarekf8a8ccd2007-01-29 12:08:38 -0800188 unsigned long jiffies;
189 unsigned long last_arp_rx;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 s8 link; /* one of BOND_LINK_XXXX */
Jay Vosburghb2220ca2008-05-17 21:10:13 -0700191 s8 new_link;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192 s8 state; /* one of BOND_STATE_XXXX */
Moni Shoua3158bf72007-10-09 19:43:41 -0700193 u32 original_mtu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194 u32 link_failure_count;
Eric Dumazet885a1362009-09-01 06:31:18 +0000195 u8 perm_hwaddr[ETH_ALEN];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 u16 speed;
197 u8 duplex;
Andy Gospodarekbb1d9122010-06-02 08:40:18 +0000198 u16 queue_id;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 struct ad_slave_info ad_info; /* HUGE - better to dynamically alloc */
200 struct tlb_slave_info tlb_info;
201};
202
203/*
Jay Vosburghb2220ca2008-05-17 21:10:13 -0700204 * Link pseudo-state only used internally by monitors
205 */
206#define BOND_LINK_NOCHANGE -1
207
208/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209 * Here are the locking policies for the two bonding locks:
210 *
211 * 1) Get bond->lock when reading/writing slave list.
212 * 2) Get bond->curr_slave_lock when reading/writing bond->curr_active_slave.
213 * (It is unnecessary when the write-lock is put with bond->lock.)
214 * 3) When we lock with bond->curr_slave_lock, we must lock with bond->lock
215 * beforehand.
216 */
217struct bonding {
Mitch Williamse944ef72005-11-09 10:36:50 -0800218 struct net_device *dev; /* first - useful for panic debug */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 struct slave *first_slave;
220 struct slave *curr_active_slave;
221 struct slave *current_arp_slave;
222 struct slave *primary_slave;
Jiri Pirkoa5499522009-09-25 03:28:09 +0000223 bool force_primary;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 s32 slave_cnt; /* never change this value outside the attach/detach wrappers */
225 rwlock_t lock;
226 rwlock_t curr_slave_lock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 s8 kill_timers;
Moni Shoua1053f622007-10-09 19:43:42 -0700228 s8 send_grat_arp;
Brian Haley305d5522008-11-04 17:51:14 -0800229 s8 send_unsol_na;
Moni Shouad90a1622007-10-09 19:43:43 -0700230 s8 setup_by_slave;
Flavio Leitnerc2952c32010-10-05 14:23:59 +0000231 s8 igmp_retrans;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232#ifdef CONFIG_PROC_FS
233 struct proc_dir_entry *proc_entry;
234 char proc_file_name[IFNAMSIZ];
235#endif /* CONFIG_PROC_FS */
236 struct list_head bond_list;
Jiri Pirko22bedad32010-04-01 21:22:57 +0000237 struct netdev_hw_addr_list mc_list;
Jasper Spaansa361c832009-10-23 04:09:24 +0000238 int (*xmit_hash_policy)(struct sk_buff *, int);
Al Virod3bb52b2007-08-22 20:06:58 -0400239 __be32 master_ip;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240 u16 flags;
Jay Vosburghcf5f9042007-10-17 17:37:47 -0700241 u16 rr_tx_counter;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 struct ad_bond_info ad_info;
243 struct alb_bond_info alb_info;
244 struct bond_params params;
245 struct list_head vlan_list;
246 struct vlan_group *vlgrp;
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700247 struct packet_type arp_mon_pt;
Jay Vosburgh1b76b312007-10-17 17:37:45 -0700248 struct workqueue_struct *wq;
249 struct delayed_work mii_work;
250 struct delayed_work arp_work;
251 struct delayed_work alb_work;
252 struct delayed_work ad_work;
Flavio Leitner5a37e8c2010-10-05 14:23:57 +0000253 struct delayed_work mcast_work;
Brian Haley305d5522008-11-04 17:51:14 -0800254#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
255 struct in6_addr master_ipv6;
256#endif
Taku Izumif073c7c2010-12-09 15:17:13 +0000257#ifdef CONFIG_DEBUG_FS
258 /* debugging suport via debugfs */
259 struct dentry *debug_dir;
260#endif /* CONFIG_DEBUG_FS */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261};
262
263/**
264 * Returns NULL if the net_device does not belong to any of the bond's slaves
265 *
266 * Caller must hold bond lock for read
267 */
Adrian Bunkcceb9042006-01-05 22:45:42 -0800268static inline struct slave *bond_get_slave_by_dev(struct bonding *bond, struct net_device *slave_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269{
270 struct slave *slave = NULL;
271 int i;
272
273 bond_for_each_slave(bond, slave, i) {
274 if (slave->dev == slave_dev) {
Hillf Dantonaf3e5bd2010-12-10 18:54:11 +0000275 return slave;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 }
277 }
278
Hillf Dantonaf3e5bd2010-12-10 18:54:11 +0000279 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280}
281
Adrian Bunkcceb9042006-01-05 22:45:42 -0800282static inline struct bonding *bond_get_bond_by_slave(struct slave *slave)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283{
284 if (!slave || !slave->dev->master) {
285 return NULL;
286 }
287
Joe Perchesc04914a2010-11-15 11:12:25 +0000288 return netdev_priv(slave->dev->master);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289}
290
Holger Eitzenberger58402052008-12-09 23:07:13 -0800291static inline bool bond_is_lb(const struct bonding *bond)
292{
Joe Perches8e95a202009-12-03 07:58:21 +0000293 return (bond->params.mode == BOND_MODE_TLB ||
294 bond->params.mode == BOND_MODE_ALB);
Holger Eitzenberger58402052008-12-09 23:07:13 -0800295}
296
Jiri Pirkoa5499522009-09-25 03:28:09 +0000297#define BOND_PRI_RESELECT_ALWAYS 0
298#define BOND_PRI_RESELECT_BETTER 1
299#define BOND_PRI_RESELECT_FAILURE 2
300
Jay Vosburgh3915c1e82008-05-17 21:10:14 -0700301#define BOND_FOM_NONE 0
302#define BOND_FOM_ACTIVE 1
303#define BOND_FOM_FOLLOW 2
304
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700305#define BOND_ARP_VALIDATE_NONE 0
306#define BOND_ARP_VALIDATE_ACTIVE (1 << BOND_STATE_ACTIVE)
307#define BOND_ARP_VALIDATE_BACKUP (1 << BOND_STATE_BACKUP)
308#define BOND_ARP_VALIDATE_ALL (BOND_ARP_VALIDATE_ACTIVE | \
309 BOND_ARP_VALIDATE_BACKUP)
310
Adrian Bunk079ca7d2006-12-12 17:24:39 +0100311static inline int slave_do_arp_validate(struct bonding *bond,
312 struct slave *slave)
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700313{
314 return bond->params.arp_validate & (1 << slave->state);
315}
316
Adrian Bunk079ca7d2006-12-12 17:24:39 +0100317static inline unsigned long slave_last_rx(struct bonding *bond,
Andy Gospodarekf8a8ccd2007-01-29 12:08:38 -0800318 struct slave *slave)
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700319{
320 if (slave_do_arp_validate(bond, slave))
321 return slave->last_arp_rx;
322
323 return slave->dev->last_rx;
324}
325
Adrian Bunkcceb9042006-01-05 22:45:42 -0800326static inline void bond_set_slave_inactive_flags(struct slave *slave)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327{
Wang Chen454d7c92008-11-12 23:37:49 -0800328 struct bonding *bond = netdev_priv(slave->dev->master);
Jiri Pirkoae63e802009-05-27 05:42:36 +0000329 if (!bond_is_lb(bond))
Jay Vosburgh8f903c72006-02-21 16:36:44 -0800330 slave->state = BOND_STATE_BACKUP;
Andy Gospodarekebd8e492010-06-02 08:39:21 +0000331 if (!bond->params.all_slaves_active)
332 slave->dev->priv_flags |= IFF_SLAVE_INACTIVE;
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700333 if (slave_do_arp_validate(bond, slave))
334 slave->dev->priv_flags |= IFF_SLAVE_NEEDARP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335}
336
Adrian Bunkcceb9042006-01-05 22:45:42 -0800337static inline void bond_set_slave_active_flags(struct slave *slave)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338{
339 slave->state = BOND_STATE_ACTIVE;
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700340 slave->dev->priv_flags &= ~(IFF_SLAVE_INACTIVE | IFF_SLAVE_NEEDARP);
Jay Vosburgh8f903c72006-02-21 16:36:44 -0800341}
342
343static inline void bond_set_master_3ad_flags(struct bonding *bond)
344{
345 bond->dev->priv_flags |= IFF_MASTER_8023AD;
346}
347
348static inline void bond_unset_master_3ad_flags(struct bonding *bond)
349{
350 bond->dev->priv_flags &= ~IFF_MASTER_8023AD;
351}
352
353static inline void bond_set_master_alb_flags(struct bonding *bond)
354{
355 bond->dev->priv_flags |= IFF_MASTER_ALB;
356}
357
358static inline void bond_unset_master_alb_flags(struct bonding *bond)
359{
360 bond->dev->priv_flags &= ~IFF_MASTER_ALB;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362
363struct vlan_entry *bond_next_vlan(struct bonding *bond, struct vlan_entry *curr);
364int bond_dev_queue_xmit(struct bonding *bond, struct sk_buff *skb, struct net_device *slave_dev);
Eric W. Biedermanec87fd32009-10-29 14:18:26 +0000365int bond_create(struct net *net, const char *name);
Mitch Williamsb76cdba2005-11-09 10:36:41 -0800366int bond_create_sysfs(void);
367void bond_destroy_sysfs(void);
Eric W. Biederman6151b3d2009-10-29 14:18:22 +0000368void bond_prepare_sysfs_group(struct bonding *bond);
Mitch Williamsb76cdba2005-11-09 10:36:41 -0800369int bond_create_slave_symlinks(struct net_device *master, struct net_device *slave);
370void bond_destroy_slave_symlinks(struct net_device *master, struct net_device *slave);
Mitch Williamsa77b5322005-11-09 10:35:51 -0800371int bond_enslave(struct net_device *bond_dev, struct net_device *slave_dev);
372int bond_release(struct net_device *bond_dev, struct net_device *slave_dev);
Jay Vosburgh1b76b312007-10-17 17:37:45 -0700373void bond_mii_monitor(struct work_struct *);
374void bond_loadbalance_arp_mon(struct work_struct *);
375void bond_activebackup_arp_mon(struct work_struct *);
Mitch Williamsa77b5322005-11-09 10:35:51 -0800376void bond_set_mode_ops(struct bonding *bond, int mode);
Holger Eitzenberger325dcf72008-12-09 23:10:17 -0800377int bond_parse_parm(const char *mode_arg, const struct bond_parm_tbl *tbl);
Mitch Williamsa77b5322005-11-09 10:35:51 -0800378void bond_select_active_slave(struct bonding *bond);
379void bond_change_active_slave(struct bonding *bond, struct slave *new_active);
Jay Vosburghf5b2b962006-09-22 21:54:53 -0700380void bond_register_arp(struct bonding *);
381void bond_unregister_arp(struct bonding *);
Taku Izumif073c7c2010-12-09 15:17:13 +0000382void bond_create_debugfs(void);
383void bond_destroy_debugfs(void);
384void bond_debug_register(struct bonding *bond);
385void bond_debug_unregister(struct bonding *bond);
386void bond_debug_reregister(struct bonding *bond);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387
Eric W. Biedermanec87fd32009-10-29 14:18:26 +0000388struct bond_net {
389 struct net * net; /* Associated network namespace */
390 struct list_head dev_list;
391#ifdef CONFIG_PROC_FS
392 struct proc_dir_entry * proc_dir;
393#endif
394};
395
Ben Dooksb2259672008-09-14 16:56:12 +0100396/* exported from bond_main.c */
Eric W. Biedermanec87fd32009-10-29 14:18:26 +0000397extern int bond_net_id;
Holger Eitzenbergere97fd7c2008-12-09 23:10:38 -0800398extern const struct bond_parm_tbl bond_lacp_tbl[];
399extern const struct bond_parm_tbl bond_mode_tbl[];
400extern const struct bond_parm_tbl xmit_hashtype_tbl[];
401extern const struct bond_parm_tbl arp_validate_tbl[];
402extern const struct bond_parm_tbl fail_over_mac_tbl[];
Jiri Pirkoa5499522009-09-25 03:28:09 +0000403extern const struct bond_parm_tbl pri_reselect_tbl[];
Hannes Ederb06715b2008-12-25 23:58:57 -0800404extern struct bond_parm_tbl ad_select_tbl[];
405
Brian Haley305d5522008-11-04 17:51:14 -0800406#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
407void bond_send_unsolicited_na(struct bonding *bond);
408void bond_register_ipv6_notifier(void);
409void bond_unregister_ipv6_notifier(void);
410#else
411static inline void bond_send_unsolicited_na(struct bonding *bond)
412{
413 return;
414}
415static inline void bond_register_ipv6_notifier(void)
416{
417 return;
418}
419static inline void bond_unregister_ipv6_notifier(void)
420{
421 return;
422}
423#endif
424
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425#endif /* _LINUX_BONDING_H */