1 /*
2 * Bond several ethernet interfaces into a Cisco, running 'Etherchannel'.
3 *
4 * Portions are (c) Copyright 1995 Simon "Guru Aleph-Null" Janes
5 * NCM: Network and Communications Management, Inc.
6 *
7 * BUT, I'm the one who modified it for ethernet, so:
8 * (c) Copyright 1999, Thomas Davis, tadavis@lbl.gov
9 *
10 * This software may be used and distributed according to the terms
11 * of the GNU Public License, incorporated herein by reference.
12 *
13 */
14
15 #ifndef _LINUX_BONDING_H
16 #define _LINUX_BONDING_H
17
18 #include <linux/timer.h>
19 #include <linux/proc_fs.h>
20 #include <linux/if_bonding.h>
21 #include <linux/etherdevice.h>
22 #include <linux/cpumask.h>
23 #include <linux/in6.h>
24 #include <linux/netpoll.h>
25 #include <linux/inetdevice.h>
26 #include "bond_3ad.h"
27 #include "bond_alb.h"
28
29 #define DRV_VERSION "3.7.1"
30 #define DRV_RELDATE "April 27, 2011"
31 #define DRV_NAME "bonding"
32 #define DRV_DESCRIPTION "Ethernet Channel Bonding Driver"
33
34 #define bond_version DRV_DESCRIPTION ": v" DRV_VERSION " (" DRV_RELDATE ")\n"
35
36 #define BOND_MAX_ARP_TARGETS 16
37
38 #define IS_UP(dev) \
39 ((((dev)->flags & IFF_UP) == IFF_UP) && \
40 netif_running(dev) && \
41 netif_carrier_ok(dev))
42
43 /*
44 * Checks whether slave is ready for transmit.
45 */
46 #define SLAVE_IS_OK(slave) \
47 (((slave)->dev->flags & IFF_UP) && \
48 netif_running((slave)->dev) && \
49 ((slave)->link == BOND_LINK_UP) && \
50 bond_is_active_slave(slave))
51
52
53 #define USES_PRIMARY(mode) \
54 (((mode) == BOND_MODE_ACTIVEBACKUP) || \
55 ((mode) == BOND_MODE_TLB) || \
56 ((mode) == BOND_MODE_ALB))
57
58 #define TX_QUEUE_OVERRIDE(mode) \
59 (((mode) == BOND_MODE_ACTIVEBACKUP) || \
60 ((mode) == BOND_MODE_ROUNDROBIN))
61 /*
62 * Less bad way to call ioctl from within the kernel; this needs to be
63 * done some other way to get the call out of interrupt context.
64 * Needs "ioctl" variable to be supplied by calling context.
65 */
66 #define IOCTL(dev, arg, cmd) ({ \
67 int res = 0; \
68 mm_segment_t fs = get_fs(); \
69 set_fs(get_ds()); \
70 res = ioctl(dev, arg, cmd); \
71 set_fs(fs); \
72 res; })
73
74 /**
75 * bond_for_each_slave_from - iterate the slaves list from a starting point
76 * @bond: the bond holding this list.
77 * @pos: current slave.
78 * @cnt: counter for max number of moves
79 * @start: starting point.
80 *
81 * Caller must hold bond->lock
82 */
83 #define bond_for_each_slave_from(bond, pos, cnt, start) \
84 for (cnt = 0, pos = start; \
85 cnt < (bond)->slave_cnt; \
86 cnt++, pos = (pos)->next)
87
88 /**
89 * bond_for_each_slave_from_to - iterate the slaves list from start point to stop point
90 * @bond: the bond holding this list.
91 * @pos: current slave.
92 * @cnt: counter for number max of moves
93 * @start: start point.
94 * @stop: stop point.
95 *
96 * Caller must hold bond->lock
97 */
98 #define bond_for_each_slave_from_to(bond, pos, cnt, start, stop) \
99 for (cnt = 0, pos = start; \
100 ((cnt < (bond)->slave_cnt) && (pos != (stop)->next)); \
101 cnt++, pos = (pos)->next)
102
103 /**
104 * bond_for_each_slave - iterate the slaves list from head
105 * @bond: the bond holding this list.
106 * @pos: current slave.
107 * @cnt: counter for max number of moves
108 *
109 * Caller must hold bond->lock
110 */
111 #define bond_for_each_slave(bond, pos, cnt) \
112 bond_for_each_slave_from(bond, pos, cnt, (bond)->first_slave)
113
114
115 #ifdef CONFIG_NET_POLL_CONTROLLER
116 extern atomic_t netpoll_block_tx;
117
block_netpoll_tx(void)118 static inline void block_netpoll_tx(void)
119 {
120 atomic_inc(&netpoll_block_tx);
121 }
122
unblock_netpoll_tx(void)123 static inline void unblock_netpoll_tx(void)
124 {
125 atomic_dec(&netpoll_block_tx);
126 }
127
is_netpoll_tx_blocked(struct net_device * dev)128 static inline int is_netpoll_tx_blocked(struct net_device *dev)
129 {
130 if (unlikely(netpoll_tx_running(dev)))
131 return atomic_read(&netpoll_block_tx);
132 return 0;
133 }
134 #else
135 #define block_netpoll_tx()
136 #define unblock_netpoll_tx()
137 #define is_netpoll_tx_blocked(dev) (0)
138 #endif
139
140 struct bond_params {
141 int mode;
142 int xmit_policy;
143 int miimon;
144 u8 num_peer_notif;
145 int arp_interval;
146 int arp_validate;
147 int use_carrier;
148 int fail_over_mac;
149 int updelay;
150 int downdelay;
151 int lacp_fast;
152 unsigned int min_links;
153 int ad_select;
154 char primary[IFNAMSIZ];
155 int primary_reselect;
156 __be32 arp_targets[BOND_MAX_ARP_TARGETS];
157 int tx_queues;
158 int all_slaves_active;
159 int resend_igmp;
160 };
161
162 struct bond_parm_tbl {
163 char *modename;
164 int mode;
165 };
166
167 #define BOND_MAX_MODENAME_LEN 20
168
169 struct vlan_entry {
170 struct list_head vlan_list;
171 unsigned short vlan_id;
172 };
173
174 struct slave {
175 struct net_device *dev; /* first - useful for panic debug */
176 struct slave *next;
177 struct slave *prev;
178 struct bonding *bond; /* our master */
179 int delay;
180 unsigned long jiffies;
181 unsigned long last_arp_rx;
182 s8 link; /* one of BOND_LINK_XXXX */
183 s8 new_link;
184 u8 backup:1, /* indicates backup slave. Value corresponds with
185 BOND_STATE_ACTIVE and BOND_STATE_BACKUP */
186 inactive:1; /* indicates inactive slave */
187 u8 duplex;
188 u32 original_mtu;
189 u32 link_failure_count;
190 u32 speed;
191 u16 queue_id;
192 u8 perm_hwaddr[ETH_ALEN];
193 struct ad_slave_info ad_info; /* HUGE - better to dynamically alloc */
194 struct tlb_slave_info tlb_info;
195 #ifdef CONFIG_NET_POLL_CONTROLLER
196 struct netpoll *np;
197 #endif
198 };
199
200 /*
201 * Link pseudo-state only used internally by monitors
202 */
203 #define BOND_LINK_NOCHANGE -1
204
205 /*
206 * Here are the locking policies for the two bonding locks:
207 *
208 * 1) Get bond->lock when reading/writing slave list.
209 * 2) Get bond->curr_slave_lock when reading/writing bond->curr_active_slave.
210 * (It is unnecessary when the write-lock is put with bond->lock.)
211 * 3) When we lock with bond->curr_slave_lock, we must lock with bond->lock
212 * beforehand.
213 */
214 struct bonding {
215 struct net_device *dev; /* first - useful for panic debug */
216 struct slave *first_slave;
217 struct slave *curr_active_slave;
218 struct slave *current_arp_slave;
219 struct slave *primary_slave;
220 bool force_primary;
221 s32 slave_cnt; /* never change this value outside the attach/detach wrappers */
222 int (*recv_probe)(struct sk_buff *, struct bonding *,
223 struct slave *);
224 rwlock_t lock;
225 rwlock_t curr_slave_lock;
226 u8 send_peer_notif;
227 s8 setup_by_slave;
228 s8 igmp_retrans;
229 #ifdef CONFIG_PROC_FS
230 struct proc_dir_entry *proc_entry;
231 char proc_file_name[IFNAMSIZ];
232 #endif /* CONFIG_PROC_FS */
233 struct list_head bond_list;
234 struct netdev_hw_addr_list mc_list;
235 int (*xmit_hash_policy)(struct sk_buff *, int);
236 u16 rr_tx_counter;
237 struct ad_bond_info ad_info;
238 struct alb_bond_info alb_info;
239 struct bond_params params;
240 struct list_head vlan_list;
241 struct workqueue_struct *wq;
242 struct delayed_work mii_work;
243 struct delayed_work arp_work;
244 struct delayed_work alb_work;
245 struct delayed_work ad_work;
246 struct delayed_work mcast_work;
247 #ifdef CONFIG_DEBUG_FS
248 /* debugging suport via debugfs */
249 struct dentry *debug_dir;
250 #endif /* CONFIG_DEBUG_FS */
251 };
252
bond_vlan_used(struct bonding * bond)253 static inline bool bond_vlan_used(struct bonding *bond)
254 {
255 return !list_empty(&bond->vlan_list);
256 }
257
258 #define bond_slave_get_rcu(dev) \
259 ((struct slave *) rcu_dereference(dev->rx_handler_data))
260
261 /**
262 * Returns NULL if the net_device does not belong to any of the bond's slaves
263 *
264 * Caller must hold bond lock for read
265 */
bond_get_slave_by_dev(struct bonding * bond,struct net_device * slave_dev)266 static inline struct slave *bond_get_slave_by_dev(struct bonding *bond,
267 struct net_device *slave_dev)
268 {
269 struct slave *slave = NULL;
270 int i;
271
272 bond_for_each_slave(bond, slave, i) {
273 if (slave->dev == slave_dev) {
274 return slave;
275 }
276 }
277
278 return NULL;
279 }
280
bond_get_bond_by_slave(struct slave * slave)281 static inline struct bonding *bond_get_bond_by_slave(struct slave *slave)
282 {
283 if (!slave || !slave->dev->master) {
284 return NULL;
285 }
286
287 return netdev_priv(slave->dev->master);
288 }
289
bond_is_lb(const struct bonding * bond)290 static inline bool bond_is_lb(const struct bonding *bond)
291 {
292 return (bond->params.mode == BOND_MODE_TLB ||
293 bond->params.mode == BOND_MODE_ALB);
294 }
295
bond_set_active_slave(struct slave * slave)296 static inline void bond_set_active_slave(struct slave *slave)
297 {
298 slave->backup = 0;
299 }
300
bond_set_backup_slave(struct slave * slave)301 static inline void bond_set_backup_slave(struct slave *slave)
302 {
303 slave->backup = 1;
304 }
305
bond_slave_state(struct slave * slave)306 static inline int bond_slave_state(struct slave *slave)
307 {
308 return slave->backup;
309 }
310
bond_is_active_slave(struct slave * slave)311 static inline bool bond_is_active_slave(struct slave *slave)
312 {
313 return !bond_slave_state(slave);
314 }
315
316 #define BOND_PRI_RESELECT_ALWAYS 0
317 #define BOND_PRI_RESELECT_BETTER 1
318 #define BOND_PRI_RESELECT_FAILURE 2
319
320 #define BOND_FOM_NONE 0
321 #define BOND_FOM_ACTIVE 1
322 #define BOND_FOM_FOLLOW 2
323
324 #define BOND_ARP_VALIDATE_NONE 0
325 #define BOND_ARP_VALIDATE_ACTIVE (1 << BOND_STATE_ACTIVE)
326 #define BOND_ARP_VALIDATE_BACKUP (1 << BOND_STATE_BACKUP)
327 #define BOND_ARP_VALIDATE_ALL (BOND_ARP_VALIDATE_ACTIVE | \
328 BOND_ARP_VALIDATE_BACKUP)
329
slave_do_arp_validate(struct bonding * bond,struct slave * slave)330 static inline int slave_do_arp_validate(struct bonding *bond,
331 struct slave *slave)
332 {
333 return bond->params.arp_validate & (1 << bond_slave_state(slave));
334 }
335
slave_last_rx(struct bonding * bond,struct slave * slave)336 static inline unsigned long slave_last_rx(struct bonding *bond,
337 struct slave *slave)
338 {
339 if (slave_do_arp_validate(bond, slave))
340 return slave->last_arp_rx;
341
342 return slave->dev->last_rx;
343 }
344
345 #ifdef CONFIG_NET_POLL_CONTROLLER
bond_netpoll_send_skb(const struct slave * slave,struct sk_buff * skb)346 static inline void bond_netpoll_send_skb(const struct slave *slave,
347 struct sk_buff *skb)
348 {
349 struct netpoll *np = slave->np;
350
351 if (np)
352 netpoll_send_skb(np, skb);
353 }
354 #else
bond_netpoll_send_skb(const struct slave * slave,struct sk_buff * skb)355 static inline void bond_netpoll_send_skb(const struct slave *slave,
356 struct sk_buff *skb)
357 {
358 }
359 #endif
360
bond_set_slave_inactive_flags(struct slave * slave)361 static inline void bond_set_slave_inactive_flags(struct slave *slave)
362 {
363 struct bonding *bond = netdev_priv(slave->dev->master);
364 if (!bond_is_lb(bond))
365 bond_set_backup_slave(slave);
366 if (!bond->params.all_slaves_active)
367 slave->inactive = 1;
368 }
369
bond_set_slave_active_flags(struct slave * slave)370 static inline void bond_set_slave_active_flags(struct slave *slave)
371 {
372 bond_set_active_slave(slave);
373 slave->inactive = 0;
374 }
375
bond_is_slave_inactive(struct slave * slave)376 static inline bool bond_is_slave_inactive(struct slave *slave)
377 {
378 return slave->inactive;
379 }
380
bond_confirm_addr(struct net_device * dev,__be32 dst,__be32 local)381 static inline __be32 bond_confirm_addr(struct net_device *dev, __be32 dst, __be32 local)
382 {
383 struct in_device *in_dev;
384 __be32 addr = 0;
385
386 rcu_read_lock();
387 in_dev = __in_dev_get_rcu(dev);
388
389 if (in_dev)
390 addr = inet_confirm_addr(in_dev, dst, local, RT_SCOPE_HOST);
391
392 rcu_read_unlock();
393 return addr;
394 }
395
396 struct bond_net;
397
398 struct vlan_entry *bond_next_vlan(struct bonding *bond, struct vlan_entry *curr);
399 int bond_dev_queue_xmit(struct bonding *bond, struct sk_buff *skb, struct net_device *slave_dev);
400 int bond_create(struct net *net, const char *name);
401 int bond_create_sysfs(struct bond_net *net);
402 void bond_destroy_sysfs(struct bond_net *net);
403 void bond_prepare_sysfs_group(struct bonding *bond);
404 int bond_create_slave_symlinks(struct net_device *master, struct net_device *slave);
405 void bond_destroy_slave_symlinks(struct net_device *master, struct net_device *slave);
406 int bond_enslave(struct net_device *bond_dev, struct net_device *slave_dev);
407 int bond_release(struct net_device *bond_dev, struct net_device *slave_dev);
408 void bond_mii_monitor(struct work_struct *);
409 void bond_loadbalance_arp_mon(struct work_struct *);
410 void bond_activebackup_arp_mon(struct work_struct *);
411 void bond_set_mode_ops(struct bonding *bond, int mode);
412 int bond_parse_parm(const char *mode_arg, const struct bond_parm_tbl *tbl);
413 void bond_select_active_slave(struct bonding *bond);
414 void bond_change_active_slave(struct bonding *bond, struct slave *new_active);
415 void bond_create_debugfs(void);
416 void bond_destroy_debugfs(void);
417 void bond_debug_register(struct bonding *bond);
418 void bond_debug_unregister(struct bonding *bond);
419 void bond_debug_reregister(struct bonding *bond);
420 const char *bond_mode_name(int mode);
421
422 struct bond_net {
423 struct net * net; /* Associated network namespace */
424 struct list_head dev_list;
425 #ifdef CONFIG_PROC_FS
426 struct proc_dir_entry * proc_dir;
427 #endif
428 struct class_attribute class_attr_bonding_masters;
429 };
430
431 #ifdef CONFIG_PROC_FS
432 void bond_create_proc_entry(struct bonding *bond);
433 void bond_remove_proc_entry(struct bonding *bond);
434 void bond_create_proc_dir(struct bond_net *bn);
435 void bond_destroy_proc_dir(struct bond_net *bn);
436 #else
bond_create_proc_entry(struct bonding * bond)437 static inline void bond_create_proc_entry(struct bonding *bond)
438 {
439 }
440
bond_remove_proc_entry(struct bonding * bond)441 static inline void bond_remove_proc_entry(struct bonding *bond)
442 {
443 }
444
bond_create_proc_dir(struct bond_net * bn)445 static inline void bond_create_proc_dir(struct bond_net *bn)
446 {
447 }
448
bond_destroy_proc_dir(struct bond_net * bn)449 static inline void bond_destroy_proc_dir(struct bond_net *bn)
450 {
451 }
452 #endif
453
bond_slave_has_mac(struct bonding * bond,const u8 * mac)454 static inline struct slave *bond_slave_has_mac(struct bonding *bond,
455 const u8 *mac)
456 {
457 int i = 0;
458 struct slave *tmp;
459
460 bond_for_each_slave(bond, tmp, i)
461 if (!compare_ether_addr_64bits(mac, tmp->dev->dev_addr))
462 return tmp;
463
464 return NULL;
465 }
466
467 /* exported from bond_main.c */
468 extern int bond_net_id;
469 extern const struct bond_parm_tbl bond_lacp_tbl[];
470 extern const struct bond_parm_tbl bond_mode_tbl[];
471 extern const struct bond_parm_tbl xmit_hashtype_tbl[];
472 extern const struct bond_parm_tbl arp_validate_tbl[];
473 extern const struct bond_parm_tbl fail_over_mac_tbl[];
474 extern const struct bond_parm_tbl pri_reselect_tbl[];
475 extern struct bond_parm_tbl ad_select_tbl[];
476
477 #endif /* _LINUX_BONDING_H */
478