2  * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
 
   4  * This program is free software; you can redistribute it and/or modify it
 
   5  * under the terms of the GNU General Public License as published by the
 
   6  * Free Software Foundation; either version 2 of the License, or
 
   7  * (at your option) any later version.
 
   9  * This program is distributed in the hope that it will be useful, but
 
  10  * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 
  11  * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 
  14  * You should have received a copy of the GNU General Public License along
 
  15  * with this program; if not, write to the Free Software Foundation, Inc.,
 
  16  * 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
  18  * The full GNU General Public License is included in this distribution in the
 
  19  * file called LICENSE.
 
  23 //#define BONDING_DEBUG 1
 
  25 #include <linux/skbuff.h>
 
  26 #include <linux/netdevice.h>
 
  27 #include <linux/etherdevice.h>
 
  28 #include <linux/pkt_sched.h>
 
  29 #include <linux/spinlock.h>
 
  30 #include <linux/slab.h>
 
  31 #include <linux/timer.h>
 
  33 #include <linux/ipv6.h>
 
  34 #include <linux/if_arp.h>
 
  35 #include <linux/if_ether.h>
 
  36 #include <linux/if_bonding.h>
 
  37 #include <linux/if_vlan.h>
 
  41 #include <asm/byteorder.h>
 
  46 #define ALB_TIMER_TICKS_PER_SEC     10  /* should be a divisor of HZ */
 
  47 #define BOND_TLB_REBALANCE_INTERVAL 10  /* In seconds, periodic re-balancing.
 
  48                                          * Used for division - never set
 
  51 #define BOND_ALB_LP_INTERVAL        1   /* In seconds, periodic send of
 
  52                                          * learning packets to the switch
 
  55 #define BOND_TLB_REBALANCE_TICKS (BOND_TLB_REBALANCE_INTERVAL \
 
  56                                   * ALB_TIMER_TICKS_PER_SEC)
 
  58 #define BOND_ALB_LP_TICKS (BOND_ALB_LP_INTERVAL \
 
  59                            * ALB_TIMER_TICKS_PER_SEC)
 
  61 #define TLB_HASH_TABLE_SIZE 256 /* The size of the clients hash table.
 
  62                                  * Note that this value MUST NOT be smaller
 
  63                                  * because the key hash table is BYTE wide !
 
  67 #define TLB_NULL_INDEX          0xffffffff
 
  68 #define MAX_LP_BURST            3
 
  71 #define RLB_HASH_TABLE_SIZE     256
 
  72 #define RLB_NULL_INDEX          0xffffffff
 
  73 #define RLB_UPDATE_DELAY        2*ALB_TIMER_TICKS_PER_SEC /* 2 seconds */
 
  74 #define RLB_ARP_BURST_SIZE      2
 
  75 #define RLB_UPDATE_RETRY        3       /* 3-ticks - must be smaller than the rlb
 
  76                                          * rebalance interval (5 min).
 
  78 /* RLB_PROMISC_TIMEOUT = 10 sec equals the time that the current slave is
 
  79  * promiscuous after failover
 
  81 #define RLB_PROMISC_TIMEOUT     10*ALB_TIMER_TICKS_PER_SEC
 
  83 static const u8 mac_bcast[ETH_ALEN] = {0xff,0xff,0xff,0xff,0xff,0xff};
 
  84 static const int alb_delta_in_ticks = HZ / ALB_TIMER_TICKS_PER_SEC;
 
  91         u8 padding[ETH_ZLEN - ETH_HLEN];
 
  96         __be16  prot_addr_space;
 
 100         u8      mac_src[ETH_ALEN];      /* sender hardware address */
 
 101         __be32  ip_src;                 /* sender IP address */
 
 102         u8      mac_dst[ETH_ALEN];      /* target hardware address */
 
 103         __be32  ip_dst;                 /* target IP address */
 
 107 static inline struct arp_pkt *arp_pkt(const struct sk_buff *skb)
 
 109         return (struct arp_pkt *)skb_network_header(skb);
 
 112 /* Forward declaration */
 
 113 static void alb_send_learning_packets(struct slave *slave, u8 mac_addr[]);
 
 115 static inline u8 _simple_hash(const u8 *hash_start, int hash_size)
 
 120         for (i = 0; i < hash_size; i++) {
 
 121                 hash ^= hash_start[i];
 
 127 /*********************** tlb specific functions ***************************/
 
 129 static inline void _lock_tx_hashtbl(struct bonding *bond)
 
 131         spin_lock_bh(&(BOND_ALB_INFO(bond).tx_hashtbl_lock));
 
 134 static inline void _unlock_tx_hashtbl(struct bonding *bond)
 
 136         spin_unlock_bh(&(BOND_ALB_INFO(bond).tx_hashtbl_lock));
 
 139 /* Caller must hold tx_hashtbl lock */
 
 140 static inline void tlb_init_table_entry(struct tlb_client_info *entry, int save_load)
 
 143                 entry->load_history = 1 + entry->tx_bytes /
 
 144                                       BOND_TLB_REBALANCE_INTERVAL;
 
 148         entry->tx_slave = NULL;
 
 149         entry->next = TLB_NULL_INDEX;
 
 150         entry->prev = TLB_NULL_INDEX;
 
 153 static inline void tlb_init_slave(struct slave *slave)
 
 155         SLAVE_TLB_INFO(slave).load = 0;
 
 156         SLAVE_TLB_INFO(slave).head = TLB_NULL_INDEX;
 
 159 /* Caller must hold bond lock for read */
 
 160 static void tlb_clear_slave(struct bonding *bond, struct slave *slave, int save_load)
 
 162         struct tlb_client_info *tx_hash_table;
 
 165         _lock_tx_hashtbl(bond);
 
 167         /* clear slave from tx_hashtbl */
 
 168         tx_hash_table = BOND_ALB_INFO(bond).tx_hashtbl;
 
 170         index = SLAVE_TLB_INFO(slave).head;
 
 171         while (index != TLB_NULL_INDEX) {
 
 172                 u32 next_index = tx_hash_table[index].next;
 
 173                 tlb_init_table_entry(&tx_hash_table[index], save_load);
 
 177         tlb_init_slave(slave);
 
 179         _unlock_tx_hashtbl(bond);
 
 182 /* Must be called before starting the monitor timer */
 
 183 static int tlb_initialize(struct bonding *bond)
 
 185         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 186         int size = TLB_HASH_TABLE_SIZE * sizeof(struct tlb_client_info);
 
 187         struct tlb_client_info *new_hashtbl;
 
 190         spin_lock_init(&(bond_info->tx_hashtbl_lock));
 
 192         new_hashtbl = kzalloc(size, GFP_KERNEL);
 
 194                 printk(KERN_ERR DRV_NAME
 
 195                        ": %s: Error: Failed to allocate TLB hash table\n",
 
 199         _lock_tx_hashtbl(bond);
 
 201         bond_info->tx_hashtbl = new_hashtbl;
 
 203         for (i = 0; i < TLB_HASH_TABLE_SIZE; i++) {
 
 204                 tlb_init_table_entry(&bond_info->tx_hashtbl[i], 1);
 
 207         _unlock_tx_hashtbl(bond);
 
 212 /* Must be called only after all slaves have been released */
 
 213 static void tlb_deinitialize(struct bonding *bond)
 
 215         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 217         _lock_tx_hashtbl(bond);
 
 219         kfree(bond_info->tx_hashtbl);
 
 220         bond_info->tx_hashtbl = NULL;
 
 222         _unlock_tx_hashtbl(bond);
 
 225 /* Caller must hold bond lock for read */
 
 226 static struct slave *tlb_get_least_loaded_slave(struct bonding *bond)
 
 228         struct slave *slave, *least_loaded;
 
 232         /* Find the first enabled slave */
 
 233         bond_for_each_slave(bond, slave, i) {
 
 234                 if (SLAVE_IS_OK(slave)) {
 
 244         least_loaded = slave;
 
 245         max_gap = (s64)(slave->speed << 20) - /* Convert to Megabit per sec */
 
 246                         (s64)(SLAVE_TLB_INFO(slave).load << 3); /* Bytes to bits */
 
 248         /* Find the slave with the largest gap */
 
 249         bond_for_each_slave_from(bond, slave, i, least_loaded) {
 
 250                 if (SLAVE_IS_OK(slave)) {
 
 251                         s64 gap = (s64)(slave->speed << 20) -
 
 252                                         (s64)(SLAVE_TLB_INFO(slave).load << 3);
 
 254                                 least_loaded = slave;
 
 263 /* Caller must hold bond lock for read */
 
 264 static struct slave *tlb_choose_channel(struct bonding *bond, u32 hash_index, u32 skb_len)
 
 266         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 267         struct tlb_client_info *hash_table;
 
 268         struct slave *assigned_slave;
 
 270         _lock_tx_hashtbl(bond);
 
 272         hash_table = bond_info->tx_hashtbl;
 
 273         assigned_slave = hash_table[hash_index].tx_slave;
 
 274         if (!assigned_slave) {
 
 275                 assigned_slave = tlb_get_least_loaded_slave(bond);
 
 277                 if (assigned_slave) {
 
 278                         struct tlb_slave_info *slave_info =
 
 279                                 &(SLAVE_TLB_INFO(assigned_slave));
 
 280                         u32 next_index = slave_info->head;
 
 282                         hash_table[hash_index].tx_slave = assigned_slave;
 
 283                         hash_table[hash_index].next = next_index;
 
 284                         hash_table[hash_index].prev = TLB_NULL_INDEX;
 
 286                         if (next_index != TLB_NULL_INDEX) {
 
 287                                 hash_table[next_index].prev = hash_index;
 
 290                         slave_info->head = hash_index;
 
 292                                 hash_table[hash_index].load_history;
 
 296         if (assigned_slave) {
 
 297                 hash_table[hash_index].tx_bytes += skb_len;
 
 300         _unlock_tx_hashtbl(bond);
 
 302         return assigned_slave;
 
 305 /*********************** rlb specific functions ***************************/
 
 306 static inline void _lock_rx_hashtbl(struct bonding *bond)
 
 308         spin_lock_bh(&(BOND_ALB_INFO(bond).rx_hashtbl_lock));
 
 311 static inline void _unlock_rx_hashtbl(struct bonding *bond)
 
 313         spin_unlock_bh(&(BOND_ALB_INFO(bond).rx_hashtbl_lock));
 
 316 /* when an ARP REPLY is received from a client update its info
 
 319 static void rlb_update_entry_from_arp(struct bonding *bond, struct arp_pkt *arp)
 
 321         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 322         struct rlb_client_info *client_info;
 
 325         _lock_rx_hashtbl(bond);
 
 327         hash_index = _simple_hash((u8*)&(arp->ip_src), sizeof(arp->ip_src));
 
 328         client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 330         if ((client_info->assigned) &&
 
 331             (client_info->ip_src == arp->ip_dst) &&
 
 332             (client_info->ip_dst == arp->ip_src)) {
 
 333                 /* update the clients MAC address */
 
 334                 memcpy(client_info->mac_dst, arp->mac_src, ETH_ALEN);
 
 335                 client_info->ntt = 1;
 
 336                 bond_info->rx_ntt = 1;
 
 339         _unlock_rx_hashtbl(bond);
 
 342 static int rlb_arp_recv(struct sk_buff *skb, struct net_device *bond_dev, struct packet_type *ptype, struct net_device *orig_dev)
 
 344         struct bonding *bond = bond_dev->priv;
 
 345         struct arp_pkt *arp = (struct arp_pkt *)skb->data;
 
 346         int res = NET_RX_DROP;
 
 348         if (dev_net(bond_dev) != &init_net)
 
 351         if (!(bond_dev->flags & IFF_MASTER))
 
 355                 dprintk("Packet has no ARP data\n");
 
 359         if (skb->len < sizeof(struct arp_pkt)) {
 
 360                 dprintk("Packet is too small to be an ARP\n");
 
 364         if (arp->op_code == htons(ARPOP_REPLY)) {
 
 365                 /* update rx hash table for this ARP */
 
 366                 rlb_update_entry_from_arp(bond, arp);
 
 367                 dprintk("Server received an ARP Reply from client\n");
 
 370         res = NET_RX_SUCCESS;
 
 378 /* Caller must hold bond lock for read */
 
 379 static struct slave *rlb_next_rx_slave(struct bonding *bond)
 
 381         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 382         struct slave *rx_slave, *slave, *start_at;
 
 385         if (bond_info->next_rx_slave) {
 
 386                 start_at = bond_info->next_rx_slave;
 
 388                 start_at = bond->first_slave;
 
 393         bond_for_each_slave_from(bond, slave, i, start_at) {
 
 394                 if (SLAVE_IS_OK(slave)) {
 
 397                         } else if (slave->speed > rx_slave->speed) {
 
 404                 bond_info->next_rx_slave = rx_slave->next;
 
 410 /* teach the switch the mac of a disabled slave
 
 411  * on the primary for fault tolerance
 
 413  * Caller must hold bond->curr_slave_lock for write or bond lock for write
 
 415 static void rlb_teach_disabled_mac_on_primary(struct bonding *bond, u8 addr[])
 
 417         if (!bond->curr_active_slave) {
 
 421         if (!bond->alb_info.primary_is_promisc) {
 
 422                 if (!dev_set_promiscuity(bond->curr_active_slave->dev, 1))
 
 423                         bond->alb_info.primary_is_promisc = 1;
 
 425                         bond->alb_info.primary_is_promisc = 0;
 
 428         bond->alb_info.rlb_promisc_timeout_counter = 0;
 
 430         alb_send_learning_packets(bond->curr_active_slave, addr);
 
 433 /* slave being removed should not be active at this point
 
 435  * Caller must hold bond lock for read
 
 437 static void rlb_clear_slave(struct bonding *bond, struct slave *slave)
 
 439         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 440         struct rlb_client_info *rx_hash_table;
 
 441         u32 index, next_index;
 
 443         /* clear slave from rx_hashtbl */
 
 444         _lock_rx_hashtbl(bond);
 
 446         rx_hash_table = bond_info->rx_hashtbl;
 
 447         index = bond_info->rx_hashtbl_head;
 
 448         for (; index != RLB_NULL_INDEX; index = next_index) {
 
 449                 next_index = rx_hash_table[index].next;
 
 450                 if (rx_hash_table[index].slave == slave) {
 
 451                         struct slave *assigned_slave = rlb_next_rx_slave(bond);
 
 453                         if (assigned_slave) {
 
 454                                 rx_hash_table[index].slave = assigned_slave;
 
 455                                 if (memcmp(rx_hash_table[index].mac_dst,
 
 456                                            mac_bcast, ETH_ALEN)) {
 
 457                                         bond_info->rx_hashtbl[index].ntt = 1;
 
 458                                         bond_info->rx_ntt = 1;
 
 459                                         /* A slave has been removed from the
 
 460                                          * table because it is either disabled
 
 461                                          * or being released. We must retry the
 
 462                                          * update to avoid clients from not
 
 463                                          * being updated & disconnecting when
 
 466                                         bond_info->rlb_update_retry_counter =
 
 469                         } else {  /* there is no active slave */
 
 470                                 rx_hash_table[index].slave = NULL;
 
 475         _unlock_rx_hashtbl(bond);
 
 477         write_lock_bh(&bond->curr_slave_lock);
 
 479         if (slave != bond->curr_active_slave) {
 
 480                 rlb_teach_disabled_mac_on_primary(bond, slave->dev->dev_addr);
 
 483         write_unlock_bh(&bond->curr_slave_lock);
 
 486 static void rlb_update_client(struct rlb_client_info *client_info)
 
 490         if (!client_info->slave) {
 
 494         for (i = 0; i < RLB_ARP_BURST_SIZE; i++) {
 
 497                 skb = arp_create(ARPOP_REPLY, ETH_P_ARP,
 
 499                                  client_info->slave->dev,
 
 501                                  client_info->mac_dst,
 
 502                                  client_info->slave->dev->dev_addr,
 
 503                                  client_info->mac_dst);
 
 505                         printk(KERN_ERR DRV_NAME
 
 506                                ": %s: Error: failed to create an ARP packet\n",
 
 507                                client_info->slave->dev->master->name);
 
 511                 skb->dev = client_info->slave->dev;
 
 513                 if (client_info->tag) {
 
 514                         skb = vlan_put_tag(skb, client_info->vlan_id);
 
 516                                 printk(KERN_ERR DRV_NAME
 
 517                                        ": %s: Error: failed to insert VLAN tag\n",
 
 518                                        client_info->slave->dev->master->name);
 
 527 /* sends ARP REPLIES that update the clients that need updating */
 
 528 static void rlb_update_rx_clients(struct bonding *bond)
 
 530         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 531         struct rlb_client_info *client_info;
 
 534         _lock_rx_hashtbl(bond);
 
 536         hash_index = bond_info->rx_hashtbl_head;
 
 537         for (; hash_index != RLB_NULL_INDEX; hash_index = client_info->next) {
 
 538                 client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 539                 if (client_info->ntt) {
 
 540                         rlb_update_client(client_info);
 
 541                         if (bond_info->rlb_update_retry_counter == 0) {
 
 542                                 client_info->ntt = 0;
 
 547         /* do not update the entries again untill this counter is zero so that
 
 548          * not to confuse the clients.
 
 550         bond_info->rlb_update_delay_counter = RLB_UPDATE_DELAY;
 
 552         _unlock_rx_hashtbl(bond);
 
 555 /* The slave was assigned a new mac address - update the clients */
 
 556 static void rlb_req_update_slave_clients(struct bonding *bond, struct slave *slave)
 
 558         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 559         struct rlb_client_info *client_info;
 
 563         _lock_rx_hashtbl(bond);
 
 565         hash_index = bond_info->rx_hashtbl_head;
 
 566         for (; hash_index != RLB_NULL_INDEX; hash_index = client_info->next) {
 
 567                 client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 569                 if ((client_info->slave == slave) &&
 
 570                     memcmp(client_info->mac_dst, mac_bcast, ETH_ALEN)) {
 
 571                         client_info->ntt = 1;
 
 576         // update the team's flag only after the whole iteration
 
 578                 bond_info->rx_ntt = 1;
 
 580                 bond_info->rlb_update_retry_counter = RLB_UPDATE_RETRY;
 
 583         _unlock_rx_hashtbl(bond);
 
 586 /* mark all clients using src_ip to be updated */
 
 587 static void rlb_req_update_subnet_clients(struct bonding *bond, __be32 src_ip)
 
 589         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 590         struct rlb_client_info *client_info;
 
 593         _lock_rx_hashtbl(bond);
 
 595         hash_index = bond_info->rx_hashtbl_head;
 
 596         for (; hash_index != RLB_NULL_INDEX; hash_index = client_info->next) {
 
 597                 client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 599                 if (!client_info->slave) {
 
 600                         printk(KERN_ERR DRV_NAME
 
 601                                ": %s: Error: found a client with no channel in "
 
 602                                "the client's hash table\n",
 
 606                 /*update all clients using this src_ip, that are not assigned
 
 607                  * to the team's address (curr_active_slave) and have a known
 
 608                  * unicast mac address.
 
 610                 if ((client_info->ip_src == src_ip) &&
 
 611                     memcmp(client_info->slave->dev->dev_addr,
 
 612                            bond->dev->dev_addr, ETH_ALEN) &&
 
 613                     memcmp(client_info->mac_dst, mac_bcast, ETH_ALEN)) {
 
 614                         client_info->ntt = 1;
 
 615                         bond_info->rx_ntt = 1;
 
 619         _unlock_rx_hashtbl(bond);
 
 622 /* Caller must hold both bond and ptr locks for read */
 
 623 static struct slave *rlb_choose_channel(struct sk_buff *skb, struct bonding *bond)
 
 625         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 626         struct arp_pkt *arp = arp_pkt(skb);
 
 627         struct slave *assigned_slave;
 
 628         struct rlb_client_info *client_info;
 
 631         _lock_rx_hashtbl(bond);
 
 633         hash_index = _simple_hash((u8 *)&arp->ip_dst, sizeof(arp->ip_src));
 
 634         client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 636         if (client_info->assigned) {
 
 637                 if ((client_info->ip_src == arp->ip_src) &&
 
 638                     (client_info->ip_dst == arp->ip_dst)) {
 
 639                         /* the entry is already assigned to this client */
 
 640                         if (memcmp(arp->mac_dst, mac_bcast, ETH_ALEN)) {
 
 641                                 /* update mac address from arp */
 
 642                                 memcpy(client_info->mac_dst, arp->mac_dst, ETH_ALEN);
 
 645                         assigned_slave = client_info->slave;
 
 646                         if (assigned_slave) {
 
 647                                 _unlock_rx_hashtbl(bond);
 
 648                                 return assigned_slave;
 
 651                         /* the entry is already assigned to some other client,
 
 652                          * move the old client to primary (curr_active_slave) so
 
 653                          * that the new client can be assigned to this entry.
 
 655                         if (bond->curr_active_slave &&
 
 656                             client_info->slave != bond->curr_active_slave) {
 
 657                                 client_info->slave = bond->curr_active_slave;
 
 658                                 rlb_update_client(client_info);
 
 662         /* assign a new slave */
 
 663         assigned_slave = rlb_next_rx_slave(bond);
 
 665         if (assigned_slave) {
 
 666                 client_info->ip_src = arp->ip_src;
 
 667                 client_info->ip_dst = arp->ip_dst;
 
 668                 /* arp->mac_dst is broadcast for arp reqeusts.
 
 669                  * will be updated with clients actual unicast mac address
 
 670                  * upon receiving an arp reply.
 
 672                 memcpy(client_info->mac_dst, arp->mac_dst, ETH_ALEN);
 
 673                 client_info->slave = assigned_slave;
 
 675                 if (memcmp(client_info->mac_dst, mac_bcast, ETH_ALEN)) {
 
 676                         client_info->ntt = 1;
 
 677                         bond->alb_info.rx_ntt = 1;
 
 679                         client_info->ntt = 0;
 
 682                 if (!list_empty(&bond->vlan_list)) {
 
 683                         if (!vlan_get_tag(skb, &client_info->vlan_id))
 
 684                                 client_info->tag = 1;
 
 687                 if (!client_info->assigned) {
 
 688                         u32 prev_tbl_head = bond_info->rx_hashtbl_head;
 
 689                         bond_info->rx_hashtbl_head = hash_index;
 
 690                         client_info->next = prev_tbl_head;
 
 691                         if (prev_tbl_head != RLB_NULL_INDEX) {
 
 692                                 bond_info->rx_hashtbl[prev_tbl_head].prev =
 
 695                         client_info->assigned = 1;
 
 699         _unlock_rx_hashtbl(bond);
 
 701         return assigned_slave;
 
 704 /* chooses (and returns) transmit channel for arp reply
 
 705  * does not choose channel for other arp types since they are
 
 706  * sent on the curr_active_slave
 
 708 static struct slave *rlb_arp_xmit(struct sk_buff *skb, struct bonding *bond)
 
 710         struct arp_pkt *arp = arp_pkt(skb);
 
 711         struct slave *tx_slave = NULL;
 
 713         if (arp->op_code == __constant_htons(ARPOP_REPLY)) {
 
 714                 /* the arp must be sent on the selected
 
 717                 tx_slave = rlb_choose_channel(skb, bond);
 
 719                         memcpy(arp->mac_src,tx_slave->dev->dev_addr, ETH_ALEN);
 
 721                 dprintk("Server sent ARP Reply packet\n");
 
 722         } else if (arp->op_code == __constant_htons(ARPOP_REQUEST)) {
 
 723                 /* Create an entry in the rx_hashtbl for this client as a
 
 725                  * When the arp reply is received the entry will be updated
 
 726                  * with the correct unicast address of the client.
 
 728                 rlb_choose_channel(skb, bond);
 
 730                 /* The ARP relpy packets must be delayed so that
 
 731                  * they can cancel out the influence of the ARP request.
 
 733                 bond->alb_info.rlb_update_delay_counter = RLB_UPDATE_DELAY;
 
 735                 /* arp requests are broadcast and are sent on the primary
 
 736                  * the arp request will collapse all clients on the subnet to
 
 737                  * the primary slave. We must register these clients to be
 
 738                  * updated with their assigned mac.
 
 740                 rlb_req_update_subnet_clients(bond, arp->ip_src);
 
 741                 dprintk("Server sent ARP Request packet\n");
 
 747 /* Caller must hold bond lock for read */
 
 748 static void rlb_rebalance(struct bonding *bond)
 
 750         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 751         struct slave *assigned_slave;
 
 752         struct rlb_client_info *client_info;
 
 756         _lock_rx_hashtbl(bond);
 
 759         hash_index = bond_info->rx_hashtbl_head;
 
 760         for (; hash_index != RLB_NULL_INDEX; hash_index = client_info->next) {
 
 761                 client_info = &(bond_info->rx_hashtbl[hash_index]);
 
 762                 assigned_slave = rlb_next_rx_slave(bond);
 
 763                 if (assigned_slave && (client_info->slave != assigned_slave)) {
 
 764                         client_info->slave = assigned_slave;
 
 765                         client_info->ntt = 1;
 
 770         /* update the team's flag only after the whole iteration */
 
 772                 bond_info->rx_ntt = 1;
 
 774         _unlock_rx_hashtbl(bond);
 
 777 /* Caller must hold rx_hashtbl lock */
 
 778 static void rlb_init_table_entry(struct rlb_client_info *entry)
 
 780         memset(entry, 0, sizeof(struct rlb_client_info));
 
 781         entry->next = RLB_NULL_INDEX;
 
 782         entry->prev = RLB_NULL_INDEX;
 
 785 static int rlb_initialize(struct bonding *bond)
 
 787         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 788         struct packet_type *pk_type = &(BOND_ALB_INFO(bond).rlb_pkt_type);
 
 789         struct rlb_client_info  *new_hashtbl;
 
 790         int size = RLB_HASH_TABLE_SIZE * sizeof(struct rlb_client_info);
 
 793         spin_lock_init(&(bond_info->rx_hashtbl_lock));
 
 795         new_hashtbl = kmalloc(size, GFP_KERNEL);
 
 797                 printk(KERN_ERR DRV_NAME
 
 798                        ": %s: Error: Failed to allocate RLB hash table\n",
 
 802         _lock_rx_hashtbl(bond);
 
 804         bond_info->rx_hashtbl = new_hashtbl;
 
 806         bond_info->rx_hashtbl_head = RLB_NULL_INDEX;
 
 808         for (i = 0; i < RLB_HASH_TABLE_SIZE; i++) {
 
 809                 rlb_init_table_entry(bond_info->rx_hashtbl + i);
 
 812         _unlock_rx_hashtbl(bond);
 
 814         /*initialize packet type*/
 
 815         pk_type->type = __constant_htons(ETH_P_ARP);
 
 816         pk_type->dev = bond->dev;
 
 817         pk_type->func = rlb_arp_recv;
 
 819         /* register to receive ARPs */
 
 820         dev_add_pack(pk_type);
 
 825 static void rlb_deinitialize(struct bonding *bond)
 
 827         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 829         dev_remove_pack(&(bond_info->rlb_pkt_type));
 
 831         _lock_rx_hashtbl(bond);
 
 833         kfree(bond_info->rx_hashtbl);
 
 834         bond_info->rx_hashtbl = NULL;
 
 835         bond_info->rx_hashtbl_head = RLB_NULL_INDEX;
 
 837         _unlock_rx_hashtbl(bond);
 
 840 static void rlb_clear_vlan(struct bonding *bond, unsigned short vlan_id)
 
 842         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
 845         _lock_rx_hashtbl(bond);
 
 847         curr_index = bond_info->rx_hashtbl_head;
 
 848         while (curr_index != RLB_NULL_INDEX) {
 
 849                 struct rlb_client_info *curr = &(bond_info->rx_hashtbl[curr_index]);
 
 850                 u32 next_index = bond_info->rx_hashtbl[curr_index].next;
 
 851                 u32 prev_index = bond_info->rx_hashtbl[curr_index].prev;
 
 853                 if (curr->tag && (curr->vlan_id == vlan_id)) {
 
 854                         if (curr_index == bond_info->rx_hashtbl_head) {
 
 855                                 bond_info->rx_hashtbl_head = next_index;
 
 857                         if (prev_index != RLB_NULL_INDEX) {
 
 858                                 bond_info->rx_hashtbl[prev_index].next = next_index;
 
 860                         if (next_index != RLB_NULL_INDEX) {
 
 861                                 bond_info->rx_hashtbl[next_index].prev = prev_index;
 
 864                         rlb_init_table_entry(curr);
 
 867                 curr_index = next_index;
 
 870         _unlock_rx_hashtbl(bond);
 
 873 /*********************** tlb/rlb shared functions *********************/
 
 875 static void alb_send_learning_packets(struct slave *slave, u8 mac_addr[])
 
 877         struct bonding *bond = bond_get_bond_by_slave(slave);
 
 878         struct learning_pkt pkt;
 
 879         int size = sizeof(struct learning_pkt);
 
 882         memset(&pkt, 0, size);
 
 883         memcpy(pkt.mac_dst, mac_addr, ETH_ALEN);
 
 884         memcpy(pkt.mac_src, mac_addr, ETH_ALEN);
 
 885         pkt.type = __constant_htons(ETH_P_LOOP);
 
 887         for (i = 0; i < MAX_LP_BURST; i++) {
 
 891                 skb = dev_alloc_skb(size);
 
 896                 data = skb_put(skb, size);
 
 897                 memcpy(data, &pkt, size);
 
 899                 skb_reset_mac_header(skb);
 
 900                 skb->network_header = skb->mac_header + ETH_HLEN;
 
 901                 skb->protocol = pkt.type;
 
 902                 skb->priority = TC_PRIO_CONTROL;
 
 903                 skb->dev = slave->dev;
 
 905                 if (!list_empty(&bond->vlan_list)) {
 
 906                         struct vlan_entry *vlan;
 
 908                         vlan = bond_next_vlan(bond,
 
 909                                               bond->alb_info.current_alb_vlan);
 
 911                         bond->alb_info.current_alb_vlan = vlan;
 
 917                         skb = vlan_put_tag(skb, vlan->vlan_id);
 
 919                                 printk(KERN_ERR DRV_NAME
 
 920                                        ": %s: Error: failed to insert VLAN tag\n",
 
 930 /* hw is a boolean parameter that determines whether we should try and
 
 931  * set the hw address of the device as well as the hw address of the
 
 934 static int alb_set_slave_mac_addr(struct slave *slave, u8 addr[], int hw)
 
 936         struct net_device *dev = slave->dev;
 
 937         struct sockaddr s_addr;
 
 940                 memcpy(dev->dev_addr, addr, dev->addr_len);
 
 944         /* for rlb each slave must have a unique hw mac addresses so that */
 
 945         /* each slave will receive packets destined to a different mac */
 
 946         memcpy(s_addr.sa_data, addr, dev->addr_len);
 
 947         s_addr.sa_family = dev->type;
 
 948         if (dev_set_mac_address(dev, &s_addr)) {
 
 949                 printk(KERN_ERR DRV_NAME
 
 950                        ": %s: Error: dev_set_mac_address of dev %s failed! ALB "
 
 951                        "mode requires that the base driver support setting "
 
 952                        "the hw address also when the network device's "
 
 953                        "interface is open\n",
 
 954                        dev->master->name, dev->name);
 
 961  * Swap MAC addresses between two slaves.
 
 963  * Called with RTNL held, and no other locks.
 
 967 static void alb_swap_mac_addr(struct bonding *bond, struct slave *slave1, struct slave *slave2)
 
 969         u8 tmp_mac_addr[ETH_ALEN];
 
 971         memcpy(tmp_mac_addr, slave1->dev->dev_addr, ETH_ALEN);
 
 972         alb_set_slave_mac_addr(slave1, slave2->dev->dev_addr, bond->alb_info.rlb_enabled);
 
 973         alb_set_slave_mac_addr(slave2, tmp_mac_addr, bond->alb_info.rlb_enabled);
 
 978  * Send learning packets after MAC address swap.
 
 980  * Called with RTNL and no other locks
 
 982 static void alb_fasten_mac_swap(struct bonding *bond, struct slave *slave1,
 
 983                                 struct slave *slave2)
 
 985         int slaves_state_differ = (SLAVE_IS_OK(slave1) != SLAVE_IS_OK(slave2));
 
 986         struct slave *disabled_slave = NULL;
 
 990         /* fasten the change in the switch */
 
 991         if (SLAVE_IS_OK(slave1)) {
 
 992                 alb_send_learning_packets(slave1, slave1->dev->dev_addr);
 
 993                 if (bond->alb_info.rlb_enabled) {
 
 994                         /* inform the clients that the mac address
 
 997                         rlb_req_update_slave_clients(bond, slave1);
 
1000                 disabled_slave = slave1;
 
1003         if (SLAVE_IS_OK(slave2)) {
 
1004                 alb_send_learning_packets(slave2, slave2->dev->dev_addr);
 
1005                 if (bond->alb_info.rlb_enabled) {
 
1006                         /* inform the clients that the mac address
 
1009                         rlb_req_update_slave_clients(bond, slave2);
 
1012                 disabled_slave = slave2;
 
1015         if (bond->alb_info.rlb_enabled && slaves_state_differ) {
 
1016                 /* A disabled slave was assigned an active mac addr */
 
1017                 rlb_teach_disabled_mac_on_primary(bond,
 
1018                                                   disabled_slave->dev->dev_addr);
 
1023  * alb_change_hw_addr_on_detach
 
1024  * @bond: bonding we're working on
 
1025  * @slave: the slave that was just detached
 
1027  * We assume that @slave was already detached from the slave list.
 
1029  * If @slave's permanent hw address is different both from its current
 
1030  * address and from @bond's address, then somewhere in the bond there's
 
1031  * a slave that has @slave's permanet address as its current address.
 
1032  * We'll make sure that that slave no longer uses @slave's permanent address.
 
1034  * Caller must hold RTNL and no other locks
 
1036 static void alb_change_hw_addr_on_detach(struct bonding *bond, struct slave *slave)
 
1041         perm_curr_diff = memcmp(slave->perm_hwaddr,
 
1042                                 slave->dev->dev_addr,
 
1044         perm_bond_diff = memcmp(slave->perm_hwaddr,
 
1045                                 bond->dev->dev_addr,
 
1048         if (perm_curr_diff && perm_bond_diff) {
 
1049                 struct slave *tmp_slave;
 
1052                 bond_for_each_slave(bond, tmp_slave, i) {
 
1053                         if (!memcmp(slave->perm_hwaddr,
 
1054                                     tmp_slave->dev->dev_addr,
 
1062                         /* locking: needs RTNL and nothing else */
 
1063                         alb_swap_mac_addr(bond, slave, tmp_slave);
 
1064                         alb_fasten_mac_swap(bond, slave, tmp_slave);
 
1070  * alb_handle_addr_collision_on_attach
 
1071  * @bond: bonding we're working on
 
1072  * @slave: the slave that was just attached
 
1074  * checks uniqueness of slave's mac address and handles the case the
 
1075  * new slave uses the bonds mac address.
 
1077  * If the permanent hw address of @slave is @bond's hw address, we need to
 
1078  * find a different hw address to give @slave, that isn't in use by any other
 
1079  * slave in the bond. This address must be, of course, one of the premanent
 
1080  * addresses of the other slaves.
 
1082  * We go over the slave list, and for each slave there we compare its
 
1083  * permanent hw address with the current address of all the other slaves.
 
1084  * If no match was found, then we've found a slave with a permanent address
 
1085  * that isn't used by any other slave in the bond, so we can assign it to
 
1088  * assumption: this function is called before @slave is attached to the
 
1091  * caller must hold the bond lock for write since the mac addresses are compared
 
1092  * and may be swapped.
 
1094 static int alb_handle_addr_collision_on_attach(struct bonding *bond, struct slave *slave)
 
1096         struct slave *tmp_slave1, *tmp_slave2, *free_mac_slave;
 
1097         struct slave *has_bond_addr = bond->curr_active_slave;
 
1098         int i, j, found = 0;
 
1100         if (bond->slave_cnt == 0) {
 
1101                 /* this is the first slave */
 
1105         /* if slave's mac address differs from bond's mac address
 
1106          * check uniqueness of slave's mac address against the other
 
1107          * slaves in the bond.
 
1109         if (memcmp(slave->perm_hwaddr, bond->dev->dev_addr, ETH_ALEN)) {
 
1110                 bond_for_each_slave(bond, tmp_slave1, i) {
 
1111                         if (!memcmp(tmp_slave1->dev->dev_addr, slave->dev->dev_addr,
 
1121                 /* Try setting slave mac to bond address and fall-through
 
1122                    to code handling that situation below... */
 
1123                 alb_set_slave_mac_addr(slave, bond->dev->dev_addr,
 
1124                                        bond->alb_info.rlb_enabled);
 
1127         /* The slave's address is equal to the address of the bond.
 
1128          * Search for a spare address in the bond for this slave.
 
1130         free_mac_slave = NULL;
 
1132         bond_for_each_slave(bond, tmp_slave1, i) {
 
1134                 bond_for_each_slave(bond, tmp_slave2, j) {
 
1135                         if (!memcmp(tmp_slave1->perm_hwaddr,
 
1136                                     tmp_slave2->dev->dev_addr,
 
1144                         /* no slave has tmp_slave1's perm addr
 
1147                         free_mac_slave = tmp_slave1;
 
1151                 if (!has_bond_addr) {
 
1152                         if (!memcmp(tmp_slave1->dev->dev_addr,
 
1153                                     bond->dev->dev_addr,
 
1156                                 has_bond_addr = tmp_slave1;
 
1161         if (free_mac_slave) {
 
1162                 alb_set_slave_mac_addr(slave, free_mac_slave->perm_hwaddr,
 
1163                                        bond->alb_info.rlb_enabled);
 
1165                 printk(KERN_WARNING DRV_NAME
 
1166                        ": %s: Warning: the hw address of slave %s is in use by "
 
1167                        "the bond; giving it the hw address of %s\n",
 
1168                        bond->dev->name, slave->dev->name, free_mac_slave->dev->name);
 
1170         } else if (has_bond_addr) {
 
1171                 printk(KERN_ERR DRV_NAME
 
1172                        ": %s: Error: the hw address of slave %s is in use by the "
 
1173                        "bond; couldn't find a slave with a free hw address to "
 
1174                        "give it (this should not have happened)\n",
 
1175                        bond->dev->name, slave->dev->name);
 
1183  * alb_set_mac_address
 
1187  * In TLB mode all slaves are configured to the bond's hw address, but set
 
1188  * their dev_addr field to different addresses (based on their permanent hw
 
1191  * For each slave, this function sets the interface to the new address and then
 
1192  * changes its dev_addr field to its previous value.
 
1194  * Unwinding assumes bond's mac address has not yet changed.
 
1196 static int alb_set_mac_address(struct bonding *bond, void *addr)
 
1199         struct slave *slave, *stop_at;
 
1200         char tmp_addr[ETH_ALEN];
 
1204         if (bond->alb_info.rlb_enabled) {
 
1208         bond_for_each_slave(bond, slave, i) {
 
1209                 if (slave->dev->set_mac_address == NULL) {
 
1214                 /* save net_device's current hw address */
 
1215                 memcpy(tmp_addr, slave->dev->dev_addr, ETH_ALEN);
 
1217                 res = dev_set_mac_address(slave->dev, addr);
 
1219                 /* restore net_device's hw address */
 
1220                 memcpy(slave->dev->dev_addr, tmp_addr, ETH_ALEN);
 
1230         memcpy(sa.sa_data, bond->dev->dev_addr, bond->dev->addr_len);
 
1231         sa.sa_family = bond->dev->type;
 
1233         /* unwind from head to the slave that failed */
 
1235         bond_for_each_slave_from_to(bond, slave, i, bond->first_slave, stop_at) {
 
1236                 memcpy(tmp_addr, slave->dev->dev_addr, ETH_ALEN);
 
1237                 dev_set_mac_address(slave->dev, &sa);
 
1238                 memcpy(slave->dev->dev_addr, tmp_addr, ETH_ALEN);
 
1244 /************************ exported alb funcions ************************/
 
1246 int bond_alb_initialize(struct bonding *bond, int rlb_enabled)
 
1250         res = tlb_initialize(bond);
 
1256                 bond->alb_info.rlb_enabled = 1;
 
1257                 /* initialize rlb */
 
1258                 res = rlb_initialize(bond);
 
1260                         tlb_deinitialize(bond);
 
1264                 bond->alb_info.rlb_enabled = 0;
 
1270 void bond_alb_deinitialize(struct bonding *bond)
 
1272         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
1274         tlb_deinitialize(bond);
 
1276         if (bond_info->rlb_enabled) {
 
1277                 rlb_deinitialize(bond);
 
1281 int bond_alb_xmit(struct sk_buff *skb, struct net_device *bond_dev)
 
1283         struct bonding *bond = bond_dev->priv;
 
1284         struct ethhdr *eth_data;
 
1285         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
1286         struct slave *tx_slave = NULL;
 
1287         static const __be32 ip_bcast = htonl(0xffffffff);
 
1289         int do_tx_balance = 1;
 
1291         const u8 *hash_start = NULL;
 
1294         skb_reset_mac_header(skb);
 
1295         eth_data = eth_hdr(skb);
 
1297         /* make sure that the curr_active_slave and the slaves list do
 
1298          * not change during tx
 
1300         read_lock(&bond->lock);
 
1301         read_lock(&bond->curr_slave_lock);
 
1303         if (!BOND_IS_OK(bond)) {
 
1307         switch (ntohs(skb->protocol)) {
 
1309                 const struct iphdr *iph = ip_hdr(skb);
 
1311                 if ((memcmp(eth_data->h_dest, mac_bcast, ETH_ALEN) == 0) ||
 
1312                     (iph->daddr == ip_bcast) ||
 
1313                     (iph->protocol == IPPROTO_IGMP)) {
 
1317                 hash_start = (char *)&(iph->daddr);
 
1318                 hash_size = sizeof(iph->daddr);
 
1322                 if (memcmp(eth_data->h_dest, mac_bcast, ETH_ALEN) == 0) {
 
1327                 hash_start = (char *)&(ipv6_hdr(skb)->daddr);
 
1328                 hash_size = sizeof(ipv6_hdr(skb)->daddr);
 
1331                 if (ipx_hdr(skb)->ipx_checksum != IPX_NO_CHECKSUM) {
 
1332                         /* something is wrong with this packet */
 
1337                 if (ipx_hdr(skb)->ipx_type != IPX_TYPE_NCP) {
 
1338                         /* The only protocol worth balancing in
 
1339                          * this family since it has an "ARP" like
 
1346                 hash_start = (char*)eth_data->h_dest;
 
1347                 hash_size = ETH_ALEN;
 
1351                 if (bond_info->rlb_enabled) {
 
1352                         tx_slave = rlb_arp_xmit(skb, bond);
 
1360         if (do_tx_balance) {
 
1361                 hash_index = _simple_hash(hash_start, hash_size);
 
1362                 tx_slave = tlb_choose_channel(bond, hash_index, skb->len);
 
1366                 /* unbalanced or unassigned, send through primary */
 
1367                 tx_slave = bond->curr_active_slave;
 
1368                 bond_info->unbalanced_load += skb->len;
 
1371         if (tx_slave && SLAVE_IS_OK(tx_slave)) {
 
1372                 if (tx_slave != bond->curr_active_slave) {
 
1373                         memcpy(eth_data->h_source,
 
1374                                tx_slave->dev->dev_addr,
 
1378                 res = bond_dev_queue_xmit(bond, skb, tx_slave->dev);
 
1381                         tlb_clear_slave(bond, tx_slave, 0);
 
1387                 /* no suitable interface, frame not sent */
 
1390         read_unlock(&bond->curr_slave_lock);
 
1391         read_unlock(&bond->lock);
 
1395 void bond_alb_monitor(struct work_struct *work)
 
1397         struct bonding *bond = container_of(work, struct bonding,
 
1399         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
1400         struct slave *slave;
 
1403         read_lock(&bond->lock);
 
1405         if (bond->kill_timers) {
 
1409         if (bond->slave_cnt == 0) {
 
1410                 bond_info->tx_rebalance_counter = 0;
 
1411                 bond_info->lp_counter = 0;
 
1415         bond_info->tx_rebalance_counter++;
 
1416         bond_info->lp_counter++;
 
1418         /* send learning packets */
 
1419         if (bond_info->lp_counter >= BOND_ALB_LP_TICKS) {
 
1420                 /* change of curr_active_slave involves swapping of mac addresses.
 
1421                  * in order to avoid this swapping from happening while
 
1422                  * sending the learning packets, the curr_slave_lock must be held for
 
1425                 read_lock(&bond->curr_slave_lock);
 
1427                 bond_for_each_slave(bond, slave, i) {
 
1428                         alb_send_learning_packets(slave, slave->dev->dev_addr);
 
1431                 read_unlock(&bond->curr_slave_lock);
 
1433                 bond_info->lp_counter = 0;
 
1436         /* rebalance tx traffic */
 
1437         if (bond_info->tx_rebalance_counter >= BOND_TLB_REBALANCE_TICKS) {
 
1439                 read_lock(&bond->curr_slave_lock);
 
1441                 bond_for_each_slave(bond, slave, i) {
 
1442                         tlb_clear_slave(bond, slave, 1);
 
1443                         if (slave == bond->curr_active_slave) {
 
1444                                 SLAVE_TLB_INFO(slave).load =
 
1445                                         bond_info->unbalanced_load /
 
1446                                                 BOND_TLB_REBALANCE_INTERVAL;
 
1447                                 bond_info->unbalanced_load = 0;
 
1451                 read_unlock(&bond->curr_slave_lock);
 
1453                 bond_info->tx_rebalance_counter = 0;
 
1456         /* handle rlb stuff */
 
1457         if (bond_info->rlb_enabled) {
 
1458                 if (bond_info->primary_is_promisc &&
 
1459                     (++bond_info->rlb_promisc_timeout_counter >= RLB_PROMISC_TIMEOUT)) {
 
1462                          * dev_set_promiscuity requires rtnl and
 
1465                         read_unlock(&bond->lock);
 
1468                         bond_info->rlb_promisc_timeout_counter = 0;
 
1470                         /* If the primary was set to promiscuous mode
 
1471                          * because a slave was disabled then
 
1472                          * it can now leave promiscuous mode.
 
1474                         dev_set_promiscuity(bond->curr_active_slave->dev, -1);
 
1475                         bond_info->primary_is_promisc = 0;
 
1478                         read_lock(&bond->lock);
 
1481                 if (bond_info->rlb_rebalance) {
 
1482                         bond_info->rlb_rebalance = 0;
 
1483                         rlb_rebalance(bond);
 
1486                 /* check if clients need updating */
 
1487                 if (bond_info->rx_ntt) {
 
1488                         if (bond_info->rlb_update_delay_counter) {
 
1489                                 --bond_info->rlb_update_delay_counter;
 
1491                                 rlb_update_rx_clients(bond);
 
1492                                 if (bond_info->rlb_update_retry_counter) {
 
1493                                         --bond_info->rlb_update_retry_counter;
 
1495                                         bond_info->rx_ntt = 0;
 
1502         queue_delayed_work(bond->wq, &bond->alb_work, alb_delta_in_ticks);
 
1504         read_unlock(&bond->lock);
 
1507 /* assumption: called before the slave is attached to the bond
 
1508  * and not locked by the bond lock
 
1510 int bond_alb_init_slave(struct bonding *bond, struct slave *slave)
 
1514         res = alb_set_slave_mac_addr(slave, slave->perm_hwaddr,
 
1515                                      bond->alb_info.rlb_enabled);
 
1520         /* caller must hold the bond lock for write since the mac addresses
 
1521          * are compared and may be swapped.
 
1523         read_lock(&bond->lock);
 
1525         res = alb_handle_addr_collision_on_attach(bond, slave);
 
1527         read_unlock(&bond->lock);
 
1533         tlb_init_slave(slave);
 
1535         /* order a rebalance ASAP */
 
1536         bond->alb_info.tx_rebalance_counter = BOND_TLB_REBALANCE_TICKS;
 
1538         if (bond->alb_info.rlb_enabled) {
 
1539                 bond->alb_info.rlb_rebalance = 1;
 
1546  * Remove slave from tlb and rlb hash tables, and fix up MAC addresses
 
1549  * Caller must hold RTNL and no other locks
 
1551 void bond_alb_deinit_slave(struct bonding *bond, struct slave *slave)
 
1553         if (bond->slave_cnt > 1) {
 
1554                 alb_change_hw_addr_on_detach(bond, slave);
 
1557         tlb_clear_slave(bond, slave, 0);
 
1559         if (bond->alb_info.rlb_enabled) {
 
1560                 bond->alb_info.next_rx_slave = NULL;
 
1561                 rlb_clear_slave(bond, slave);
 
1565 /* Caller must hold bond lock for read */
 
1566 void bond_alb_handle_link_change(struct bonding *bond, struct slave *slave, char link)
 
1568         struct alb_bond_info *bond_info = &(BOND_ALB_INFO(bond));
 
1570         if (link == BOND_LINK_DOWN) {
 
1571                 tlb_clear_slave(bond, slave, 0);
 
1572                 if (bond->alb_info.rlb_enabled) {
 
1573                         rlb_clear_slave(bond, slave);
 
1575         } else if (link == BOND_LINK_UP) {
 
1576                 /* order a rebalance ASAP */
 
1577                 bond_info->tx_rebalance_counter = BOND_TLB_REBALANCE_TICKS;
 
1578                 if (bond->alb_info.rlb_enabled) {
 
1579                         bond->alb_info.rlb_rebalance = 1;
 
1580                         /* If the updelay module parameter is smaller than the
 
1581                          * forwarding delay of the switch the rebalance will
 
1582                          * not work because the rebalance arp replies will
 
1583                          * not be forwarded to the clients..
 
1590  * bond_alb_handle_active_change - assign new curr_active_slave
 
1591  * @bond: our bonding struct
 
1592  * @new_slave: new slave to assign
 
1594  * Set the bond->curr_active_slave to @new_slave and handle
 
1595  * mac address swapping and promiscuity changes as needed.
 
1597  * If new_slave is NULL, caller must hold curr_slave_lock or
 
1598  * bond->lock for write.
 
1600  * If new_slave is not NULL, caller must hold RTNL, bond->lock for
 
1601  * read and curr_slave_lock for write.  Processing here may sleep, so
 
1602  * no other locks may be held.
 
1604 void bond_alb_handle_active_change(struct bonding *bond, struct slave *new_slave)
 
1606         struct slave *swap_slave;
 
1609         if (bond->curr_active_slave == new_slave) {
 
1613         if (bond->curr_active_slave && bond->alb_info.primary_is_promisc) {
 
1614                 dev_set_promiscuity(bond->curr_active_slave->dev, -1);
 
1615                 bond->alb_info.primary_is_promisc = 0;
 
1616                 bond->alb_info.rlb_promisc_timeout_counter = 0;
 
1619         swap_slave = bond->curr_active_slave;
 
1620         bond->curr_active_slave = new_slave;
 
1622         if (!new_slave || (bond->slave_cnt == 0)) {
 
1626         /* set the new curr_active_slave to the bonds mac address
 
1627          * i.e. swap mac addresses of old curr_active_slave and new curr_active_slave
 
1630                 struct slave *tmp_slave;
 
1631                 /* find slave that is holding the bond's mac address */
 
1632                 bond_for_each_slave(bond, tmp_slave, i) {
 
1633                         if (!memcmp(tmp_slave->dev->dev_addr,
 
1634                                     bond->dev->dev_addr, ETH_ALEN)) {
 
1635                                 swap_slave = tmp_slave;
 
1642          * Arrange for swap_slave and new_slave to temporarily be
 
1643          * ignored so we can mess with their MAC addresses without
 
1644          * fear of interference from transmit activity.
 
1647                 tlb_clear_slave(bond, swap_slave, 1);
 
1649         tlb_clear_slave(bond, new_slave, 1);
 
1651         write_unlock_bh(&bond->curr_slave_lock);
 
1652         read_unlock(&bond->lock);
 
1656         /* curr_active_slave must be set before calling alb_swap_mac_addr */
 
1658                 /* swap mac address */
 
1659                 alb_swap_mac_addr(bond, swap_slave, new_slave);
 
1661                 /* set the new_slave to the bond mac address */
 
1662                 alb_set_slave_mac_addr(new_slave, bond->dev->dev_addr,
 
1663                                        bond->alb_info.rlb_enabled);
 
1667                 alb_fasten_mac_swap(bond, swap_slave, new_slave);
 
1668                 read_lock(&bond->lock);
 
1670                 read_lock(&bond->lock);
 
1671                 alb_send_learning_packets(new_slave, bond->dev->dev_addr);
 
1674         write_lock_bh(&bond->curr_slave_lock);
 
1680 int bond_alb_set_mac_address(struct net_device *bond_dev, void *addr)
 
1682         struct bonding *bond = bond_dev->priv;
 
1683         struct sockaddr *sa = addr;
 
1684         struct slave *slave, *swap_slave;
 
1688         if (!is_valid_ether_addr(sa->sa_data)) {
 
1689                 return -EADDRNOTAVAIL;
 
1692         res = alb_set_mac_address(bond, addr);
 
1697         memcpy(bond_dev->dev_addr, sa->sa_data, bond_dev->addr_len);
 
1699         /* If there is no curr_active_slave there is nothing else to do.
 
1700          * Otherwise we'll need to pass the new address to it and handle
 
1703         if (!bond->curr_active_slave) {
 
1709         bond_for_each_slave(bond, slave, i) {
 
1710                 if (!memcmp(slave->dev->dev_addr, bond_dev->dev_addr, ETH_ALEN)) {
 
1716         write_unlock_bh(&bond->curr_slave_lock);
 
1717         read_unlock(&bond->lock);
 
1720                 alb_swap_mac_addr(bond, swap_slave, bond->curr_active_slave);
 
1721                 alb_fasten_mac_swap(bond, swap_slave, bond->curr_active_slave);
 
1723                 alb_set_slave_mac_addr(bond->curr_active_slave, bond_dev->dev_addr,
 
1724                                        bond->alb_info.rlb_enabled);
 
1726                 alb_send_learning_packets(bond->curr_active_slave, bond_dev->dev_addr);
 
1727                 if (bond->alb_info.rlb_enabled) {
 
1728                         /* inform clients mac address has changed */
 
1729                         rlb_req_update_slave_clients(bond, bond->curr_active_slave);
 
1733         read_lock(&bond->lock);
 
1734         write_lock_bh(&bond->curr_slave_lock);
 
1739 void bond_alb_clear_vlan(struct bonding *bond, unsigned short vlan_id)
 
1741         if (bond->alb_info.current_alb_vlan &&
 
1742             (bond->alb_info.current_alb_vlan->vlan_id == vlan_id)) {
 
1743                 bond->alb_info.current_alb_vlan = NULL;
 
1746         if (bond->alb_info.rlb_enabled) {
 
1747                 rlb_clear_vlan(bond, vlan_id);