2 * Copyright (C) 2005 - 2009 ServerEngines
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License version 2
7 * as published by the Free Software Foundation. The full GNU General
8 * Public License is included in this distribution in the file called COPYING.
10 * Contact Information:
11 * linux-drivers@serverengines.com
14 * 209 N. Fair Oaks Ave
19 #include <asm/div64.h>
21 MODULE_VERSION(DRV_VER);
22 MODULE_DEVICE_TABLE(pci, be_dev_ids);
23 MODULE_DESCRIPTION(DRV_DESC " " DRV_VER);
24 MODULE_AUTHOR("ServerEngines Corporation");
25 MODULE_LICENSE("GPL");
27 static unsigned int rx_frag_size = 2048;
28 module_param(rx_frag_size, uint, S_IRUGO);
29 MODULE_PARM_DESC(rx_frag_size, "Size of a fragment that holds rcvd data.");
31 static DEFINE_PCI_DEVICE_TABLE(be_dev_ids) = {
32 { PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID1) },
33 { PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID1) },
34 { PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID2) },
37 MODULE_DEVICE_TABLE(pci, be_dev_ids);
39 static void be_queue_free(struct be_adapter *adapter, struct be_queue_info *q)
41 struct be_dma_mem *mem = &q->dma_mem;
43 pci_free_consistent(adapter->pdev, mem->size,
47 static int be_queue_alloc(struct be_adapter *adapter, struct be_queue_info *q,
48 u16 len, u16 entry_size)
50 struct be_dma_mem *mem = &q->dma_mem;
52 memset(q, 0, sizeof(*q));
54 q->entry_size = entry_size;
55 mem->size = len * entry_size;
56 mem->va = pci_alloc_consistent(adapter->pdev, mem->size, &mem->dma);
59 memset(mem->va, 0, mem->size);
63 static void be_intr_set(struct be_ctrl_info *ctrl, bool enable)
65 u8 __iomem *addr = ctrl->pcicfg + PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET;
66 u32 reg = ioread32(addr);
67 u32 enabled = reg & MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
68 if (!enabled && enable) {
69 reg |= MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
70 } else if (enabled && !enable) {
71 reg &= ~MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
73 printk(KERN_WARNING DRV_NAME
74 ": bad value in membar_int_ctrl reg=0x%x\n", reg);
80 static void be_rxq_notify(struct be_ctrl_info *ctrl, u16 qid, u16 posted)
83 val |= qid & DB_RQ_RING_ID_MASK;
84 val |= posted << DB_RQ_NUM_POSTED_SHIFT;
85 iowrite32(val, ctrl->db + DB_RQ_OFFSET);
88 static void be_txq_notify(struct be_ctrl_info *ctrl, u16 qid, u16 posted)
91 val |= qid & DB_TXULP_RING_ID_MASK;
92 val |= (posted & DB_TXULP_NUM_POSTED_MASK) << DB_TXULP_NUM_POSTED_SHIFT;
93 iowrite32(val, ctrl->db + DB_TXULP1_OFFSET);
96 static void be_eq_notify(struct be_ctrl_info *ctrl, u16 qid,
97 bool arm, bool clear_int, u16 num_popped)
100 val |= qid & DB_EQ_RING_ID_MASK;
102 val |= 1 << DB_EQ_REARM_SHIFT;
104 val |= 1 << DB_EQ_CLR_SHIFT;
105 val |= 1 << DB_EQ_EVNT_SHIFT;
106 val |= num_popped << DB_EQ_NUM_POPPED_SHIFT;
107 iowrite32(val, ctrl->db + DB_EQ_OFFSET);
110 void be_cq_notify(struct be_ctrl_info *ctrl, u16 qid,
111 bool arm, u16 num_popped)
114 val |= qid & DB_CQ_RING_ID_MASK;
116 val |= 1 << DB_CQ_REARM_SHIFT;
117 val |= num_popped << DB_CQ_NUM_POPPED_SHIFT;
118 iowrite32(val, ctrl->db + DB_CQ_OFFSET);
122 static int be_mac_addr_set(struct net_device *netdev, void *p)
124 struct be_adapter *adapter = netdev_priv(netdev);
125 struct sockaddr *addr = p;
128 if (netif_running(netdev)) {
129 status = be_cmd_pmac_del(&adapter->ctrl, adapter->if_handle,
134 status = be_cmd_pmac_add(&adapter->ctrl, (u8 *)addr->sa_data,
135 adapter->if_handle, &adapter->pmac_id);
139 memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
144 static void netdev_stats_update(struct be_adapter *adapter)
146 struct be_hw_stats *hw_stats = hw_stats_from_cmd(adapter->stats.cmd.va);
147 struct be_rxf_stats *rxf_stats = &hw_stats->rxf;
148 struct be_port_rxf_stats *port_stats =
149 &rxf_stats->port[adapter->port_num];
150 struct net_device_stats *dev_stats = &adapter->stats.net_stats;
151 struct be_erx_stats *erx_stats = &hw_stats->erx;
153 dev_stats->rx_packets = port_stats->rx_total_frames;
154 dev_stats->tx_packets = port_stats->tx_unicastframes +
155 port_stats->tx_multicastframes + port_stats->tx_broadcastframes;
156 dev_stats->rx_bytes = (u64) port_stats->rx_bytes_msd << 32 |
157 (u64) port_stats->rx_bytes_lsd;
158 dev_stats->tx_bytes = (u64) port_stats->tx_bytes_msd << 32 |
159 (u64) port_stats->tx_bytes_lsd;
161 /* bad pkts received */
162 dev_stats->rx_errors = port_stats->rx_crc_errors +
163 port_stats->rx_alignment_symbol_errors +
164 port_stats->rx_in_range_errors +
165 port_stats->rx_out_range_errors +
166 port_stats->rx_frame_too_long +
167 port_stats->rx_dropped_too_small +
168 port_stats->rx_dropped_too_short +
169 port_stats->rx_dropped_header_too_small +
170 port_stats->rx_dropped_tcp_length +
171 port_stats->rx_dropped_runt +
172 port_stats->rx_tcp_checksum_errs +
173 port_stats->rx_ip_checksum_errs +
174 port_stats->rx_udp_checksum_errs;
176 /* no space in linux buffers: best possible approximation */
177 dev_stats->rx_dropped = erx_stats->rx_drops_no_fragments[0];
179 /* detailed rx errors */
180 dev_stats->rx_length_errors = port_stats->rx_in_range_errors +
181 port_stats->rx_out_range_errors +
182 port_stats->rx_frame_too_long;
184 /* receive ring buffer overflow */
185 dev_stats->rx_over_errors = 0;
187 dev_stats->rx_crc_errors = port_stats->rx_crc_errors;
189 /* frame alignment errors */
190 dev_stats->rx_frame_errors = port_stats->rx_alignment_symbol_errors;
192 /* receiver fifo overrun */
193 /* drops_no_pbuf is no per i/f, it's per BE card */
194 dev_stats->rx_fifo_errors = port_stats->rx_fifo_overflow +
195 port_stats->rx_input_fifo_overflow +
196 rxf_stats->rx_drops_no_pbuf;
197 /* receiver missed packetd */
198 dev_stats->rx_missed_errors = 0;
200 /* packet transmit problems */
201 dev_stats->tx_errors = 0;
203 /* no space available in linux */
204 dev_stats->tx_dropped = 0;
206 dev_stats->multicast = port_stats->tx_multicastframes;
207 dev_stats->collisions = 0;
209 /* detailed tx_errors */
210 dev_stats->tx_aborted_errors = 0;
211 dev_stats->tx_carrier_errors = 0;
212 dev_stats->tx_fifo_errors = 0;
213 dev_stats->tx_heartbeat_errors = 0;
214 dev_stats->tx_window_errors = 0;
217 static void be_link_status_update(struct be_adapter *adapter)
219 struct be_link_info *prev = &adapter->link;
220 struct be_link_info now = { 0 };
221 struct net_device *netdev = adapter->netdev;
223 be_cmd_link_status_query(&adapter->ctrl, &now);
225 /* If link came up or went down */
226 if (now.speed != prev->speed && (now.speed == PHY_LINK_SPEED_ZERO ||
227 prev->speed == PHY_LINK_SPEED_ZERO)) {
228 if (now.speed == PHY_LINK_SPEED_ZERO) {
229 netif_stop_queue(netdev);
230 netif_carrier_off(netdev);
231 printk(KERN_INFO "%s: Link down\n", netdev->name);
233 netif_start_queue(netdev);
234 netif_carrier_on(netdev);
235 printk(KERN_INFO "%s: Link up\n", netdev->name);
241 /* Update the EQ delay n BE based on the RX frags consumed / sec */
242 static void be_rx_eqd_update(struct be_adapter *adapter)
244 struct be_ctrl_info *ctrl = &adapter->ctrl;
245 struct be_eq_obj *rx_eq = &adapter->rx_eq;
246 struct be_drvr_stats *stats = &adapter->stats.drvr_stats;
250 if (!rx_eq->enable_aic)
254 if (time_before(now, stats->rx_fps_jiffies)) {
255 stats->rx_fps_jiffies = now;
259 /* Update once a second */
260 if ((now - stats->rx_fps_jiffies) < HZ)
263 stats->be_rx_fps = (stats->be_rx_frags - stats->be_prev_rx_frags) /
264 ((now - stats->rx_fps_jiffies) / HZ);
266 stats->rx_fps_jiffies = now;
267 stats->be_prev_rx_frags = stats->be_rx_frags;
268 eqd = stats->be_rx_fps / 110000;
270 if (eqd > rx_eq->max_eqd)
271 eqd = rx_eq->max_eqd;
272 if (eqd < rx_eq->min_eqd)
273 eqd = rx_eq->min_eqd;
276 if (eqd != rx_eq->cur_eqd)
277 be_cmd_modify_eqd(ctrl, rx_eq->q.id, eqd);
279 rx_eq->cur_eqd = eqd;
282 static struct net_device_stats *be_get_stats(struct net_device *dev)
284 struct be_adapter *adapter = netdev_priv(dev);
286 return &adapter->stats.net_stats;
289 static u32 be_calc_rate(u64 bytes, unsigned long ticks)
293 do_div(rate, ticks / HZ);
294 rate <<= 3; /* bytes/sec -> bits/sec */
295 do_div(rate, 1000000ul); /* MB/Sec */
300 static void be_tx_rate_update(struct be_adapter *adapter)
302 struct be_drvr_stats *stats = drvr_stats(adapter);
305 /* Wrapped around? */
306 if (time_before(now, stats->be_tx_jiffies)) {
307 stats->be_tx_jiffies = now;
311 /* Update tx rate once in two seconds */
312 if ((now - stats->be_tx_jiffies) > 2 * HZ) {
313 stats->be_tx_rate = be_calc_rate(stats->be_tx_bytes
314 - stats->be_tx_bytes_prev,
315 now - stats->be_tx_jiffies);
316 stats->be_tx_jiffies = now;
317 stats->be_tx_bytes_prev = stats->be_tx_bytes;
321 static void be_tx_stats_update(struct be_adapter *adapter,
322 u32 wrb_cnt, u32 copied, bool stopped)
324 struct be_drvr_stats *stats = drvr_stats(adapter);
326 stats->be_tx_wrbs += wrb_cnt;
327 stats->be_tx_bytes += copied;
329 stats->be_tx_stops++;
332 /* Determine number of WRB entries needed to xmit data in an skb */
333 static u32 wrb_cnt_for_skb(struct sk_buff *skb, bool *dummy)
335 int cnt = (skb->len > skb->data_len);
337 cnt += skb_shinfo(skb)->nr_frags;
339 /* to account for hdr wrb */
342 /* add a dummy to make it an even num */
347 BUG_ON(cnt > BE_MAX_TX_FRAG_COUNT);
351 static inline void wrb_fill(struct be_eth_wrb *wrb, u64 addr, int len)
353 wrb->frag_pa_hi = upper_32_bits(addr);
354 wrb->frag_pa_lo = addr & 0xFFFFFFFF;
355 wrb->frag_len = len & ETH_WRB_FRAG_LEN_MASK;
358 static void wrb_fill_hdr(struct be_eth_hdr_wrb *hdr, struct sk_buff *skb,
359 bool vlan, u32 wrb_cnt, u32 len)
361 memset(hdr, 0, sizeof(*hdr));
363 AMAP_SET_BITS(struct amap_eth_hdr_wrb, crc, hdr, 1);
365 if (skb_shinfo(skb)->gso_segs > 1 && skb_shinfo(skb)->gso_size) {
366 AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso, hdr, 1);
367 AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso_mss,
368 hdr, skb_shinfo(skb)->gso_size);
369 } else if (skb->ip_summed == CHECKSUM_PARTIAL) {
371 AMAP_SET_BITS(struct amap_eth_hdr_wrb, tcpcs, hdr, 1);
372 else if (is_udp_pkt(skb))
373 AMAP_SET_BITS(struct amap_eth_hdr_wrb, udpcs, hdr, 1);
376 if (vlan && vlan_tx_tag_present(skb)) {
377 AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan, hdr, 1);
378 AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan_tag,
379 hdr, vlan_tx_tag_get(skb));
382 AMAP_SET_BITS(struct amap_eth_hdr_wrb, event, hdr, 1);
383 AMAP_SET_BITS(struct amap_eth_hdr_wrb, complete, hdr, 1);
384 AMAP_SET_BITS(struct amap_eth_hdr_wrb, num_wrb, hdr, wrb_cnt);
385 AMAP_SET_BITS(struct amap_eth_hdr_wrb, len, hdr, len);
389 static int make_tx_wrbs(struct be_adapter *adapter,
390 struct sk_buff *skb, u32 wrb_cnt, bool dummy_wrb)
394 struct pci_dev *pdev = adapter->pdev;
395 struct sk_buff *first_skb = skb;
396 struct be_queue_info *txq = &adapter->tx_obj.q;
397 struct be_eth_wrb *wrb;
398 struct be_eth_hdr_wrb *hdr;
400 atomic_add(wrb_cnt, &txq->used);
401 hdr = queue_head_node(txq);
404 if (skb->len > skb->data_len) {
405 int len = skb->len - skb->data_len;
406 busaddr = pci_map_single(pdev, skb->data, len,
408 wrb = queue_head_node(txq);
409 wrb_fill(wrb, busaddr, len);
410 be_dws_cpu_to_le(wrb, sizeof(*wrb));
415 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
416 struct skb_frag_struct *frag =
417 &skb_shinfo(skb)->frags[i];
418 busaddr = pci_map_page(pdev, frag->page,
420 frag->size, PCI_DMA_TODEVICE);
421 wrb = queue_head_node(txq);
422 wrb_fill(wrb, busaddr, frag->size);
423 be_dws_cpu_to_le(wrb, sizeof(*wrb));
425 copied += frag->size;
429 wrb = queue_head_node(txq);
431 be_dws_cpu_to_le(wrb, sizeof(*wrb));
435 wrb_fill_hdr(hdr, first_skb, adapter->vlan_grp ? true : false,
437 be_dws_cpu_to_le(hdr, sizeof(*hdr));
442 static int be_xmit(struct sk_buff *skb, struct net_device *netdev)
444 struct be_adapter *adapter = netdev_priv(netdev);
445 struct be_tx_obj *tx_obj = &adapter->tx_obj;
446 struct be_queue_info *txq = &tx_obj->q;
447 u32 wrb_cnt = 0, copied = 0;
448 u32 start = txq->head;
449 bool dummy_wrb, stopped = false;
451 wrb_cnt = wrb_cnt_for_skb(skb, &dummy_wrb);
453 copied = make_tx_wrbs(adapter, skb, wrb_cnt, dummy_wrb);
455 /* record the sent skb in the sent_skb table */
456 BUG_ON(tx_obj->sent_skb_list[start]);
457 tx_obj->sent_skb_list[start] = skb;
459 /* Ensure that txq has space for the next skb; Else stop the queue
460 * *BEFORE* ringing the tx doorbell, so that we serialze the
461 * tx compls of the current transmit which'll wake up the queue
463 if ((BE_MAX_TX_FRAG_COUNT + atomic_read(&txq->used)) >= txq->len) {
464 netif_stop_queue(netdev);
468 be_txq_notify(&adapter->ctrl, txq->id, wrb_cnt);
470 be_tx_stats_update(adapter, wrb_cnt, copied, stopped);
474 static int be_change_mtu(struct net_device *netdev, int new_mtu)
476 struct be_adapter *adapter = netdev_priv(netdev);
477 if (new_mtu < BE_MIN_MTU ||
478 new_mtu > BE_MAX_JUMBO_FRAME_SIZE) {
479 dev_info(&adapter->pdev->dev,
480 "MTU must be between %d and %d bytes\n",
481 BE_MIN_MTU, BE_MAX_JUMBO_FRAME_SIZE);
484 dev_info(&adapter->pdev->dev, "MTU changed from %d to %d bytes\n",
485 netdev->mtu, new_mtu);
486 netdev->mtu = new_mtu;
491 * if there are BE_NUM_VLANS_SUPPORTED or lesser number of VLANS configured,
492 * program them in BE. If more than BE_NUM_VLANS_SUPPORTED are configured,
493 * set the BE in promiscuous VLAN mode.
495 static void be_vid_config(struct net_device *netdev)
497 struct be_adapter *adapter = netdev_priv(netdev);
498 u16 vtag[BE_NUM_VLANS_SUPPORTED];
501 if (adapter->num_vlans <= BE_NUM_VLANS_SUPPORTED) {
502 /* Construct VLAN Table to give to HW */
503 for (i = 0; i < VLAN_GROUP_ARRAY_LEN; i++) {
504 if (adapter->vlan_tag[i]) {
505 vtag[ntags] = cpu_to_le16(i);
509 be_cmd_vlan_config(&adapter->ctrl, adapter->if_handle,
512 be_cmd_vlan_config(&adapter->ctrl, adapter->if_handle,
517 static void be_vlan_register(struct net_device *netdev, struct vlan_group *grp)
519 struct be_adapter *adapter = netdev_priv(netdev);
520 struct be_eq_obj *rx_eq = &adapter->rx_eq;
521 struct be_eq_obj *tx_eq = &adapter->tx_eq;
522 struct be_ctrl_info *ctrl = &adapter->ctrl;
524 be_eq_notify(ctrl, rx_eq->q.id, false, false, 0);
525 be_eq_notify(ctrl, tx_eq->q.id, false, false, 0);
526 adapter->vlan_grp = grp;
527 be_eq_notify(ctrl, rx_eq->q.id, true, false, 0);
528 be_eq_notify(ctrl, tx_eq->q.id, true, false, 0);
531 static void be_vlan_add_vid(struct net_device *netdev, u16 vid)
533 struct be_adapter *adapter = netdev_priv(netdev);
535 adapter->num_vlans++;
536 adapter->vlan_tag[vid] = 1;
538 be_vid_config(netdev);
541 static void be_vlan_rem_vid(struct net_device *netdev, u16 vid)
543 struct be_adapter *adapter = netdev_priv(netdev);
545 adapter->num_vlans--;
546 adapter->vlan_tag[vid] = 0;
548 vlan_group_set_device(adapter->vlan_grp, vid, NULL);
549 be_vid_config(netdev);
552 static void be_set_multicast_filter(struct net_device *netdev)
554 struct be_adapter *adapter = netdev_priv(netdev);
555 struct dev_mc_list *mc_ptr;
556 u8 mac_addr[32][ETH_ALEN];
559 if (netdev->flags & IFF_ALLMULTI) {
560 /* set BE in Multicast promiscuous */
561 be_cmd_mcast_mac_set(&adapter->ctrl,
562 adapter->if_handle, NULL, 0, true);
566 for (mc_ptr = netdev->mc_list; mc_ptr; mc_ptr = mc_ptr->next) {
567 memcpy(&mac_addr[i][0], mc_ptr->dmi_addr, ETH_ALEN);
569 be_cmd_mcast_mac_set(&adapter->ctrl,
570 adapter->if_handle, &mac_addr[0][0], i, false);
577 /* reset the promiscuous mode also. */
578 be_cmd_mcast_mac_set(&adapter->ctrl,
579 adapter->if_handle, &mac_addr[0][0], i, false);
583 static void be_set_multicast_list(struct net_device *netdev)
585 struct be_adapter *adapter = netdev_priv(netdev);
587 if (netdev->flags & IFF_PROMISC) {
588 be_cmd_promiscuous_config(&adapter->ctrl, adapter->port_num, 1);
590 be_cmd_promiscuous_config(&adapter->ctrl, adapter->port_num, 0);
591 be_set_multicast_filter(netdev);
595 static void be_rx_rate_update(struct be_adapter *adapter)
597 struct be_drvr_stats *stats = drvr_stats(adapter);
601 if (time_before(now, stats->be_rx_jiffies)) {
602 stats->be_rx_jiffies = now;
606 /* Update the rate once in two seconds */
607 if ((now - stats->be_rx_jiffies) < 2 * HZ)
610 stats->be_rx_rate = be_calc_rate(stats->be_rx_bytes
611 - stats->be_rx_bytes_prev,
612 now - stats->be_rx_jiffies);
613 stats->be_rx_jiffies = now;
614 stats->be_rx_bytes_prev = stats->be_rx_bytes;
617 static void be_rx_stats_update(struct be_adapter *adapter,
618 u32 pktsize, u16 numfrags)
620 struct be_drvr_stats *stats = drvr_stats(adapter);
622 stats->be_rx_compl++;
623 stats->be_rx_frags += numfrags;
624 stats->be_rx_bytes += pktsize;
627 static inline bool do_pkt_csum(struct be_eth_rx_compl *rxcp, bool cso)
629 u8 l4_cksm, ip_version, ipcksm, tcpf = 0, udpf = 0, ipv6_chk;
631 l4_cksm = AMAP_GET_BITS(struct amap_eth_rx_compl, l4_cksm, rxcp);
632 ipcksm = AMAP_GET_BITS(struct amap_eth_rx_compl, ipcksm, rxcp);
633 ip_version = AMAP_GET_BITS(struct amap_eth_rx_compl, ip_version, rxcp);
635 tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl, tcpf, rxcp);
636 udpf = AMAP_GET_BITS(struct amap_eth_rx_compl, udpf, rxcp);
638 ipv6_chk = (ip_version && (tcpf || udpf));
640 return ((l4_cksm && ipv6_chk && ipcksm) && cso) ? false : true;
643 static struct be_rx_page_info *
644 get_rx_page_info(struct be_adapter *adapter, u16 frag_idx)
646 struct be_rx_page_info *rx_page_info;
647 struct be_queue_info *rxq = &adapter->rx_obj.q;
649 rx_page_info = &adapter->rx_obj.page_info_tbl[frag_idx];
650 BUG_ON(!rx_page_info->page);
652 if (rx_page_info->last_page_user)
653 pci_unmap_page(adapter->pdev, pci_unmap_addr(rx_page_info, bus),
654 adapter->big_page_size, PCI_DMA_FROMDEVICE);
656 atomic_dec(&rxq->used);
660 /* Throwaway the data in the Rx completion */
661 static void be_rx_compl_discard(struct be_adapter *adapter,
662 struct be_eth_rx_compl *rxcp)
664 struct be_queue_info *rxq = &adapter->rx_obj.q;
665 struct be_rx_page_info *page_info;
666 u16 rxq_idx, i, num_rcvd;
668 rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
669 num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
671 for (i = 0; i < num_rcvd; i++) {
672 page_info = get_rx_page_info(adapter, rxq_idx);
673 put_page(page_info->page);
674 memset(page_info, 0, sizeof(*page_info));
675 index_inc(&rxq_idx, rxq->len);
680 * skb_fill_rx_data forms a complete skb for an ether frame
683 static void skb_fill_rx_data(struct be_adapter *adapter,
684 struct sk_buff *skb, struct be_eth_rx_compl *rxcp)
686 struct be_queue_info *rxq = &adapter->rx_obj.q;
687 struct be_rx_page_info *page_info;
688 u16 rxq_idx, i, num_rcvd;
689 u32 pktsize, hdr_len, curr_frag_len;
692 rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
693 pktsize = AMAP_GET_BITS(struct amap_eth_rx_compl, pktsize, rxcp);
694 num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
696 page_info = get_rx_page_info(adapter, rxq_idx);
698 start = page_address(page_info->page) + page_info->page_offset;
701 /* Copy data in the first descriptor of this completion */
702 curr_frag_len = min(pktsize, rx_frag_size);
704 /* Copy the header portion into skb_data */
705 hdr_len = min((u32)BE_HDR_LEN, curr_frag_len);
706 memcpy(skb->data, start, hdr_len);
707 skb->len = curr_frag_len;
708 if (curr_frag_len <= BE_HDR_LEN) { /* tiny packet */
709 /* Complete packet has now been moved to data */
710 put_page(page_info->page);
712 skb->tail += curr_frag_len;
714 skb_shinfo(skb)->nr_frags = 1;
715 skb_shinfo(skb)->frags[0].page = page_info->page;
716 skb_shinfo(skb)->frags[0].page_offset =
717 page_info->page_offset + hdr_len;
718 skb_shinfo(skb)->frags[0].size = curr_frag_len - hdr_len;
719 skb->data_len = curr_frag_len - hdr_len;
720 skb->tail += hdr_len;
722 memset(page_info, 0, sizeof(*page_info));
724 if (pktsize <= rx_frag_size) {
725 BUG_ON(num_rcvd != 1);
729 /* More frags present for this completion */
730 pktsize -= curr_frag_len; /* account for above copied frag */
731 for (i = 1; i < num_rcvd; i++) {
732 index_inc(&rxq_idx, rxq->len);
733 page_info = get_rx_page_info(adapter, rxq_idx);
735 curr_frag_len = min(pktsize, rx_frag_size);
737 skb_shinfo(skb)->frags[i].page = page_info->page;
738 skb_shinfo(skb)->frags[i].page_offset = page_info->page_offset;
739 skb_shinfo(skb)->frags[i].size = curr_frag_len;
740 skb->len += curr_frag_len;
741 skb->data_len += curr_frag_len;
742 skb_shinfo(skb)->nr_frags++;
743 pktsize -= curr_frag_len;
745 memset(page_info, 0, sizeof(*page_info));
749 be_rx_stats_update(adapter, pktsize, num_rcvd);
753 /* Process the RX completion indicated by rxcp when LRO is disabled */
754 static void be_rx_compl_process(struct be_adapter *adapter,
755 struct be_eth_rx_compl *rxcp)
760 vtp = AMAP_GET_BITS(struct amap_eth_rx_compl, vtp, rxcp);
762 skb = netdev_alloc_skb(adapter->netdev, BE_HDR_LEN + NET_IP_ALIGN);
765 dev_warn(&adapter->pdev->dev, "skb alloc failed\n");
766 be_rx_compl_discard(adapter, rxcp);
770 skb_reserve(skb, NET_IP_ALIGN);
772 skb_fill_rx_data(adapter, skb, rxcp);
774 if (do_pkt_csum(rxcp, adapter->rx_csum))
775 skb->ip_summed = CHECKSUM_NONE;
777 skb->ip_summed = CHECKSUM_UNNECESSARY;
779 skb->truesize = skb->len + sizeof(struct sk_buff);
780 skb->protocol = eth_type_trans(skb, adapter->netdev);
781 skb->dev = adapter->netdev;
784 if (!adapter->vlan_grp || adapter->num_vlans == 0) {
788 vid = AMAP_GET_BITS(struct amap_eth_rx_compl, vlan_tag, rxcp);
789 vid = be16_to_cpu(vid);
790 vlan_hwaccel_receive_skb(skb, adapter->vlan_grp, vid);
792 netif_receive_skb(skb);
795 adapter->netdev->last_rx = jiffies;
800 /* Process the RX completion indicated by rxcp when LRO is enabled */
801 static void be_rx_compl_process_lro(struct be_adapter *adapter,
802 struct be_eth_rx_compl *rxcp)
804 struct be_rx_page_info *page_info;
805 struct skb_frag_struct rx_frags[BE_MAX_FRAGS_PER_FRAME];
806 struct be_queue_info *rxq = &adapter->rx_obj.q;
807 u32 num_rcvd, pkt_size, remaining, vlanf, curr_frag_len;
808 u16 i, rxq_idx = 0, vid;
810 num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
811 pkt_size = AMAP_GET_BITS(struct amap_eth_rx_compl, pktsize, rxcp);
812 vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl, vtp, rxcp);
813 rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
815 remaining = pkt_size;
816 for (i = 0; i < num_rcvd; i++) {
817 page_info = get_rx_page_info(adapter, rxq_idx);
819 curr_frag_len = min(remaining, rx_frag_size);
821 rx_frags[i].page = page_info->page;
822 rx_frags[i].page_offset = page_info->page_offset;
823 rx_frags[i].size = curr_frag_len;
824 remaining -= curr_frag_len;
826 index_inc(&rxq_idx, rxq->len);
828 memset(page_info, 0, sizeof(*page_info));
831 if (likely(!vlanf)) {
832 lro_receive_frags(&adapter->rx_obj.lro_mgr, rx_frags, pkt_size,
835 vid = AMAP_GET_BITS(struct amap_eth_rx_compl, vlan_tag, rxcp);
836 vid = be16_to_cpu(vid);
838 if (!adapter->vlan_grp || adapter->num_vlans == 0)
841 lro_vlan_hwaccel_receive_frags(&adapter->rx_obj.lro_mgr,
842 rx_frags, pkt_size, pkt_size, adapter->vlan_grp,
846 be_rx_stats_update(adapter, pkt_size, num_rcvd);
850 static struct be_eth_rx_compl *be_rx_compl_get(struct be_adapter *adapter)
852 struct be_eth_rx_compl *rxcp = queue_tail_node(&adapter->rx_obj.cq);
854 if (rxcp->dw[offsetof(struct amap_eth_rx_compl, valid) / 32] == 0)
857 be_dws_le_to_cpu(rxcp, sizeof(*rxcp));
859 queue_tail_inc(&adapter->rx_obj.cq);
863 /* To reset the valid bit, we need to reset the whole word as
864 * when walking the queue the valid entries are little-endian
865 * and invalid entries are host endian
867 static inline void be_rx_compl_reset(struct be_eth_rx_compl *rxcp)
869 rxcp->dw[offsetof(struct amap_eth_rx_compl, valid) / 32] = 0;
872 static inline struct page *be_alloc_pages(u32 size)
874 gfp_t alloc_flags = GFP_ATOMIC;
875 u32 order = get_order(size);
877 alloc_flags |= __GFP_COMP;
878 return alloc_pages(alloc_flags, order);
882 * Allocate a page, split it to fragments of size rx_frag_size and post as
883 * receive buffers to BE
885 static void be_post_rx_frags(struct be_adapter *adapter)
887 struct be_rx_page_info *page_info_tbl = adapter->rx_obj.page_info_tbl;
888 struct be_rx_page_info *page_info = NULL;
889 struct be_queue_info *rxq = &adapter->rx_obj.q;
890 struct page *pagep = NULL;
891 struct be_eth_rx_d *rxd;
892 u64 page_dmaaddr = 0, frag_dmaaddr;
893 u32 posted, page_offset = 0;
895 page_info = &page_info_tbl[rxq->head];
896 for (posted = 0; posted < MAX_RX_POST && !page_info->page; posted++) {
898 pagep = be_alloc_pages(adapter->big_page_size);
899 if (unlikely(!pagep)) {
900 drvr_stats(adapter)->be_ethrx_post_fail++;
903 page_dmaaddr = pci_map_page(adapter->pdev, pagep, 0,
904 adapter->big_page_size,
906 page_info->page_offset = 0;
909 page_info->page_offset = page_offset + rx_frag_size;
911 page_offset = page_info->page_offset;
912 page_info->page = pagep;
913 pci_unmap_addr_set(page_info, bus, page_dmaaddr);
914 frag_dmaaddr = page_dmaaddr + page_info->page_offset;
916 rxd = queue_head_node(rxq);
917 rxd->fragpa_lo = cpu_to_le32(frag_dmaaddr & 0xFFFFFFFF);
918 rxd->fragpa_hi = cpu_to_le32(upper_32_bits(frag_dmaaddr));
921 /* Any space left in the current big page for another frag? */
922 if ((page_offset + rx_frag_size + rx_frag_size) >
923 adapter->big_page_size) {
925 page_info->last_page_user = true;
927 page_info = &page_info_tbl[rxq->head];
930 page_info->last_page_user = true;
933 atomic_add(posted, &rxq->used);
934 be_rxq_notify(&adapter->ctrl, rxq->id, posted);
935 } else if (atomic_read(&rxq->used) == 0) {
936 /* Let be_worker replenish when memory is available */
937 adapter->rx_post_starved = true;
943 static struct be_eth_tx_compl *be_tx_compl_get(struct be_queue_info *tx_cq)
945 struct be_eth_tx_compl *txcp = queue_tail_node(tx_cq);
947 if (txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] == 0)
950 be_dws_le_to_cpu(txcp, sizeof(*txcp));
952 txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] = 0;
954 queue_tail_inc(tx_cq);
958 static void be_tx_compl_process(struct be_adapter *adapter, u16 last_index)
960 struct be_queue_info *txq = &adapter->tx_obj.q;
961 struct be_eth_wrb *wrb;
962 struct sk_buff **sent_skbs = adapter->tx_obj.sent_skb_list;
963 struct sk_buff *sent_skb;
965 u16 cur_index, num_wrbs = 0;
967 cur_index = txq->tail;
968 sent_skb = sent_skbs[cur_index];
970 sent_skbs[cur_index] = NULL;
973 cur_index = txq->tail;
974 wrb = queue_tail_node(txq);
975 be_dws_le_to_cpu(wrb, sizeof(*wrb));
976 busaddr = ((u64)wrb->frag_pa_hi << 32) | (u64)wrb->frag_pa_lo;
978 pci_unmap_single(adapter->pdev, busaddr,
979 wrb->frag_len, PCI_DMA_TODEVICE);
983 } while (cur_index != last_index);
985 atomic_sub(num_wrbs, &txq->used);
990 static void be_rx_q_clean(struct be_adapter *adapter)
992 struct be_rx_page_info *page_info;
993 struct be_queue_info *rxq = &adapter->rx_obj.q;
994 struct be_queue_info *rx_cq = &adapter->rx_obj.cq;
995 struct be_eth_rx_compl *rxcp;
998 /* First cleanup pending rx completions */
999 while ((rxcp = be_rx_compl_get(adapter)) != NULL) {
1000 be_rx_compl_discard(adapter, rxcp);
1001 be_rx_compl_reset(rxcp);
1002 be_cq_notify(&adapter->ctrl, rx_cq->id, true, 1);
1005 /* Then free posted rx buffer that were not used */
1006 tail = (rxq->head + rxq->len - atomic_read(&rxq->used)) % rxq->len;
1007 for (; tail != rxq->head; index_inc(&tail, rxq->len)) {
1008 page_info = get_rx_page_info(adapter, tail);
1009 put_page(page_info->page);
1010 memset(page_info, 0, sizeof(*page_info));
1012 BUG_ON(atomic_read(&rxq->used));
1015 static void be_tx_q_clean(struct be_adapter *adapter)
1017 struct sk_buff **sent_skbs = adapter->tx_obj.sent_skb_list;
1018 struct sk_buff *sent_skb;
1019 struct be_queue_info *txq = &adapter->tx_obj.q;
1023 while (atomic_read(&txq->used)) {
1024 sent_skb = sent_skbs[txq->tail];
1025 last_index = txq->tail;
1026 index_adv(&last_index,
1027 wrb_cnt_for_skb(sent_skb, &dummy_wrb) - 1, txq->len);
1028 be_tx_compl_process(adapter, last_index);
1032 static void be_mcc_queues_destroy(struct be_adapter *adapter)
1034 struct be_queue_info *q;
1035 struct be_ctrl_info *ctrl = &adapter->ctrl;
1037 q = &ctrl->mcc_obj.q;
1039 be_cmd_q_destroy(ctrl, q, QTYPE_MCCQ);
1040 be_queue_free(adapter, q);
1042 q = &ctrl->mcc_obj.cq;
1044 be_cmd_q_destroy(ctrl, q, QTYPE_CQ);
1045 be_queue_free(adapter, q);
1048 /* Must be called only after TX qs are created as MCC shares TX EQ */
1049 static int be_mcc_queues_create(struct be_adapter *adapter)
1051 struct be_queue_info *q, *cq;
1052 struct be_ctrl_info *ctrl = &adapter->ctrl;
1054 /* Alloc MCC compl queue */
1055 cq = &ctrl->mcc_obj.cq;
1056 if (be_queue_alloc(adapter, cq, MCC_CQ_LEN,
1057 sizeof(struct be_mcc_cq_entry)))
1060 /* Ask BE to create MCC compl queue; share TX's eq */
1061 if (be_cmd_cq_create(ctrl, cq, &adapter->tx_eq.q, false, true, 0))
1064 /* Alloc MCC queue */
1065 q = &ctrl->mcc_obj.q;
1066 if (be_queue_alloc(adapter, q, MCC_Q_LEN, sizeof(struct be_mcc_wrb)))
1067 goto mcc_cq_destroy;
1069 /* Ask BE to create MCC queue */
1070 if (be_cmd_mccq_create(ctrl, q, cq))
1076 be_queue_free(adapter, q);
1078 be_cmd_q_destroy(ctrl, cq, QTYPE_CQ);
1080 be_queue_free(adapter, cq);
1085 static void be_tx_queues_destroy(struct be_adapter *adapter)
1087 struct be_queue_info *q;
1089 q = &adapter->tx_obj.q;
1091 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_TXQ);
1093 /* No more tx completions can be rcvd now; clean up if there
1094 * are any pending completions or pending tx requests */
1095 be_tx_q_clean(adapter);
1097 be_queue_free(adapter, q);
1099 q = &adapter->tx_obj.cq;
1101 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_CQ);
1102 be_queue_free(adapter, q);
1104 q = &adapter->tx_eq.q;
1106 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_EQ);
1107 be_queue_free(adapter, q);
1110 static int be_tx_queues_create(struct be_adapter *adapter)
1112 struct be_queue_info *eq, *q, *cq;
1114 adapter->tx_eq.max_eqd = 0;
1115 adapter->tx_eq.min_eqd = 0;
1116 adapter->tx_eq.cur_eqd = 96;
1117 adapter->tx_eq.enable_aic = false;
1118 /* Alloc Tx Event queue */
1119 eq = &adapter->tx_eq.q;
1120 if (be_queue_alloc(adapter, eq, EVNT_Q_LEN, sizeof(struct be_eq_entry)))
1123 /* Ask BE to create Tx Event queue */
1124 if (be_cmd_eq_create(&adapter->ctrl, eq, adapter->tx_eq.cur_eqd))
1126 /* Alloc TX eth compl queue */
1127 cq = &adapter->tx_obj.cq;
1128 if (be_queue_alloc(adapter, cq, TX_CQ_LEN,
1129 sizeof(struct be_eth_tx_compl)))
1132 /* Ask BE to create Tx eth compl queue */
1133 if (be_cmd_cq_create(&adapter->ctrl, cq, eq, false, false, 3))
1136 /* Alloc TX eth queue */
1137 q = &adapter->tx_obj.q;
1138 if (be_queue_alloc(adapter, q, TX_Q_LEN, sizeof(struct be_eth_wrb)))
1141 /* Ask BE to create Tx eth queue */
1142 if (be_cmd_txq_create(&adapter->ctrl, q, cq))
1147 be_queue_free(adapter, q);
1149 be_cmd_q_destroy(&adapter->ctrl, cq, QTYPE_CQ);
1151 be_queue_free(adapter, cq);
1153 be_cmd_q_destroy(&adapter->ctrl, eq, QTYPE_EQ);
1155 be_queue_free(adapter, eq);
1159 static void be_rx_queues_destroy(struct be_adapter *adapter)
1161 struct be_queue_info *q;
1163 q = &adapter->rx_obj.q;
1165 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_RXQ);
1166 be_rx_q_clean(adapter);
1168 be_queue_free(adapter, q);
1170 q = &adapter->rx_obj.cq;
1172 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_CQ);
1173 be_queue_free(adapter, q);
1175 q = &adapter->rx_eq.q;
1177 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_EQ);
1178 be_queue_free(adapter, q);
1181 static int be_rx_queues_create(struct be_adapter *adapter)
1183 struct be_queue_info *eq, *q, *cq;
1186 adapter->max_rx_coal = BE_MAX_FRAGS_PER_FRAME;
1187 adapter->big_page_size = (1 << get_order(rx_frag_size)) * PAGE_SIZE;
1188 adapter->rx_eq.max_eqd = BE_MAX_EQD;
1189 adapter->rx_eq.min_eqd = 0;
1190 adapter->rx_eq.cur_eqd = 0;
1191 adapter->rx_eq.enable_aic = true;
1193 /* Alloc Rx Event queue */
1194 eq = &adapter->rx_eq.q;
1195 rc = be_queue_alloc(adapter, eq, EVNT_Q_LEN,
1196 sizeof(struct be_eq_entry));
1200 /* Ask BE to create Rx Event queue */
1201 rc = be_cmd_eq_create(&adapter->ctrl, eq, adapter->rx_eq.cur_eqd);
1205 /* Alloc RX eth compl queue */
1206 cq = &adapter->rx_obj.cq;
1207 rc = be_queue_alloc(adapter, cq, RX_CQ_LEN,
1208 sizeof(struct be_eth_rx_compl));
1212 /* Ask BE to create Rx eth compl queue */
1213 rc = be_cmd_cq_create(&adapter->ctrl, cq, eq, false, false, 3);
1217 /* Alloc RX eth queue */
1218 q = &adapter->rx_obj.q;
1219 rc = be_queue_alloc(adapter, q, RX_Q_LEN, sizeof(struct be_eth_rx_d));
1223 /* Ask BE to create Rx eth queue */
1224 rc = be_cmd_rxq_create(&adapter->ctrl, q, cq->id, rx_frag_size,
1225 BE_MAX_JUMBO_FRAME_SIZE, adapter->if_handle, false);
1231 be_queue_free(adapter, q);
1233 be_cmd_q_destroy(&adapter->ctrl, cq, QTYPE_CQ);
1235 be_queue_free(adapter, cq);
1237 be_cmd_q_destroy(&adapter->ctrl, eq, QTYPE_EQ);
1239 be_queue_free(adapter, eq);
1242 static bool event_get(struct be_eq_obj *eq_obj, u16 *rid)
1244 struct be_eq_entry *entry = queue_tail_node(&eq_obj->q);
1245 u32 evt = entry->evt;
1250 evt = le32_to_cpu(evt);
1251 *rid = (evt >> EQ_ENTRY_RES_ID_SHIFT) & EQ_ENTRY_RES_ID_MASK;
1253 queue_tail_inc(&eq_obj->q);
1257 static int event_handle(struct be_ctrl_info *ctrl,
1258 struct be_eq_obj *eq_obj)
1260 u16 rid = 0, num = 0;
1262 while (event_get(eq_obj, &rid))
1265 /* We can see an interrupt and no event */
1266 be_eq_notify(ctrl, eq_obj->q.id, true, true, num);
1268 napi_schedule(&eq_obj->napi);
1273 static irqreturn_t be_intx(int irq, void *dev)
1275 struct be_adapter *adapter = dev;
1276 struct be_ctrl_info *ctrl = &adapter->ctrl;
1279 tx = event_handle(ctrl, &adapter->tx_eq);
1280 rx = event_handle(ctrl, &adapter->rx_eq);
1288 static irqreturn_t be_msix_rx(int irq, void *dev)
1290 struct be_adapter *adapter = dev;
1292 event_handle(&adapter->ctrl, &adapter->rx_eq);
1297 static irqreturn_t be_msix_tx_mcc(int irq, void *dev)
1299 struct be_adapter *adapter = dev;
1301 event_handle(&adapter->ctrl, &adapter->tx_eq);
1306 static inline bool do_lro(struct be_adapter *adapter,
1307 struct be_eth_rx_compl *rxcp)
1309 int err = AMAP_GET_BITS(struct amap_eth_rx_compl, err, rxcp);
1310 int tcp_frame = AMAP_GET_BITS(struct amap_eth_rx_compl, tcpf, rxcp);
1313 drvr_stats(adapter)->be_rxcp_err++;
1315 return (!tcp_frame || err || (adapter->max_rx_coal <= 1)) ?
1319 int be_poll_rx(struct napi_struct *napi, int budget)
1321 struct be_eq_obj *rx_eq = container_of(napi, struct be_eq_obj, napi);
1322 struct be_adapter *adapter =
1323 container_of(rx_eq, struct be_adapter, rx_eq);
1324 struct be_queue_info *rx_cq = &adapter->rx_obj.cq;
1325 struct be_eth_rx_compl *rxcp;
1328 for (work_done = 0; work_done < budget; work_done++) {
1329 rxcp = be_rx_compl_get(adapter);
1333 if (do_lro(adapter, rxcp))
1334 be_rx_compl_process_lro(adapter, rxcp);
1336 be_rx_compl_process(adapter, rxcp);
1338 be_rx_compl_reset(rxcp);
1341 lro_flush_all(&adapter->rx_obj.lro_mgr);
1343 /* Refill the queue */
1344 if (atomic_read(&adapter->rx_obj.q.used) < RX_FRAGS_REFILL_WM)
1345 be_post_rx_frags(adapter);
1348 if (work_done < budget) {
1349 napi_complete(napi);
1350 be_cq_notify(&adapter->ctrl, rx_cq->id, true, work_done);
1352 /* More to be consumed; continue with interrupts disabled */
1353 be_cq_notify(&adapter->ctrl, rx_cq->id, false, work_done);
1358 void be_process_tx(struct be_adapter *adapter)
1360 struct be_queue_info *txq = &adapter->tx_obj.q;
1361 struct be_queue_info *tx_cq = &adapter->tx_obj.cq;
1362 struct be_eth_tx_compl *txcp;
1366 while ((txcp = be_tx_compl_get(tx_cq))) {
1367 end_idx = AMAP_GET_BITS(struct amap_eth_tx_compl,
1369 be_tx_compl_process(adapter, end_idx);
1374 be_cq_notify(&adapter->ctrl, tx_cq->id, true, num_cmpl);
1376 /* As Tx wrbs have been freed up, wake up netdev queue if
1377 * it was stopped due to lack of tx wrbs.
1379 if (netif_queue_stopped(adapter->netdev) &&
1380 atomic_read(&txq->used) < txq->len / 2) {
1381 netif_wake_queue(adapter->netdev);
1384 drvr_stats(adapter)->be_tx_events++;
1385 drvr_stats(adapter)->be_tx_compl += num_cmpl;
1389 /* As TX and MCC share the same EQ check for both TX and MCC completions.
1390 * For TX/MCC we don't honour budget; consume everything
1392 static int be_poll_tx_mcc(struct napi_struct *napi, int budget)
1394 struct be_eq_obj *tx_eq = container_of(napi, struct be_eq_obj, napi);
1395 struct be_adapter *adapter =
1396 container_of(tx_eq, struct be_adapter, tx_eq);
1398 napi_complete(napi);
1400 be_process_tx(adapter);
1402 be_process_mcc(&adapter->ctrl);
1407 static void be_worker(struct work_struct *work)
1409 struct be_adapter *adapter =
1410 container_of(work, struct be_adapter, work.work);
1414 be_link_status_update(adapter);
1417 status = be_cmd_get_stats(&adapter->ctrl, &adapter->stats.cmd);
1419 netdev_stats_update(adapter);
1422 be_rx_eqd_update(adapter);
1424 be_tx_rate_update(adapter);
1425 be_rx_rate_update(adapter);
1427 if (adapter->rx_post_starved) {
1428 adapter->rx_post_starved = false;
1429 be_post_rx_frags(adapter);
1432 schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
1435 static void be_msix_enable(struct be_adapter *adapter)
1439 for (i = 0; i < BE_NUM_MSIX_VECTORS; i++)
1440 adapter->msix_entries[i].entry = i;
1442 status = pci_enable_msix(adapter->pdev, adapter->msix_entries,
1443 BE_NUM_MSIX_VECTORS);
1445 adapter->msix_enabled = true;
1449 static inline int be_msix_vec_get(struct be_adapter *adapter, u32 eq_id)
1451 return adapter->msix_entries[eq_id -
1452 8 * adapter->ctrl.pci_func].vector;
1455 static int be_msix_register(struct be_adapter *adapter)
1457 struct net_device *netdev = adapter->netdev;
1458 struct be_eq_obj *tx_eq = &adapter->tx_eq;
1459 struct be_eq_obj *rx_eq = &adapter->rx_eq;
1462 sprintf(tx_eq->desc, "%s-tx", netdev->name);
1463 vec = be_msix_vec_get(adapter, tx_eq->q.id);
1464 status = request_irq(vec, be_msix_tx_mcc, 0, tx_eq->desc, adapter);
1468 sprintf(rx_eq->desc, "%s-rx", netdev->name);
1469 vec = be_msix_vec_get(adapter, rx_eq->q.id);
1470 status = request_irq(vec, be_msix_rx, 0, rx_eq->desc, adapter);
1471 if (status) { /* Free TX IRQ */
1472 vec = be_msix_vec_get(adapter, tx_eq->q.id);
1473 free_irq(vec, adapter);
1478 dev_warn(&adapter->pdev->dev,
1479 "MSIX Request IRQ failed - err %d\n", status);
1480 pci_disable_msix(adapter->pdev);
1481 adapter->msix_enabled = false;
1485 static int be_irq_register(struct be_adapter *adapter)
1487 struct net_device *netdev = adapter->netdev;
1490 if (adapter->msix_enabled) {
1491 status = be_msix_register(adapter);
1497 netdev->irq = adapter->pdev->irq;
1498 status = request_irq(netdev->irq, be_intx, IRQF_SHARED, netdev->name,
1501 dev_err(&adapter->pdev->dev,
1502 "INTx request IRQ failed - err %d\n", status);
1506 adapter->isr_registered = true;
1510 static void be_irq_unregister(struct be_adapter *adapter)
1512 struct net_device *netdev = adapter->netdev;
1515 if (!adapter->isr_registered)
1519 if (!adapter->msix_enabled) {
1520 free_irq(netdev->irq, adapter);
1525 vec = be_msix_vec_get(adapter, adapter->tx_eq.q.id);
1526 free_irq(vec, adapter);
1527 vec = be_msix_vec_get(adapter, adapter->rx_eq.q.id);
1528 free_irq(vec, adapter);
1530 adapter->isr_registered = false;
1534 static int be_open(struct net_device *netdev)
1536 struct be_adapter *adapter = netdev_priv(netdev);
1537 struct be_ctrl_info *ctrl = &adapter->ctrl;
1538 struct be_eq_obj *rx_eq = &adapter->rx_eq;
1539 struct be_eq_obj *tx_eq = &adapter->tx_eq;
1541 /* First time posting */
1542 be_post_rx_frags(adapter);
1544 napi_enable(&rx_eq->napi);
1545 napi_enable(&tx_eq->napi);
1547 be_irq_register(adapter);
1549 be_intr_set(ctrl, true);
1551 /* The evt queues are created in unarmed state; arm them */
1552 be_eq_notify(ctrl, rx_eq->q.id, true, false, 0);
1553 be_eq_notify(ctrl, tx_eq->q.id, true, false, 0);
1555 /* Rx compl queue may be in unarmed state; rearm it */
1556 be_cq_notify(ctrl, adapter->rx_obj.cq.id, true, 0);
1558 be_link_status_update(adapter);
1560 schedule_delayed_work(&adapter->work, msecs_to_jiffies(100));
1564 static int be_setup(struct be_adapter *adapter)
1566 struct be_ctrl_info *ctrl = &adapter->ctrl;
1567 struct net_device *netdev = adapter->netdev;
1571 if_flags = BE_IF_FLAGS_BROADCAST | BE_IF_FLAGS_PROMISCUOUS |
1572 BE_IF_FLAGS_MCAST_PROMISCUOUS | BE_IF_FLAGS_UNTAGGED |
1573 BE_IF_FLAGS_PASS_L3L4_ERRORS;
1574 status = be_cmd_if_create(ctrl, if_flags, netdev->dev_addr,
1575 false/* pmac_invalid */, &adapter->if_handle,
1580 be_vid_config(netdev);
1582 status = be_cmd_set_flow_control(ctrl, true, true);
1586 status = be_tx_queues_create(adapter);
1590 status = be_rx_queues_create(adapter);
1594 status = be_mcc_queues_create(adapter);
1601 be_rx_queues_destroy(adapter);
1603 be_tx_queues_destroy(adapter);
1605 be_cmd_if_destroy(ctrl, adapter->if_handle);
1610 static int be_clear(struct be_adapter *adapter)
1612 struct be_ctrl_info *ctrl = &adapter->ctrl;
1614 be_rx_queues_destroy(adapter);
1615 be_tx_queues_destroy(adapter);
1617 be_cmd_if_destroy(ctrl, adapter->if_handle);
1619 be_mcc_queues_destroy(adapter);
1623 static int be_close(struct net_device *netdev)
1625 struct be_adapter *adapter = netdev_priv(netdev);
1626 struct be_ctrl_info *ctrl = &adapter->ctrl;
1627 struct be_eq_obj *rx_eq = &adapter->rx_eq;
1628 struct be_eq_obj *tx_eq = &adapter->tx_eq;
1631 cancel_delayed_work_sync(&adapter->work);
1633 netif_stop_queue(netdev);
1634 netif_carrier_off(netdev);
1635 adapter->link.speed = PHY_LINK_SPEED_ZERO;
1637 be_intr_set(ctrl, false);
1639 if (adapter->msix_enabled) {
1640 vec = be_msix_vec_get(adapter, tx_eq->q.id);
1641 synchronize_irq(vec);
1642 vec = be_msix_vec_get(adapter, rx_eq->q.id);
1643 synchronize_irq(vec);
1645 synchronize_irq(netdev->irq);
1647 be_irq_unregister(adapter);
1649 napi_disable(&rx_eq->napi);
1650 napi_disable(&tx_eq->napi);
1655 static int be_get_frag_header(struct skb_frag_struct *frag, void **mac_hdr,
1656 void **ip_hdr, void **tcpudp_hdr,
1657 u64 *hdr_flags, void *priv)
1660 struct vlan_ethhdr *veh;
1662 u8 *va = page_address(frag->page) + frag->page_offset;
1663 unsigned long ll_hlen;
1666 eh = (struct ethhdr *)va;
1669 if (eh->h_proto != htons(ETH_P_IP)) {
1670 if (eh->h_proto == htons(ETH_P_8021Q)) {
1671 veh = (struct vlan_ethhdr *)va;
1672 if (veh->h_vlan_encapsulated_proto != htons(ETH_P_IP))
1675 ll_hlen += VLAN_HLEN;
1680 *hdr_flags = LRO_IPV4;
1681 iph = (struct iphdr *)(va + ll_hlen);
1683 if (iph->protocol != IPPROTO_TCP)
1685 *hdr_flags |= LRO_TCP;
1686 *tcpudp_hdr = (u8 *) (*ip_hdr) + (iph->ihl << 2);
1691 static void be_lro_init(struct be_adapter *adapter, struct net_device *netdev)
1693 struct net_lro_mgr *lro_mgr;
1695 lro_mgr = &adapter->rx_obj.lro_mgr;
1696 lro_mgr->dev = netdev;
1697 lro_mgr->features = LRO_F_NAPI;
1698 lro_mgr->ip_summed = CHECKSUM_UNNECESSARY;
1699 lro_mgr->ip_summed_aggr = CHECKSUM_UNNECESSARY;
1700 lro_mgr->max_desc = BE_MAX_LRO_DESCRIPTORS;
1701 lro_mgr->lro_arr = adapter->rx_obj.lro_desc;
1702 lro_mgr->get_frag_header = be_get_frag_header;
1703 lro_mgr->max_aggr = BE_MAX_FRAGS_PER_FRAME;
1706 static struct net_device_ops be_netdev_ops = {
1707 .ndo_open = be_open,
1708 .ndo_stop = be_close,
1709 .ndo_start_xmit = be_xmit,
1710 .ndo_get_stats = be_get_stats,
1711 .ndo_set_rx_mode = be_set_multicast_list,
1712 .ndo_set_mac_address = be_mac_addr_set,
1713 .ndo_change_mtu = be_change_mtu,
1714 .ndo_validate_addr = eth_validate_addr,
1715 .ndo_vlan_rx_register = be_vlan_register,
1716 .ndo_vlan_rx_add_vid = be_vlan_add_vid,
1717 .ndo_vlan_rx_kill_vid = be_vlan_rem_vid,
1720 static void be_netdev_init(struct net_device *netdev)
1722 struct be_adapter *adapter = netdev_priv(netdev);
1724 netdev->features |= NETIF_F_SG | NETIF_F_HW_VLAN_RX | NETIF_F_TSO |
1725 NETIF_F_HW_VLAN_TX | NETIF_F_HW_VLAN_FILTER | NETIF_F_IP_CSUM |
1728 netdev->flags |= IFF_MULTICAST;
1730 adapter->rx_csum = true;
1732 BE_SET_NETDEV_OPS(netdev, &be_netdev_ops);
1734 SET_ETHTOOL_OPS(netdev, &be_ethtool_ops);
1736 be_lro_init(adapter, netdev);
1738 netif_napi_add(netdev, &adapter->rx_eq.napi, be_poll_rx,
1740 netif_napi_add(netdev, &adapter->tx_eq.napi, be_poll_tx_mcc,
1743 netif_carrier_off(netdev);
1744 netif_stop_queue(netdev);
1747 static void be_unmap_pci_bars(struct be_adapter *adapter)
1749 struct be_ctrl_info *ctrl = &adapter->ctrl;
1755 iounmap(ctrl->pcicfg);
1758 static int be_map_pci_bars(struct be_adapter *adapter)
1762 addr = ioremap_nocache(pci_resource_start(adapter->pdev, 2),
1763 pci_resource_len(adapter->pdev, 2));
1766 adapter->ctrl.csr = addr;
1768 addr = ioremap_nocache(pci_resource_start(adapter->pdev, 4),
1772 adapter->ctrl.db = addr;
1774 addr = ioremap_nocache(pci_resource_start(adapter->pdev, 1),
1775 pci_resource_len(adapter->pdev, 1));
1778 adapter->ctrl.pcicfg = addr;
1782 be_unmap_pci_bars(adapter);
1787 static void be_ctrl_cleanup(struct be_adapter *adapter)
1789 struct be_dma_mem *mem = &adapter->ctrl.mbox_mem_alloced;
1791 be_unmap_pci_bars(adapter);
1794 pci_free_consistent(adapter->pdev, mem->size,
1798 /* Initialize the mbox required to send cmds to BE */
1799 static int be_ctrl_init(struct be_adapter *adapter)
1801 struct be_ctrl_info *ctrl = &adapter->ctrl;
1802 struct be_dma_mem *mbox_mem_alloc = &ctrl->mbox_mem_alloced;
1803 struct be_dma_mem *mbox_mem_align = &ctrl->mbox_mem;
1807 status = be_map_pci_bars(adapter);
1811 mbox_mem_alloc->size = sizeof(struct be_mcc_mailbox) + 16;
1812 mbox_mem_alloc->va = pci_alloc_consistent(adapter->pdev,
1813 mbox_mem_alloc->size, &mbox_mem_alloc->dma);
1814 if (!mbox_mem_alloc->va) {
1815 be_unmap_pci_bars(adapter);
1818 mbox_mem_align->size = sizeof(struct be_mcc_mailbox);
1819 mbox_mem_align->va = PTR_ALIGN(mbox_mem_alloc->va, 16);
1820 mbox_mem_align->dma = PTR_ALIGN(mbox_mem_alloc->dma, 16);
1821 memset(mbox_mem_align->va, 0, sizeof(struct be_mcc_mailbox));
1822 spin_lock_init(&ctrl->mbox_lock);
1823 spin_lock_init(&ctrl->mcc_lock);
1824 spin_lock_init(&ctrl->mcc_cq_lock);
1826 val = ioread32(ctrl->pcicfg + PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET);
1827 ctrl->pci_func = (val >> MEMBAR_CTRL_INT_CTRL_PFUNC_SHIFT) &
1828 MEMBAR_CTRL_INT_CTRL_PFUNC_MASK;
1832 static void be_stats_cleanup(struct be_adapter *adapter)
1834 struct be_stats_obj *stats = &adapter->stats;
1835 struct be_dma_mem *cmd = &stats->cmd;
1838 pci_free_consistent(adapter->pdev, cmd->size,
1842 static int be_stats_init(struct be_adapter *adapter)
1844 struct be_stats_obj *stats = &adapter->stats;
1845 struct be_dma_mem *cmd = &stats->cmd;
1847 cmd->size = sizeof(struct be_cmd_req_get_stats);
1848 cmd->va = pci_alloc_consistent(adapter->pdev, cmd->size, &cmd->dma);
1849 if (cmd->va == NULL)
1854 static void __devexit be_remove(struct pci_dev *pdev)
1856 struct be_adapter *adapter = pci_get_drvdata(pdev);
1860 unregister_netdev(adapter->netdev);
1864 be_stats_cleanup(adapter);
1866 be_ctrl_cleanup(adapter);
1868 if (adapter->msix_enabled) {
1869 pci_disable_msix(adapter->pdev);
1870 adapter->msix_enabled = false;
1873 pci_set_drvdata(pdev, NULL);
1874 pci_release_regions(pdev);
1875 pci_disable_device(pdev);
1877 free_netdev(adapter->netdev);
1880 static int be_hw_up(struct be_adapter *adapter)
1882 struct be_ctrl_info *ctrl = &adapter->ctrl;
1885 status = be_cmd_POST(ctrl);
1889 status = be_cmd_get_fw_ver(ctrl, adapter->fw_ver);
1893 status = be_cmd_query_fw_cfg(ctrl, &adapter->port_num);
1897 static int __devinit be_probe(struct pci_dev *pdev,
1898 const struct pci_device_id *pdev_id)
1901 struct be_adapter *adapter;
1902 struct net_device *netdev;
1903 struct be_ctrl_info *ctrl;
1906 status = pci_enable_device(pdev);
1910 status = pci_request_regions(pdev, DRV_NAME);
1913 pci_set_master(pdev);
1915 netdev = alloc_etherdev(sizeof(struct be_adapter));
1916 if (netdev == NULL) {
1920 adapter = netdev_priv(netdev);
1921 adapter->pdev = pdev;
1922 pci_set_drvdata(pdev, adapter);
1923 adapter->netdev = netdev;
1925 be_msix_enable(adapter);
1927 status = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1929 netdev->features |= NETIF_F_HIGHDMA;
1931 status = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1933 dev_err(&pdev->dev, "Could not set PCI DMA Mask\n");
1938 ctrl = &adapter->ctrl;
1939 status = be_ctrl_init(adapter);
1943 status = be_stats_init(adapter);
1947 status = be_hw_up(adapter);
1951 status = be_cmd_mac_addr_query(ctrl, mac, MAC_ADDRESS_TYPE_NETWORK,
1952 true /* permanent */, 0);
1955 memcpy(netdev->dev_addr, mac, ETH_ALEN);
1957 INIT_DELAYED_WORK(&adapter->work, be_worker);
1958 be_netdev_init(netdev);
1959 SET_NETDEV_DEV(netdev, &adapter->pdev->dev);
1961 status = be_setup(adapter);
1964 status = register_netdev(netdev);
1968 dev_info(&pdev->dev, "%s port %d\n", nic_name(pdev), adapter->port_num);
1974 be_stats_cleanup(adapter);
1976 be_ctrl_cleanup(adapter);
1978 free_netdev(adapter->netdev);
1980 pci_release_regions(pdev);
1982 pci_disable_device(pdev);
1984 dev_err(&pdev->dev, "%s initialization failed\n", nic_name(pdev));
1988 static int be_suspend(struct pci_dev *pdev, pm_message_t state)
1990 struct be_adapter *adapter = pci_get_drvdata(pdev);
1991 struct net_device *netdev = adapter->netdev;
1993 netif_device_detach(netdev);
1994 if (netif_running(netdev)) {
2001 pci_save_state(pdev);
2002 pci_disable_device(pdev);
2003 pci_set_power_state(pdev, pci_choose_state(pdev, state));
2007 static int be_resume(struct pci_dev *pdev)
2010 struct be_adapter *adapter = pci_get_drvdata(pdev);
2011 struct net_device *netdev = adapter->netdev;
2013 netif_device_detach(netdev);
2015 status = pci_enable_device(pdev);
2019 pci_set_power_state(pdev, 0);
2020 pci_restore_state(pdev);
2022 if (netif_running(netdev)) {
2028 netif_device_attach(netdev);
2032 static struct pci_driver be_driver = {
2034 .id_table = be_dev_ids,
2036 .remove = be_remove,
2037 .suspend = be_suspend,
2041 static int __init be_init_module(void)
2043 if (rx_frag_size != 8192 && rx_frag_size != 4096
2044 && rx_frag_size != 2048) {
2045 printk(KERN_WARNING DRV_NAME
2046 " : Module param rx_frag_size must be 2048/4096/8192."
2048 rx_frag_size = 2048;
2050 /* Ensure rx_frag_size is aligned to chache line */
2051 if (SKB_DATA_ALIGN(rx_frag_size) != rx_frag_size) {
2052 printk(KERN_WARNING DRV_NAME
2053 " : Bad module param rx_frag_size. Using 2048\n");
2054 rx_frag_size = 2048;
2057 return pci_register_driver(&be_driver);
2059 module_init(be_init_module);
2061 static void __exit be_exit_module(void)
2063 pci_unregister_driver(&be_driver);
2065 module_exit(be_exit_module);