1 /**************************************************************************/
3 /* IBM eServer i/pSeries Virtual Ethernet Device Driver */
4 /* Copyright (C) 2003 IBM Corp. */
5 /* Originally written by Dave Larson (larson1@us.ibm.com) */
6 /* Maintained by Santiago Leon (santil@us.ibm.com) */
8 /* This program is free software; you can redistribute it and/or modify */
9 /* it under the terms of the GNU General Public License as published by */
10 /* the Free Software Foundation; either version 2 of the License, or */
11 /* (at your option) any later version. */
13 /* This program is distributed in the hope that it will be useful, */
14 /* but WITHOUT ANY WARRANTY; without even the implied warranty of */
15 /* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the */
16 /* GNU General Public License for more details. */
18 /* You should have received a copy of the GNU General Public License */
19 /* along with this program; if not, write to the Free Software */
20 /* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 */
23 /* This module contains the implementation of a virtual ethernet device */
24 /* for use with IBM i/pSeries LPAR Linux. It utilizes the logical LAN */
25 /* option of the RS/6000 Platform Architechture to interface with virtual */
26 /* ethernet NICs that are presented to the partition by the hypervisor. */
28 /**************************************************************************/
31 - remove frag processing code - no longer needed
32 - add support for sysfs
33 - possibly remove procfs support
36 #include <linux/module.h>
37 #include <linux/types.h>
38 #include <linux/errno.h>
39 #include <linux/ioport.h>
40 #include <linux/dma-mapping.h>
41 #include <linux/kernel.h>
42 #include <linux/netdevice.h>
43 #include <linux/etherdevice.h>
44 #include <linux/skbuff.h>
45 #include <linux/init.h>
46 #include <linux/delay.h>
48 #include <linux/ethtool.h>
49 #include <linux/proc_fs.h>
50 #include <asm/semaphore.h>
51 #include <asm/hvcall.h>
52 #include <asm/atomic.h>
54 #include <asm/uaccess.h>
55 #include <linux/seq_file.h>
61 #define ibmveth_printk(fmt, args...) \
62 printk(KERN_DEBUG "%s: " fmt, __FILE__, ## args)
64 #define ibmveth_error_printk(fmt, args...) \
65 printk(KERN_ERR "(%s:%3.3d ua:%x) ERROR: " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
68 #define ibmveth_debug_printk_no_adapter(fmt, args...) \
69 printk(KERN_DEBUG "(%s:%3.3d): " fmt, __FILE__, __LINE__ , ## args)
70 #define ibmveth_debug_printk(fmt, args...) \
71 printk(KERN_DEBUG "(%s:%3.3d ua:%x): " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
72 #define ibmveth_assert(expr) \
74 printk(KERN_DEBUG "assertion failed (%s:%3.3d ua:%x): %s\n", __FILE__, __LINE__, adapter->vdev->unit_address, #expr); \
78 #define ibmveth_debug_printk_no_adapter(fmt, args...)
79 #define ibmveth_debug_printk(fmt, args...)
80 #define ibmveth_assert(expr)
83 static int ibmveth_open(struct net_device *dev);
84 static int ibmveth_close(struct net_device *dev);
85 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd);
86 static int ibmveth_poll(struct napi_struct *napi, int budget);
87 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *dev);
88 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev);
89 static void ibmveth_set_multicast_list(struct net_device *dev);
90 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu);
91 static void ibmveth_proc_register_driver(void);
92 static void ibmveth_proc_unregister_driver(void);
93 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter);
94 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter);
95 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
96 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter);
97 static struct kobj_type ktype_veth_pool;
100 #define IBMVETH_PROC_DIR "net/ibmveth"
101 static struct proc_dir_entry *ibmveth_proc_dir;
104 static const char ibmveth_driver_name[] = "ibmveth";
105 static const char ibmveth_driver_string[] = "IBM i/pSeries Virtual Ethernet Driver";
106 #define ibmveth_driver_version "1.03"
108 MODULE_AUTHOR("Santiago Leon <santil@us.ibm.com>");
109 MODULE_DESCRIPTION("IBM i/pSeries Virtual Ethernet Driver");
110 MODULE_LICENSE("GPL");
111 MODULE_VERSION(ibmveth_driver_version);
113 /* simple methods of getting data from the current rxq entry */
114 static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
116 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].toggle == adapter->rx_queue.toggle);
119 static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
121 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].valid);
124 static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
126 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].offset);
129 static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
131 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
134 /* setup the initial settings for a buffer pool */
135 static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool, u32 pool_index, u32 pool_size, u32 buff_size, u32 pool_active)
137 pool->size = pool_size;
138 pool->index = pool_index;
139 pool->buff_size = buff_size;
140 pool->threshold = pool_size / 2;
141 pool->active = pool_active;
144 /* allocate and setup an buffer pool - called during open */
145 static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
149 pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL);
151 if(!pool->free_map) {
155 pool->dma_addr = kmalloc(sizeof(dma_addr_t) * pool->size, GFP_KERNEL);
156 if(!pool->dma_addr) {
157 kfree(pool->free_map);
158 pool->free_map = NULL;
162 pool->skbuff = kmalloc(sizeof(void*) * pool->size, GFP_KERNEL);
165 kfree(pool->dma_addr);
166 pool->dma_addr = NULL;
168 kfree(pool->free_map);
169 pool->free_map = NULL;
173 memset(pool->skbuff, 0, sizeof(void*) * pool->size);
174 memset(pool->dma_addr, 0, sizeof(dma_addr_t) * pool->size);
176 for(i = 0; i < pool->size; ++i) {
177 pool->free_map[i] = i;
180 atomic_set(&pool->available, 0);
181 pool->producer_index = 0;
182 pool->consumer_index = 0;
187 /* replenish the buffers for a pool. note that we don't need to
188 * skb_reserve these since they are used for incoming...
190 static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
193 u32 count = pool->size - atomic_read(&pool->available);
194 u32 buffers_added = 0;
198 for(i = 0; i < count; ++i) {
200 unsigned int free_index, index;
202 union ibmveth_buf_desc desc;
203 unsigned long lpar_rc;
206 skb = alloc_skb(pool->buff_size, GFP_ATOMIC);
209 ibmveth_debug_printk("replenish: unable to allocate skb\n");
210 adapter->replenish_no_mem++;
214 free_index = pool->consumer_index;
215 pool->consumer_index = (pool->consumer_index + 1) % pool->size;
216 index = pool->free_map[free_index];
218 ibmveth_assert(index != IBM_VETH_INVALID_MAP);
219 ibmveth_assert(pool->skbuff[index] == NULL);
221 dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
222 pool->buff_size, DMA_FROM_DEVICE);
224 pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
225 pool->dma_addr[index] = dma_addr;
226 pool->skbuff[index] = skb;
228 correlator = ((u64)pool->index << 32) | index;
229 *(u64*)skb->data = correlator;
232 desc.fields.valid = 1;
233 desc.fields.length = pool->buff_size;
234 desc.fields.address = dma_addr;
236 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
238 if(lpar_rc != H_SUCCESS) {
239 pool->free_map[free_index] = index;
240 pool->skbuff[index] = NULL;
241 if (pool->consumer_index == 0)
242 pool->consumer_index = pool->size - 1;
244 pool->consumer_index--;
245 dma_unmap_single(&adapter->vdev->dev,
246 pool->dma_addr[index], pool->buff_size,
248 dev_kfree_skb_any(skb);
249 adapter->replenish_add_buff_failure++;
253 adapter->replenish_add_buff_success++;
258 atomic_add(buffers_added, &(pool->available));
261 /* replenish routine */
262 static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
266 adapter->replenish_task_cycles++;
268 for(i = 0; i < IbmVethNumBufferPools; i++)
269 if(adapter->rx_buff_pool[i].active)
270 ibmveth_replenish_buffer_pool(adapter,
271 &adapter->rx_buff_pool[i]);
273 adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
276 /* empty and free ana buffer pool - also used to do cleanup in error paths */
277 static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
281 kfree(pool->free_map);
282 pool->free_map = NULL;
284 if(pool->skbuff && pool->dma_addr) {
285 for(i = 0; i < pool->size; ++i) {
286 struct sk_buff *skb = pool->skbuff[i];
288 dma_unmap_single(&adapter->vdev->dev,
292 dev_kfree_skb_any(skb);
293 pool->skbuff[i] = NULL;
299 kfree(pool->dma_addr);
300 pool->dma_addr = NULL;
309 /* remove a buffer from a pool */
310 static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter, u64 correlator)
312 unsigned int pool = correlator >> 32;
313 unsigned int index = correlator & 0xffffffffUL;
314 unsigned int free_index;
317 ibmveth_assert(pool < IbmVethNumBufferPools);
318 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
320 skb = adapter->rx_buff_pool[pool].skbuff[index];
322 ibmveth_assert(skb != NULL);
324 adapter->rx_buff_pool[pool].skbuff[index] = NULL;
326 dma_unmap_single(&adapter->vdev->dev,
327 adapter->rx_buff_pool[pool].dma_addr[index],
328 adapter->rx_buff_pool[pool].buff_size,
331 free_index = adapter->rx_buff_pool[pool].producer_index;
332 adapter->rx_buff_pool[pool].producer_index
333 = (adapter->rx_buff_pool[pool].producer_index + 1)
334 % adapter->rx_buff_pool[pool].size;
335 adapter->rx_buff_pool[pool].free_map[free_index] = index;
339 atomic_dec(&(adapter->rx_buff_pool[pool].available));
342 /* get the current buffer on the rx queue */
343 static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
345 u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
346 unsigned int pool = correlator >> 32;
347 unsigned int index = correlator & 0xffffffffUL;
349 ibmveth_assert(pool < IbmVethNumBufferPools);
350 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
352 return adapter->rx_buff_pool[pool].skbuff[index];
355 /* recycle the current buffer on the rx queue */
356 static void ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
358 u32 q_index = adapter->rx_queue.index;
359 u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
360 unsigned int pool = correlator >> 32;
361 unsigned int index = correlator & 0xffffffffUL;
362 union ibmveth_buf_desc desc;
363 unsigned long lpar_rc;
365 ibmveth_assert(pool < IbmVethNumBufferPools);
366 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
368 if(!adapter->rx_buff_pool[pool].active) {
369 ibmveth_rxq_harvest_buffer(adapter);
370 ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]);
375 desc.fields.valid = 1;
376 desc.fields.length = adapter->rx_buff_pool[pool].buff_size;
377 desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
379 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
381 if(lpar_rc != H_SUCCESS) {
382 ibmveth_debug_printk("h_add_logical_lan_buffer failed during recycle rc=%ld", lpar_rc);
383 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
386 if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
387 adapter->rx_queue.index = 0;
388 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
392 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
394 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
396 if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
397 adapter->rx_queue.index = 0;
398 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
402 static void ibmveth_cleanup(struct ibmveth_adapter *adapter)
406 if(adapter->buffer_list_addr != NULL) {
407 if(!dma_mapping_error(adapter->buffer_list_dma)) {
408 dma_unmap_single(&adapter->vdev->dev,
409 adapter->buffer_list_dma, 4096,
411 adapter->buffer_list_dma = DMA_ERROR_CODE;
413 free_page((unsigned long)adapter->buffer_list_addr);
414 adapter->buffer_list_addr = NULL;
417 if(adapter->filter_list_addr != NULL) {
418 if(!dma_mapping_error(adapter->filter_list_dma)) {
419 dma_unmap_single(&adapter->vdev->dev,
420 adapter->filter_list_dma, 4096,
422 adapter->filter_list_dma = DMA_ERROR_CODE;
424 free_page((unsigned long)adapter->filter_list_addr);
425 adapter->filter_list_addr = NULL;
428 if(adapter->rx_queue.queue_addr != NULL) {
429 if(!dma_mapping_error(adapter->rx_queue.queue_dma)) {
430 dma_unmap_single(&adapter->vdev->dev,
431 adapter->rx_queue.queue_dma,
432 adapter->rx_queue.queue_len,
434 adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
436 kfree(adapter->rx_queue.queue_addr);
437 adapter->rx_queue.queue_addr = NULL;
440 for(i = 0; i<IbmVethNumBufferPools; i++)
441 if (adapter->rx_buff_pool[i].active)
442 ibmveth_free_buffer_pool(adapter,
443 &adapter->rx_buff_pool[i]);
446 static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
447 union ibmveth_buf_desc rxq_desc, u64 mac_address)
449 int rc, try_again = 1;
451 /* After a kexec the adapter will still be open, so our attempt to
452 * open it will fail. So if we get a failure we free the adapter and
453 * try again, but only once. */
455 rc = h_register_logical_lan(adapter->vdev->unit_address,
456 adapter->buffer_list_dma, rxq_desc.desc,
457 adapter->filter_list_dma, mac_address);
459 if (rc != H_SUCCESS && try_again) {
461 rc = h_free_logical_lan(adapter->vdev->unit_address);
462 } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
471 static int ibmveth_open(struct net_device *netdev)
473 struct ibmveth_adapter *adapter = netdev->priv;
476 unsigned long lpar_rc;
478 union ibmveth_buf_desc rxq_desc;
481 ibmveth_debug_printk("open starting\n");
483 napi_enable(&adapter->napi);
485 for(i = 0; i<IbmVethNumBufferPools; i++)
486 rxq_entries += adapter->rx_buff_pool[i].size;
488 adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
489 adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
491 if(!adapter->buffer_list_addr || !adapter->filter_list_addr) {
492 ibmveth_error_printk("unable to allocate filter or buffer list pages\n");
493 ibmveth_cleanup(adapter);
494 napi_disable(&adapter->napi);
498 adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) * rxq_entries;
499 adapter->rx_queue.queue_addr = kmalloc(adapter->rx_queue.queue_len, GFP_KERNEL);
501 if(!adapter->rx_queue.queue_addr) {
502 ibmveth_error_printk("unable to allocate rx queue pages\n");
503 ibmveth_cleanup(adapter);
504 napi_disable(&adapter->napi);
508 adapter->buffer_list_dma = dma_map_single(&adapter->vdev->dev,
509 adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
510 adapter->filter_list_dma = dma_map_single(&adapter->vdev->dev,
511 adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
512 adapter->rx_queue.queue_dma = dma_map_single(&adapter->vdev->dev,
513 adapter->rx_queue.queue_addr,
514 adapter->rx_queue.queue_len, DMA_BIDIRECTIONAL);
516 if((dma_mapping_error(adapter->buffer_list_dma) ) ||
517 (dma_mapping_error(adapter->filter_list_dma)) ||
518 (dma_mapping_error(adapter->rx_queue.queue_dma))) {
519 ibmveth_error_printk("unable to map filter or buffer list pages\n");
520 ibmveth_cleanup(adapter);
521 napi_disable(&adapter->napi);
525 adapter->rx_queue.index = 0;
526 adapter->rx_queue.num_slots = rxq_entries;
527 adapter->rx_queue.toggle = 1;
529 memcpy(&mac_address, netdev->dev_addr, netdev->addr_len);
530 mac_address = mac_address >> 16;
533 rxq_desc.fields.valid = 1;
534 rxq_desc.fields.length = adapter->rx_queue.queue_len;
535 rxq_desc.fields.address = adapter->rx_queue.queue_dma;
537 ibmveth_debug_printk("buffer list @ 0x%p\n", adapter->buffer_list_addr);
538 ibmveth_debug_printk("filter list @ 0x%p\n", adapter->filter_list_addr);
539 ibmveth_debug_printk("receive q @ 0x%p\n", adapter->rx_queue.queue_addr);
541 h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
543 lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
545 if(lpar_rc != H_SUCCESS) {
546 ibmveth_error_printk("h_register_logical_lan failed with %ld\n", lpar_rc);
547 ibmveth_error_printk("buffer TCE:0x%lx filter TCE:0x%lx rxq desc:0x%lx MAC:0x%lx\n",
548 adapter->buffer_list_dma,
549 adapter->filter_list_dma,
552 ibmveth_cleanup(adapter);
553 napi_disable(&adapter->napi);
557 for(i = 0; i<IbmVethNumBufferPools; i++) {
558 if(!adapter->rx_buff_pool[i].active)
560 if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
561 ibmveth_error_printk("unable to alloc pool\n");
562 adapter->rx_buff_pool[i].active = 0;
563 ibmveth_cleanup(adapter);
564 napi_disable(&adapter->napi);
569 ibmveth_debug_printk("registering irq 0x%x\n", netdev->irq);
570 if((rc = request_irq(netdev->irq, &ibmveth_interrupt, 0, netdev->name, netdev)) != 0) {
571 ibmveth_error_printk("unable to request irq 0x%x, rc %d\n", netdev->irq, rc);
573 rc = h_free_logical_lan(adapter->vdev->unit_address);
574 } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
576 ibmveth_cleanup(adapter);
577 napi_disable(&adapter->napi);
581 ibmveth_debug_printk("initial replenish cycle\n");
582 ibmveth_interrupt(netdev->irq, netdev);
584 netif_start_queue(netdev);
586 ibmveth_debug_printk("open complete\n");
591 static int ibmveth_close(struct net_device *netdev)
593 struct ibmveth_adapter *adapter = netdev->priv;
596 ibmveth_debug_printk("close starting\n");
598 napi_disable(&adapter->napi);
600 if (!adapter->pool_config)
601 netif_stop_queue(netdev);
603 free_irq(netdev->irq, netdev);
606 lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
607 } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
609 if(lpar_rc != H_SUCCESS)
611 ibmveth_error_printk("h_free_logical_lan failed with %lx, continuing with close\n",
615 adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
617 ibmveth_cleanup(adapter);
619 ibmveth_debug_printk("close complete\n");
624 static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd) {
625 cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg | SUPPORTED_FIBRE);
626 cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg | ADVERTISED_FIBRE);
627 cmd->speed = SPEED_1000;
628 cmd->duplex = DUPLEX_FULL;
629 cmd->port = PORT_FIBRE;
630 cmd->phy_address = 0;
631 cmd->transceiver = XCVR_INTERNAL;
632 cmd->autoneg = AUTONEG_ENABLE;
638 static void netdev_get_drvinfo (struct net_device *dev, struct ethtool_drvinfo *info) {
639 strncpy(info->driver, ibmveth_driver_name, sizeof(info->driver) - 1);
640 strncpy(info->version, ibmveth_driver_version, sizeof(info->version) - 1);
643 static u32 netdev_get_link(struct net_device *dev) {
647 static const struct ethtool_ops netdev_ethtool_ops = {
648 .get_drvinfo = netdev_get_drvinfo,
649 .get_settings = netdev_get_settings,
650 .get_link = netdev_get_link,
651 .get_sg = ethtool_op_get_sg,
652 .get_tx_csum = ethtool_op_get_tx_csum,
655 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
660 #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
662 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *netdev)
664 struct ibmveth_adapter *adapter = netdev->priv;
665 union ibmveth_buf_desc desc[IbmVethMaxSendFrags];
666 unsigned long lpar_rc;
667 int nfrags = 0, curfrag;
668 unsigned long correlator;
670 unsigned int retry_count;
671 unsigned int tx_dropped = 0;
672 unsigned int tx_bytes = 0;
673 unsigned int tx_packets = 0;
674 unsigned int tx_send_failed = 0;
675 unsigned int tx_map_failed = 0;
678 if ((skb_shinfo(skb)->nr_frags + 1) > IbmVethMaxSendFrags) {
683 memset(&desc, 0, sizeof(desc));
685 /* nfrags = number of frags after the initial fragment */
686 nfrags = skb_shinfo(skb)->nr_frags;
689 adapter->tx_multidesc_send++;
691 /* map the initial fragment */
692 desc[0].fields.length = nfrags ? skb->len - skb->data_len : skb->len;
693 desc[0].fields.address = dma_map_single(&adapter->vdev->dev, skb->data,
694 desc[0].fields.length, DMA_TO_DEVICE);
695 desc[0].fields.valid = 1;
697 if(dma_mapping_error(desc[0].fields.address)) {
698 ibmveth_error_printk("tx: unable to map initial fragment\n");
706 /* map fragments past the initial portion if there are any */
708 skb_frag_t *frag = &skb_shinfo(skb)->frags[curfrag];
709 desc[curfrag+1].fields.address
710 = dma_map_single(&adapter->vdev->dev,
711 page_address(frag->page) + frag->page_offset,
712 frag->size, DMA_TO_DEVICE);
713 desc[curfrag+1].fields.length = frag->size;
714 desc[curfrag+1].fields.valid = 1;
716 if(dma_mapping_error(desc[curfrag+1].fields.address)) {
717 ibmveth_error_printk("tx: unable to map fragment %d\n", curfrag);
720 /* Free all the mappings we just created */
721 while(curfrag < nfrags) {
722 dma_unmap_single(&adapter->vdev->dev,
723 desc[curfrag+1].fields.address,
724 desc[curfrag+1].fields.length,
732 /* send the frame. Arbitrarily set retrycount to 1024 */
736 lpar_rc = h_send_logical_lan(adapter->vdev->unit_address,
745 } while ((lpar_rc == H_BUSY) && (retry_count--));
747 if(lpar_rc != H_SUCCESS && lpar_rc != H_DROPPED) {
749 ibmveth_error_printk("tx: h_send_logical_lan failed with rc=%ld\n", lpar_rc);
750 for(i = 0; i < 6; i++) {
751 ibmveth_error_printk("tx: desc[%i] valid=%d, len=%d, address=0x%d\n", i,
752 desc[i].fields.valid, desc[i].fields.length, desc[i].fields.address);
758 tx_bytes += skb->len;
759 netdev->trans_start = jiffies;
763 dma_unmap_single(&adapter->vdev->dev,
764 desc[nfrags].fields.address,
765 desc[nfrags].fields.length, DMA_TO_DEVICE);
766 } while(--nfrags >= 0);
768 out: spin_lock_irqsave(&adapter->stats_lock, flags);
769 adapter->stats.tx_dropped += tx_dropped;
770 adapter->stats.tx_bytes += tx_bytes;
771 adapter->stats.tx_packets += tx_packets;
772 adapter->tx_send_failed += tx_send_failed;
773 adapter->tx_map_failed += tx_map_failed;
774 spin_unlock_irqrestore(&adapter->stats_lock, flags);
780 static int ibmveth_poll(struct napi_struct *napi, int budget)
782 struct ibmveth_adapter *adapter = container_of(napi, struct ibmveth_adapter, napi);
783 struct net_device *netdev = adapter->netdev;
784 int frames_processed = 0;
785 unsigned long lpar_rc;
791 if (!ibmveth_rxq_pending_buffer(adapter))
795 if (!ibmveth_rxq_buffer_valid(adapter)) {
796 wmb(); /* suggested by larson1 */
797 adapter->rx_invalid_buffer++;
798 ibmveth_debug_printk("recycling invalid buffer\n");
799 ibmveth_rxq_recycle_buffer(adapter);
801 int length = ibmveth_rxq_frame_length(adapter);
802 int offset = ibmveth_rxq_frame_offset(adapter);
803 skb = ibmveth_rxq_get_buffer(adapter);
805 ibmveth_rxq_harvest_buffer(adapter);
807 skb_reserve(skb, offset);
808 skb_put(skb, length);
809 skb->protocol = eth_type_trans(skb, netdev);
811 netif_receive_skb(skb); /* send it up */
813 adapter->stats.rx_packets++;
814 adapter->stats.rx_bytes += length;
816 netdev->last_rx = jiffies;
818 } while (frames_processed < budget);
820 ibmveth_replenish_task(adapter);
822 if (frames_processed < budget) {
823 /* We think we are done - reenable interrupts,
824 * then check once more to make sure we are done.
826 lpar_rc = h_vio_signal(adapter->vdev->unit_address,
829 ibmveth_assert(lpar_rc == H_SUCCESS);
831 netif_rx_complete(netdev, napi);
833 if (ibmveth_rxq_pending_buffer(adapter) &&
834 netif_rx_reschedule(netdev, napi)) {
835 lpar_rc = h_vio_signal(adapter->vdev->unit_address,
841 return frames_processed;
844 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
846 struct net_device *netdev = dev_instance;
847 struct ibmveth_adapter *adapter = netdev->priv;
848 unsigned long lpar_rc;
850 if (netif_rx_schedule_prep(netdev, &adapter->napi)) {
851 lpar_rc = h_vio_signal(adapter->vdev->unit_address,
853 ibmveth_assert(lpar_rc == H_SUCCESS);
854 __netif_rx_schedule(netdev, &adapter->napi);
859 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev)
861 struct ibmveth_adapter *adapter = dev->priv;
862 return &adapter->stats;
865 static void ibmveth_set_multicast_list(struct net_device *netdev)
867 struct ibmveth_adapter *adapter = netdev->priv;
868 unsigned long lpar_rc;
870 if((netdev->flags & IFF_PROMISC) || (netdev->mc_count > adapter->mcastFilterSize)) {
871 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
872 IbmVethMcastEnableRecv |
873 IbmVethMcastDisableFiltering,
875 if(lpar_rc != H_SUCCESS) {
876 ibmveth_error_printk("h_multicast_ctrl rc=%ld when entering promisc mode\n", lpar_rc);
879 struct dev_mc_list *mclist = netdev->mc_list;
881 /* clear the filter table & disable filtering */
882 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
883 IbmVethMcastEnableRecv |
884 IbmVethMcastDisableFiltering |
885 IbmVethMcastClearFilterTable,
887 if(lpar_rc != H_SUCCESS) {
888 ibmveth_error_printk("h_multicast_ctrl rc=%ld when attempting to clear filter table\n", lpar_rc);
890 /* add the addresses to the filter table */
891 for(i = 0; i < netdev->mc_count; ++i, mclist = mclist->next) {
892 // add the multicast address to the filter table
893 unsigned long mcast_addr = 0;
894 memcpy(((char *)&mcast_addr)+2, mclist->dmi_addr, 6);
895 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
896 IbmVethMcastAddFilter,
898 if(lpar_rc != H_SUCCESS) {
899 ibmveth_error_printk("h_multicast_ctrl rc=%ld when adding an entry to the filter table\n", lpar_rc);
903 /* re-enable filtering */
904 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
905 IbmVethMcastEnableFiltering,
907 if(lpar_rc != H_SUCCESS) {
908 ibmveth_error_printk("h_multicast_ctrl rc=%ld when enabling filtering\n", lpar_rc);
913 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
915 struct ibmveth_adapter *adapter = dev->priv;
916 int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
920 if (new_mtu < IBMVETH_MAX_MTU)
923 for (i = 0; i < IbmVethNumBufferPools; i++)
924 if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size)
927 if (i == IbmVethNumBufferPools)
930 /* Look for an active buffer pool that can hold the new MTU */
931 for(i = 0; i<IbmVethNumBufferPools; i++) {
932 if (!adapter->rx_buff_pool[i].active) {
933 adapter->rx_buff_pool[i].active = 1;
937 if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size) {
938 if (reinit && netif_running(adapter->netdev)) {
939 adapter->pool_config = 1;
940 ibmveth_close(adapter->netdev);
941 adapter->pool_config = 0;
943 if ((rc = ibmveth_open(adapter->netdev)))
953 #ifdef CONFIG_NET_POLL_CONTROLLER
954 static void ibmveth_poll_controller(struct net_device *dev)
956 ibmveth_replenish_task(dev->priv);
957 ibmveth_interrupt(dev->irq, dev);
961 static int __devinit ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
964 struct net_device *netdev;
965 struct ibmveth_adapter *adapter;
967 unsigned char *mac_addr_p;
968 unsigned int *mcastFilterSize_p;
971 ibmveth_debug_printk_no_adapter("entering ibmveth_probe for UA 0x%x\n",
974 mac_addr_p = (unsigned char *) vio_get_attribute(dev,
975 VETH_MAC_ADDR, NULL);
977 printk(KERN_ERR "(%s:%3.3d) ERROR: Can't find VETH_MAC_ADDR "
978 "attribute\n", __FILE__, __LINE__);
982 mcastFilterSize_p = (unsigned int *) vio_get_attribute(dev,
983 VETH_MCAST_FILTER_SIZE, NULL);
984 if(!mcastFilterSize_p) {
985 printk(KERN_ERR "(%s:%3.3d) ERROR: Can't find "
986 "VETH_MCAST_FILTER_SIZE attribute\n",
991 netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
996 SET_MODULE_OWNER(netdev);
998 adapter = netdev->priv;
999 dev->dev.driver_data = netdev;
1001 adapter->vdev = dev;
1002 adapter->netdev = netdev;
1003 adapter->mcastFilterSize= *mcastFilterSize_p;
1004 adapter->pool_config = 0;
1006 netif_napi_add(netdev, &adapter->napi, ibmveth_poll, 16);
1008 /* Some older boxes running PHYP non-natively have an OF that
1009 returns a 8-byte local-mac-address field (and the first
1010 2 bytes have to be ignored) while newer boxes' OF return
1011 a 6-byte field. Note that IEEE 1275 specifies that
1012 local-mac-address must be a 6-byte field.
1013 The RPA doc specifies that the first byte must be 10b, so
1014 we'll just look for it to solve this 8 vs. 6 byte field issue */
1016 if ((*mac_addr_p & 0x3) != 0x02)
1019 adapter->mac_addr = 0;
1020 memcpy(&adapter->mac_addr, mac_addr_p, 6);
1022 netdev->irq = dev->irq;
1023 netdev->open = ibmveth_open;
1024 netdev->stop = ibmveth_close;
1025 netdev->hard_start_xmit = ibmveth_start_xmit;
1026 netdev->get_stats = ibmveth_get_stats;
1027 netdev->set_multicast_list = ibmveth_set_multicast_list;
1028 netdev->do_ioctl = ibmveth_ioctl;
1029 netdev->ethtool_ops = &netdev_ethtool_ops;
1030 netdev->change_mtu = ibmveth_change_mtu;
1031 SET_NETDEV_DEV(netdev, &dev->dev);
1032 #ifdef CONFIG_NET_POLL_CONTROLLER
1033 netdev->poll_controller = ibmveth_poll_controller;
1035 netdev->features |= NETIF_F_LLTX;
1036 spin_lock_init(&adapter->stats_lock);
1038 memcpy(&netdev->dev_addr, &adapter->mac_addr, netdev->addr_len);
1040 for(i = 0; i<IbmVethNumBufferPools; i++) {
1041 struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
1042 ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
1043 pool_count[i], pool_size[i],
1045 kobj->parent = &dev->dev.kobj;
1046 sprintf(kobj->name, "pool%d", i);
1047 kobj->ktype = &ktype_veth_pool;
1048 kobject_register(kobj);
1051 ibmveth_debug_printk("adapter @ 0x%p\n", adapter);
1053 adapter->buffer_list_dma = DMA_ERROR_CODE;
1054 adapter->filter_list_dma = DMA_ERROR_CODE;
1055 adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
1057 ibmveth_debug_printk("registering netdev...\n");
1059 rc = register_netdev(netdev);
1062 ibmveth_debug_printk("failed to register netdev rc=%d\n", rc);
1063 free_netdev(netdev);
1067 ibmveth_debug_printk("registered\n");
1069 ibmveth_proc_register_adapter(adapter);
1074 static int __devexit ibmveth_remove(struct vio_dev *dev)
1076 struct net_device *netdev = dev->dev.driver_data;
1077 struct ibmveth_adapter *adapter = netdev->priv;
1080 for(i = 0; i<IbmVethNumBufferPools; i++)
1081 kobject_unregister(&adapter->rx_buff_pool[i].kobj);
1083 unregister_netdev(netdev);
1085 ibmveth_proc_unregister_adapter(adapter);
1087 free_netdev(netdev);
1091 #ifdef CONFIG_PROC_FS
1092 static void ibmveth_proc_register_driver(void)
1094 ibmveth_proc_dir = proc_mkdir(IBMVETH_PROC_DIR, NULL);
1095 if (ibmveth_proc_dir) {
1096 SET_MODULE_OWNER(ibmveth_proc_dir);
1100 static void ibmveth_proc_unregister_driver(void)
1102 remove_proc_entry(IBMVETH_PROC_DIR, NULL);
1105 static void *ibmveth_seq_start(struct seq_file *seq, loff_t *pos)
1114 static void *ibmveth_seq_next(struct seq_file *seq, void *v, loff_t *pos)
1120 static void ibmveth_seq_stop(struct seq_file *seq, void *v)
1124 static int ibmveth_seq_show(struct seq_file *seq, void *v)
1126 struct ibmveth_adapter *adapter = seq->private;
1127 char *current_mac = ((char*) &adapter->netdev->dev_addr);
1128 char *firmware_mac = ((char*) &adapter->mac_addr) ;
1130 seq_printf(seq, "%s %s\n\n", ibmveth_driver_string, ibmveth_driver_version);
1132 seq_printf(seq, "Unit Address: 0x%x\n", adapter->vdev->unit_address);
1133 seq_printf(seq, "Current MAC: %02X:%02X:%02X:%02X:%02X:%02X\n",
1134 current_mac[0], current_mac[1], current_mac[2],
1135 current_mac[3], current_mac[4], current_mac[5]);
1136 seq_printf(seq, "Firmware MAC: %02X:%02X:%02X:%02X:%02X:%02X\n",
1137 firmware_mac[0], firmware_mac[1], firmware_mac[2],
1138 firmware_mac[3], firmware_mac[4], firmware_mac[5]);
1140 seq_printf(seq, "\nAdapter Statistics:\n");
1141 seq_printf(seq, " TX: skbuffs linearized: %ld\n", adapter->tx_linearized);
1142 seq_printf(seq, " multi-descriptor sends: %ld\n", adapter->tx_multidesc_send);
1143 seq_printf(seq, " skb_linearize failures: %ld\n", adapter->tx_linearize_failed);
1144 seq_printf(seq, " vio_map_single failres: %ld\n", adapter->tx_map_failed);
1145 seq_printf(seq, " send failures: %ld\n", adapter->tx_send_failed);
1146 seq_printf(seq, " RX: replenish task cycles: %ld\n", adapter->replenish_task_cycles);
1147 seq_printf(seq, " alloc_skb_failures: %ld\n", adapter->replenish_no_mem);
1148 seq_printf(seq, " add buffer failures: %ld\n", adapter->replenish_add_buff_failure);
1149 seq_printf(seq, " invalid buffers: %ld\n", adapter->rx_invalid_buffer);
1150 seq_printf(seq, " no buffers: %ld\n", adapter->rx_no_buffer);
1154 static struct seq_operations ibmveth_seq_ops = {
1155 .start = ibmveth_seq_start,
1156 .next = ibmveth_seq_next,
1157 .stop = ibmveth_seq_stop,
1158 .show = ibmveth_seq_show,
1161 static int ibmveth_proc_open(struct inode *inode, struct file *file)
1163 struct seq_file *seq;
1164 struct proc_dir_entry *proc;
1167 rc = seq_open(file, &ibmveth_seq_ops);
1169 /* recover the pointer buried in proc_dir_entry data */
1170 seq = file->private_data;
1172 seq->private = proc->data;
1177 static const struct file_operations ibmveth_proc_fops = {
1178 .owner = THIS_MODULE,
1179 .open = ibmveth_proc_open,
1181 .llseek = seq_lseek,
1182 .release = seq_release,
1185 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter)
1187 struct proc_dir_entry *entry;
1188 if (ibmveth_proc_dir) {
1190 sprintf(u_addr, "%x", adapter->vdev->unit_address);
1191 entry = create_proc_entry(u_addr, S_IFREG, ibmveth_proc_dir);
1193 ibmveth_error_printk("Cannot create adapter proc entry");
1195 entry->data = (void *) adapter;
1196 entry->proc_fops = &ibmveth_proc_fops;
1197 SET_MODULE_OWNER(entry);
1203 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter)
1205 if (ibmveth_proc_dir) {
1207 sprintf(u_addr, "%x", adapter->vdev->unit_address);
1208 remove_proc_entry(u_addr, ibmveth_proc_dir);
1212 #else /* CONFIG_PROC_FS */
1213 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter)
1217 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter)
1220 static void ibmveth_proc_register_driver(void)
1224 static void ibmveth_proc_unregister_driver(void)
1227 #endif /* CONFIG_PROC_FS */
1229 static struct attribute veth_active_attr;
1230 static struct attribute veth_num_attr;
1231 static struct attribute veth_size_attr;
1233 static ssize_t veth_pool_show(struct kobject * kobj,
1234 struct attribute * attr, char * buf)
1236 struct ibmveth_buff_pool *pool = container_of(kobj,
1237 struct ibmveth_buff_pool,
1240 if (attr == &veth_active_attr)
1241 return sprintf(buf, "%d\n", pool->active);
1242 else if (attr == &veth_num_attr)
1243 return sprintf(buf, "%d\n", pool->size);
1244 else if (attr == &veth_size_attr)
1245 return sprintf(buf, "%d\n", pool->buff_size);
1249 static ssize_t veth_pool_store(struct kobject * kobj, struct attribute * attr,
1250 const char * buf, size_t count)
1252 struct ibmveth_buff_pool *pool = container_of(kobj,
1253 struct ibmveth_buff_pool,
1255 struct net_device *netdev =
1256 container_of(kobj->parent, struct device, kobj)->driver_data;
1257 struct ibmveth_adapter *adapter = netdev->priv;
1258 long value = simple_strtol(buf, NULL, 10);
1261 if (attr == &veth_active_attr) {
1262 if (value && !pool->active) {
1263 if (netif_running(netdev)) {
1264 if(ibmveth_alloc_buffer_pool(pool)) {
1265 ibmveth_error_printk("unable to alloc pool\n");
1269 adapter->pool_config = 1;
1270 ibmveth_close(netdev);
1271 adapter->pool_config = 0;
1272 if ((rc = ibmveth_open(netdev)))
1276 } else if (!value && pool->active) {
1277 int mtu = netdev->mtu + IBMVETH_BUFF_OH;
1279 /* Make sure there is a buffer pool with buffers that
1280 can hold a packet of the size of the MTU */
1281 for (i = 0; i < IbmVethNumBufferPools; i++) {
1282 if (pool == &adapter->rx_buff_pool[i])
1284 if (!adapter->rx_buff_pool[i].active)
1286 if (mtu <= adapter->rx_buff_pool[i].buff_size)
1290 if (i == IbmVethNumBufferPools) {
1291 ibmveth_error_printk("no active pool >= MTU\n");
1296 if (netif_running(netdev)) {
1297 adapter->pool_config = 1;
1298 ibmveth_close(netdev);
1299 adapter->pool_config = 0;
1300 if ((rc = ibmveth_open(netdev)))
1304 } else if (attr == &veth_num_attr) {
1305 if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT)
1308 if (netif_running(netdev)) {
1309 adapter->pool_config = 1;
1310 ibmveth_close(netdev);
1311 adapter->pool_config = 0;
1313 if ((rc = ibmveth_open(netdev)))
1318 } else if (attr == &veth_size_attr) {
1319 if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE)
1322 if (netif_running(netdev)) {
1323 adapter->pool_config = 1;
1324 ibmveth_close(netdev);
1325 adapter->pool_config = 0;
1326 pool->buff_size = value;
1327 if ((rc = ibmveth_open(netdev)))
1330 pool->buff_size = value;
1334 /* kick the interrupt handler to allocate/deallocate pools */
1335 ibmveth_interrupt(netdev->irq, netdev);
1340 #define ATTR(_name, _mode) \
1341 struct attribute veth_##_name##_attr = { \
1342 .name = __stringify(_name), .mode = _mode, \
1345 static ATTR(active, 0644);
1346 static ATTR(num, 0644);
1347 static ATTR(size, 0644);
1349 static struct attribute * veth_pool_attrs[] = {
1356 static struct sysfs_ops veth_pool_ops = {
1357 .show = veth_pool_show,
1358 .store = veth_pool_store,
1361 static struct kobj_type ktype_veth_pool = {
1363 .sysfs_ops = &veth_pool_ops,
1364 .default_attrs = veth_pool_attrs,
1368 static struct vio_device_id ibmveth_device_table[] __devinitdata= {
1369 { "network", "IBM,l-lan"},
1372 MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
1374 static struct vio_driver ibmveth_driver = {
1375 .id_table = ibmveth_device_table,
1376 .probe = ibmveth_probe,
1377 .remove = ibmveth_remove,
1379 .name = ibmveth_driver_name,
1380 .owner = THIS_MODULE,
1384 static int __init ibmveth_module_init(void)
1386 ibmveth_printk("%s: %s %s\n", ibmveth_driver_name, ibmveth_driver_string, ibmveth_driver_version);
1388 ibmveth_proc_register_driver();
1390 return vio_register_driver(&ibmveth_driver);
1393 static void __exit ibmveth_module_exit(void)
1395 vio_unregister_driver(&ibmveth_driver);
1396 ibmveth_proc_unregister_driver();
1399 module_init(ibmveth_module_init);
1400 module_exit(ibmveth_module_exit);