1 /**************************************************************************/
3 /* IBM eServer i/pSeries Virtual Ethernet Device Driver */
4 /* Copyright (C) 2003 IBM Corp. */
5 /* Originally written by Dave Larson (larson1@us.ibm.com) */
6 /* Maintained by Santiago Leon (santil@us.ibm.com) */
8 /* This program is free software; you can redistribute it and/or modify */
9 /* it under the terms of the GNU General Public License as published by */
10 /* the Free Software Foundation; either version 2 of the License, or */
11 /* (at your option) any later version. */
13 /* This program is distributed in the hope that it will be useful, */
14 /* but WITHOUT ANY WARRANTY; without even the implied warranty of */
15 /* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the */
16 /* GNU General Public License for more details. */
18 /* You should have received a copy of the GNU General Public License */
19 /* along with this program; if not, write to the Free Software */
20 /* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 */
23 /* This module contains the implementation of a virtual ethernet device */
24 /* for use with IBM i/pSeries LPAR Linux. It utilizes the logical LAN */
25 /* option of the RS/6000 Platform Architechture to interface with virtual */
26 /* ethernet NICs that are presented to the partition by the hypervisor. */
28 /**************************************************************************/
31 - remove frag processing code - no longer needed
32 - add support for sysfs
33 - possibly remove procfs support
36 #include <linux/module.h>
37 #include <linux/types.h>
38 #include <linux/errno.h>
39 #include <linux/ioport.h>
40 #include <linux/dma-mapping.h>
41 #include <linux/kernel.h>
42 #include <linux/netdevice.h>
43 #include <linux/etherdevice.h>
44 #include <linux/skbuff.h>
45 #include <linux/init.h>
46 #include <linux/delay.h>
48 #include <linux/ethtool.h>
49 #include <linux/proc_fs.h>
50 #include <asm/semaphore.h>
51 #include <asm/hvcall.h>
52 #include <asm/atomic.h>
54 #include <asm/uaccess.h>
55 #include <linux/seq_file.h>
61 #define ibmveth_printk(fmt, args...) \
62 printk(KERN_DEBUG "%s: " fmt, __FILE__, ## args)
64 #define ibmveth_error_printk(fmt, args...) \
65 printk(KERN_ERR "(%s:%3.3d ua:%x) ERROR: " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
68 #define ibmveth_debug_printk_no_adapter(fmt, args...) \
69 printk(KERN_DEBUG "(%s:%3.3d): " fmt, __FILE__, __LINE__ , ## args)
70 #define ibmveth_debug_printk(fmt, args...) \
71 printk(KERN_DEBUG "(%s:%3.3d ua:%x): " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
72 #define ibmveth_assert(expr) \
74 printk(KERN_DEBUG "assertion failed (%s:%3.3d ua:%x): %s\n", __FILE__, __LINE__, adapter->vdev->unit_address, #expr); \
78 #define ibmveth_debug_printk_no_adapter(fmt, args...)
79 #define ibmveth_debug_printk(fmt, args...)
80 #define ibmveth_assert(expr)
83 static int ibmveth_open(struct net_device *dev);
84 static int ibmveth_close(struct net_device *dev);
85 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd);
86 static int ibmveth_poll(struct net_device *dev, int *budget);
87 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *dev);
88 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev);
89 static void ibmveth_set_multicast_list(struct net_device *dev);
90 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu);
91 static void ibmveth_proc_register_driver(void);
92 static void ibmveth_proc_unregister_driver(void);
93 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter);
94 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter);
95 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
96 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter);
97 static struct kobj_type ktype_veth_pool;
100 #define IBMVETH_PROC_DIR "net/ibmveth"
101 static struct proc_dir_entry *ibmveth_proc_dir;
104 static const char ibmveth_driver_name[] = "ibmveth";
105 static const char ibmveth_driver_string[] = "IBM i/pSeries Virtual Ethernet Driver";
106 #define ibmveth_driver_version "1.03"
108 MODULE_AUTHOR("Santiago Leon <santil@us.ibm.com>");
109 MODULE_DESCRIPTION("IBM i/pSeries Virtual Ethernet Driver");
110 MODULE_LICENSE("GPL");
111 MODULE_VERSION(ibmveth_driver_version);
113 /* simple methods of getting data from the current rxq entry */
114 static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
116 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].toggle == adapter->rx_queue.toggle);
119 static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
121 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].valid);
124 static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
126 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].offset);
129 static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
131 return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
134 /* setup the initial settings for a buffer pool */
135 static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool, u32 pool_index, u32 pool_size, u32 buff_size, u32 pool_active)
137 pool->size = pool_size;
138 pool->index = pool_index;
139 pool->buff_size = buff_size;
140 pool->threshold = pool_size / 2;
141 pool->active = pool_active;
144 /* allocate and setup an buffer pool - called during open */
145 static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
149 pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL);
151 if(!pool->free_map) {
155 pool->dma_addr = kmalloc(sizeof(dma_addr_t) * pool->size, GFP_KERNEL);
156 if(!pool->dma_addr) {
157 kfree(pool->free_map);
158 pool->free_map = NULL;
162 pool->skbuff = kmalloc(sizeof(void*) * pool->size, GFP_KERNEL);
165 kfree(pool->dma_addr);
166 pool->dma_addr = NULL;
168 kfree(pool->free_map);
169 pool->free_map = NULL;
173 memset(pool->skbuff, 0, sizeof(void*) * pool->size);
174 memset(pool->dma_addr, 0, sizeof(dma_addr_t) * pool->size);
176 for(i = 0; i < pool->size; ++i) {
177 pool->free_map[i] = i;
180 atomic_set(&pool->available, 0);
181 pool->producer_index = 0;
182 pool->consumer_index = 0;
187 /* replenish the buffers for a pool. note that we don't need to
188 * skb_reserve these since they are used for incoming...
190 static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
193 u32 count = pool->size - atomic_read(&pool->available);
194 u32 buffers_added = 0;
198 for(i = 0; i < count; ++i) {
200 unsigned int free_index, index;
202 union ibmveth_buf_desc desc;
203 unsigned long lpar_rc;
206 skb = alloc_skb(pool->buff_size, GFP_ATOMIC);
209 ibmveth_debug_printk("replenish: unable to allocate skb\n");
210 adapter->replenish_no_mem++;
214 free_index = pool->consumer_index;
215 pool->consumer_index = (pool->consumer_index + 1) % pool->size;
216 index = pool->free_map[free_index];
218 ibmveth_assert(index != IBM_VETH_INVALID_MAP);
219 ibmveth_assert(pool->skbuff[index] == NULL);
221 dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
222 pool->buff_size, DMA_FROM_DEVICE);
224 pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
225 pool->dma_addr[index] = dma_addr;
226 pool->skbuff[index] = skb;
228 correlator = ((u64)pool->index << 32) | index;
229 *(u64*)skb->data = correlator;
232 desc.fields.valid = 1;
233 desc.fields.length = pool->buff_size;
234 desc.fields.address = dma_addr;
236 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
238 if(lpar_rc != H_SUCCESS) {
239 pool->free_map[free_index] = index;
240 pool->skbuff[index] = NULL;
241 if (pool->consumer_index == 0)
242 pool->consumer_index = pool->size - 1;
244 pool->consumer_index--;
245 dma_unmap_single(&adapter->vdev->dev,
246 pool->dma_addr[index], pool->buff_size,
248 dev_kfree_skb_any(skb);
249 adapter->replenish_add_buff_failure++;
253 adapter->replenish_add_buff_success++;
258 atomic_add(buffers_added, &(pool->available));
261 /* replenish routine */
262 static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
266 adapter->replenish_task_cycles++;
268 for(i = 0; i < IbmVethNumBufferPools; i++)
269 if(adapter->rx_buff_pool[i].active)
270 ibmveth_replenish_buffer_pool(adapter,
271 &adapter->rx_buff_pool[i]);
273 adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
276 /* empty and free ana buffer pool - also used to do cleanup in error paths */
277 static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
281 kfree(pool->free_map);
282 pool->free_map = NULL;
284 if(pool->skbuff && pool->dma_addr) {
285 for(i = 0; i < pool->size; ++i) {
286 struct sk_buff *skb = pool->skbuff[i];
288 dma_unmap_single(&adapter->vdev->dev,
292 dev_kfree_skb_any(skb);
293 pool->skbuff[i] = NULL;
299 kfree(pool->dma_addr);
300 pool->dma_addr = NULL;
309 /* remove a buffer from a pool */
310 static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter, u64 correlator)
312 unsigned int pool = correlator >> 32;
313 unsigned int index = correlator & 0xffffffffUL;
314 unsigned int free_index;
317 ibmveth_assert(pool < IbmVethNumBufferPools);
318 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
320 skb = adapter->rx_buff_pool[pool].skbuff[index];
322 ibmveth_assert(skb != NULL);
324 adapter->rx_buff_pool[pool].skbuff[index] = NULL;
326 dma_unmap_single(&adapter->vdev->dev,
327 adapter->rx_buff_pool[pool].dma_addr[index],
328 adapter->rx_buff_pool[pool].buff_size,
331 free_index = adapter->rx_buff_pool[pool].producer_index;
332 adapter->rx_buff_pool[pool].producer_index
333 = (adapter->rx_buff_pool[pool].producer_index + 1)
334 % adapter->rx_buff_pool[pool].size;
335 adapter->rx_buff_pool[pool].free_map[free_index] = index;
339 atomic_dec(&(adapter->rx_buff_pool[pool].available));
342 /* get the current buffer on the rx queue */
343 static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
345 u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
346 unsigned int pool = correlator >> 32;
347 unsigned int index = correlator & 0xffffffffUL;
349 ibmveth_assert(pool < IbmVethNumBufferPools);
350 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
352 return adapter->rx_buff_pool[pool].skbuff[index];
355 /* recycle the current buffer on the rx queue */
356 static void ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
358 u32 q_index = adapter->rx_queue.index;
359 u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
360 unsigned int pool = correlator >> 32;
361 unsigned int index = correlator & 0xffffffffUL;
362 union ibmveth_buf_desc desc;
363 unsigned long lpar_rc;
365 ibmveth_assert(pool < IbmVethNumBufferPools);
366 ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
368 if(!adapter->rx_buff_pool[pool].active) {
369 ibmveth_rxq_harvest_buffer(adapter);
370 ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]);
375 desc.fields.valid = 1;
376 desc.fields.length = adapter->rx_buff_pool[pool].buff_size;
377 desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
379 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
381 if(lpar_rc != H_SUCCESS) {
382 ibmveth_debug_printk("h_add_logical_lan_buffer failed during recycle rc=%ld", lpar_rc);
383 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
386 if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
387 adapter->rx_queue.index = 0;
388 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
392 static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
394 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
396 if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
397 adapter->rx_queue.index = 0;
398 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
402 static void ibmveth_cleanup(struct ibmveth_adapter *adapter)
406 if(adapter->buffer_list_addr != NULL) {
407 if(!dma_mapping_error(adapter->buffer_list_dma)) {
408 dma_unmap_single(&adapter->vdev->dev,
409 adapter->buffer_list_dma, 4096,
411 adapter->buffer_list_dma = DMA_ERROR_CODE;
413 free_page((unsigned long)adapter->buffer_list_addr);
414 adapter->buffer_list_addr = NULL;
417 if(adapter->filter_list_addr != NULL) {
418 if(!dma_mapping_error(adapter->filter_list_dma)) {
419 dma_unmap_single(&adapter->vdev->dev,
420 adapter->filter_list_dma, 4096,
422 adapter->filter_list_dma = DMA_ERROR_CODE;
424 free_page((unsigned long)adapter->filter_list_addr);
425 adapter->filter_list_addr = NULL;
428 if(adapter->rx_queue.queue_addr != NULL) {
429 if(!dma_mapping_error(adapter->rx_queue.queue_dma)) {
430 dma_unmap_single(&adapter->vdev->dev,
431 adapter->rx_queue.queue_dma,
432 adapter->rx_queue.queue_len,
434 adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
436 kfree(adapter->rx_queue.queue_addr);
437 adapter->rx_queue.queue_addr = NULL;
440 for(i = 0; i<IbmVethNumBufferPools; i++)
441 if (adapter->rx_buff_pool[i].active)
442 ibmveth_free_buffer_pool(adapter,
443 &adapter->rx_buff_pool[i]);
446 static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
447 union ibmveth_buf_desc rxq_desc, u64 mac_address)
449 int rc, try_again = 1;
451 /* After a kexec the adapter will still be open, so our attempt to
452 * open it will fail. So if we get a failure we free the adapter and
453 * try again, but only once. */
455 rc = h_register_logical_lan(adapter->vdev->unit_address,
456 adapter->buffer_list_dma, rxq_desc.desc,
457 adapter->filter_list_dma, mac_address);
459 if (rc != H_SUCCESS && try_again) {
461 rc = h_free_logical_lan(adapter->vdev->unit_address);
462 } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
471 static int ibmveth_open(struct net_device *netdev)
473 struct ibmveth_adapter *adapter = netdev->priv;
476 unsigned long lpar_rc;
478 union ibmveth_buf_desc rxq_desc;
481 ibmveth_debug_printk("open starting\n");
483 for(i = 0; i<IbmVethNumBufferPools; i++)
484 rxq_entries += adapter->rx_buff_pool[i].size;
486 adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
487 adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
489 if(!adapter->buffer_list_addr || !adapter->filter_list_addr) {
490 ibmveth_error_printk("unable to allocate filter or buffer list pages\n");
491 ibmveth_cleanup(adapter);
495 adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) * rxq_entries;
496 adapter->rx_queue.queue_addr = kmalloc(adapter->rx_queue.queue_len, GFP_KERNEL);
498 if(!adapter->rx_queue.queue_addr) {
499 ibmveth_error_printk("unable to allocate rx queue pages\n");
500 ibmveth_cleanup(adapter);
504 adapter->buffer_list_dma = dma_map_single(&adapter->vdev->dev,
505 adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
506 adapter->filter_list_dma = dma_map_single(&adapter->vdev->dev,
507 adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
508 adapter->rx_queue.queue_dma = dma_map_single(&adapter->vdev->dev,
509 adapter->rx_queue.queue_addr,
510 adapter->rx_queue.queue_len, DMA_BIDIRECTIONAL);
512 if((dma_mapping_error(adapter->buffer_list_dma) ) ||
513 (dma_mapping_error(adapter->filter_list_dma)) ||
514 (dma_mapping_error(adapter->rx_queue.queue_dma))) {
515 ibmveth_error_printk("unable to map filter or buffer list pages\n");
516 ibmveth_cleanup(adapter);
520 adapter->rx_queue.index = 0;
521 adapter->rx_queue.num_slots = rxq_entries;
522 adapter->rx_queue.toggle = 1;
524 memcpy(&mac_address, netdev->dev_addr, netdev->addr_len);
525 mac_address = mac_address >> 16;
528 rxq_desc.fields.valid = 1;
529 rxq_desc.fields.length = adapter->rx_queue.queue_len;
530 rxq_desc.fields.address = adapter->rx_queue.queue_dma;
532 ibmveth_debug_printk("buffer list @ 0x%p\n", adapter->buffer_list_addr);
533 ibmveth_debug_printk("filter list @ 0x%p\n", adapter->filter_list_addr);
534 ibmveth_debug_printk("receive q @ 0x%p\n", adapter->rx_queue.queue_addr);
536 h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
538 lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
540 if(lpar_rc != H_SUCCESS) {
541 ibmveth_error_printk("h_register_logical_lan failed with %ld\n", lpar_rc);
542 ibmveth_error_printk("buffer TCE:0x%lx filter TCE:0x%lx rxq desc:0x%lx MAC:0x%lx\n",
543 adapter->buffer_list_dma,
544 adapter->filter_list_dma,
547 ibmveth_cleanup(adapter);
551 for(i = 0; i<IbmVethNumBufferPools; i++) {
552 if(!adapter->rx_buff_pool[i].active)
554 if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
555 ibmveth_error_printk("unable to alloc pool\n");
556 adapter->rx_buff_pool[i].active = 0;
557 ibmveth_cleanup(adapter);
562 ibmveth_debug_printk("registering irq 0x%x\n", netdev->irq);
563 if((rc = request_irq(netdev->irq, &ibmveth_interrupt, 0, netdev->name, netdev)) != 0) {
564 ibmveth_error_printk("unable to request irq 0x%x, rc %d\n", netdev->irq, rc);
566 rc = h_free_logical_lan(adapter->vdev->unit_address);
567 } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
569 ibmveth_cleanup(adapter);
573 ibmveth_debug_printk("initial replenish cycle\n");
574 ibmveth_interrupt(netdev->irq, netdev);
576 netif_start_queue(netdev);
578 ibmveth_debug_printk("open complete\n");
583 static int ibmveth_close(struct net_device *netdev)
585 struct ibmveth_adapter *adapter = netdev->priv;
588 ibmveth_debug_printk("close starting\n");
590 if (!adapter->pool_config)
591 netif_stop_queue(netdev);
593 free_irq(netdev->irq, netdev);
596 lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
597 } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
599 if(lpar_rc != H_SUCCESS)
601 ibmveth_error_printk("h_free_logical_lan failed with %lx, continuing with close\n",
605 adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
607 ibmveth_cleanup(adapter);
609 ibmveth_debug_printk("close complete\n");
614 static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd) {
615 cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg | SUPPORTED_FIBRE);
616 cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg | ADVERTISED_FIBRE);
617 cmd->speed = SPEED_1000;
618 cmd->duplex = DUPLEX_FULL;
619 cmd->port = PORT_FIBRE;
620 cmd->phy_address = 0;
621 cmd->transceiver = XCVR_INTERNAL;
622 cmd->autoneg = AUTONEG_ENABLE;
628 static void netdev_get_drvinfo (struct net_device *dev, struct ethtool_drvinfo *info) {
629 strncpy(info->driver, ibmveth_driver_name, sizeof(info->driver) - 1);
630 strncpy(info->version, ibmveth_driver_version, sizeof(info->version) - 1);
633 static u32 netdev_get_link(struct net_device *dev) {
637 static const struct ethtool_ops netdev_ethtool_ops = {
638 .get_drvinfo = netdev_get_drvinfo,
639 .get_settings = netdev_get_settings,
640 .get_link = netdev_get_link,
641 .get_sg = ethtool_op_get_sg,
642 .get_tx_csum = ethtool_op_get_tx_csum,
645 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
650 #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
652 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *netdev)
654 struct ibmveth_adapter *adapter = netdev->priv;
655 union ibmveth_buf_desc desc[IbmVethMaxSendFrags];
656 unsigned long lpar_rc;
657 int nfrags = 0, curfrag;
658 unsigned long correlator;
660 unsigned int retry_count;
661 unsigned int tx_dropped = 0;
662 unsigned int tx_bytes = 0;
663 unsigned int tx_packets = 0;
664 unsigned int tx_send_failed = 0;
665 unsigned int tx_map_failed = 0;
668 if ((skb_shinfo(skb)->nr_frags + 1) > IbmVethMaxSendFrags) {
673 memset(&desc, 0, sizeof(desc));
675 /* nfrags = number of frags after the initial fragment */
676 nfrags = skb_shinfo(skb)->nr_frags;
679 adapter->tx_multidesc_send++;
681 /* map the initial fragment */
682 desc[0].fields.length = nfrags ? skb->len - skb->data_len : skb->len;
683 desc[0].fields.address = dma_map_single(&adapter->vdev->dev, skb->data,
684 desc[0].fields.length, DMA_TO_DEVICE);
685 desc[0].fields.valid = 1;
687 if(dma_mapping_error(desc[0].fields.address)) {
688 ibmveth_error_printk("tx: unable to map initial fragment\n");
696 /* map fragments past the initial portion if there are any */
698 skb_frag_t *frag = &skb_shinfo(skb)->frags[curfrag];
699 desc[curfrag+1].fields.address
700 = dma_map_single(&adapter->vdev->dev,
701 page_address(frag->page) + frag->page_offset,
702 frag->size, DMA_TO_DEVICE);
703 desc[curfrag+1].fields.length = frag->size;
704 desc[curfrag+1].fields.valid = 1;
706 if(dma_mapping_error(desc[curfrag+1].fields.address)) {
707 ibmveth_error_printk("tx: unable to map fragment %d\n", curfrag);
710 /* Free all the mappings we just created */
711 while(curfrag < nfrags) {
712 dma_unmap_single(&adapter->vdev->dev,
713 desc[curfrag+1].fields.address,
714 desc[curfrag+1].fields.length,
722 /* send the frame. Arbitrarily set retrycount to 1024 */
726 lpar_rc = h_send_logical_lan(adapter->vdev->unit_address,
735 } while ((lpar_rc == H_BUSY) && (retry_count--));
737 if(lpar_rc != H_SUCCESS && lpar_rc != H_DROPPED) {
739 ibmveth_error_printk("tx: h_send_logical_lan failed with rc=%ld\n", lpar_rc);
740 for(i = 0; i < 6; i++) {
741 ibmveth_error_printk("tx: desc[%i] valid=%d, len=%d, address=0x%d\n", i,
742 desc[i].fields.valid, desc[i].fields.length, desc[i].fields.address);
748 tx_bytes += skb->len;
749 netdev->trans_start = jiffies;
753 dma_unmap_single(&adapter->vdev->dev,
754 desc[nfrags].fields.address,
755 desc[nfrags].fields.length, DMA_TO_DEVICE);
756 } while(--nfrags >= 0);
758 out: spin_lock_irqsave(&adapter->stats_lock, flags);
759 adapter->stats.tx_dropped += tx_dropped;
760 adapter->stats.tx_bytes += tx_bytes;
761 adapter->stats.tx_packets += tx_packets;
762 adapter->tx_send_failed += tx_send_failed;
763 adapter->tx_map_failed += tx_map_failed;
764 spin_unlock_irqrestore(&adapter->stats_lock, flags);
770 static int ibmveth_poll(struct net_device *netdev, int *budget)
772 struct ibmveth_adapter *adapter = netdev->priv;
773 int max_frames_to_process = netdev->quota;
774 int frames_processed = 0;
776 unsigned long lpar_rc;
780 struct net_device *netdev = adapter->netdev;
782 if(ibmveth_rxq_pending_buffer(adapter)) {
787 if(!ibmveth_rxq_buffer_valid(adapter)) {
788 wmb(); /* suggested by larson1 */
789 adapter->rx_invalid_buffer++;
790 ibmveth_debug_printk("recycling invalid buffer\n");
791 ibmveth_rxq_recycle_buffer(adapter);
793 int length = ibmveth_rxq_frame_length(adapter);
794 int offset = ibmveth_rxq_frame_offset(adapter);
795 skb = ibmveth_rxq_get_buffer(adapter);
797 ibmveth_rxq_harvest_buffer(adapter);
799 skb_reserve(skb, offset);
800 skb_put(skb, length);
801 skb->protocol = eth_type_trans(skb, netdev);
803 netif_receive_skb(skb); /* send it up */
805 adapter->stats.rx_packets++;
806 adapter->stats.rx_bytes += length;
808 netdev->last_rx = jiffies;
813 } while(more_work && (frames_processed < max_frames_to_process));
815 ibmveth_replenish_task(adapter);
818 /* more work to do - return that we are not done yet */
819 netdev->quota -= frames_processed;
820 *budget -= frames_processed;
824 /* we think we are done - reenable interrupts, then check once more to make sure we are done */
825 lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_ENABLE);
827 ibmveth_assert(lpar_rc == H_SUCCESS);
829 netif_rx_complete(netdev);
831 if(ibmveth_rxq_pending_buffer(adapter) && netif_rx_reschedule(netdev, frames_processed))
833 lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
834 ibmveth_assert(lpar_rc == H_SUCCESS);
839 netdev->quota -= frames_processed;
840 *budget -= frames_processed;
842 /* we really are done */
846 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
848 struct net_device *netdev = dev_instance;
849 struct ibmveth_adapter *adapter = netdev->priv;
850 unsigned long lpar_rc;
852 if(netif_rx_schedule_prep(netdev)) {
853 lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
854 ibmveth_assert(lpar_rc == H_SUCCESS);
855 __netif_rx_schedule(netdev);
860 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev)
862 struct ibmveth_adapter *adapter = dev->priv;
863 return &adapter->stats;
866 static void ibmveth_set_multicast_list(struct net_device *netdev)
868 struct ibmveth_adapter *adapter = netdev->priv;
869 unsigned long lpar_rc;
871 if((netdev->flags & IFF_PROMISC) || (netdev->mc_count > adapter->mcastFilterSize)) {
872 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
873 IbmVethMcastEnableRecv |
874 IbmVethMcastDisableFiltering,
876 if(lpar_rc != H_SUCCESS) {
877 ibmveth_error_printk("h_multicast_ctrl rc=%ld when entering promisc mode\n", lpar_rc);
880 struct dev_mc_list *mclist = netdev->mc_list;
882 /* clear the filter table & disable filtering */
883 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
884 IbmVethMcastEnableRecv |
885 IbmVethMcastDisableFiltering |
886 IbmVethMcastClearFilterTable,
888 if(lpar_rc != H_SUCCESS) {
889 ibmveth_error_printk("h_multicast_ctrl rc=%ld when attempting to clear filter table\n", lpar_rc);
891 /* add the addresses to the filter table */
892 for(i = 0; i < netdev->mc_count; ++i, mclist = mclist->next) {
893 // add the multicast address to the filter table
894 unsigned long mcast_addr = 0;
895 memcpy(((char *)&mcast_addr)+2, mclist->dmi_addr, 6);
896 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
897 IbmVethMcastAddFilter,
899 if(lpar_rc != H_SUCCESS) {
900 ibmveth_error_printk("h_multicast_ctrl rc=%ld when adding an entry to the filter table\n", lpar_rc);
904 /* re-enable filtering */
905 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
906 IbmVethMcastEnableFiltering,
908 if(lpar_rc != H_SUCCESS) {
909 ibmveth_error_printk("h_multicast_ctrl rc=%ld when enabling filtering\n", lpar_rc);
914 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
916 struct ibmveth_adapter *adapter = dev->priv;
917 int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
921 if (new_mtu < IBMVETH_MAX_MTU)
924 for (i = 0; i < IbmVethNumBufferPools; i++)
925 if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size)
928 if (i == IbmVethNumBufferPools)
931 /* Look for an active buffer pool that can hold the new MTU */
932 for(i = 0; i<IbmVethNumBufferPools; i++) {
933 if (!adapter->rx_buff_pool[i].active) {
934 adapter->rx_buff_pool[i].active = 1;
938 if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size) {
939 if (reinit && netif_running(adapter->netdev)) {
940 adapter->pool_config = 1;
941 ibmveth_close(adapter->netdev);
942 adapter->pool_config = 0;
944 if ((rc = ibmveth_open(adapter->netdev)))
954 #ifdef CONFIG_NET_POLL_CONTROLLER
955 static void ibmveth_poll_controller(struct net_device *dev)
957 ibmveth_replenish_task(dev->priv);
958 ibmveth_interrupt(dev->irq, dev);
962 static int __devinit ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
965 struct net_device *netdev;
966 struct ibmveth_adapter *adapter = NULL;
968 unsigned char *mac_addr_p;
969 unsigned int *mcastFilterSize_p;
972 ibmveth_debug_printk_no_adapter("entering ibmveth_probe for UA 0x%x\n",
975 mac_addr_p = (unsigned char *) vio_get_attribute(dev,
976 VETH_MAC_ADDR, NULL);
978 printk(KERN_ERR "(%s:%3.3d) ERROR: Can't find VETH_MAC_ADDR "
979 "attribute\n", __FILE__, __LINE__);
983 mcastFilterSize_p = (unsigned int *) vio_get_attribute(dev,
984 VETH_MCAST_FILTER_SIZE, NULL);
985 if(!mcastFilterSize_p) {
986 printk(KERN_ERR "(%s:%3.3d) ERROR: Can't find "
987 "VETH_MCAST_FILTER_SIZE attribute\n",
992 netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
997 SET_MODULE_OWNER(netdev);
999 adapter = netdev->priv;
1000 memset(adapter, 0, sizeof(adapter));
1001 dev->dev.driver_data = netdev;
1003 adapter->vdev = dev;
1004 adapter->netdev = netdev;
1005 adapter->mcastFilterSize= *mcastFilterSize_p;
1006 adapter->pool_config = 0;
1008 /* Some older boxes running PHYP non-natively have an OF that
1009 returns a 8-byte local-mac-address field (and the first
1010 2 bytes have to be ignored) while newer boxes' OF return
1011 a 6-byte field. Note that IEEE 1275 specifies that
1012 local-mac-address must be a 6-byte field.
1013 The RPA doc specifies that the first byte must be 10b, so
1014 we'll just look for it to solve this 8 vs. 6 byte field issue */
1016 if ((*mac_addr_p & 0x3) != 0x02)
1019 adapter->mac_addr = 0;
1020 memcpy(&adapter->mac_addr, mac_addr_p, 6);
1022 netdev->irq = dev->irq;
1023 netdev->open = ibmveth_open;
1024 netdev->poll = ibmveth_poll;
1025 netdev->weight = 16;
1026 netdev->stop = ibmveth_close;
1027 netdev->hard_start_xmit = ibmveth_start_xmit;
1028 netdev->get_stats = ibmveth_get_stats;
1029 netdev->set_multicast_list = ibmveth_set_multicast_list;
1030 netdev->do_ioctl = ibmveth_ioctl;
1031 netdev->ethtool_ops = &netdev_ethtool_ops;
1032 netdev->change_mtu = ibmveth_change_mtu;
1033 SET_NETDEV_DEV(netdev, &dev->dev);
1034 #ifdef CONFIG_NET_POLL_CONTROLLER
1035 netdev->poll_controller = ibmveth_poll_controller;
1037 netdev->features |= NETIF_F_LLTX;
1038 spin_lock_init(&adapter->stats_lock);
1040 memcpy(&netdev->dev_addr, &adapter->mac_addr, netdev->addr_len);
1042 for(i = 0; i<IbmVethNumBufferPools; i++) {
1043 struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
1044 ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
1045 pool_count[i], pool_size[i],
1047 kobj->parent = &dev->dev.kobj;
1048 sprintf(kobj->name, "pool%d", i);
1049 kobj->ktype = &ktype_veth_pool;
1050 kobject_register(kobj);
1053 ibmveth_debug_printk("adapter @ 0x%p\n", adapter);
1055 adapter->buffer_list_dma = DMA_ERROR_CODE;
1056 adapter->filter_list_dma = DMA_ERROR_CODE;
1057 adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
1059 ibmveth_debug_printk("registering netdev...\n");
1061 rc = register_netdev(netdev);
1064 ibmveth_debug_printk("failed to register netdev rc=%d\n", rc);
1065 free_netdev(netdev);
1069 ibmveth_debug_printk("registered\n");
1071 ibmveth_proc_register_adapter(adapter);
1076 static int __devexit ibmveth_remove(struct vio_dev *dev)
1078 struct net_device *netdev = dev->dev.driver_data;
1079 struct ibmveth_adapter *adapter = netdev->priv;
1082 for(i = 0; i<IbmVethNumBufferPools; i++)
1083 kobject_unregister(&adapter->rx_buff_pool[i].kobj);
1085 unregister_netdev(netdev);
1087 ibmveth_proc_unregister_adapter(adapter);
1089 free_netdev(netdev);
1093 #ifdef CONFIG_PROC_FS
1094 static void ibmveth_proc_register_driver(void)
1096 ibmveth_proc_dir = proc_mkdir(IBMVETH_PROC_DIR, NULL);
1097 if (ibmveth_proc_dir) {
1098 SET_MODULE_OWNER(ibmveth_proc_dir);
1102 static void ibmveth_proc_unregister_driver(void)
1104 remove_proc_entry(IBMVETH_PROC_DIR, NULL);
1107 static void *ibmveth_seq_start(struct seq_file *seq, loff_t *pos)
1116 static void *ibmveth_seq_next(struct seq_file *seq, void *v, loff_t *pos)
1122 static void ibmveth_seq_stop(struct seq_file *seq, void *v)
1126 static int ibmveth_seq_show(struct seq_file *seq, void *v)
1128 struct ibmveth_adapter *adapter = seq->private;
1129 char *current_mac = ((char*) &adapter->netdev->dev_addr);
1130 char *firmware_mac = ((char*) &adapter->mac_addr) ;
1132 seq_printf(seq, "%s %s\n\n", ibmveth_driver_string, ibmveth_driver_version);
1134 seq_printf(seq, "Unit Address: 0x%x\n", adapter->vdev->unit_address);
1135 seq_printf(seq, "Current MAC: %02X:%02X:%02X:%02X:%02X:%02X\n",
1136 current_mac[0], current_mac[1], current_mac[2],
1137 current_mac[3], current_mac[4], current_mac[5]);
1138 seq_printf(seq, "Firmware MAC: %02X:%02X:%02X:%02X:%02X:%02X\n",
1139 firmware_mac[0], firmware_mac[1], firmware_mac[2],
1140 firmware_mac[3], firmware_mac[4], firmware_mac[5]);
1142 seq_printf(seq, "\nAdapter Statistics:\n");
1143 seq_printf(seq, " TX: skbuffs linearized: %ld\n", adapter->tx_linearized);
1144 seq_printf(seq, " multi-descriptor sends: %ld\n", adapter->tx_multidesc_send);
1145 seq_printf(seq, " skb_linearize failures: %ld\n", adapter->tx_linearize_failed);
1146 seq_printf(seq, " vio_map_single failres: %ld\n", adapter->tx_map_failed);
1147 seq_printf(seq, " send failures: %ld\n", adapter->tx_send_failed);
1148 seq_printf(seq, " RX: replenish task cycles: %ld\n", adapter->replenish_task_cycles);
1149 seq_printf(seq, " alloc_skb_failures: %ld\n", adapter->replenish_no_mem);
1150 seq_printf(seq, " add buffer failures: %ld\n", adapter->replenish_add_buff_failure);
1151 seq_printf(seq, " invalid buffers: %ld\n", adapter->rx_invalid_buffer);
1152 seq_printf(seq, " no buffers: %ld\n", adapter->rx_no_buffer);
1156 static struct seq_operations ibmveth_seq_ops = {
1157 .start = ibmveth_seq_start,
1158 .next = ibmveth_seq_next,
1159 .stop = ibmveth_seq_stop,
1160 .show = ibmveth_seq_show,
1163 static int ibmveth_proc_open(struct inode *inode, struct file *file)
1165 struct seq_file *seq;
1166 struct proc_dir_entry *proc;
1169 rc = seq_open(file, &ibmveth_seq_ops);
1171 /* recover the pointer buried in proc_dir_entry data */
1172 seq = file->private_data;
1174 seq->private = proc->data;
1179 static const struct file_operations ibmveth_proc_fops = {
1180 .owner = THIS_MODULE,
1181 .open = ibmveth_proc_open,
1183 .llseek = seq_lseek,
1184 .release = seq_release,
1187 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter)
1189 struct proc_dir_entry *entry;
1190 if (ibmveth_proc_dir) {
1192 sprintf(u_addr, "%x", adapter->vdev->unit_address);
1193 entry = create_proc_entry(u_addr, S_IFREG, ibmveth_proc_dir);
1195 ibmveth_error_printk("Cannot create adapter proc entry");
1197 entry->data = (void *) adapter;
1198 entry->proc_fops = &ibmveth_proc_fops;
1199 SET_MODULE_OWNER(entry);
1205 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter)
1207 if (ibmveth_proc_dir) {
1209 sprintf(u_addr, "%x", adapter->vdev->unit_address);
1210 remove_proc_entry(u_addr, ibmveth_proc_dir);
1214 #else /* CONFIG_PROC_FS */
1215 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter)
1219 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter)
1222 static void ibmveth_proc_register_driver(void)
1226 static void ibmveth_proc_unregister_driver(void)
1229 #endif /* CONFIG_PROC_FS */
1231 static struct attribute veth_active_attr;
1232 static struct attribute veth_num_attr;
1233 static struct attribute veth_size_attr;
1235 static ssize_t veth_pool_show(struct kobject * kobj,
1236 struct attribute * attr, char * buf)
1238 struct ibmveth_buff_pool *pool = container_of(kobj,
1239 struct ibmveth_buff_pool,
1242 if (attr == &veth_active_attr)
1243 return sprintf(buf, "%d\n", pool->active);
1244 else if (attr == &veth_num_attr)
1245 return sprintf(buf, "%d\n", pool->size);
1246 else if (attr == &veth_size_attr)
1247 return sprintf(buf, "%d\n", pool->buff_size);
1251 static ssize_t veth_pool_store(struct kobject * kobj, struct attribute * attr,
1252 const char * buf, size_t count)
1254 struct ibmveth_buff_pool *pool = container_of(kobj,
1255 struct ibmveth_buff_pool,
1257 struct net_device *netdev =
1258 container_of(kobj->parent, struct device, kobj)->driver_data;
1259 struct ibmveth_adapter *adapter = netdev->priv;
1260 long value = simple_strtol(buf, NULL, 10);
1263 if (attr == &veth_active_attr) {
1264 if (value && !pool->active) {
1265 if (netif_running(netdev)) {
1266 if(ibmveth_alloc_buffer_pool(pool)) {
1267 ibmveth_error_printk("unable to alloc pool\n");
1271 adapter->pool_config = 1;
1272 ibmveth_close(netdev);
1273 adapter->pool_config = 0;
1274 if ((rc = ibmveth_open(netdev)))
1278 } else if (!value && pool->active) {
1279 int mtu = netdev->mtu + IBMVETH_BUFF_OH;
1281 /* Make sure there is a buffer pool with buffers that
1282 can hold a packet of the size of the MTU */
1283 for(i = 0; i<IbmVethNumBufferPools; i++) {
1284 if (pool == &adapter->rx_buff_pool[i])
1286 if (!adapter->rx_buff_pool[i].active)
1288 if (mtu < adapter->rx_buff_pool[i].buff_size) {
1290 h_free_logical_lan_buffer(adapter->
1298 ibmveth_error_printk("no active pool >= MTU\n");
1302 } else if (attr == &veth_num_attr) {
1303 if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT)
1306 if (netif_running(netdev)) {
1307 adapter->pool_config = 1;
1308 ibmveth_close(netdev);
1309 adapter->pool_config = 0;
1311 if ((rc = ibmveth_open(netdev)))
1316 } else if (attr == &veth_size_attr) {
1317 if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE)
1320 if (netif_running(netdev)) {
1321 adapter->pool_config = 1;
1322 ibmveth_close(netdev);
1323 adapter->pool_config = 0;
1324 pool->buff_size = value;
1325 if ((rc = ibmveth_open(netdev)))
1328 pool->buff_size = value;
1332 /* kick the interrupt handler to allocate/deallocate pools */
1333 ibmveth_interrupt(netdev->irq, netdev);
1338 #define ATTR(_name, _mode) \
1339 struct attribute veth_##_name##_attr = { \
1340 .name = __stringify(_name), .mode = _mode, .owner = THIS_MODULE \
1343 static ATTR(active, 0644);
1344 static ATTR(num, 0644);
1345 static ATTR(size, 0644);
1347 static struct attribute * veth_pool_attrs[] = {
1354 static struct sysfs_ops veth_pool_ops = {
1355 .show = veth_pool_show,
1356 .store = veth_pool_store,
1359 static struct kobj_type ktype_veth_pool = {
1361 .sysfs_ops = &veth_pool_ops,
1362 .default_attrs = veth_pool_attrs,
1366 static struct vio_device_id ibmveth_device_table[] __devinitdata= {
1367 { "network", "IBM,l-lan"},
1370 MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
1372 static struct vio_driver ibmveth_driver = {
1373 .id_table = ibmveth_device_table,
1374 .probe = ibmveth_probe,
1375 .remove = ibmveth_remove,
1377 .name = ibmveth_driver_name,
1378 .owner = THIS_MODULE,
1382 static int __init ibmveth_module_init(void)
1384 ibmveth_printk("%s: %s %s\n", ibmveth_driver_name, ibmveth_driver_string, ibmveth_driver_version);
1386 ibmveth_proc_register_driver();
1388 return vio_register_driver(&ibmveth_driver);
1391 static void __exit ibmveth_module_exit(void)
1393 vio_unregister_driver(&ibmveth_driver);
1394 ibmveth_proc_unregister_driver();
1397 module_init(ibmveth_module_init);
1398 module_exit(ibmveth_module_exit);