2 Madge Ambassador ATM Adapter driver.
3 Copyright (C) 1995-1999 Madge Networks Ltd.
5 This program is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2 of the License, or
8 (at your option) any later version.
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 The GNU GPL is contained in /usr/doc/copyright/GPL on a Debian
20 system and in the file COPYING in the Linux kernel source.
23 /* * dedicated to the memory of Graham Gordon 1971-1998 * */
25 #include <linux/module.h>
26 #include <linux/types.h>
27 #include <linux/pci.h>
28 #include <linux/kernel.h>
29 #include <linux/init.h>
30 #include <linux/ioport.h>
31 #include <linux/atmdev.h>
32 #include <linux/delay.h>
33 #include <linux/interrupt.h>
34 #include <linux/poison.h>
36 #include <asm/atomic.h>
38 #include <asm/byteorder.h>
40 #include "ambassador.h"
42 #define maintainer_string "Giuliano Procida at Madge Networks <gprocida@madge.com>"
43 #define description_string "Madge ATM Ambassador driver"
44 #define version_string "1.2.4"
46 static inline void __init show_version (void) {
47 printk ("%s version %s\n", description_string, version_string);
54 I Hardware, detection, initialisation and shutdown.
58 This driver is for the PCI ATMizer-based Ambassador card (except
59 very early versions). It is not suitable for the similar EISA "TR7"
60 card. Commercially, both cards are known as Collage Server ATM
63 The loader supports image transfer to the card, image start and few
64 other miscellaneous commands.
66 Only AAL5 is supported with vpi = 0 and vci in the range 0 to 1023.
68 The cards are big-endian.
72 Standard PCI stuff, the early cards are detected and rejected.
76 The cards are reset and the self-test results are checked. The
77 microcode image is then transferred and started. This waits for a
78 pointer to a descriptor containing details of the host-based queues
79 and buffers and various parameters etc. Once they are processed
80 normal operations may begin. The BIA is read using a microcode
85 This may be accomplished either by a card reset or via the microcode
86 shutdown command. Further investigation required.
90 The card reset does not affect PCI configuration (good) or the
91 contents of several other "shared run-time registers" (bad) which
92 include doorbell and interrupt control as well as EEPROM and PCI
93 control. The driver must be careful when modifying these registers
94 not to touch bits it does not use and to undo any changes at exit.
100 The adapter is quite intelligent (fast) and has a simple interface
101 (few features). VPI is always zero, 1024 VCIs are supported. There
102 is limited cell rate support. UBR channels can be capped and ABR
103 (explicit rate, but not EFCI) is supported. There is no CBR or VBR
106 1. Driver <-> Adapter Communication
108 Apart from the basic loader commands, the driver communicates
109 through three entities: the command queue (CQ), the transmit queue
110 pair (TXQ) and the receive queue pairs (RXQ). These three entities
111 are set up by the host and passed to the microcode just after it has
114 All queues are host-based circular queues. They are contiguous and
115 (due to hardware limitations) have some restrictions as to their
116 locations in (bus) memory. They are of the "full means the same as
117 empty so don't do that" variety since the adapter uses pointers
120 The queue pairs work as follows: one queue is for supply to the
121 adapter, items in it are pending and are owned by the adapter; the
122 other is the queue for return from the adapter, items in it have
123 been dealt with by the adapter. The host adds items to the supply
124 (TX descriptors and free RX buffer descriptors) and removes items
125 from the return (TX and RX completions). The adapter deals with out
126 of order completions.
128 Interrupts (card to host) and the doorbell (host to card) are used
133 This is to communicate "open VC", "close VC", "get stats" etc. to
134 the adapter. At most one command is retired every millisecond by the
135 card. There is no out of order completion or notification. The
136 driver needs to check the return code of the command, waiting as
141 TX supply items are of variable length (scatter gather support) and
142 so the queue items are (more or less) pointers to the real thing.
143 Each TX supply item contains a unique, host-supplied handle (the skb
144 bus address seems most sensible as this works for Alphas as well,
145 there is no need to do any endian conversions on the handles).
147 TX return items consist of just the handles above.
149 3. RXQ (up to 4 of these with different lengths and buffer sizes)
151 RX supply items consist of a unique, host-supplied handle (the skb
152 bus address again) and a pointer to the buffer data area.
154 RX return items consist of the handle above, the VC, length and a
155 status word. This just screams "oh so easy" doesn't it?
157 Note on RX pool sizes:
159 Each pool should have enough buffers to handle a back-to-back stream
160 of minimum sized frames on a single VC. For example:
162 frame spacing = 3us (about right)
164 delay = IRQ lat + RX handling + RX buffer replenish = 20 (us) (a guess)
166 min number of buffers for one VC = 1 + delay/spacing (buffers)
168 delay/spacing = latency = (20+2)/3 = 7 (buffers) (rounding up)
170 The 20us delay assumes that there is no need to sleep; if we need to
171 sleep to get buffers we are going to drop frames anyway.
173 In fact, each pool should have enough buffers to support the
174 simultaneous reassembly of a separate frame on each VC and cope with
175 the case in which frames complete in round robin cell fashion on
178 Only one frame can complete at each cell arrival, so if "n" VCs are
179 open, the worst case is to have them all complete frames together
180 followed by all starting new frames together.
182 desired number of buffers = n + delay/spacing
184 These are the extreme requirements, however, they are "n+k" for some
185 "k" so we have only the constant to choose. This is the argument
186 rx_lats which current defaults to 7.
188 Actually, "n ? n+k : 0" is better and this is what is implemented,
189 subject to the limit given by the pool size.
193 Simple spinlocks are used around the TX and RX queue mechanisms.
194 Anyone with a faster, working method is welcome to implement it.
196 The adapter command queue is protected with a spinlock. We always
197 wait for commands to complete.
199 A more complex form of locking is used around parts of the VC open
200 and close functions. There are three reasons for a lock: 1. we need
201 to do atomic rate reservation and release (not used yet), 2. Opening
202 sometimes involves two adapter commands which must not be separated
203 by another command on the same VC, 3. the changes to RX pool size
204 must be atomic. The lock needs to work over context switches, so we
207 III Hardware Features and Microcode Bugs
211 *%^"$&%^$*&^"$(%^$#&^%$(&#%$*(&^#%!"!"!*!
215 All structures that are not accessed using DMA must be 4-byte
216 aligned (not a problem) and must not cross 4MB boundaries.
218 There is a DMA memory hole at E0000000-E00000FF (groan).
220 TX fragments (DMA read) must not cross 4MB boundaries (would be 16MB
221 but for a hardware bug).
223 RX buffers (DMA write) must not cross 16MB boundaries and must
224 include spare trailing bytes up to the next 4-byte boundary; they
225 will be written with rubbish.
227 The PLX likes to prefetch; if reading up to 4 u32 past the end of
228 each TX fragment is not a problem, then TX can be made to go a
229 little faster by passing a flag at init that disables a prefetch
230 workaround. We do not pass this flag. (new microcode only)
233 . Note that alloc_skb rounds up size to a 16byte boundary.
234 . Ensure all areas do not traverse 4MB boundaries.
235 . Ensure all areas do not start at a E00000xx bus address.
236 (I cannot be certain, but this may always hold with Linux)
237 . Make all failures cause a loud message.
238 . Discard non-conforming SKBs (causes TX failure or RX fill delay).
239 . Discard non-conforming TX fragment descriptors (the TX fails).
240 In the future we could:
241 . Allow RX areas that traverse 4MB (but not 16MB) boundaries.
242 . Segment TX areas into some/more fragments, when necessary.
243 . Relax checks for non-DMA items (ignore hole).
244 . Give scatter-gather (iovec) requirements using ???. (?)
246 3. VC close is broken (only for new microcode)
248 The VC close adapter microcode command fails to do anything if any
249 frames have been received on the VC but none have been transmitted.
250 Frames continue to be reassembled and passed (with IRQ) to the
257 . Timer code may be broken.
259 . Deal with buggy VC close (somehow) in microcode 12.
261 . Handle interrupted and/or non-blocking writes - is this a job for
264 . Add code to break up TX fragments when they span 4MB boundaries.
266 . Add SUNI phy layer (need to know where SUNI lives on card).
268 . Implement a tx_alloc fn to (a) satisfy TX alignment etc. and (b)
269 leave extra headroom space for Ambassador TX descriptors.
271 . Understand these elements of struct atm_vcc: recvq (proto?),
272 sleep, callback, listenq, backlog_quota, reply and user_back.
274 . Adjust TX/RX skb allocation to favour IP with LANE/CLIP (configurable).
276 . Impose a TX-pending limit (2?) on each VC, help avoid TX q overflow.
278 . Decide whether RX buffer recycling is or can be made completely safe;
279 turn it back on. It looks like Werner is going to axe this.
281 . Implement QoS changes on open VCs (involves extracting parts of VC open
282 and close into separate functions and using them to make changes).
284 . Hack on command queue so that someone can issue multiple commands and wait
285 on the last one (OR only "no-op" or "wait" commands are waited for).
287 . Eliminate need for while-schedule around do_command.
291 /********** microcode **********/
293 #ifdef AMB_NEW_MICROCODE
294 #define UCODE(x) UCODE2(atmsar12.x)
296 #define UCODE(x) UCODE2(atmsar11.x)
300 static u32 __devinitdata ucode_start =
301 #include UCODE(start)
304 static region __devinitdata ucode_regions[] = {
305 #include UCODE(regions)
309 static u32 __devinitdata ucode_data[] = {
314 static void do_housekeeping (unsigned long arg);
315 /********** globals **********/
317 static unsigned short debug = 0;
318 static unsigned int cmds = 8;
319 static unsigned int txs = 32;
320 static unsigned int rxs[NUM_RX_POOLS] = { 64, 64, 64, 64 };
321 static unsigned int rxs_bs[NUM_RX_POOLS] = { 4080, 12240, 36720, 65535 };
322 static unsigned int rx_lats = 7;
323 static unsigned char pci_lat = 0;
325 static const unsigned long onegigmask = -1 << 30;
327 /********** access to adapter **********/
329 static inline void wr_plain (const amb_dev * dev, size_t addr, u32 data) {
330 PRINTD (DBG_FLOW|DBG_REGS, "wr: %08zx <- %08x", addr, data);
332 dev->membase[addr / sizeof(u32)] = data;
334 outl (data, dev->iobase + addr);
338 static inline u32 rd_plain (const amb_dev * dev, size_t addr) {
340 u32 data = dev->membase[addr / sizeof(u32)];
342 u32 data = inl (dev->iobase + addr);
344 PRINTD (DBG_FLOW|DBG_REGS, "rd: %08zx -> %08x", addr, data);
348 static inline void wr_mem (const amb_dev * dev, size_t addr, u32 data) {
349 __be32 be = cpu_to_be32 (data);
350 PRINTD (DBG_FLOW|DBG_REGS, "wr: %08zx <- %08x b[%08x]", addr, data, be);
352 dev->membase[addr / sizeof(u32)] = be;
354 outl (be, dev->iobase + addr);
358 static inline u32 rd_mem (const amb_dev * dev, size_t addr) {
360 __be32 be = dev->membase[addr / sizeof(u32)];
362 __be32 be = inl (dev->iobase + addr);
364 u32 data = be32_to_cpu (be);
365 PRINTD (DBG_FLOW|DBG_REGS, "rd: %08zx -> %08x b[%08x]", addr, data, be);
369 /********** dump routines **********/
371 static inline void dump_registers (const amb_dev * dev) {
372 #ifdef DEBUG_AMBASSADOR
373 if (debug & DBG_REGS) {
375 PRINTD (DBG_REGS, "reading PLX control: ");
376 for (i = 0x00; i < 0x30; i += sizeof(u32))
378 PRINTD (DBG_REGS, "reading mailboxes: ");
379 for (i = 0x40; i < 0x60; i += sizeof(u32))
381 PRINTD (DBG_REGS, "reading doorb irqev irqen reset:");
382 for (i = 0x60; i < 0x70; i += sizeof(u32))
391 static inline void dump_loader_block (volatile loader_block * lb) {
392 #ifdef DEBUG_AMBASSADOR
394 PRINTDB (DBG_LOAD, "lb @ %p; res: %d, cmd: %d, pay:",
395 lb, be32_to_cpu (lb->result), be32_to_cpu (lb->command));
396 for (i = 0; i < MAX_COMMAND_DATA; ++i)
397 PRINTDM (DBG_LOAD, " %08x", be32_to_cpu (lb->payload.data[i]));
398 PRINTDE (DBG_LOAD, ", vld: %08x", be32_to_cpu (lb->valid));
405 static inline void dump_command (command * cmd) {
406 #ifdef DEBUG_AMBASSADOR
408 PRINTDB (DBG_CMD, "cmd @ %p, req: %08x, pars:",
409 cmd, /*be32_to_cpu*/ (cmd->request));
410 for (i = 0; i < 3; ++i)
411 PRINTDM (DBG_CMD, " %08x", /*be32_to_cpu*/ (cmd->args.par[i]));
412 PRINTDE (DBG_CMD, "");
419 static inline void dump_skb (char * prefix, unsigned int vc, struct sk_buff * skb) {
420 #ifdef DEBUG_AMBASSADOR
422 unsigned char * data = skb->data;
423 PRINTDB (DBG_DATA, "%s(%u) ", prefix, vc);
424 for (i=0; i<skb->len && i < 256;i++)
425 PRINTDM (DBG_DATA, "%02x ", data[i]);
426 PRINTDE (DBG_DATA,"");
435 /********** check memory areas for use by Ambassador **********/
437 /* see limitations under Hardware Features */
439 static inline int check_area (void * start, size_t length) {
440 // assumes length > 0
441 const u32 fourmegmask = -1 << 22;
442 const u32 twofivesixmask = -1 << 8;
443 const u32 starthole = 0xE0000000;
444 u32 startaddress = virt_to_bus (start);
445 u32 lastaddress = startaddress+length-1;
446 if ((startaddress ^ lastaddress) & fourmegmask ||
447 (startaddress & twofivesixmask) == starthole) {
448 PRINTK (KERN_ERR, "check_area failure: [%x,%x] - mail maintainer!",
449 startaddress, lastaddress);
456 /********** free an skb (as per ATM device driver documentation) **********/
458 static inline void amb_kfree_skb (struct sk_buff * skb) {
459 if (ATM_SKB(skb)->vcc->pop) {
460 ATM_SKB(skb)->vcc->pop (ATM_SKB(skb)->vcc, skb);
462 dev_kfree_skb_any (skb);
466 /********** TX completion **********/
468 static inline void tx_complete (amb_dev * dev, tx_out * tx) {
469 tx_simple * tx_descr = bus_to_virt (tx->handle);
470 struct sk_buff * skb = tx_descr->skb;
472 PRINTD (DBG_FLOW|DBG_TX, "tx_complete %p %p", dev, tx);
475 atomic_inc(&ATM_SKB(skb)->vcc->stats->tx);
477 // free the descriptor
487 /********** RX completion **********/
489 static void rx_complete (amb_dev * dev, rx_out * rx) {
490 struct sk_buff * skb = bus_to_virt (rx->handle);
491 u16 vc = be16_to_cpu (rx->vc);
492 // unused: u16 lec_id = be16_to_cpu (rx->lec_id);
493 u16 status = be16_to_cpu (rx->status);
494 u16 rx_len = be16_to_cpu (rx->length);
496 PRINTD (DBG_FLOW|DBG_RX, "rx_complete %p %p (len=%hu)", dev, rx, rx_len);
498 // XXX move this in and add to VC stats ???
500 struct atm_vcc * atm_vcc = dev->rxer[vc];
505 if (rx_len <= atm_vcc->qos.rxtp.max_sdu) {
507 if (atm_charge (atm_vcc, skb->truesize)) {
509 // prepare socket buffer
510 ATM_SKB(skb)->vcc = atm_vcc;
511 skb_put (skb, rx_len);
513 dump_skb ("<<<", vc, skb);
516 atomic_inc(&atm_vcc->stats->rx);
517 __net_timestamp(skb);
518 // end of our responsability
519 atm_vcc->push (atm_vcc, skb);
523 // someone fix this (message), please!
524 PRINTD (DBG_INFO|DBG_RX, "dropped thanks to atm_charge (vc %hu, truesize %u)", vc, skb->truesize);
525 // drop stats incremented in atm_charge
529 PRINTK (KERN_INFO, "dropped over-size frame");
530 // should we count this?
531 atomic_inc(&atm_vcc->stats->rx_drop);
535 PRINTD (DBG_WARN|DBG_RX, "got frame but RX closed for channel %hu", vc);
536 // this is an adapter bug, only in new version of microcode
540 dev->stats.rx.error++;
541 if (status & CRC_ERR)
542 dev->stats.rx.badcrc++;
543 if (status & LEN_ERR)
544 dev->stats.rx.toolong++;
545 if (status & ABORT_ERR)
546 dev->stats.rx.aborted++;
547 if (status & UNUSED_ERR)
548 dev->stats.rx.unused++;
551 dev_kfree_skb_any (skb);
557 Note on queue handling.
559 Here "give" and "take" refer to queue entries and a queue (pair)
560 rather than frames to or from the host or adapter. Empty frame
561 buffers are given to the RX queue pair and returned unused or
562 containing RX frames. TX frames (well, pointers to TX fragment
563 lists) are given to the TX queue pair, completions are returned.
567 /********** command queue **********/
569 // I really don't like this, but it's the best I can do at the moment
571 // also, the callers are responsible for byte order as the microcode
572 // sometimes does 16-bit accesses (yuk yuk yuk)
574 static int command_do (amb_dev * dev, command * cmd) {
575 amb_cq * cq = &dev->cq;
576 volatile amb_cq_ptrs * ptrs = &cq->ptrs;
579 PRINTD (DBG_FLOW|DBG_CMD, "command_do %p", dev);
581 if (test_bit (dead, &dev->flags))
584 spin_lock (&cq->lock);
587 if (cq->pending < cq->maximum) {
588 // remember my slot for later
590 PRINTD (DBG_CMD, "command in slot %p", my_slot);
597 ptrs->in = NEXTQ (ptrs->in, ptrs->start, ptrs->limit);
600 wr_mem (dev, offsetof(amb_mem, mb.adapter.cmd_address), virt_to_bus (ptrs->in));
602 if (cq->pending > cq->high)
603 cq->high = cq->pending;
604 spin_unlock (&cq->lock);
606 // these comments were in a while-loop before, msleep removes the loop
608 // PRINTD (DBG_CMD, "wait: sleeping %lu for command", timeout);
611 // wait for my slot to be reached (all waiters are here or above, until...)
612 while (ptrs->out != my_slot) {
613 PRINTD (DBG_CMD, "wait: command slot (now at %p)", ptrs->out);
614 set_current_state(TASK_UNINTERRUPTIBLE);
618 // wait on my slot (... one gets to its slot, and... )
619 while (ptrs->out->request != cpu_to_be32 (SRB_COMPLETE)) {
620 PRINTD (DBG_CMD, "wait: command slot completion");
621 set_current_state(TASK_UNINTERRUPTIBLE);
625 PRINTD (DBG_CMD, "command complete");
626 // update queue (... moves the queue along to the next slot)
627 spin_lock (&cq->lock);
631 ptrs->out = NEXTQ (ptrs->out, ptrs->start, ptrs->limit);
632 spin_unlock (&cq->lock);
637 spin_unlock (&cq->lock);
643 /********** TX queue pair **********/
645 static inline int tx_give (amb_dev * dev, tx_in * tx) {
646 amb_txq * txq = &dev->txq;
649 PRINTD (DBG_FLOW|DBG_TX, "tx_give %p", dev);
651 if (test_bit (dead, &dev->flags))
654 spin_lock_irqsave (&txq->lock, flags);
656 if (txq->pending < txq->maximum) {
657 PRINTD (DBG_TX, "TX in slot %p", txq->in.ptr);
661 txq->in.ptr = NEXTQ (txq->in.ptr, txq->in.start, txq->in.limit);
662 // hand over the TX and ring the bell
663 wr_mem (dev, offsetof(amb_mem, mb.adapter.tx_address), virt_to_bus (txq->in.ptr));
664 wr_mem (dev, offsetof(amb_mem, doorbell), TX_FRAME);
666 if (txq->pending > txq->high)
667 txq->high = txq->pending;
668 spin_unlock_irqrestore (&txq->lock, flags);
672 spin_unlock_irqrestore (&txq->lock, flags);
677 static inline int tx_take (amb_dev * dev) {
678 amb_txq * txq = &dev->txq;
681 PRINTD (DBG_FLOW|DBG_TX, "tx_take %p", dev);
683 spin_lock_irqsave (&txq->lock, flags);
685 if (txq->pending && txq->out.ptr->handle) {
686 // deal with TX completion
687 tx_complete (dev, txq->out.ptr);
689 txq->out.ptr->handle = 0;
692 txq->out.ptr = NEXTQ (txq->out.ptr, txq->out.start, txq->out.limit);
694 spin_unlock_irqrestore (&txq->lock, flags);
698 spin_unlock_irqrestore (&txq->lock, flags);
703 /********** RX queue pairs **********/
705 static inline int rx_give (amb_dev * dev, rx_in * rx, unsigned char pool) {
706 amb_rxq * rxq = &dev->rxq[pool];
709 PRINTD (DBG_FLOW|DBG_RX, "rx_give %p[%hu]", dev, pool);
711 spin_lock_irqsave (&rxq->lock, flags);
713 if (rxq->pending < rxq->maximum) {
714 PRINTD (DBG_RX, "RX in slot %p", rxq->in.ptr);
718 rxq->in.ptr = NEXTQ (rxq->in.ptr, rxq->in.start, rxq->in.limit);
719 // hand over the RX buffer
720 wr_mem (dev, offsetof(amb_mem, mb.adapter.rx_address[pool]), virt_to_bus (rxq->in.ptr));
722 spin_unlock_irqrestore (&rxq->lock, flags);
725 spin_unlock_irqrestore (&rxq->lock, flags);
730 static inline int rx_take (amb_dev * dev, unsigned char pool) {
731 amb_rxq * rxq = &dev->rxq[pool];
734 PRINTD (DBG_FLOW|DBG_RX, "rx_take %p[%hu]", dev, pool);
736 spin_lock_irqsave (&rxq->lock, flags);
738 if (rxq->pending && (rxq->out.ptr->status || rxq->out.ptr->length)) {
739 // deal with RX completion
740 rx_complete (dev, rxq->out.ptr);
742 rxq->out.ptr->status = 0;
743 rxq->out.ptr->length = 0;
746 rxq->out.ptr = NEXTQ (rxq->out.ptr, rxq->out.start, rxq->out.limit);
748 if (rxq->pending < rxq->low)
749 rxq->low = rxq->pending;
750 spin_unlock_irqrestore (&rxq->lock, flags);
753 if (!rxq->pending && rxq->buffers_wanted)
755 spin_unlock_irqrestore (&rxq->lock, flags);
760 /********** RX Pool handling **********/
762 /* pre: buffers_wanted = 0, post: pending = 0 */
763 static inline void drain_rx_pool (amb_dev * dev, unsigned char pool) {
764 amb_rxq * rxq = &dev->rxq[pool];
766 PRINTD (DBG_FLOW|DBG_POOL, "drain_rx_pool %p %hu", dev, pool);
768 if (test_bit (dead, &dev->flags))
771 /* we are not quite like the fill pool routines as we cannot just
772 remove one buffer, we have to remove all of them, but we might as
774 if (rxq->pending > rxq->buffers_wanted) {
776 cmd.request = cpu_to_be32 (SRB_FLUSH_BUFFER_Q);
777 cmd.args.flush.flags = cpu_to_be32 (pool << SRB_POOL_SHIFT);
778 while (command_do (dev, &cmd))
780 /* the pool may also be emptied via the interrupt handler */
781 while (rxq->pending > rxq->buffers_wanted)
782 if (rx_take (dev, pool))
789 static void drain_rx_pools (amb_dev * dev) {
792 PRINTD (DBG_FLOW|DBG_POOL, "drain_rx_pools %p", dev);
794 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
795 drain_rx_pool (dev, pool);
798 static inline void fill_rx_pool (amb_dev * dev, unsigned char pool,
804 PRINTD (DBG_FLOW|DBG_POOL, "fill_rx_pool %p %hu %x", dev, pool, priority);
806 if (test_bit (dead, &dev->flags))
809 rxq = &dev->rxq[pool];
810 while (rxq->pending < rxq->maximum && rxq->pending < rxq->buffers_wanted) {
812 struct sk_buff * skb = alloc_skb (rxq->buffer_size, priority);
814 PRINTD (DBG_SKB|DBG_POOL, "failed to allocate skb for RX pool %hu", pool);
817 if (check_area (skb->data, skb->truesize)) {
818 dev_kfree_skb_any (skb);
821 // cast needed as there is no %? for pointer differences
822 PRINTD (DBG_SKB, "allocated skb at %p, head %p, area %li",
823 skb, skb->head, (long) (skb->end - skb->head));
824 rx.handle = virt_to_bus (skb);
825 rx.host_address = cpu_to_be32 (virt_to_bus (skb->data));
826 if (rx_give (dev, &rx, pool))
827 dev_kfree_skb_any (skb);
834 // top up all RX pools (can also be called as a bottom half)
835 static void fill_rx_pools (amb_dev * dev) {
838 PRINTD (DBG_FLOW|DBG_POOL, "fill_rx_pools %p", dev);
840 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
841 fill_rx_pool (dev, pool, GFP_ATOMIC);
846 /********** enable host interrupts **********/
848 static inline void interrupts_on (amb_dev * dev) {
849 wr_plain (dev, offsetof(amb_mem, interrupt_control),
850 rd_plain (dev, offsetof(amb_mem, interrupt_control))
851 | AMB_INTERRUPT_BITS);
854 /********** disable host interrupts **********/
856 static inline void interrupts_off (amb_dev * dev) {
857 wr_plain (dev, offsetof(amb_mem, interrupt_control),
858 rd_plain (dev, offsetof(amb_mem, interrupt_control))
859 &~ AMB_INTERRUPT_BITS);
862 /********** interrupt handling **********/
864 static irqreturn_t interrupt_handler(int irq, void *dev_id,
865 struct pt_regs *pt_regs) {
866 amb_dev * dev = (amb_dev *) dev_id;
869 PRINTD (DBG_IRQ|DBG_FLOW, "interrupt_handler: %p", dev_id);
872 PRINTD (DBG_IRQ|DBG_ERR, "irq with NULL dev_id: %d", irq);
877 u32 interrupt = rd_plain (dev, offsetof(amb_mem, interrupt));
879 // for us or someone else sharing the same interrupt
881 PRINTD (DBG_IRQ, "irq not for me: %d", irq);
886 PRINTD (DBG_IRQ, "FYI: interrupt was %08x", interrupt);
887 wr_plain (dev, offsetof(amb_mem, interrupt), -1);
891 unsigned int irq_work = 0;
893 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
894 while (!rx_take (dev, pool))
896 while (!tx_take (dev))
900 #ifdef FILL_RX_POOLS_IN_BH
901 schedule_work (&dev->bh);
906 PRINTD (DBG_IRQ, "work done: %u", irq_work);
908 PRINTD (DBG_IRQ|DBG_WARN, "no work done");
912 PRINTD (DBG_IRQ|DBG_FLOW, "interrupt_handler done: %p", dev_id);
916 /********** make rate (not quite as much fun as Horizon) **********/
918 static unsigned int make_rate (unsigned int rate, rounding r,
919 u16 * bits, unsigned int * actual) {
920 unsigned char exp = -1; // hush gcc
921 unsigned int man = -1; // hush gcc
923 PRINTD (DBG_FLOW|DBG_QOS, "make_rate %u", rate);
925 // rates in cells per second, ITU format (nasty 16-bit floating-point)
926 // given 5-bit e and 9-bit m:
927 // rate = EITHER (1+m/2^9)*2^e OR 0
928 // bits = EITHER 1<<14 | e<<9 | m OR 0
929 // (bit 15 is "reserved", bit 14 "non-zero")
930 // smallest rate is 0 (special representation)
931 // largest rate is (1+511/512)*2^31 = 4290772992 (< 2^32-1)
932 // smallest non-zero rate is (1+0/512)*2^0 = 1 (> 0)
934 // find position of top bit, this gives e
935 // remove top bit and shift (rounding if feeling clever) by 9-e
937 // ucode bug: please don't set bit 14! so 0 rate not representable
939 if (rate > 0xffc00000U) {
940 // larger than largest representable rate
950 // representable rate
955 // invariant: rate = man*2^(exp-31)
956 while (!(man & (1<<31))) {
961 // man has top bit set
962 // rate = (2^31+(man-2^31))*2^(exp-31)
963 // rate = (1+(man-2^31)/2^31)*2^exp
965 man &= 0xffffffffU; // a nop on 32-bit systems
966 // rate = (1+man/2^32)*2^exp
968 // exp is in the range 0 to 31, man is in the range 0 to 2^32-1
969 // time to lose significance... we want m in the range 0 to 2^9-1
970 // rounding presents a minor problem... we first decide which way
971 // we are rounding (based on given rounding direction and possibly
972 // the bits of the mantissa that are to be discarded).
981 // check all bits that we are discarding
983 man = (man>>(32-9)) + 1;
985 // no need to check for round up outside of range
994 case round_nearest: {
995 // check msb that we are discarding
996 if (man & (1<<(32-9-1))) {
997 man = (man>>(32-9)) + 1;
999 // no need to check for round up outside of range
1004 man = (man>>(32-9));
1011 // zero rate - not representable
1013 if (r == round_down) {
1022 PRINTD (DBG_QOS, "rate: man=%u, exp=%hu", man, exp);
1025 *bits = /* (1<<14) | */ (exp<<9) | man;
1028 *actual = (exp >= 9)
1029 ? (1 << exp) + (man << (exp-9))
1030 : (1 << exp) + ((man + (1<<(9-exp-1))) >> (9-exp));
1035 /********** Linux ATM Operations **********/
1037 // some are not yet implemented while others do not make sense for
1040 /********** Open a VC **********/
1042 static int amb_open (struct atm_vcc * atm_vcc)
1046 struct atm_qos * qos;
1047 struct atm_trafprm * txtp;
1048 struct atm_trafprm * rxtp;
1050 u16 tx_vc_bits = -1; // hush gcc
1051 u16 tx_frame_bits = -1; // hush gcc
1053 amb_dev * dev = AMB_DEV(atm_vcc->dev);
1055 unsigned char pool = -1; // hush gcc
1056 short vpi = atm_vcc->vpi;
1057 int vci = atm_vcc->vci;
1059 PRINTD (DBG_FLOW|DBG_VCC, "amb_open %x %x", vpi, vci);
1061 #ifdef ATM_VPI_UNSPEC
1062 // UNSPEC is deprecated, remove this code eventually
1063 if (vpi == ATM_VPI_UNSPEC || vci == ATM_VCI_UNSPEC) {
1064 PRINTK (KERN_WARNING, "rejecting open with unspecified VPI/VCI (deprecated)");
1069 if (!(0 <= vpi && vpi < (1<<NUM_VPI_BITS) &&
1070 0 <= vci && vci < (1<<NUM_VCI_BITS))) {
1071 PRINTD (DBG_WARN|DBG_VCC, "VPI/VCI out of range: %hd/%d", vpi, vci);
1075 qos = &atm_vcc->qos;
1077 if (qos->aal != ATM_AAL5) {
1078 PRINTD (DBG_QOS, "AAL not supported");
1082 // traffic parameters
1084 PRINTD (DBG_QOS, "TX:");
1086 if (txtp->traffic_class != ATM_NONE) {
1087 switch (txtp->traffic_class) {
1089 // we take "the PCR" as a rate-cap
1090 int pcr = atm_pcr_goal (txtp);
1094 tx_vc_bits = TX_UBR;
1095 tx_frame_bits = TX_FRAME_NOTCAP;
1104 error = make_rate (pcr, r, &tx_rate_bits, NULL);
1105 tx_vc_bits = TX_UBR_CAPPED;
1106 tx_frame_bits = TX_FRAME_CAPPED;
1112 pcr = atm_pcr_goal (txtp);
1113 PRINTD (DBG_QOS, "pcr goal = %d", pcr);
1118 // PRINTD (DBG_QOS, "request for non-UBR/ABR denied");
1119 PRINTD (DBG_QOS, "request for non-UBR denied");
1123 PRINTD (DBG_QOS, "tx_rate_bits=%hx, tx_vc_bits=%hx",
1124 tx_rate_bits, tx_vc_bits);
1127 PRINTD (DBG_QOS, "RX:");
1129 if (rxtp->traffic_class == ATM_NONE) {
1132 // choose an RX pool (arranged in increasing size)
1133 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
1134 if ((unsigned int) rxtp->max_sdu <= dev->rxq[pool].buffer_size) {
1135 PRINTD (DBG_VCC|DBG_QOS|DBG_POOL, "chose pool %hu (max_sdu %u <= %u)",
1136 pool, rxtp->max_sdu, dev->rxq[pool].buffer_size);
1139 if (pool == NUM_RX_POOLS) {
1140 PRINTD (DBG_WARN|DBG_VCC|DBG_QOS|DBG_POOL,
1141 "no pool suitable for VC (RX max_sdu %d is too large)",
1146 switch (rxtp->traffic_class) {
1152 pcr = atm_pcr_goal (rxtp);
1153 PRINTD (DBG_QOS, "pcr goal = %d", pcr);
1158 // PRINTD (DBG_QOS, "request for non-UBR/ABR denied");
1159 PRINTD (DBG_QOS, "request for non-UBR denied");
1165 // get space for our vcc stuff
1166 vcc = kmalloc (sizeof(amb_vcc), GFP_KERNEL);
1168 PRINTK (KERN_ERR, "out of memory!");
1171 atm_vcc->dev_data = (void *) vcc;
1173 // no failures beyond this point
1175 // we are not really "immediately before allocating the connection
1176 // identifier in hardware", but it will just have to do!
1177 set_bit(ATM_VF_ADDR,&atm_vcc->flags);
1179 if (txtp->traffic_class != ATM_NONE) {
1182 vcc->tx_frame_bits = tx_frame_bits;
1184 down (&dev->vcc_sf);
1185 if (dev->rxer[vci]) {
1186 // RXer on the channel already, just modify rate...
1187 cmd.request = cpu_to_be32 (SRB_MODIFY_VC_RATE);
1188 cmd.args.modify_rate.vc = cpu_to_be32 (vci); // vpi 0
1189 cmd.args.modify_rate.rate = cpu_to_be32 (tx_rate_bits << SRB_RATE_SHIFT);
1190 while (command_do (dev, &cmd))
1192 // ... and TX flags, preserving the RX pool
1193 cmd.request = cpu_to_be32 (SRB_MODIFY_VC_FLAGS);
1194 cmd.args.modify_flags.vc = cpu_to_be32 (vci); // vpi 0
1195 cmd.args.modify_flags.flags = cpu_to_be32
1196 ( (AMB_VCC(dev->rxer[vci])->rx_info.pool << SRB_POOL_SHIFT)
1197 | (tx_vc_bits << SRB_FLAGS_SHIFT) );
1198 while (command_do (dev, &cmd))
1201 // no RXer on the channel, just open (with pool zero)
1202 cmd.request = cpu_to_be32 (SRB_OPEN_VC);
1203 cmd.args.open.vc = cpu_to_be32 (vci); // vpi 0
1204 cmd.args.open.flags = cpu_to_be32 (tx_vc_bits << SRB_FLAGS_SHIFT);
1205 cmd.args.open.rate = cpu_to_be32 (tx_rate_bits << SRB_RATE_SHIFT);
1206 while (command_do (dev, &cmd))
1209 dev->txer[vci].tx_present = 1;
1213 if (rxtp->traffic_class != ATM_NONE) {
1216 vcc->rx_info.pool = pool;
1218 down (&dev->vcc_sf);
1219 /* grow RX buffer pool */
1220 if (!dev->rxq[pool].buffers_wanted)
1221 dev->rxq[pool].buffers_wanted = rx_lats;
1222 dev->rxq[pool].buffers_wanted += 1;
1223 fill_rx_pool (dev, pool, GFP_KERNEL);
1225 if (dev->txer[vci].tx_present) {
1226 // TXer on the channel already
1227 // switch (from pool zero) to this pool, preserving the TX bits
1228 cmd.request = cpu_to_be32 (SRB_MODIFY_VC_FLAGS);
1229 cmd.args.modify_flags.vc = cpu_to_be32 (vci); // vpi 0
1230 cmd.args.modify_flags.flags = cpu_to_be32
1231 ( (pool << SRB_POOL_SHIFT)
1232 | (dev->txer[vci].tx_vc_bits << SRB_FLAGS_SHIFT) );
1234 // no TXer on the channel, open the VC (with no rate info)
1235 cmd.request = cpu_to_be32 (SRB_OPEN_VC);
1236 cmd.args.open.vc = cpu_to_be32 (vci); // vpi 0
1237 cmd.args.open.flags = cpu_to_be32 (pool << SRB_POOL_SHIFT);
1238 cmd.args.open.rate = cpu_to_be32 (0);
1240 while (command_do (dev, &cmd))
1242 // this link allows RX frames through
1243 dev->rxer[vci] = atm_vcc;
1247 // indicate readiness
1248 set_bit(ATM_VF_READY,&atm_vcc->flags);
1253 /********** Close a VC **********/
1255 static void amb_close (struct atm_vcc * atm_vcc) {
1256 amb_dev * dev = AMB_DEV (atm_vcc->dev);
1257 amb_vcc * vcc = AMB_VCC (atm_vcc);
1258 u16 vci = atm_vcc->vci;
1260 PRINTD (DBG_VCC|DBG_FLOW, "amb_close");
1262 // indicate unreadiness
1263 clear_bit(ATM_VF_READY,&atm_vcc->flags);
1266 if (atm_vcc->qos.txtp.traffic_class != ATM_NONE) {
1269 down (&dev->vcc_sf);
1270 if (dev->rxer[vci]) {
1271 // RXer still on the channel, just modify rate... XXX not really needed
1272 cmd.request = cpu_to_be32 (SRB_MODIFY_VC_RATE);
1273 cmd.args.modify_rate.vc = cpu_to_be32 (vci); // vpi 0
1274 cmd.args.modify_rate.rate = cpu_to_be32 (0);
1275 // ... and clear TX rate flags (XXX to stop RM cell output?), preserving RX pool
1277 // no RXer on the channel, close channel
1278 cmd.request = cpu_to_be32 (SRB_CLOSE_VC);
1279 cmd.args.close.vc = cpu_to_be32 (vci); // vpi 0
1281 dev->txer[vci].tx_present = 0;
1282 while (command_do (dev, &cmd))
1288 if (atm_vcc->qos.rxtp.traffic_class != ATM_NONE) {
1291 // this is (the?) one reason why we need the amb_vcc struct
1292 unsigned char pool = vcc->rx_info.pool;
1294 down (&dev->vcc_sf);
1295 if (dev->txer[vci].tx_present) {
1296 // TXer still on the channel, just go to pool zero XXX not really needed
1297 cmd.request = cpu_to_be32 (SRB_MODIFY_VC_FLAGS);
1298 cmd.args.modify_flags.vc = cpu_to_be32 (vci); // vpi 0
1299 cmd.args.modify_flags.flags = cpu_to_be32
1300 (dev->txer[vci].tx_vc_bits << SRB_FLAGS_SHIFT);
1302 // no TXer on the channel, close the VC
1303 cmd.request = cpu_to_be32 (SRB_CLOSE_VC);
1304 cmd.args.close.vc = cpu_to_be32 (vci); // vpi 0
1306 // forget the rxer - no more skbs will be pushed
1307 if (atm_vcc != dev->rxer[vci])
1308 PRINTK (KERN_ERR, "%s vcc=%p rxer[vci]=%p",
1309 "arghhh! we're going to die!",
1310 vcc, dev->rxer[vci]);
1311 dev->rxer[vci] = NULL;
1312 while (command_do (dev, &cmd))
1315 /* shrink RX buffer pool */
1316 dev->rxq[pool].buffers_wanted -= 1;
1317 if (dev->rxq[pool].buffers_wanted == rx_lats) {
1318 dev->rxq[pool].buffers_wanted = 0;
1319 drain_rx_pool (dev, pool);
1324 // free our structure
1327 // say the VPI/VCI is free again
1328 clear_bit(ATM_VF_ADDR,&atm_vcc->flags);
1333 /********** Set socket options for a VC **********/
1335 // int amb_getsockopt (struct atm_vcc * atm_vcc, int level, int optname, void * optval, int optlen);
1337 /********** Set socket options for a VC **********/
1339 // int amb_setsockopt (struct atm_vcc * atm_vcc, int level, int optname, void * optval, int optlen);
1341 /********** Send **********/
1343 static int amb_send (struct atm_vcc * atm_vcc, struct sk_buff * skb) {
1344 amb_dev * dev = AMB_DEV(atm_vcc->dev);
1345 amb_vcc * vcc = AMB_VCC(atm_vcc);
1346 u16 vc = atm_vcc->vci;
1347 unsigned int tx_len = skb->len;
1348 unsigned char * tx_data = skb->data;
1349 tx_simple * tx_descr;
1352 if (test_bit (dead, &dev->flags))
1355 PRINTD (DBG_FLOW|DBG_TX, "amb_send vc %x data %p len %u",
1356 vc, tx_data, tx_len);
1358 dump_skb (">>>", vc, skb);
1360 if (!dev->txer[vc].tx_present) {
1361 PRINTK (KERN_ERR, "attempt to send on RX-only VC %x", vc);
1365 // this is a driver private field so we have to set it ourselves,
1366 // despite the fact that we are _required_ to use it to check for a
1368 ATM_SKB(skb)->vcc = atm_vcc;
1370 if (skb->len > (size_t) atm_vcc->qos.txtp.max_sdu) {
1371 PRINTK (KERN_ERR, "sk_buff length greater than agreed max_sdu, dropping...");
1375 if (check_area (skb->data, skb->len)) {
1376 atomic_inc(&atm_vcc->stats->tx_err);
1377 return -ENOMEM; // ?
1380 // allocate memory for fragments
1381 tx_descr = kmalloc (sizeof(tx_simple), GFP_KERNEL);
1383 PRINTK (KERN_ERR, "could not allocate TX descriptor");
1386 if (check_area (tx_descr, sizeof(tx_simple))) {
1390 PRINTD (DBG_TX, "fragment list allocated at %p", tx_descr);
1392 tx_descr->skb = skb;
1394 tx_descr->tx_frag.bytes = cpu_to_be32 (tx_len);
1395 tx_descr->tx_frag.address = cpu_to_be32 (virt_to_bus (tx_data));
1397 tx_descr->tx_frag_end.handle = virt_to_bus (tx_descr);
1398 tx_descr->tx_frag_end.vc = 0;
1399 tx_descr->tx_frag_end.next_descriptor_length = 0;
1400 tx_descr->tx_frag_end.next_descriptor = 0;
1401 #ifdef AMB_NEW_MICROCODE
1402 tx_descr->tx_frag_end.cpcs_uu = 0;
1403 tx_descr->tx_frag_end.cpi = 0;
1404 tx_descr->tx_frag_end.pad = 0;
1407 tx.vc = cpu_to_be16 (vcc->tx_frame_bits | vc);
1408 tx.tx_descr_length = cpu_to_be16 (sizeof(tx_frag)+sizeof(tx_frag_end));
1409 tx.tx_descr_addr = cpu_to_be32 (virt_to_bus (&tx_descr->tx_frag));
1411 while (tx_give (dev, &tx))
1416 /********** Change QoS on a VC **********/
1418 // int amb_change_qos (struct atm_vcc * atm_vcc, struct atm_qos * qos, int flags);
1420 /********** Free RX Socket Buffer **********/
1423 static void amb_free_rx_skb (struct atm_vcc * atm_vcc, struct sk_buff * skb) {
1424 amb_dev * dev = AMB_DEV (atm_vcc->dev);
1425 amb_vcc * vcc = AMB_VCC (atm_vcc);
1426 unsigned char pool = vcc->rx_info.pool;
1429 // This may be unsafe for various reasons that I cannot really guess
1430 // at. However, I note that the ATM layer calls kfree_skb rather
1431 // than dev_kfree_skb at this point so we are least covered as far
1432 // as buffer locking goes. There may be bugs if pcap clones RX skbs.
1434 PRINTD (DBG_FLOW|DBG_SKB, "amb_rx_free skb %p (atm_vcc %p, vcc %p)",
1437 rx.handle = virt_to_bus (skb);
1438 rx.host_address = cpu_to_be32 (virt_to_bus (skb->data));
1440 skb->data = skb->head;
1441 skb->tail = skb->head;
1444 if (!rx_give (dev, &rx, pool)) {
1446 PRINTD (DBG_SKB|DBG_POOL, "recycled skb for pool %hu", pool);
1450 // just do what the ATM layer would have done
1451 dev_kfree_skb_any (skb);
1457 /********** Proc File Output **********/
1459 static int amb_proc_read (struct atm_dev * atm_dev, loff_t * pos, char * page) {
1460 amb_dev * dev = AMB_DEV (atm_dev);
1464 PRINTD (DBG_FLOW, "amb_proc_read");
1466 /* more diagnostics here? */
1469 amb_stats * s = &dev->stats;
1470 return sprintf (page,
1471 "frames: TX OK %lu, RX OK %lu, RX bad %lu "
1472 "(CRC %lu, long %lu, aborted %lu, unused %lu).\n",
1473 s->tx_ok, s->rx.ok, s->rx.error,
1474 s->rx.badcrc, s->rx.toolong,
1475 s->rx.aborted, s->rx.unused);
1479 amb_cq * c = &dev->cq;
1480 return sprintf (page, "cmd queue [cur/hi/max]: %u/%u/%u. ",
1481 c->pending, c->high, c->maximum);
1485 amb_txq * t = &dev->txq;
1486 return sprintf (page, "TX queue [cur/max high full]: %u/%u %u %u.\n",
1487 t->pending, t->maximum, t->high, t->filled);
1491 unsigned int count = sprintf (page, "RX queues [cur/max/req low empty]:");
1492 for (pool = 0; pool < NUM_RX_POOLS; ++pool) {
1493 amb_rxq * r = &dev->rxq[pool];
1494 count += sprintf (page+count, " %u/%u/%u %u %u",
1495 r->pending, r->maximum, r->buffers_wanted, r->low, r->emptied);
1497 count += sprintf (page+count, ".\n");
1502 unsigned int count = sprintf (page, "RX buffer sizes:");
1503 for (pool = 0; pool < NUM_RX_POOLS; ++pool) {
1504 amb_rxq * r = &dev->rxq[pool];
1505 count += sprintf (page+count, " %u", r->buffer_size);
1507 count += sprintf (page+count, ".\n");
1520 /********** Operation Structure **********/
1522 static const struct atmdev_ops amb_ops = {
1526 .proc_read = amb_proc_read,
1527 .owner = THIS_MODULE,
1530 /********** housekeeping **********/
1531 static void do_housekeeping (unsigned long arg) {
1532 amb_dev * dev = (amb_dev *) arg;
1534 // could collect device-specific (not driver/atm-linux) stats here
1536 // last resort refill once every ten seconds
1537 fill_rx_pools (dev);
1538 mod_timer(&dev->housekeeping, jiffies + 10*HZ);
1543 /********** creation of communication queues **********/
1545 static int __devinit create_queues (amb_dev * dev, unsigned int cmds,
1546 unsigned int txs, unsigned int * rxs,
1547 unsigned int * rx_buffer_sizes) {
1553 PRINTD (DBG_FLOW, "create_queues %p", dev);
1555 total += cmds * sizeof(command);
1557 total += txs * (sizeof(tx_in) + sizeof(tx_out));
1559 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
1560 total += rxs[pool] * (sizeof(rx_in) + sizeof(rx_out));
1562 memory = kmalloc (total, GFP_KERNEL);
1564 PRINTK (KERN_ERR, "could not allocate queues");
1567 if (check_area (memory, total)) {
1568 PRINTK (KERN_ERR, "queues allocated in nasty area");
1573 limit = memory + total;
1574 PRINTD (DBG_INIT, "queues from %p to %p", memory, limit);
1576 PRINTD (DBG_CMD, "command queue at %p", memory);
1579 command * cmd = memory;
1580 amb_cq * cq = &dev->cq;
1584 cq->maximum = cmds - 1;
1586 cq->ptrs.start = cmd;
1589 cq->ptrs.limit = cmd + cmds;
1591 memory = cq->ptrs.limit;
1594 PRINTD (DBG_TX, "TX queue pair at %p", memory);
1597 tx_in * in = memory;
1599 amb_txq * txq = &dev->txq;
1604 txq->maximum = txs - 1;
1608 txq->in.limit = in + txs;
1610 memory = txq->in.limit;
1613 txq->out.start = out;
1615 txq->out.limit = out + txs;
1617 memory = txq->out.limit;
1620 PRINTD (DBG_RX, "RX queue pairs at %p", memory);
1622 for (pool = 0; pool < NUM_RX_POOLS; ++pool) {
1623 rx_in * in = memory;
1625 amb_rxq * rxq = &dev->rxq[pool];
1627 rxq->buffer_size = rx_buffer_sizes[pool];
1628 rxq->buffers_wanted = 0;
1631 rxq->low = rxs[pool] - 1;
1633 rxq->maximum = rxs[pool] - 1;
1637 rxq->in.limit = in + rxs[pool];
1639 memory = rxq->in.limit;
1642 rxq->out.start = out;
1644 rxq->out.limit = out + rxs[pool];
1646 memory = rxq->out.limit;
1649 if (memory == limit) {
1652 PRINTK (KERN_ERR, "bad queue alloc %p != %p (tell maintainer)", memory, limit);
1653 kfree (limit - total);
1659 /********** destruction of communication queues **********/
1661 static void destroy_queues (amb_dev * dev) {
1662 // all queues assumed empty
1663 void * memory = dev->cq.ptrs.start;
1664 // includes txq.in, txq.out, rxq[].in and rxq[].out
1666 PRINTD (DBG_FLOW, "destroy_queues %p", dev);
1668 PRINTD (DBG_INIT, "freeing queues at %p", memory);
1674 /********** basic loader commands and error handling **********/
1675 // centisecond timeouts - guessing away here
1676 static unsigned int command_timeouts [] = {
1677 [host_memory_test] = 15,
1678 [read_adapter_memory] = 2,
1679 [write_adapter_memory] = 2,
1680 [adapter_start] = 50,
1681 [get_version_number] = 10,
1682 [interrupt_host] = 1,
1683 [flash_erase_sector] = 1,
1684 [adap_download_block] = 1,
1685 [adap_erase_flash] = 1,
1686 [adap_run_in_iram] = 1,
1687 [adap_end_download] = 1
1691 static unsigned int command_successes [] = {
1692 [host_memory_test] = COMMAND_PASSED_TEST,
1693 [read_adapter_memory] = COMMAND_READ_DATA_OK,
1694 [write_adapter_memory] = COMMAND_WRITE_DATA_OK,
1695 [adapter_start] = COMMAND_COMPLETE,
1696 [get_version_number] = COMMAND_COMPLETE,
1697 [interrupt_host] = COMMAND_COMPLETE,
1698 [flash_erase_sector] = COMMAND_COMPLETE,
1699 [adap_download_block] = COMMAND_COMPLETE,
1700 [adap_erase_flash] = COMMAND_COMPLETE,
1701 [adap_run_in_iram] = COMMAND_COMPLETE,
1702 [adap_end_download] = COMMAND_COMPLETE
1705 static int decode_loader_result (loader_command cmd, u32 result)
1710 if (result == command_successes[cmd])
1716 msg = "bad command";
1718 case COMMAND_IN_PROGRESS:
1720 msg = "command in progress";
1722 case COMMAND_PASSED_TEST:
1724 msg = "command passed test";
1726 case COMMAND_FAILED_TEST:
1728 msg = "command failed test";
1730 case COMMAND_READ_DATA_OK:
1732 msg = "command read data ok";
1734 case COMMAND_READ_BAD_ADDRESS:
1736 msg = "command read bad address";
1738 case COMMAND_WRITE_DATA_OK:
1740 msg = "command write data ok";
1742 case COMMAND_WRITE_BAD_ADDRESS:
1744 msg = "command write bad address";
1746 case COMMAND_WRITE_FLASH_FAILURE:
1748 msg = "command write flash failure";
1750 case COMMAND_COMPLETE:
1752 msg = "command complete";
1754 case COMMAND_FLASH_ERASE_FAILURE:
1756 msg = "command flash erase failure";
1758 case COMMAND_WRITE_BAD_DATA:
1760 msg = "command write bad data";
1764 msg = "unknown error";
1765 PRINTD (DBG_LOAD|DBG_ERR,
1766 "decode_loader_result got %d=%x !",
1771 PRINTK (KERN_ERR, "%s", msg);
1775 static int __devinit do_loader_command (volatile loader_block * lb,
1776 const amb_dev * dev, loader_command cmd) {
1778 unsigned long timeout;
1780 PRINTD (DBG_FLOW|DBG_LOAD, "do_loader_command");
1784 Set the return value to zero, set the command type and set the
1785 valid entry to the right magic value. The payload is already
1786 correctly byte-ordered so we leave it alone. Hit the doorbell
1787 with the bus address of this structure.
1792 lb->command = cpu_to_be32 (cmd);
1793 lb->valid = cpu_to_be32 (DMA_VALID);
1794 // dump_registers (dev);
1795 // dump_loader_block (lb);
1796 wr_mem (dev, offsetof(amb_mem, doorbell), virt_to_bus (lb) & ~onegigmask);
1798 timeout = command_timeouts[cmd] * 10;
1800 while (!lb->result || lb->result == cpu_to_be32 (COMMAND_IN_PROGRESS))
1802 timeout = msleep_interruptible(timeout);
1804 PRINTD (DBG_LOAD|DBG_ERR, "command %d timed out", cmd);
1805 dump_registers (dev);
1806 dump_loader_block (lb);
1810 if (cmd == adapter_start) {
1811 // wait for start command to acknowledge...
1813 while (rd_plain (dev, offsetof(amb_mem, doorbell)))
1815 timeout = msleep_interruptible(timeout);
1817 PRINTD (DBG_LOAD|DBG_ERR, "start command did not clear doorbell, res=%08x",
1818 be32_to_cpu (lb->result));
1819 dump_registers (dev);
1824 return decode_loader_result (cmd, be32_to_cpu (lb->result));
1829 /* loader: determine loader version */
1831 static int __devinit get_loader_version (loader_block * lb,
1832 const amb_dev * dev, u32 * version) {
1835 PRINTD (DBG_FLOW|DBG_LOAD, "get_loader_version");
1837 res = do_loader_command (lb, dev, get_version_number);
1841 *version = be32_to_cpu (lb->payload.version);
1845 /* loader: write memory data blocks */
1847 static int __devinit loader_write (loader_block * lb,
1848 const amb_dev * dev, const u32 * data,
1849 u32 address, unsigned int count) {
1851 transfer_block * tb = &lb->payload.transfer;
1853 PRINTD (DBG_FLOW|DBG_LOAD, "loader_write");
1855 if (count > MAX_TRANSFER_DATA)
1857 tb->address = cpu_to_be32 (address);
1858 tb->count = cpu_to_be32 (count);
1859 for (i = 0; i < count; ++i)
1860 tb->data[i] = cpu_to_be32 (data[i]);
1861 return do_loader_command (lb, dev, write_adapter_memory);
1864 /* loader: verify memory data blocks */
1866 static int __devinit loader_verify (loader_block * lb,
1867 const amb_dev * dev, const u32 * data,
1868 u32 address, unsigned int count) {
1870 transfer_block * tb = &lb->payload.transfer;
1873 PRINTD (DBG_FLOW|DBG_LOAD, "loader_verify");
1875 if (count > MAX_TRANSFER_DATA)
1877 tb->address = cpu_to_be32 (address);
1878 tb->count = cpu_to_be32 (count);
1879 res = do_loader_command (lb, dev, read_adapter_memory);
1881 for (i = 0; i < count; ++i)
1882 if (tb->data[i] != cpu_to_be32 (data[i])) {
1889 /* loader: start microcode */
1891 static int __devinit loader_start (loader_block * lb,
1892 const amb_dev * dev, u32 address) {
1893 PRINTD (DBG_FLOW|DBG_LOAD, "loader_start");
1895 lb->payload.start = cpu_to_be32 (address);
1896 return do_loader_command (lb, dev, adapter_start);
1899 /********** reset card **********/
1901 static inline void sf (const char * msg)
1903 PRINTK (KERN_ERR, "self-test failed: %s", msg);
1906 static int amb_reset (amb_dev * dev, int diags) {
1909 PRINTD (DBG_FLOW|DBG_LOAD, "amb_reset");
1911 word = rd_plain (dev, offsetof(amb_mem, reset_control));
1912 // put card into reset state
1913 wr_plain (dev, offsetof(amb_mem, reset_control), word | AMB_RESET_BITS);
1914 // wait a short while
1917 // put card into known good state
1918 wr_plain (dev, offsetof(amb_mem, interrupt_control), AMB_DOORBELL_BITS);
1919 // clear all interrupts just in case
1920 wr_plain (dev, offsetof(amb_mem, interrupt), -1);
1922 // clear self-test done flag
1923 wr_plain (dev, offsetof(amb_mem, mb.loader.ready), 0);
1924 // take card out of reset state
1925 wr_plain (dev, offsetof(amb_mem, reset_control), word &~ AMB_RESET_BITS);
1928 unsigned long timeout;
1931 // half second time-out
1933 while (!rd_plain (dev, offsetof(amb_mem, mb.loader.ready)))
1935 timeout = msleep_interruptible(timeout);
1937 PRINTD (DBG_LOAD|DBG_ERR, "reset timed out");
1941 // get results of self-test
1942 // XXX double check byte-order
1943 word = rd_mem (dev, offsetof(amb_mem, mb.loader.result));
1944 if (word & SELF_TEST_FAILURE) {
1945 if (word & GPINT_TST_FAILURE)
1947 if (word & SUNI_DATA_PATTERN_FAILURE)
1948 sf ("SUNI data pattern");
1949 if (word & SUNI_DATA_BITS_FAILURE)
1950 sf ("SUNI data bits");
1951 if (word & SUNI_UTOPIA_FAILURE)
1952 sf ("SUNI UTOPIA interface");
1953 if (word & SUNI_FIFO_FAILURE)
1954 sf ("SUNI cell buffer FIFO");
1955 if (word & SRAM_FAILURE)
1957 // better return value?
1965 /********** transfer and start the microcode **********/
1967 static int __devinit ucode_init (loader_block * lb, amb_dev * dev) {
1969 unsigned int total = 0;
1970 const u32 * pointer = ucode_data;
1975 PRINTD (DBG_FLOW|DBG_LOAD, "ucode_init");
1977 while (address = ucode_regions[i].start,
1978 count = ucode_regions[i].count) {
1979 PRINTD (DBG_LOAD, "starting region (%x, %u)", address, count);
1982 if (count <= MAX_TRANSFER_DATA)
1985 words = MAX_TRANSFER_DATA;
1987 res = loader_write (lb, dev, pointer, address, words);
1990 res = loader_verify (lb, dev, pointer, address, words);
1994 address += sizeof(u32) * words;
1999 if (*pointer == ATM_POISON) {
2000 return loader_start (lb, dev, ucode_start);
2002 // cast needed as there is no %? for pointer differnces
2003 PRINTD (DBG_LOAD|DBG_ERR,
2004 "offset=%li, *pointer=%x, address=%x, total=%u",
2005 (long) (pointer - ucode_data), *pointer, address, total);
2006 PRINTK (KERN_ERR, "incorrect microcode data");
2011 /********** give adapter parameters **********/
2013 static inline __be32 bus_addr(void * addr) {
2014 return cpu_to_be32 (virt_to_bus (addr));
2017 static int __devinit amb_talk (amb_dev * dev) {
2020 unsigned long timeout;
2022 PRINTD (DBG_FLOW, "amb_talk %p", dev);
2024 a.command_start = bus_addr (dev->cq.ptrs.start);
2025 a.command_end = bus_addr (dev->cq.ptrs.limit);
2026 a.tx_start = bus_addr (dev->txq.in.start);
2027 a.tx_end = bus_addr (dev->txq.in.limit);
2028 a.txcom_start = bus_addr (dev->txq.out.start);
2029 a.txcom_end = bus_addr (dev->txq.out.limit);
2031 for (pool = 0; pool < NUM_RX_POOLS; ++pool) {
2032 // the other "a" items are set up by the adapter
2033 a.rec_struct[pool].buffer_start = bus_addr (dev->rxq[pool].in.start);
2034 a.rec_struct[pool].buffer_end = bus_addr (dev->rxq[pool].in.limit);
2035 a.rec_struct[pool].rx_start = bus_addr (dev->rxq[pool].out.start);
2036 a.rec_struct[pool].rx_end = bus_addr (dev->rxq[pool].out.limit);
2037 a.rec_struct[pool].buffer_size = cpu_to_be32 (dev->rxq[pool].buffer_size);
2040 #ifdef AMB_NEW_MICROCODE
2041 // disable fast PLX prefetching
2045 // pass the structure
2046 wr_mem (dev, offsetof(amb_mem, doorbell), virt_to_bus (&a));
2048 // 2.2 second wait (must not touch doorbell during 2 second DMA test)
2050 // give the adapter another half second?
2052 while (rd_plain (dev, offsetof(amb_mem, doorbell)))
2054 timeout = msleep_interruptible(timeout);
2056 PRINTD (DBG_INIT|DBG_ERR, "adapter init timed out");
2063 // get microcode version
2064 static void __devinit amb_ucode_version (amb_dev * dev) {
2068 cmd.request = cpu_to_be32 (SRB_GET_VERSION);
2069 while (command_do (dev, &cmd)) {
2070 set_current_state(TASK_UNINTERRUPTIBLE);
2073 major = be32_to_cpu (cmd.args.version.major);
2074 minor = be32_to_cpu (cmd.args.version.minor);
2075 PRINTK (KERN_INFO, "microcode version is %u.%u", major, minor);
2078 // swap bits within byte to get Ethernet ordering
2079 static u8 bit_swap (u8 byte)
2087 return ((swap[byte & 0xf]<<4) | swap[byte>>4]);
2090 // get end station address
2091 static void __devinit amb_esi (amb_dev * dev, u8 * esi) {
2096 cmd.request = cpu_to_be32 (SRB_GET_BIA);
2097 while (command_do (dev, &cmd)) {
2098 set_current_state(TASK_UNINTERRUPTIBLE);
2101 lower4 = be32_to_cpu (cmd.args.bia.lower4);
2102 upper2 = be32_to_cpu (cmd.args.bia.upper2);
2103 PRINTD (DBG_LOAD, "BIA: lower4: %08x, upper2 %04x", lower4, upper2);
2108 PRINTDB (DBG_INIT, "ESI:");
2109 for (i = 0; i < ESI_LEN; ++i) {
2111 esi[i] = bit_swap (lower4>>(8*i));
2113 esi[i] = bit_swap (upper2>>(8*(i-4)));
2114 PRINTDM (DBG_INIT, " %02x", esi[i]);
2117 PRINTDE (DBG_INIT, "");
2123 static void fixup_plx_window (amb_dev *dev, loader_block *lb)
2125 // fix up the PLX-mapped window base address to match the block
2128 blb = virt_to_bus(lb);
2129 // the kernel stack had better not ever cross a 1Gb boundary!
2130 mapreg = rd_plain (dev, offsetof(amb_mem, stuff[10]));
2131 mapreg &= ~onegigmask;
2132 mapreg |= blb & onegigmask;
2133 wr_plain (dev, offsetof(amb_mem, stuff[10]), mapreg);
2137 static int __devinit amb_init (amb_dev * dev)
2143 if (amb_reset (dev, 1)) {
2144 PRINTK (KERN_ERR, "card reset failed!");
2146 fixup_plx_window (dev, &lb);
2148 if (get_loader_version (&lb, dev, &version)) {
2149 PRINTK (KERN_INFO, "failed to get loader version");
2151 PRINTK (KERN_INFO, "loader version is %08x", version);
2153 if (ucode_init (&lb, dev)) {
2154 PRINTK (KERN_ERR, "microcode failure");
2155 } else if (create_queues (dev, cmds, txs, rxs, rxs_bs)) {
2156 PRINTK (KERN_ERR, "failed to get memory for queues");
2159 if (amb_talk (dev)) {
2160 PRINTK (KERN_ERR, "adapter did not accept queues");
2163 amb_ucode_version (dev);
2168 destroy_queues (dev);
2169 } /* create_queues, ucode_init */
2172 } /* get_loader_version */
2179 static void setup_dev(amb_dev *dev, struct pci_dev *pci_dev)
2182 memset (dev, 0, sizeof(amb_dev));
2184 // set up known dev items straight away
2185 dev->pci_dev = pci_dev;
2186 pci_set_drvdata(pci_dev, dev);
2188 dev->iobase = pci_resource_start (pci_dev, 1);
2189 dev->irq = pci_dev->irq;
2190 dev->membase = bus_to_virt(pci_resource_start(pci_dev, 0));
2192 // flags (currently only dead)
2195 // Allocate cell rates (fibre)
2196 // ATM_OC3_PCR = 1555200000/8/270*260/53 - 29/53
2197 // to be really pedantic, this should be ATM_OC3c_PCR
2198 dev->tx_avail = ATM_OC3_PCR;
2199 dev->rx_avail = ATM_OC3_PCR;
2201 #ifdef FILL_RX_POOLS_IN_BH
2202 // initialise bottom half
2203 INIT_WORK(&dev->bh, (void (*)(void *)) fill_rx_pools, dev);
2206 // semaphore for txer/rxer modifications - we cannot use a
2207 // spinlock as the critical region needs to switch processes
2208 init_MUTEX (&dev->vcc_sf);
2209 // queue manipulation spinlocks; we want atomic reads and
2210 // writes to the queue descriptors (handles IRQ and SMP)
2211 // consider replacing "int pending" -> "atomic_t available"
2212 // => problem related to who gets to move queue pointers
2213 spin_lock_init (&dev->cq.lock);
2214 spin_lock_init (&dev->txq.lock);
2215 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
2216 spin_lock_init (&dev->rxq[pool].lock);
2219 static void setup_pci_dev(struct pci_dev *pci_dev)
2223 // enable bus master accesses
2224 pci_set_master(pci_dev);
2226 // frobnicate latency (upwards, usually)
2227 pci_read_config_byte (pci_dev, PCI_LATENCY_TIMER, &lat);
2230 pci_lat = (lat < MIN_PCI_LATENCY) ? MIN_PCI_LATENCY : lat;
2232 if (lat != pci_lat) {
2233 PRINTK (KERN_INFO, "Changing PCI latency timer from %hu to %hu",
2235 pci_write_config_byte(pci_dev, PCI_LATENCY_TIMER, pci_lat);
2239 static int __devinit amb_probe(struct pci_dev *pci_dev, const struct pci_device_id *pci_ent)
2245 err = pci_enable_device(pci_dev);
2247 PRINTK (KERN_ERR, "skipped broken (PLX rev 2) card");
2251 // read resources from PCI configuration space
2254 if (pci_dev->device == PCI_DEVICE_ID_MADGE_AMBASSADOR_BAD) {
2255 PRINTK (KERN_ERR, "skipped broken (PLX rev 2) card");
2260 PRINTD (DBG_INFO, "found Madge ATM adapter (amb) at"
2261 " IO %llx, IRQ %u, MEM %p",
2262 (unsigned long long)pci_resource_start(pci_dev, 1),
2263 irq, bus_to_virt(pci_resource_start(pci_dev, 0)));
2266 err = pci_request_region(pci_dev, 1, DEV_LABEL);
2268 PRINTK (KERN_ERR, "IO range already in use!");
2272 dev = kmalloc (sizeof(amb_dev), GFP_KERNEL);
2274 PRINTK (KERN_ERR, "out of memory!");
2279 setup_dev(dev, pci_dev);
2281 err = amb_init(dev);
2283 PRINTK (KERN_ERR, "adapter initialisation failure");
2287 setup_pci_dev(pci_dev);
2289 // grab (but share) IRQ and install handler
2290 err = request_irq(irq, interrupt_handler, IRQF_SHARED, DEV_LABEL, dev);
2292 PRINTK (KERN_ERR, "request IRQ failed!");
2296 dev->atm_dev = atm_dev_register (DEV_LABEL, &amb_ops, -1, NULL);
2297 if (!dev->atm_dev) {
2298 PRINTD (DBG_ERR, "failed to register Madge ATM adapter");
2303 PRINTD (DBG_INFO, "registered Madge ATM adapter (no. %d) (%p) at %p",
2304 dev->atm_dev->number, dev, dev->atm_dev);
2305 dev->atm_dev->dev_data = (void *) dev;
2307 // register our address
2308 amb_esi (dev, dev->atm_dev->esi);
2310 // 0 bits for vpi, 10 bits for vci
2311 dev->atm_dev->ci_range.vpi_bits = NUM_VPI_BITS;
2312 dev->atm_dev->ci_range.vci_bits = NUM_VCI_BITS;
2314 init_timer(&dev->housekeeping);
2315 dev->housekeeping.function = do_housekeeping;
2316 dev->housekeeping.data = (unsigned long) dev;
2317 mod_timer(&dev->housekeeping, jiffies);
2319 // enable host interrupts
2320 interrupts_on (dev);
2332 pci_release_region(pci_dev, 1);
2334 pci_disable_device(pci_dev);
2339 static void __devexit amb_remove_one(struct pci_dev *pci_dev)
2341 struct amb_dev *dev;
2343 dev = pci_get_drvdata(pci_dev);
2345 PRINTD(DBG_INFO|DBG_INIT, "closing %p (atm_dev = %p)", dev, dev->atm_dev);
2346 del_timer_sync(&dev->housekeeping);
2347 // the drain should not be necessary
2348 drain_rx_pools(dev);
2349 interrupts_off(dev);
2351 free_irq(dev->irq, dev);
2352 pci_disable_device(pci_dev);
2353 destroy_queues(dev);
2354 atm_dev_deregister(dev->atm_dev);
2356 pci_release_region(pci_dev, 1);
2359 static void __init amb_check_args (void) {
2361 unsigned int max_rx_size;
2363 #ifdef DEBUG_AMBASSADOR
2364 PRINTK (KERN_NOTICE, "debug bitmap is %hx", debug &= DBG_MASK);
2367 PRINTK (KERN_NOTICE, "no debugging support");
2370 if (cmds < MIN_QUEUE_SIZE)
2371 PRINTK (KERN_NOTICE, "cmds has been raised to %u",
2372 cmds = MIN_QUEUE_SIZE);
2374 if (txs < MIN_QUEUE_SIZE)
2375 PRINTK (KERN_NOTICE, "txs has been raised to %u",
2376 txs = MIN_QUEUE_SIZE);
2378 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
2379 if (rxs[pool] < MIN_QUEUE_SIZE)
2380 PRINTK (KERN_NOTICE, "rxs[%hu] has been raised to %u",
2381 pool, rxs[pool] = MIN_QUEUE_SIZE);
2383 // buffers sizes should be greater than zero and strictly increasing
2385 for (pool = 0; pool < NUM_RX_POOLS; ++pool)
2386 if (rxs_bs[pool] <= max_rx_size)
2387 PRINTK (KERN_NOTICE, "useless pool (rxs_bs[%hu] = %u)",
2388 pool, rxs_bs[pool]);
2390 max_rx_size = rxs_bs[pool];
2392 if (rx_lats < MIN_RX_BUFFERS)
2393 PRINTK (KERN_NOTICE, "rx_lats has been raised to %u",
2394 rx_lats = MIN_RX_BUFFERS);
2399 /********** module stuff **********/
2401 MODULE_AUTHOR(maintainer_string);
2402 MODULE_DESCRIPTION(description_string);
2403 MODULE_LICENSE("GPL");
2404 module_param(debug, ushort, 0644);
2405 module_param(cmds, uint, 0);
2406 module_param(txs, uint, 0);
2407 module_param_array(rxs, uint, NULL, 0);
2408 module_param_array(rxs_bs, uint, NULL, 0);
2409 module_param(rx_lats, uint, 0);
2410 module_param(pci_lat, byte, 0);
2411 MODULE_PARM_DESC(debug, "debug bitmap, see .h file");
2412 MODULE_PARM_DESC(cmds, "number of command queue entries");
2413 MODULE_PARM_DESC(txs, "number of TX queue entries");
2414 MODULE_PARM_DESC(rxs, "number of RX queue entries [" __MODULE_STRING(NUM_RX_POOLS) "]");
2415 MODULE_PARM_DESC(rxs_bs, "size of RX buffers [" __MODULE_STRING(NUM_RX_POOLS) "]");
2416 MODULE_PARM_DESC(rx_lats, "number of extra buffers to cope with RX latencies");
2417 MODULE_PARM_DESC(pci_lat, "PCI latency in bus cycles");
2419 /********** module entry **********/
2421 static struct pci_device_id amb_pci_tbl[] = {
2422 { PCI_VENDOR_ID_MADGE, PCI_DEVICE_ID_MADGE_AMBASSADOR, PCI_ANY_ID, PCI_ANY_ID,
2424 { PCI_VENDOR_ID_MADGE, PCI_DEVICE_ID_MADGE_AMBASSADOR_BAD, PCI_ANY_ID, PCI_ANY_ID,
2429 MODULE_DEVICE_TABLE(pci, amb_pci_tbl);
2431 static struct pci_driver amb_driver = {
2434 .remove = __devexit_p(amb_remove_one),
2435 .id_table = amb_pci_tbl,
2438 static int __init amb_module_init (void)
2440 PRINTD (DBG_FLOW|DBG_INIT, "init_module");
2442 // sanity check - cast needed as printk does not support %Zu
2443 if (sizeof(amb_mem) != 4*16 + 4*12) {
2444 PRINTK (KERN_ERR, "Fix amb_mem (is %lu words).",
2445 (unsigned long) sizeof(amb_mem));
2454 return pci_register_driver(&amb_driver);
2457 /********** module exit **********/
2459 static void __exit amb_module_exit (void)
2461 PRINTD (DBG_FLOW|DBG_INIT, "cleanup_module");
2463 return pci_unregister_driver(&amb_driver);
2466 module_init(amb_module_init);
2467 module_exit(amb_module_exit);