2 * Copyright (c) 2005 Ammasso, Inc. All rights reserved.
3 * Copyright (c) 2005 Open Grid Computing, Inc. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
37 #include <linux/netdevice.h>
38 #include <linux/spinlock.h>
39 #include <linux/kernel.h>
40 #include <linux/pci.h>
41 #include <linux/dma-mapping.h>
42 #include <linux/idr.h>
44 #include "c2_provider.h"
46 #include "c2_status.h"
49 #define DRV_VERSION "1.1"
50 #define PFX DRV_NAME ": "
56 #define RX_BUF_SIZE (1536 + 8)
57 #define ETH_JUMBO_MTU 9000
58 #define C2_MAGIC "CEPHEUS"
60 #define C2_IVN (18 & 0x7fffffff)
62 #define C2_REG0_SIZE (16 * 1024)
63 #define C2_REG2_SIZE (2 * 1024 * 1024)
64 #define C2_REG4_SIZE (256 * 1024 * 1024)
65 #define C2_NUM_TX_DESC 341
66 #define C2_NUM_RX_DESC 256
67 #define C2_PCI_REGS_OFFSET (0x10000)
68 #define C2_RXP_HRXDQ_OFFSET (((C2_REG4_SIZE)/2))
69 #define C2_RXP_HRXDQ_SIZE (4096)
70 #define C2_TXP_HTXDQ_OFFSET (((C2_REG4_SIZE)/2) + C2_RXP_HRXDQ_SIZE)
71 #define C2_TXP_HTXDQ_SIZE (4096)
72 #define C2_TX_TIMEOUT (6*HZ)
75 static const u8 c2_magic[] = {
76 0x43, 0x45, 0x50, 0x48, 0x45, 0x55, 0x53
79 enum adapter_pci_regs {
80 C2_REGS_MAGIC = 0x0000,
81 C2_REGS_VERS = 0x0008,
83 C2_REGS_PCI_WINSIZE = 0x0010,
84 C2_REGS_Q0_QSIZE = 0x0014,
85 C2_REGS_Q0_MSGSIZE = 0x0018,
86 C2_REGS_Q0_POOLSTART = 0x001C,
87 C2_REGS_Q0_SHARED = 0x0020,
88 C2_REGS_Q1_QSIZE = 0x0024,
89 C2_REGS_Q1_MSGSIZE = 0x0028,
90 C2_REGS_Q1_SHARED = 0x0030,
91 C2_REGS_Q2_QSIZE = 0x0034,
92 C2_REGS_Q2_MSGSIZE = 0x0038,
93 C2_REGS_Q2_SHARED = 0x0040,
94 C2_REGS_ENADDR = 0x004C,
95 C2_REGS_RDMA_ENADDR = 0x0054,
96 C2_REGS_HRX_CUR = 0x006C,
99 struct c2_adapter_pci_regs {
140 C2_PCI_HRX_INT = 1 << 8,
141 C2_PCI_HTX_INT = 1 << 17,
142 C2_PCI_HRX_QUI = 1 << 31,
146 * Cepheus registers in BAR0.
163 TXP_HTXD_READY = 1 << 0,
164 TXP_HTXD_UNINIT = 1 << 1,
170 RXP_HRXD_READY = 1 << 0,
171 RXP_HRXD_DONE = 1 << 1,
177 RXP_HRXD_OK = 1 << 0,
178 RXP_HRXD_BUF_OV = 1 << 1,
181 /* TXP descriptor fields */
183 C2_TXP_FLAGS = 0x0000,
185 C2_TXP_ADDR = 0x0004,
188 /* RXP descriptor fields */
190 C2_RXP_FLAGS = 0x0000,
191 C2_RXP_STATUS = 0x0002,
192 C2_RXP_COUNT = 0x0004,
194 C2_RXP_ADDR = 0x0008,
201 } __attribute__ ((packed));
209 } __attribute__ ((packed));
216 } __attribute__ ((packed));
221 dma_addr_t next_offset;
227 dma_addr_t next_offset;
234 unsigned long *table;
245 * The MQ shared pointer pool is organized as a linked list of
246 * chunks. Each chunk contains a linked list of free shared pointers
247 * that can be allocated to a given user mode client.
251 struct sp_chunk *next;
253 DECLARE_PCI_UNMAP_ADDR(mapping);
262 unsigned long *table;
272 struct c2_element *next;
273 void *ht_desc; /* host descriptor */
274 void __iomem *hw_desc; /* hardware descriptor */
281 struct c2_element *to_clean;
282 struct c2_element *to_use;
283 struct c2_element *start;
288 struct ib_device ibdev;
290 void __iomem *mmio_txp_ring; /* remapped adapter memory for hw rings */
291 void __iomem *mmio_rxp_ring;
293 struct pci_dev *pcidev;
294 struct net_device *netdev;
295 struct net_device *pseudo_netdev;
299 int device_cap_flags;
300 void __iomem *kva; /* KVA device memory */
301 unsigned long pa; /* PA device memory */
304 struct kmem_cache *host_msg_cache;
306 struct list_head cca_link; /* adapter list */
307 struct list_head eh_wakeup_list; /* event wakeup list */
308 wait_queue_head_t req_vq_wo;
310 /* Cached RNIC properties */
311 struct ib_device_attr props;
313 struct c2_pd_table pd_table;
314 struct c2_qp_table qp_table;
315 int ports; /* num of GigE ports */
317 spinlock_t vqlock; /* sync vbs req MQ */
320 struct c2_mq req_vq; /* Verbs Request MQ */
321 struct c2_mq rep_vq; /* Verbs Reply MQ */
322 struct c2_mq aeq; /* Async Events MQ */
324 /* Kernel client MQs */
325 struct sp_chunk *kern_mqsp_pool;
327 /* Device updates these values when posting messages to a host
335 * Shared host target pages for user-accessible MQs.
337 int hthead; /* index of first free entry */
338 void *htpages; /* kernel vaddr */
339 int htlen; /* length of htpages memory */
340 void *htuva; /* user mapped vaddr */
341 spinlock_t htlock; /* serialize allocation */
343 u64 adapter_hint_uva; /* access to the activity FIFO */
345 // spinlock_t aeq_lock;
346 // spinlock_t rnic_lock;
349 dma_addr_t hint_count_dma;
352 int init; /* TRUE if it's ready */
353 char ae_cache_name[16];
354 char vq_cache_name[16];
359 struct c2_dev *c2dev;
360 struct net_device *netdev;
364 struct c2_ring tx_ring;
365 struct c2_ring rx_ring;
367 void *mem; /* PCI memory for host rings */
369 unsigned long mem_size;
375 * Activity FIFO registers in BAR0.
377 #define PCI_BAR0_HOST_HINT 0x100
378 #define PCI_BAR0_ADAPTER_HINT 0x2000
381 * Ammasso PCI vendor id and Cepheus PCI device id.
383 #define CQ_ARMED 0x01
384 #define CQ_WAIT_FOR_DMA 0x80
387 * The format of a hint is as follows:
388 * Lower 16 bits are the count of hints for the queue.
389 * Next 15 bits are the qp_index
390 * Upper most bit depends on who reads it:
391 * If read by producer, then it means Full (1) or Not-Full (0)
392 * If read by consumer, then it means Empty (1) or Not-Empty (0)
394 #define C2_HINT_MAKE(q_index, hint_count) (((q_index) << 16) | hint_count)
395 #define C2_HINT_GET_INDEX(hint) (((hint) & 0x7FFF0000) >> 16)
396 #define C2_HINT_GET_COUNT(hint) ((hint) & 0x0000FFFF)
400 * The following defines the offset in SDRAM for the c2_adapter_pci_regs_t
403 #define C2_ADAPTER_PCI_REGS_OFFSET 0x10000
406 static inline u64 readq(const void __iomem * addr)
408 u64 ret = readl(addr + 4);
417 static inline void __raw_writeq(u64 val, void __iomem * addr)
419 __raw_writel((u32) (val), addr);
420 __raw_writel((u32) (val >> 32), (addr + 4));
424 #define C2_SET_CUR_RX(c2dev, cur_rx) \
425 __raw_writel((__force u32) cpu_to_be32(cur_rx), c2dev->mmio_txp_ring + 4092)
427 #define C2_GET_CUR_RX(c2dev) \
428 be32_to_cpu((__force __be32) readl(c2dev->mmio_txp_ring + 4092))
430 static inline struct c2_dev *to_c2dev(struct ib_device *ibdev)
432 return container_of(ibdev, struct c2_dev, ibdev);
435 static inline int c2_errno(void *reply)
437 switch (c2_wr_get_result(reply)) {
441 case CCERR_INSUFFICIENT_RESOURCES:
442 case CCERR_ZERO_RDMA_READ_RESOURCES:
444 case CCERR_MR_IN_USE:
445 case CCERR_QP_IN_USE:
447 case CCERR_ADDR_IN_USE:
449 case CCERR_ADDR_NOT_AVAIL:
450 return -EADDRNOTAVAIL;
451 case CCERR_CONN_RESET:
453 case CCERR_NOT_IMPLEMENTED:
454 case CCERR_INVALID_WQE:
456 case CCERR_QP_NOT_PRIVILEGED:
458 case CCERR_STACK_ERROR:
460 case CCERR_ACCESS_VIOLATION:
461 case CCERR_BASE_AND_BOUNDS_VIOLATION:
463 case CCERR_STAG_STATE_NOT_INVALID:
464 case CCERR_INVALID_ADDRESS:
465 case CCERR_INVALID_CQ:
466 case CCERR_INVALID_EP:
467 case CCERR_INVALID_MODIFIER:
468 case CCERR_INVALID_MTU:
469 case CCERR_INVALID_PD_ID:
470 case CCERR_INVALID_QP:
471 case CCERR_INVALID_RNIC:
472 case CCERR_INVALID_STAG:
480 extern int c2_register_device(struct c2_dev *c2dev);
481 extern void c2_unregister_device(struct c2_dev *c2dev);
482 extern int c2_rnic_init(struct c2_dev *c2dev);
483 extern void c2_rnic_term(struct c2_dev *c2dev);
484 extern void c2_rnic_interrupt(struct c2_dev *c2dev);
485 extern int c2_del_addr(struct c2_dev *c2dev, __be32 inaddr, __be32 inmask);
486 extern int c2_add_addr(struct c2_dev *c2dev, __be32 inaddr, __be32 inmask);
489 extern int c2_alloc_qp(struct c2_dev *c2dev, struct c2_pd *pd,
490 struct ib_qp_init_attr *qp_attrs, struct c2_qp *qp);
491 extern void c2_free_qp(struct c2_dev *c2dev, struct c2_qp *qp);
492 extern struct ib_qp *c2_get_qp(struct ib_device *device, int qpn);
493 extern int c2_qp_modify(struct c2_dev *c2dev, struct c2_qp *qp,
494 struct ib_qp_attr *attr, int attr_mask);
495 extern int c2_qp_set_read_limits(struct c2_dev *c2dev, struct c2_qp *qp,
497 extern int c2_post_send(struct ib_qp *ibqp, struct ib_send_wr *ib_wr,
498 struct ib_send_wr **bad_wr);
499 extern int c2_post_receive(struct ib_qp *ibqp, struct ib_recv_wr *ib_wr,
500 struct ib_recv_wr **bad_wr);
501 extern void __devinit c2_init_qp_table(struct c2_dev *c2dev);
502 extern void __devexit c2_cleanup_qp_table(struct c2_dev *c2dev);
503 extern void c2_set_qp_state(struct c2_qp *, int);
504 extern struct c2_qp *c2_find_qpn(struct c2_dev *c2dev, int qpn);
507 extern int c2_pd_alloc(struct c2_dev *c2dev, int privileged, struct c2_pd *pd);
508 extern void c2_pd_free(struct c2_dev *c2dev, struct c2_pd *pd);
509 extern int __devinit c2_init_pd_table(struct c2_dev *c2dev);
510 extern void __devexit c2_cleanup_pd_table(struct c2_dev *c2dev);
513 extern int c2_init_cq(struct c2_dev *c2dev, int entries,
514 struct c2_ucontext *ctx, struct c2_cq *cq);
515 extern void c2_free_cq(struct c2_dev *c2dev, struct c2_cq *cq);
516 extern void c2_cq_event(struct c2_dev *c2dev, u32 mq_index);
517 extern void c2_cq_clean(struct c2_dev *c2dev, struct c2_qp *qp, u32 mq_index);
518 extern int c2_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *entry);
519 extern int c2_arm_cq(struct ib_cq *ibcq, enum ib_cq_notify_flags flags);
522 extern int c2_llp_connect(struct iw_cm_id *cm_id,
523 struct iw_cm_conn_param *iw_param);
524 extern int c2_llp_accept(struct iw_cm_id *cm_id,
525 struct iw_cm_conn_param *iw_param);
526 extern int c2_llp_reject(struct iw_cm_id *cm_id, const void *pdata,
528 extern int c2_llp_service_create(struct iw_cm_id *cm_id, int backlog);
529 extern int c2_llp_service_destroy(struct iw_cm_id *cm_id);
532 extern int c2_nsmr_register_phys_kern(struct c2_dev *c2dev, u64 *addr_list,
533 int page_size, int pbl_depth, u32 length,
534 u32 off, u64 *va, enum c2_acf acf,
536 extern int c2_stag_dealloc(struct c2_dev *c2dev, u32 stag_index);
539 extern void c2_ae_event(struct c2_dev *c2dev, u32 mq_index);
542 extern int c2_init_mqsp_pool(struct c2_dev *c2dev, gfp_t gfp_mask,
543 struct sp_chunk **root);
544 extern void c2_free_mqsp_pool(struct c2_dev *c2dev, struct sp_chunk *root);
545 extern __be16 *c2_alloc_mqsp(struct c2_dev *c2dev, struct sp_chunk *head,
546 dma_addr_t *dma_addr, gfp_t gfp_mask);
547 extern void c2_free_mqsp(__be16* mqsp);