2  * Copyright (c) 2005 Ammasso, Inc. All rights reserved.
 
   3  * Copyright (c) 2005 Open Grid Computing, Inc. All rights reserved.
 
   5  * This software is available to you under a choice of one of two
 
   6  * licenses.  You may choose to be licensed under the terms of the GNU
 
   7  * General Public License (GPL) Version 2, available from the file
 
   8  * COPYING in the main directory of this source tree, or the
 
   9  * OpenIB.org BSD license below:
 
  11  *     Redistribution and use in source and binary forms, with or
 
  12  *     without modification, are permitted provided that the following
 
  15  *      - Redistributions of source code must retain the above
 
  16  *        copyright notice, this list of conditions and the following
 
  19  *      - Redistributions in binary form must reproduce the above
 
  20  *        copyright notice, this list of conditions and the following
 
  21  *        disclaimer in the documentation and/or other materials
 
  22  *        provided with the distribution.
 
  24  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 
  25  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 
  26  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 
  27  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 
  28  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 
  29  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 
  30  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 
  36 #include <linux/module.h>
 
  37 #include <linux/moduleparam.h>
 
  38 #include <linux/pci.h>
 
  39 #include <linux/netdevice.h>
 
  40 #include <linux/etherdevice.h>
 
  41 #include <linux/delay.h>
 
  42 #include <linux/ethtool.h>
 
  43 #include <linux/mii.h>
 
  44 #include <linux/if_vlan.h>
 
  45 #include <linux/crc32.h>
 
  48 #include <linux/tcp.h>
 
  49 #include <linux/init.h>
 
  50 #include <linux/dma-mapping.h>
 
  52 #include <linux/inet.h>
 
  53 #include <linux/vmalloc.h>
 
  55 #include <linux/route.h>
 
  59 #include <asm/byteorder.h>
 
  60 #include <rdma/ib_smi.h>
 
  64 /* Device capabilities */
 
  65 #define C2_MIN_PAGESIZE  1024
 
  67 #define C2_MAX_MRS       32768
 
  68 #define C2_MAX_QPS       16000
 
  69 #define C2_MAX_WQE_SZ    256
 
  70 #define C2_MAX_QP_WR     ((128*1024)/C2_MAX_WQE_SZ)
 
  72 #define C2_MAX_SGE_RD    1
 
  73 #define C2_MAX_CQS       32768
 
  74 #define C2_MAX_CQES      4096
 
  75 #define C2_MAX_PDS       16384
 
  78  * Send the adapter INIT message to the amso1100
 
  80 static int c2_adapter_init(struct c2_dev *c2dev)
 
  82         struct c2wr_init_req wr;
 
  85         memset(&wr, 0, sizeof(wr));
 
  86         c2_wr_set_id(&wr, CCWR_INIT);
 
  88         wr.hint_count = cpu_to_be64(c2dev->hint_count_dma);
 
  89         wr.q0_host_shared = cpu_to_be64(c2dev->req_vq.shared_dma);
 
  90         wr.q1_host_shared = cpu_to_be64(c2dev->rep_vq.shared_dma);
 
  91         wr.q1_host_msg_pool = cpu_to_be64(c2dev->rep_vq.host_dma);
 
  92         wr.q2_host_shared = cpu_to_be64(c2dev->aeq.shared_dma);
 
  93         wr.q2_host_msg_pool = cpu_to_be64(c2dev->aeq.host_dma);
 
  95         /* Post the init message */
 
  96         err = vq_send_wr(c2dev, (union c2wr *) & wr);
 
 102  * Send the adapter TERM message to the amso1100
 
 104 static void c2_adapter_term(struct c2_dev *c2dev)
 
 106         struct c2wr_init_req wr;
 
 108         memset(&wr, 0, sizeof(wr));
 
 109         c2_wr_set_id(&wr, CCWR_TERM);
 
 112         /* Post the init message */
 
 113         vq_send_wr(c2dev, (union c2wr *) & wr);
 
 122 static int c2_rnic_query(struct c2_dev *c2dev, struct ib_device_attr *props)
 
 124         struct c2_vq_req *vq_req;
 
 125         struct c2wr_rnic_query_req wr;
 
 126         struct c2wr_rnic_query_rep *reply;
 
 129         vq_req = vq_req_alloc(c2dev);
 
 133         c2_wr_set_id(&wr, CCWR_RNIC_QUERY);
 
 134         wr.hdr.context = (unsigned long) vq_req;
 
 135         wr.rnic_handle = c2dev->adapter_handle;
 
 137         vq_req_get(c2dev, vq_req);
 
 139         err = vq_send_wr(c2dev, (union c2wr *) &wr);
 
 141                 vq_req_put(c2dev, vq_req);
 
 145         err = vq_wait_for_reply(c2dev, vq_req);
 
 150             (struct c2wr_rnic_query_rep *) (unsigned long) (vq_req->reply_msg);
 
 154         err = c2_errno(reply);
 
 159                 ((u64)be32_to_cpu(reply->fw_ver_major) << 32) |
 
 160                 ((be32_to_cpu(reply->fw_ver_minor) && 0xFFFF) << 16) |
 
 161                 (be32_to_cpu(reply->fw_ver_patch) && 0xFFFF);
 
 162         memcpy(&props->sys_image_guid, c2dev->netdev->dev_addr, 6);
 
 163         props->max_mr_size         = 0xFFFFFFFF;
 
 164         props->page_size_cap       = ~(C2_MIN_PAGESIZE-1);
 
 165         props->vendor_id           = be32_to_cpu(reply->vendor_id);
 
 166         props->vendor_part_id      = be32_to_cpu(reply->part_number);
 
 167         props->hw_ver              = be32_to_cpu(reply->hw_version);
 
 168         props->max_qp              = be32_to_cpu(reply->max_qps);
 
 169         props->max_qp_wr           = be32_to_cpu(reply->max_qp_depth);
 
 170         props->device_cap_flags    = c2dev->device_cap_flags;
 
 171         props->max_sge             = C2_MAX_SGES;
 
 172         props->max_sge_rd          = C2_MAX_SGE_RD;
 
 173         props->max_cq              = be32_to_cpu(reply->max_cqs);
 
 174         props->max_cqe             = be32_to_cpu(reply->max_cq_depth);
 
 175         props->max_mr              = be32_to_cpu(reply->max_mrs);
 
 176         props->max_pd              = be32_to_cpu(reply->max_pds);
 
 177         props->max_qp_rd_atom      = be32_to_cpu(reply->max_qp_ird);
 
 178         props->max_ee_rd_atom      = 0;
 
 179         props->max_res_rd_atom     = be32_to_cpu(reply->max_global_ird);
 
 180         props->max_qp_init_rd_atom = be32_to_cpu(reply->max_qp_ord);
 
 181         props->max_ee_init_rd_atom = 0;
 
 182         props->atomic_cap          = IB_ATOMIC_NONE;
 
 185         props->max_mw              = be32_to_cpu(reply->max_mws);
 
 186         props->max_raw_ipv6_qp     = 0;
 
 187         props->max_raw_ethy_qp     = 0;
 
 188         props->max_mcast_grp       = 0;
 
 189         props->max_mcast_qp_attach = 0;
 
 190         props->max_total_mcast_qp_attach = 0;
 
 193         props->max_map_per_fmr     = 0;
 
 195         props->max_srq_wr          = 0;
 
 196         props->max_srq_sge         = 0;
 
 197         props->max_pkeys           = 0;
 
 198         props->local_ca_ack_delay  = 0;
 
 201         vq_repbuf_free(c2dev, reply);
 
 204         vq_req_free(c2dev, vq_req);
 
 209  * Add an IP address to the RNIC interface
 
 211 int c2_add_addr(struct c2_dev *c2dev, u32 inaddr, u32 inmask)
 
 213         struct c2_vq_req *vq_req;
 
 214         struct c2wr_rnic_setconfig_req *wr;
 
 215         struct c2wr_rnic_setconfig_rep *reply;
 
 216         struct c2_netaddr netaddr;
 
 219         vq_req = vq_req_alloc(c2dev);
 
 223         len = sizeof(struct c2_netaddr);
 
 224         wr = kmalloc(c2dev->req_vq.msg_size, GFP_KERNEL);
 
 230         c2_wr_set_id(wr, CCWR_RNIC_SETCONFIG);
 
 231         wr->hdr.context = (unsigned long) vq_req;
 
 232         wr->rnic_handle = c2dev->adapter_handle;
 
 233         wr->option = cpu_to_be32(C2_CFG_ADD_ADDR);
 
 235         netaddr.ip_addr = inaddr;
 
 236         netaddr.netmask = inmask;
 
 239         memcpy(wr->data, &netaddr, len);
 
 241         vq_req_get(c2dev, vq_req);
 
 243         err = vq_send_wr(c2dev, (union c2wr *) wr);
 
 245                 vq_req_put(c2dev, vq_req);
 
 249         err = vq_wait_for_reply(c2dev, vq_req);
 
 254             (struct c2wr_rnic_setconfig_rep *) (unsigned long) (vq_req->reply_msg);
 
 260         err = c2_errno(reply);
 
 261         vq_repbuf_free(c2dev, reply);
 
 266         vq_req_free(c2dev, vq_req);
 
 271  * Delete an IP address from the RNIC interface
 
 273 int c2_del_addr(struct c2_dev *c2dev, u32 inaddr, u32 inmask)
 
 275         struct c2_vq_req *vq_req;
 
 276         struct c2wr_rnic_setconfig_req *wr;
 
 277         struct c2wr_rnic_setconfig_rep *reply;
 
 278         struct c2_netaddr netaddr;
 
 281         vq_req = vq_req_alloc(c2dev);
 
 285         len = sizeof(struct c2_netaddr);
 
 286         wr = kmalloc(c2dev->req_vq.msg_size, GFP_KERNEL);
 
 292         c2_wr_set_id(wr, CCWR_RNIC_SETCONFIG);
 
 293         wr->hdr.context = (unsigned long) vq_req;
 
 294         wr->rnic_handle = c2dev->adapter_handle;
 
 295         wr->option = cpu_to_be32(C2_CFG_DEL_ADDR);
 
 297         netaddr.ip_addr = inaddr;
 
 298         netaddr.netmask = inmask;
 
 301         memcpy(wr->data, &netaddr, len);
 
 303         vq_req_get(c2dev, vq_req);
 
 305         err = vq_send_wr(c2dev, (union c2wr *) wr);
 
 307                 vq_req_put(c2dev, vq_req);
 
 311         err = vq_wait_for_reply(c2dev, vq_req);
 
 316             (struct c2wr_rnic_setconfig_rep *) (unsigned long) (vq_req->reply_msg);
 
 322         err = c2_errno(reply);
 
 323         vq_repbuf_free(c2dev, reply);
 
 328         vq_req_free(c2dev, vq_req);
 
 333  * Open a single RNIC instance to use with all
 
 334  * low level openib calls
 
 336 static int c2_rnic_open(struct c2_dev *c2dev)
 
 338         struct c2_vq_req *vq_req;
 
 340         struct c2wr_rnic_open_rep *reply;
 
 343         vq_req = vq_req_alloc(c2dev);
 
 344         if (vq_req == NULL) {
 
 348         memset(&wr, 0, sizeof(wr));
 
 349         c2_wr_set_id(&wr, CCWR_RNIC_OPEN);
 
 350         wr.rnic_open.req.hdr.context = (unsigned long) (vq_req);
 
 351         wr.rnic_open.req.flags = cpu_to_be16(RNIC_PRIV_MODE);
 
 352         wr.rnic_open.req.port_num = cpu_to_be16(0);
 
 353         wr.rnic_open.req.user_context = (unsigned long) c2dev;
 
 355         vq_req_get(c2dev, vq_req);
 
 357         err = vq_send_wr(c2dev, &wr);
 
 359                 vq_req_put(c2dev, vq_req);
 
 363         err = vq_wait_for_reply(c2dev, vq_req);
 
 368         reply = (struct c2wr_rnic_open_rep *) (unsigned long) (vq_req->reply_msg);
 
 374         if ((err = c2_errno(reply)) != 0) {
 
 378         c2dev->adapter_handle = reply->rnic_handle;
 
 381         vq_repbuf_free(c2dev, reply);
 
 383         vq_req_free(c2dev, vq_req);
 
 388  * Close the RNIC instance
 
 390 static int c2_rnic_close(struct c2_dev *c2dev)
 
 392         struct c2_vq_req *vq_req;
 
 394         struct c2wr_rnic_close_rep *reply;
 
 397         vq_req = vq_req_alloc(c2dev);
 
 398         if (vq_req == NULL) {
 
 402         memset(&wr, 0, sizeof(wr));
 
 403         c2_wr_set_id(&wr, CCWR_RNIC_CLOSE);
 
 404         wr.rnic_close.req.hdr.context = (unsigned long) vq_req;
 
 405         wr.rnic_close.req.rnic_handle = c2dev->adapter_handle;
 
 407         vq_req_get(c2dev, vq_req);
 
 409         err = vq_send_wr(c2dev, &wr);
 
 411                 vq_req_put(c2dev, vq_req);
 
 415         err = vq_wait_for_reply(c2dev, vq_req);
 
 420         reply = (struct c2wr_rnic_close_rep *) (unsigned long) (vq_req->reply_msg);
 
 426         if ((err = c2_errno(reply)) != 0) {
 
 430         c2dev->adapter_handle = 0;
 
 433         vq_repbuf_free(c2dev, reply);
 
 435         vq_req_free(c2dev, vq_req);
 
 440  * Called by c2_probe to initialize the RNIC. This principally
 
 441  * involves initalizing the various limits and resouce pools that
 
 442  * comprise the RNIC instance.
 
 444 int c2_rnic_init(struct c2_dev *c2dev)
 
 450         void __iomem *mmio_regs;
 
 452         /* Device capabilities */
 
 453         c2dev->device_cap_flags =
 
 454             (IB_DEVICE_RESIZE_MAX_WR |
 
 455              IB_DEVICE_CURR_QP_STATE_MOD |
 
 456              IB_DEVICE_SYS_IMAGE_GUID |
 
 457              IB_DEVICE_ZERO_STAG |
 
 458              IB_DEVICE_SEND_W_INV | IB_DEVICE_MEM_WINDOW);
 
 460         /* Allocate the qptr_array */
 
 461         c2dev->qptr_array = vmalloc(C2_MAX_CQS * sizeof(void *));
 
 462         if (!c2dev->qptr_array) {
 
 466         /* Inialize the qptr_array */
 
 467         memset(c2dev->qptr_array, 0, C2_MAX_CQS * sizeof(void *));
 
 468         c2dev->qptr_array[0] = (void *) &c2dev->req_vq;
 
 469         c2dev->qptr_array[1] = (void *) &c2dev->rep_vq;
 
 470         c2dev->qptr_array[2] = (void *) &c2dev->aeq;
 
 472         /* Initialize data structures */
 
 473         init_waitqueue_head(&c2dev->req_vq_wo);
 
 474         spin_lock_init(&c2dev->vqlock);
 
 475         spin_lock_init(&c2dev->lock);
 
 477         /* Allocate MQ shared pointer pool for kernel clients. User
 
 478          * mode client pools are hung off the user context
 
 480         err = c2_init_mqsp_pool(c2dev, GFP_KERNEL, &c2dev->kern_mqsp_pool);
 
 485         /* Allocate shared pointers for Q0, Q1, and Q2 from
 
 486          * the shared pointer pool.
 
 489         c2dev->hint_count = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
 
 490                                              &c2dev->hint_count_dma,
 
 492         c2dev->req_vq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
 
 493                                              &c2dev->req_vq.shared_dma,
 
 495         c2dev->rep_vq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
 
 496                                              &c2dev->rep_vq.shared_dma,
 
 498         c2dev->aeq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
 
 499                                           &c2dev->aeq.shared_dma, GFP_KERNEL);
 
 500         if (!c2dev->hint_count || !c2dev->req_vq.shared ||
 
 501             !c2dev->rep_vq.shared || !c2dev->aeq.shared) {
 
 506         mmio_regs = c2dev->kva;
 
 507         /* Initialize the Verbs Request Queue */
 
 508         c2_mq_req_init(&c2dev->req_vq, 0,
 
 509                        be32_to_cpu(readl(mmio_regs + C2_REGS_Q0_QSIZE)),
 
 510                        be32_to_cpu(readl(mmio_regs + C2_REGS_Q0_MSGSIZE)),
 
 512                        be32_to_cpu(readl(mmio_regs + C2_REGS_Q0_POOLSTART)),
 
 514                        be32_to_cpu(readl(mmio_regs + C2_REGS_Q0_SHARED)),
 
 515                        C2_MQ_ADAPTER_TARGET);
 
 517         /* Initialize the Verbs Reply Queue */
 
 518         qsize = be32_to_cpu(readl(mmio_regs + C2_REGS_Q1_QSIZE));
 
 519         msgsize = be32_to_cpu(readl(mmio_regs + C2_REGS_Q1_MSGSIZE));
 
 520         q1_pages = kmalloc(qsize * msgsize, GFP_KERNEL);
 
 525         c2dev->rep_vq.host_dma = dma_map_single(c2dev->ibdev.dma_device,
 
 526                                                 (void *)q1_pages, qsize * msgsize,
 
 528         pci_unmap_addr_set(&c2dev->rep_vq, mapping, c2dev->rep_vq.host_dma);
 
 529         pr_debug("%s rep_vq va %p dma %llx\n", __FUNCTION__, q1_pages,
 
 530                  (u64)c2dev->rep_vq.host_dma);
 
 531         c2_mq_rep_init(&c2dev->rep_vq,
 
 537                    be32_to_cpu(readl(mmio_regs + C2_REGS_Q1_SHARED)),
 
 540         /* Initialize the Asynchronus Event Queue */
 
 541         qsize = be32_to_cpu(readl(mmio_regs + C2_REGS_Q2_QSIZE));
 
 542         msgsize = be32_to_cpu(readl(mmio_regs + C2_REGS_Q2_MSGSIZE));
 
 543         q2_pages = kmalloc(qsize * msgsize, GFP_KERNEL);
 
 548         c2dev->aeq.host_dma = dma_map_single(c2dev->ibdev.dma_device,
 
 549                                                 (void *)q2_pages, qsize * msgsize,
 
 551         pci_unmap_addr_set(&c2dev->aeq, mapping, c2dev->aeq.host_dma);
 
 552         pr_debug("%s aeq va %p dma %llx\n", __FUNCTION__, q1_pages,
 
 553                  (u64)c2dev->rep_vq.host_dma);
 
 554         c2_mq_rep_init(&c2dev->aeq,
 
 560                        be32_to_cpu(readl(mmio_regs + C2_REGS_Q2_SHARED)),
 
 563         /* Initialize the verbs request allocator */
 
 564         err = vq_init(c2dev);
 
 568         /* Enable interrupts on the adapter */
 
 569         writel(0, c2dev->regs + C2_IDIS);
 
 571         /* create the WR init message */
 
 572         err = c2_adapter_init(c2dev);
 
 577         /* open an adapter instance */
 
 578         err = c2_rnic_open(c2dev);
 
 582         /* Initialize cached the adapter limits */
 
 583         if (c2_rnic_query(c2dev, &c2dev->props))
 
 586         /* Initialize the PD pool */
 
 587         err = c2_init_pd_table(c2dev);
 
 591         /* Initialize the QP pool */
 
 592         c2_init_qp_table(c2dev);
 
 596         c2_rnic_close(c2dev);
 
 600         dma_unmap_single(c2dev->ibdev.dma_device,
 
 601                          pci_unmap_addr(&c2dev->aeq, mapping),
 
 602                          c2dev->aeq.q_size * c2dev->aeq.msg_size,
 
 606         dma_unmap_single(c2dev->ibdev.dma_device,
 
 607                          pci_unmap_addr(&c2dev->rep_vq, mapping),
 
 608                          c2dev->rep_vq.q_size * c2dev->rep_vq.msg_size,
 
 612         c2_free_mqsp_pool(c2dev, c2dev->kern_mqsp_pool);
 
 614         vfree(c2dev->qptr_array);
 
 620  * Called by c2_remove to cleanup the RNIC resources.
 
 622 void c2_rnic_term(struct c2_dev *c2dev)
 
 625         /* Close the open adapter instance */
 
 626         c2_rnic_close(c2dev);
 
 628         /* Send the TERM message to the adapter */
 
 629         c2_adapter_term(c2dev);
 
 631         /* Disable interrupts on the adapter */
 
 632         writel(1, c2dev->regs + C2_IDIS);
 
 634         /* Free the QP pool */
 
 635         c2_cleanup_qp_table(c2dev);
 
 637         /* Free the PD pool */
 
 638         c2_cleanup_pd_table(c2dev);
 
 640         /* Free the verbs request allocator */
 
 643         /* Unmap and free the asynchronus event queue */
 
 644         dma_unmap_single(c2dev->ibdev.dma_device,
 
 645                          pci_unmap_addr(&c2dev->aeq, mapping),
 
 646                          c2dev->aeq.q_size * c2dev->aeq.msg_size,
 
 648         kfree(c2dev->aeq.msg_pool.host);
 
 650         /* Unmap and free the verbs reply queue */
 
 651         dma_unmap_single(c2dev->ibdev.dma_device,
 
 652                          pci_unmap_addr(&c2dev->rep_vq, mapping),
 
 653                          c2dev->rep_vq.q_size * c2dev->rep_vq.msg_size,
 
 655         kfree(c2dev->rep_vq.msg_pool.host);
 
 657         /* Free the MQ shared pointer pool */
 
 658         c2_free_mqsp_pool(c2dev, c2dev->kern_mqsp_pool);
 
 660         /* Free the qptr_array */
 
 661         vfree(c2dev->qptr_array);