RDMA/nes: Enhanced PFT management scheme
[linux-2.6] / drivers / infiniband / hw / ehca / ehca_main.c
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  module start stop, hca detection
5  *
6  *  Authors: Heiko J Schick <schickhj@de.ibm.com>
7  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
8  *           Joachim Fenkes <fenkes@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42
43 #ifdef CONFIG_PPC_64K_PAGES
44 #include <linux/slab.h>
45 #endif
46
47 #include "ehca_classes.h"
48 #include "ehca_iverbs.h"
49 #include "ehca_mrmw.h"
50 #include "ehca_tools.h"
51 #include "hcp_if.h"
52
53 #define HCAD_VERSION "0026"
54
55 MODULE_LICENSE("Dual BSD/GPL");
56 MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
57 MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
58 MODULE_VERSION(HCAD_VERSION);
59
60 static int ehca_open_aqp1     = 0;
61 static int ehca_hw_level      = 0;
62 static int ehca_poll_all_eqs  = 1;
63
64 int ehca_debug_level   = 0;
65 int ehca_nr_ports      = 2;
66 int ehca_use_hp_mr     = 0;
67 int ehca_port_act_time = 30;
68 int ehca_static_rate   = -1;
69 int ehca_scaling_code  = 0;
70 int ehca_lock_hcalls   = -1;
71 int ehca_max_cq        = -1;
72 int ehca_max_qp        = -1;
73
74 module_param_named(open_aqp1,     ehca_open_aqp1,     bool, S_IRUGO);
75 module_param_named(debug_level,   ehca_debug_level,   int,  S_IRUGO);
76 module_param_named(hw_level,      ehca_hw_level,      int,  S_IRUGO);
77 module_param_named(nr_ports,      ehca_nr_ports,      int,  S_IRUGO);
78 module_param_named(use_hp_mr,     ehca_use_hp_mr,     bool, S_IRUGO);
79 module_param_named(port_act_time, ehca_port_act_time, int,  S_IRUGO);
80 module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  bool, S_IRUGO);
81 module_param_named(static_rate,   ehca_static_rate,   int,  S_IRUGO);
82 module_param_named(scaling_code,  ehca_scaling_code,  bool, S_IRUGO);
83 module_param_named(lock_hcalls,   ehca_lock_hcalls,   bool, S_IRUGO);
84 module_param_named(number_of_cqs, ehca_max_cq,        int,  S_IRUGO);
85 module_param_named(number_of_qps, ehca_max_qp,        int,  S_IRUGO);
86
87 MODULE_PARM_DESC(open_aqp1,
88                  "Open AQP1 on startup (default: no)");
89 MODULE_PARM_DESC(debug_level,
90                  "Amount of debug output (0: none (default), 1: traces, "
91                  "2: some dumps, 3: lots)");
92 MODULE_PARM_DESC(hw_level,
93                  "Hardware level (0: autosensing (default), "
94                  "0x10..0x14: eHCA, 0x20..0x23: eHCA2)");
95 MODULE_PARM_DESC(nr_ports,
96                  "number of connected ports (-1: autodetect, 1: port one only, "
97                  "2: two ports (default)");
98 MODULE_PARM_DESC(use_hp_mr,
99                  "Use high performance MRs (default: no)");
100 MODULE_PARM_DESC(port_act_time,
101                  "Time to wait for port activation (default: 30 sec)");
102 MODULE_PARM_DESC(poll_all_eqs,
103                  "Poll all event queues periodically (default: yes)");
104 MODULE_PARM_DESC(static_rate,
105                  "Set permanent static rate (default: no static rate)");
106 MODULE_PARM_DESC(scaling_code,
107                  "Enable scaling code (default: no)");
108 MODULE_PARM_DESC(lock_hcalls,
109                  "Serialize all hCalls made by the driver "
110                  "(default: autodetect)");
111 MODULE_PARM_DESC(number_of_cqs,
112                 "Max number of CQs which can be allocated "
113                 "(default: autodetect)");
114 MODULE_PARM_DESC(number_of_qps,
115                 "Max number of QPs which can be allocated "
116                 "(default: autodetect)");
117
118 DEFINE_RWLOCK(ehca_qp_idr_lock);
119 DEFINE_RWLOCK(ehca_cq_idr_lock);
120 DEFINE_IDR(ehca_qp_idr);
121 DEFINE_IDR(ehca_cq_idr);
122
123 static LIST_HEAD(shca_list); /* list of all registered ehcas */
124 static DEFINE_SPINLOCK(shca_list_lock);
125
126 static struct timer_list poll_eqs_timer;
127
128 #ifdef CONFIG_PPC_64K_PAGES
129 static struct kmem_cache *ctblk_cache;
130
131 void *ehca_alloc_fw_ctrlblock(gfp_t flags)
132 {
133         void *ret = kmem_cache_zalloc(ctblk_cache, flags);
134         if (!ret)
135                 ehca_gen_err("Out of memory for ctblk");
136         return ret;
137 }
138
139 void ehca_free_fw_ctrlblock(void *ptr)
140 {
141         if (ptr)
142                 kmem_cache_free(ctblk_cache, ptr);
143
144 }
145 #endif
146
147 int ehca2ib_return_code(u64 ehca_rc)
148 {
149         switch (ehca_rc) {
150         case H_SUCCESS:
151                 return 0;
152         case H_RESOURCE:             /* Resource in use */
153         case H_BUSY:
154                 return -EBUSY;
155         case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
156         case H_CONSTRAINED:          /* resource constraint */
157         case H_NO_MEM:
158                 return -ENOMEM;
159         default:
160                 return -EINVAL;
161         }
162 }
163
164 static int ehca_create_slab_caches(void)
165 {
166         int ret;
167
168         ret = ehca_init_pd_cache();
169         if (ret) {
170                 ehca_gen_err("Cannot create PD SLAB cache.");
171                 return ret;
172         }
173
174         ret = ehca_init_cq_cache();
175         if (ret) {
176                 ehca_gen_err("Cannot create CQ SLAB cache.");
177                 goto create_slab_caches2;
178         }
179
180         ret = ehca_init_qp_cache();
181         if (ret) {
182                 ehca_gen_err("Cannot create QP SLAB cache.");
183                 goto create_slab_caches3;
184         }
185
186         ret = ehca_init_av_cache();
187         if (ret) {
188                 ehca_gen_err("Cannot create AV SLAB cache.");
189                 goto create_slab_caches4;
190         }
191
192         ret = ehca_init_mrmw_cache();
193         if (ret) {
194                 ehca_gen_err("Cannot create MR&MW SLAB cache.");
195                 goto create_slab_caches5;
196         }
197
198         ret = ehca_init_small_qp_cache();
199         if (ret) {
200                 ehca_gen_err("Cannot create small queue SLAB cache.");
201                 goto create_slab_caches6;
202         }
203
204 #ifdef CONFIG_PPC_64K_PAGES
205         ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
206                                         EHCA_PAGESIZE, H_CB_ALIGNMENT,
207                                         SLAB_HWCACHE_ALIGN,
208                                         NULL);
209         if (!ctblk_cache) {
210                 ehca_gen_err("Cannot create ctblk SLAB cache.");
211                 ehca_cleanup_small_qp_cache();
212                 goto create_slab_caches6;
213         }
214 #endif
215         return 0;
216
217 create_slab_caches6:
218         ehca_cleanup_mrmw_cache();
219
220 create_slab_caches5:
221         ehca_cleanup_av_cache();
222
223 create_slab_caches4:
224         ehca_cleanup_qp_cache();
225
226 create_slab_caches3:
227         ehca_cleanup_cq_cache();
228
229 create_slab_caches2:
230         ehca_cleanup_pd_cache();
231
232         return ret;
233 }
234
235 static void ehca_destroy_slab_caches(void)
236 {
237         ehca_cleanup_small_qp_cache();
238         ehca_cleanup_mrmw_cache();
239         ehca_cleanup_av_cache();
240         ehca_cleanup_qp_cache();
241         ehca_cleanup_cq_cache();
242         ehca_cleanup_pd_cache();
243 #ifdef CONFIG_PPC_64K_PAGES
244         if (ctblk_cache)
245                 kmem_cache_destroy(ctblk_cache);
246 #endif
247 }
248
249 #define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
250 #define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
251
252 static struct cap_descr {
253         u64 mask;
254         char *descr;
255 } hca_cap_descr[] = {
256         { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
257         { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
258         { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
259         { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
260         { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
261         { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
262         { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
263         { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
264         { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
265         { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
266         { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
267         { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
268         { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
269         { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
270         { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
271         { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
272         { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
273         { HCA_CAP_H_ALLOC_RES_SYNC, "HCA_CAP_H_ALLOC_RES_SYNC" },
274 };
275
276 static int ehca_sense_attributes(struct ehca_shca *shca)
277 {
278         int i, ret = 0;
279         u64 h_ret;
280         struct hipz_query_hca *rblock;
281         struct hipz_query_port *port;
282         const char *loc_code;
283
284         static const u32 pgsize_map[] = {
285                 HCA_CAP_MR_PGSIZE_4K,  0x1000,
286                 HCA_CAP_MR_PGSIZE_64K, 0x10000,
287                 HCA_CAP_MR_PGSIZE_1M,  0x100000,
288                 HCA_CAP_MR_PGSIZE_16M, 0x1000000,
289         };
290
291         ehca_gen_dbg("Probing adapter %s...",
292                      shca->ofdev->node->full_name);
293         loc_code = of_get_property(shca->ofdev->node, "ibm,loc-code", NULL);
294         if (loc_code)
295                 ehca_gen_dbg(" ... location lode=%s", loc_code);
296
297         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
298         if (!rblock) {
299                 ehca_gen_err("Cannot allocate rblock memory.");
300                 return -ENOMEM;
301         }
302
303         h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
304         if (h_ret != H_SUCCESS) {
305                 ehca_gen_err("Cannot query device properties. h_ret=%li",
306                              h_ret);
307                 ret = -EPERM;
308                 goto sense_attributes1;
309         }
310
311         if (ehca_nr_ports == 1)
312                 shca->num_ports = 1;
313         else
314                 shca->num_ports = (u8)rblock->num_ports;
315
316         ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
317
318         if (ehca_hw_level == 0) {
319                 u32 hcaaver;
320                 u32 revid;
321
322                 hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
323                 revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
324
325                 ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
326
327                 if (hcaaver == 1) {
328                         if (revid <= 3)
329                                 shca->hw_level = 0x10 | (revid + 1);
330                         else
331                                 shca->hw_level = 0x14;
332                 } else if (hcaaver == 2) {
333                         if (revid == 0)
334                                 shca->hw_level = 0x21;
335                         else if (revid == 0x10)
336                                 shca->hw_level = 0x22;
337                         else if (revid == 0x20 || revid == 0x21)
338                                 shca->hw_level = 0x23;
339                 }
340
341                 if (!shca->hw_level) {
342                         ehca_gen_warn("unknown hardware version"
343                                       " - assuming default level");
344                         shca->hw_level = 0x22;
345                 }
346         } else
347                 shca->hw_level = ehca_hw_level;
348         ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
349
350         shca->hca_cap = rblock->hca_cap_indicators;
351         ehca_gen_dbg(" ... HCA capabilities:");
352         for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
353                 if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
354                         ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
355
356         /* Autodetect hCall locking -- the "H_ALLOC_RESOURCE synced" flag is
357          * a firmware property, so it's valid across all adapters
358          */
359         if (ehca_lock_hcalls == -1)
360                 ehca_lock_hcalls = !(shca->hca_cap & HCA_CAP_H_ALLOC_RES_SYNC);
361
362         /* translate supported MR page sizes; always support 4K */
363         shca->hca_cap_mr_pgsize = EHCA_PAGESIZE;
364         for (i = 0; i < ARRAY_SIZE(pgsize_map); i += 2)
365                 if (rblock->memory_page_size_supported & pgsize_map[i])
366                         shca->hca_cap_mr_pgsize |= pgsize_map[i + 1];
367
368         /* Set maximum number of CQs and QPs to calculate EQ size */
369         if (ehca_max_qp == -1)
370                 ehca_max_qp = min_t(int, rblock->max_qp, EHCA_MAX_NUM_QUEUES);
371         else if (ehca_max_qp < 1 || ehca_max_qp > rblock->max_qp) {
372                 ehca_gen_err("Requested number of QPs is out of range (1 - %i) "
373                         "specified by HW", rblock->max_qp);
374                 ret = -EINVAL;
375                 goto sense_attributes1;
376         }
377
378         if (ehca_max_cq == -1)
379                 ehca_max_cq = min_t(int, rblock->max_cq, EHCA_MAX_NUM_QUEUES);
380         else if (ehca_max_cq < 1 || ehca_max_cq > rblock->max_cq) {
381                 ehca_gen_err("Requested number of CQs is out of range (1 - %i) "
382                         "specified by HW", rblock->max_cq);
383                 ret = -EINVAL;
384                 goto sense_attributes1;
385         }
386
387         /* query max MTU from first port -- it's the same for all ports */
388         port = (struct hipz_query_port *)rblock;
389         h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
390         if (h_ret != H_SUCCESS) {
391                 ehca_gen_err("Cannot query port properties. h_ret=%li",
392                              h_ret);
393                 ret = -EPERM;
394                 goto sense_attributes1;
395         }
396
397         shca->max_mtu = port->max_mtu;
398
399 sense_attributes1:
400         ehca_free_fw_ctrlblock(rblock);
401         return ret;
402 }
403
404 static int init_node_guid(struct ehca_shca *shca)
405 {
406         int ret = 0;
407         struct hipz_query_hca *rblock;
408
409         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
410         if (!rblock) {
411                 ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
412                 return -ENOMEM;
413         }
414
415         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
416                 ehca_err(&shca->ib_device, "Can't query device properties");
417                 ret = -EINVAL;
418                 goto init_node_guid1;
419         }
420
421         memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
422
423 init_node_guid1:
424         ehca_free_fw_ctrlblock(rblock);
425         return ret;
426 }
427
428 static int ehca_init_device(struct ehca_shca *shca)
429 {
430         int ret;
431
432         ret = init_node_guid(shca);
433         if (ret)
434                 return ret;
435
436         strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
437         shca->ib_device.owner               = THIS_MODULE;
438
439         shca->ib_device.uverbs_abi_ver      = 8;
440         shca->ib_device.uverbs_cmd_mask     =
441                 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
442                 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
443                 (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
444                 (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
445                 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
446                 (1ull << IB_USER_VERBS_CMD_REG_MR)              |
447                 (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
448                 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
449                 (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
450                 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
451                 (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
452                 (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
453                 (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
454                 (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
455                 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
456                 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
457
458         shca->ib_device.node_type           = RDMA_NODE_IB_CA;
459         shca->ib_device.phys_port_cnt       = shca->num_ports;
460         shca->ib_device.num_comp_vectors    = 1;
461         shca->ib_device.dma_device          = &shca->ofdev->dev;
462         shca->ib_device.query_device        = ehca_query_device;
463         shca->ib_device.query_port          = ehca_query_port;
464         shca->ib_device.query_gid           = ehca_query_gid;
465         shca->ib_device.query_pkey          = ehca_query_pkey;
466         /* shca->in_device.modify_device    = ehca_modify_device    */
467         shca->ib_device.modify_port         = ehca_modify_port;
468         shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
469         shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
470         shca->ib_device.alloc_pd            = ehca_alloc_pd;
471         shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
472         shca->ib_device.create_ah           = ehca_create_ah;
473         /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
474         shca->ib_device.query_ah            = ehca_query_ah;
475         shca->ib_device.destroy_ah          = ehca_destroy_ah;
476         shca->ib_device.create_qp           = ehca_create_qp;
477         shca->ib_device.modify_qp           = ehca_modify_qp;
478         shca->ib_device.query_qp            = ehca_query_qp;
479         shca->ib_device.destroy_qp          = ehca_destroy_qp;
480         shca->ib_device.post_send           = ehca_post_send;
481         shca->ib_device.post_recv           = ehca_post_recv;
482         shca->ib_device.create_cq           = ehca_create_cq;
483         shca->ib_device.destroy_cq          = ehca_destroy_cq;
484         shca->ib_device.resize_cq           = ehca_resize_cq;
485         shca->ib_device.poll_cq             = ehca_poll_cq;
486         /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
487         shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
488         /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
489         shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
490         shca->ib_device.reg_phys_mr         = ehca_reg_phys_mr;
491         shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
492         shca->ib_device.query_mr            = ehca_query_mr;
493         shca->ib_device.dereg_mr            = ehca_dereg_mr;
494         shca->ib_device.rereg_phys_mr       = ehca_rereg_phys_mr;
495         shca->ib_device.alloc_mw            = ehca_alloc_mw;
496         shca->ib_device.bind_mw             = ehca_bind_mw;
497         shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
498         shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
499         shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
500         shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
501         shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
502         shca->ib_device.attach_mcast        = ehca_attach_mcast;
503         shca->ib_device.detach_mcast        = ehca_detach_mcast;
504         shca->ib_device.process_mad         = ehca_process_mad;
505         shca->ib_device.mmap                = ehca_mmap;
506
507         if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
508                 shca->ib_device.uverbs_cmd_mask |=
509                         (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
510                         (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
511                         (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
512                         (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
513
514                 shca->ib_device.create_srq          = ehca_create_srq;
515                 shca->ib_device.modify_srq          = ehca_modify_srq;
516                 shca->ib_device.query_srq           = ehca_query_srq;
517                 shca->ib_device.destroy_srq         = ehca_destroy_srq;
518                 shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
519         }
520
521         return ret;
522 }
523
524 static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
525 {
526         struct ehca_sport *sport = &shca->sport[port - 1];
527         struct ib_cq *ibcq;
528         struct ib_qp *ibqp;
529         struct ib_qp_init_attr qp_init_attr;
530         int ret;
531
532         if (sport->ibcq_aqp1) {
533                 ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
534                 return -EPERM;
535         }
536
537         ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1), 10, 0);
538         if (IS_ERR(ibcq)) {
539                 ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
540                 return PTR_ERR(ibcq);
541         }
542         sport->ibcq_aqp1 = ibcq;
543
544         if (sport->ibqp_sqp[IB_QPT_GSI]) {
545                 ehca_err(&shca->ib_device, "AQP1 QP is already created.");
546                 ret = -EPERM;
547                 goto create_aqp1;
548         }
549
550         memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
551         qp_init_attr.send_cq          = ibcq;
552         qp_init_attr.recv_cq          = ibcq;
553         qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
554         qp_init_attr.cap.max_send_wr  = 100;
555         qp_init_attr.cap.max_recv_wr  = 100;
556         qp_init_attr.cap.max_send_sge = 2;
557         qp_init_attr.cap.max_recv_sge = 1;
558         qp_init_attr.qp_type          = IB_QPT_GSI;
559         qp_init_attr.port_num         = port;
560         qp_init_attr.qp_context       = NULL;
561         qp_init_attr.event_handler    = NULL;
562         qp_init_attr.srq              = NULL;
563
564         ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
565         if (IS_ERR(ibqp)) {
566                 ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
567                 ret = PTR_ERR(ibqp);
568                 goto create_aqp1;
569         }
570         sport->ibqp_sqp[IB_QPT_GSI] = ibqp;
571
572         return 0;
573
574 create_aqp1:
575         ib_destroy_cq(sport->ibcq_aqp1);
576         return ret;
577 }
578
579 static int ehca_destroy_aqp1(struct ehca_sport *sport)
580 {
581         int ret;
582
583         ret = ib_destroy_qp(sport->ibqp_sqp[IB_QPT_GSI]);
584         if (ret) {
585                 ehca_gen_err("Cannot destroy AQP1 QP. ret=%i", ret);
586                 return ret;
587         }
588
589         ret = ib_destroy_cq(sport->ibcq_aqp1);
590         if (ret)
591                 ehca_gen_err("Cannot destroy AQP1 CQ. ret=%i", ret);
592
593         return ret;
594 }
595
596 static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
597 {
598         return snprintf(buf, PAGE_SIZE, "%d\n", ehca_debug_level);
599 }
600
601 static ssize_t ehca_store_debug_level(struct device_driver *ddp,
602                                       const char *buf, size_t count)
603 {
604         int value = (*buf) - '0';
605         if (value >= 0 && value <= 9)
606                 ehca_debug_level = value;
607         return 1;
608 }
609
610 static DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
611                    ehca_show_debug_level, ehca_store_debug_level);
612
613 static struct attribute *ehca_drv_attrs[] = {
614         &driver_attr_debug_level.attr,
615         NULL
616 };
617
618 static struct attribute_group ehca_drv_attr_grp = {
619         .attrs = ehca_drv_attrs
620 };
621
622 static struct attribute_group *ehca_drv_attr_groups[] = {
623         &ehca_drv_attr_grp,
624         NULL,
625 };
626
627 #define EHCA_RESOURCE_ATTR(name)                                           \
628 static ssize_t  ehca_show_##name(struct device *dev,                       \
629                                  struct device_attribute *attr,            \
630                                  char *buf)                                \
631 {                                                                          \
632         struct ehca_shca *shca;                                            \
633         struct hipz_query_hca *rblock;                                     \
634         int data;                                                          \
635                                                                            \
636         shca = dev->driver_data;                                           \
637                                                                            \
638         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
639         if (!rblock) {                                                     \
640                 dev_err(dev, "Can't allocate rblock memory.\n");           \
641                 return 0;                                                  \
642         }                                                                  \
643                                                                            \
644         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
645                 dev_err(dev, "Can't query device properties\n");           \
646                 ehca_free_fw_ctrlblock(rblock);                            \
647                 return 0;                                                  \
648         }                                                                  \
649                                                                            \
650         data = rblock->name;                                               \
651         ehca_free_fw_ctrlblock(rblock);                                    \
652                                                                            \
653         if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
654                 return snprintf(buf, 256, "1\n");                          \
655         else                                                               \
656                 return snprintf(buf, 256, "%d\n", data);                   \
657                                                                            \
658 }                                                                          \
659 static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
660
661 EHCA_RESOURCE_ATTR(num_ports);
662 EHCA_RESOURCE_ATTR(hw_ver);
663 EHCA_RESOURCE_ATTR(max_eq);
664 EHCA_RESOURCE_ATTR(cur_eq);
665 EHCA_RESOURCE_ATTR(max_cq);
666 EHCA_RESOURCE_ATTR(cur_cq);
667 EHCA_RESOURCE_ATTR(max_qp);
668 EHCA_RESOURCE_ATTR(cur_qp);
669 EHCA_RESOURCE_ATTR(max_mr);
670 EHCA_RESOURCE_ATTR(cur_mr);
671 EHCA_RESOURCE_ATTR(max_mw);
672 EHCA_RESOURCE_ATTR(cur_mw);
673 EHCA_RESOURCE_ATTR(max_pd);
674 EHCA_RESOURCE_ATTR(max_ah);
675
676 static ssize_t ehca_show_adapter_handle(struct device *dev,
677                                         struct device_attribute *attr,
678                                         char *buf)
679 {
680         struct ehca_shca *shca = dev->driver_data;
681
682         return sprintf(buf, "%lx\n", shca->ipz_hca_handle.handle);
683
684 }
685 static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
686
687 static struct attribute *ehca_dev_attrs[] = {
688         &dev_attr_adapter_handle.attr,
689         &dev_attr_num_ports.attr,
690         &dev_attr_hw_ver.attr,
691         &dev_attr_max_eq.attr,
692         &dev_attr_cur_eq.attr,
693         &dev_attr_max_cq.attr,
694         &dev_attr_cur_cq.attr,
695         &dev_attr_max_qp.attr,
696         &dev_attr_cur_qp.attr,
697         &dev_attr_max_mr.attr,
698         &dev_attr_cur_mr.attr,
699         &dev_attr_max_mw.attr,
700         &dev_attr_cur_mw.attr,
701         &dev_attr_max_pd.attr,
702         &dev_attr_max_ah.attr,
703         NULL
704 };
705
706 static struct attribute_group ehca_dev_attr_grp = {
707         .attrs = ehca_dev_attrs
708 };
709
710 static int __devinit ehca_probe(struct of_device *dev,
711                                 const struct of_device_id *id)
712 {
713         struct ehca_shca *shca;
714         const u64 *handle;
715         struct ib_pd *ibpd;
716         int ret, i, eq_size;
717
718         handle = of_get_property(dev->node, "ibm,hca-handle", NULL);
719         if (!handle) {
720                 ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
721                              dev->node->full_name);
722                 return -ENODEV;
723         }
724
725         if (!(*handle)) {
726                 ehca_gen_err("Wrong eHCA handle for adapter: %s.",
727                              dev->node->full_name);
728                 return -ENODEV;
729         }
730
731         shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
732         if (!shca) {
733                 ehca_gen_err("Cannot allocate shca memory.");
734                 return -ENOMEM;
735         }
736         mutex_init(&shca->modify_mutex);
737         atomic_set(&shca->num_cqs, 0);
738         atomic_set(&shca->num_qps, 0);
739         for (i = 0; i < ARRAY_SIZE(shca->sport); i++)
740                 spin_lock_init(&shca->sport[i].mod_sqp_lock);
741
742         shca->ofdev = dev;
743         shca->ipz_hca_handle.handle = *handle;
744         dev->dev.driver_data = shca;
745
746         ret = ehca_sense_attributes(shca);
747         if (ret < 0) {
748                 ehca_gen_err("Cannot sense eHCA attributes.");
749                 goto probe1;
750         }
751
752         ret = ehca_init_device(shca);
753         if (ret) {
754                 ehca_gen_err("Cannot init ehca  device struct");
755                 goto probe1;
756         }
757
758         eq_size = 2 * ehca_max_cq + 4 * ehca_max_qp;
759         /* create event queues */
760         ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, eq_size);
761         if (ret) {
762                 ehca_err(&shca->ib_device, "Cannot create EQ.");
763                 goto probe1;
764         }
765
766         ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
767         if (ret) {
768                 ehca_err(&shca->ib_device, "Cannot create NEQ.");
769                 goto probe3;
770         }
771
772         /* create internal protection domain */
773         ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
774         if (IS_ERR(ibpd)) {
775                 ehca_err(&shca->ib_device, "Cannot create internal PD.");
776                 ret = PTR_ERR(ibpd);
777                 goto probe4;
778         }
779
780         shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
781         shca->pd->ib_pd.device = &shca->ib_device;
782
783         /* create internal max MR */
784         ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
785
786         if (ret) {
787                 ehca_err(&shca->ib_device, "Cannot create internal MR ret=%i",
788                          ret);
789                 goto probe5;
790         }
791
792         ret = ib_register_device(&shca->ib_device);
793         if (ret) {
794                 ehca_err(&shca->ib_device,
795                          "ib_register_device() failed ret=%i", ret);
796                 goto probe6;
797         }
798
799         /* create AQP1 for port 1 */
800         if (ehca_open_aqp1 == 1) {
801                 shca->sport[0].port_state = IB_PORT_DOWN;
802                 ret = ehca_create_aqp1(shca, 1);
803                 if (ret) {
804                         ehca_err(&shca->ib_device,
805                                  "Cannot create AQP1 for port 1.");
806                         goto probe7;
807                 }
808         }
809
810         /* create AQP1 for port 2 */
811         if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
812                 shca->sport[1].port_state = IB_PORT_DOWN;
813                 ret = ehca_create_aqp1(shca, 2);
814                 if (ret) {
815                         ehca_err(&shca->ib_device,
816                                  "Cannot create AQP1 for port 2.");
817                         goto probe8;
818                 }
819         }
820
821         ret = sysfs_create_group(&dev->dev.kobj, &ehca_dev_attr_grp);
822         if (ret) /* only complain; we can live without attributes */
823                 ehca_err(&shca->ib_device,
824                          "Cannot create device attributes  ret=%d", ret);
825
826         spin_lock(&shca_list_lock);
827         list_add(&shca->shca_list, &shca_list);
828         spin_unlock(&shca_list_lock);
829
830         return 0;
831
832 probe8:
833         ret = ehca_destroy_aqp1(&shca->sport[0]);
834         if (ret)
835                 ehca_err(&shca->ib_device,
836                          "Cannot destroy AQP1 for port 1. ret=%i", ret);
837
838 probe7:
839         ib_unregister_device(&shca->ib_device);
840
841 probe6:
842         ret = ehca_dereg_internal_maxmr(shca);
843         if (ret)
844                 ehca_err(&shca->ib_device,
845                          "Cannot destroy internal MR. ret=%x", ret);
846
847 probe5:
848         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
849         if (ret)
850                 ehca_err(&shca->ib_device,
851                          "Cannot destroy internal PD. ret=%x", ret);
852
853 probe4:
854         ret = ehca_destroy_eq(shca, &shca->neq);
855         if (ret)
856                 ehca_err(&shca->ib_device,
857                          "Cannot destroy NEQ. ret=%x", ret);
858
859 probe3:
860         ret = ehca_destroy_eq(shca, &shca->eq);
861         if (ret)
862                 ehca_err(&shca->ib_device,
863                          "Cannot destroy EQ. ret=%x", ret);
864
865 probe1:
866         ib_dealloc_device(&shca->ib_device);
867
868         return -EINVAL;
869 }
870
871 static int __devexit ehca_remove(struct of_device *dev)
872 {
873         struct ehca_shca *shca = dev->dev.driver_data;
874         int ret;
875
876         sysfs_remove_group(&dev->dev.kobj, &ehca_dev_attr_grp);
877
878         if (ehca_open_aqp1 == 1) {
879                 int i;
880                 for (i = 0; i < shca->num_ports; i++) {
881                         ret = ehca_destroy_aqp1(&shca->sport[i]);
882                         if (ret)
883                                 ehca_err(&shca->ib_device,
884                                          "Cannot destroy AQP1 for port %x "
885                                          "ret=%i", ret, i);
886                 }
887         }
888
889         ib_unregister_device(&shca->ib_device);
890
891         ret = ehca_dereg_internal_maxmr(shca);
892         if (ret)
893                 ehca_err(&shca->ib_device,
894                          "Cannot destroy internal MR. ret=%i", ret);
895
896         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
897         if (ret)
898                 ehca_err(&shca->ib_device,
899                          "Cannot destroy internal PD. ret=%i", ret);
900
901         ret = ehca_destroy_eq(shca, &shca->eq);
902         if (ret)
903                 ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%i", ret);
904
905         ret = ehca_destroy_eq(shca, &shca->neq);
906         if (ret)
907                 ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%i", ret);
908
909         ib_dealloc_device(&shca->ib_device);
910
911         spin_lock(&shca_list_lock);
912         list_del(&shca->shca_list);
913         spin_unlock(&shca_list_lock);
914
915         return ret;
916 }
917
918 static struct of_device_id ehca_device_table[] =
919 {
920         {
921                 .name       = "lhca",
922                 .compatible = "IBM,lhca",
923         },
924         {},
925 };
926 MODULE_DEVICE_TABLE(of, ehca_device_table);
927
928 static struct of_platform_driver ehca_driver = {
929         .name        = "ehca",
930         .match_table = ehca_device_table,
931         .probe       = ehca_probe,
932         .remove      = ehca_remove,
933         .driver      = {
934                 .groups = ehca_drv_attr_groups,
935         },
936 };
937
938 void ehca_poll_eqs(unsigned long data)
939 {
940         struct ehca_shca *shca;
941
942         spin_lock(&shca_list_lock);
943         list_for_each_entry(shca, &shca_list, shca_list) {
944                 if (shca->eq.is_initialized) {
945                         /* call deadman proc only if eq ptr does not change */
946                         struct ehca_eq *eq = &shca->eq;
947                         int max = 3;
948                         volatile u64 q_ofs, q_ofs2;
949                         u64 flags;
950                         spin_lock_irqsave(&eq->spinlock, flags);
951                         q_ofs = eq->ipz_queue.current_q_offset;
952                         spin_unlock_irqrestore(&eq->spinlock, flags);
953                         do {
954                                 spin_lock_irqsave(&eq->spinlock, flags);
955                                 q_ofs2 = eq->ipz_queue.current_q_offset;
956                                 spin_unlock_irqrestore(&eq->spinlock, flags);
957                                 max--;
958                         } while (q_ofs == q_ofs2 && max > 0);
959                         if (q_ofs == q_ofs2)
960                                 ehca_process_eq(shca, 0);
961                 }
962         }
963         mod_timer(&poll_eqs_timer, round_jiffies(jiffies + HZ));
964         spin_unlock(&shca_list_lock);
965 }
966
967 static int __init ehca_module_init(void)
968 {
969         int ret;
970
971         printk(KERN_INFO "eHCA Infiniband Device Driver "
972                "(Version " HCAD_VERSION ")\n");
973
974         ret = ehca_create_comp_pool();
975         if (ret) {
976                 ehca_gen_err("Cannot create comp pool.");
977                 return ret;
978         }
979
980         ret = ehca_create_slab_caches();
981         if (ret) {
982                 ehca_gen_err("Cannot create SLAB caches");
983                 ret = -ENOMEM;
984                 goto module_init1;
985         }
986
987         ret = ibmebus_register_driver(&ehca_driver);
988         if (ret) {
989                 ehca_gen_err("Cannot register eHCA device driver");
990                 ret = -EINVAL;
991                 goto module_init2;
992         }
993
994         if (ehca_poll_all_eqs != 1) {
995                 ehca_gen_err("WARNING!!!");
996                 ehca_gen_err("It is possible to lose interrupts.");
997         } else {
998                 init_timer(&poll_eqs_timer);
999                 poll_eqs_timer.function = ehca_poll_eqs;
1000                 poll_eqs_timer.expires = jiffies + HZ;
1001                 add_timer(&poll_eqs_timer);
1002         }
1003
1004         return 0;
1005
1006 module_init2:
1007         ehca_destroy_slab_caches();
1008
1009 module_init1:
1010         ehca_destroy_comp_pool();
1011         return ret;
1012 };
1013
1014 static void __exit ehca_module_exit(void)
1015 {
1016         if (ehca_poll_all_eqs == 1)
1017                 del_timer_sync(&poll_eqs_timer);
1018
1019         ibmebus_unregister_driver(&ehca_driver);
1020
1021         ehca_destroy_slab_caches();
1022
1023         ehca_destroy_comp_pool();
1024
1025         idr_destroy(&ehca_cq_idr);
1026         idr_destroy(&ehca_qp_idr);
1027 };
1028
1029 module_init(ehca_module_init);
1030 module_exit(ehca_module_exit);