2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
 
   6  *  Authors: Dietmar Decker <ddecker@de.ibm.com>
 
   7  *           Christoph Raisch <raisch@de.ibm.com>
 
   8  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
 
  10  *  Copyright (c) 2005 IBM Corporation
 
  12  *  All rights reserved.
 
  14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
 
  19  * Redistribution and use in source and binary forms, with or without
 
  20  * modification, are permitted provided that the following conditions are met:
 
  22  * Redistributions of source code must retain the above copyright notice, this
 
  23  * list of conditions and the following disclaimer.
 
  25  * Redistributions in binary form must reproduce the above copyright notice,
 
  26  * this list of conditions and the following disclaimer in the documentation
 
  27  * and/or other materials
 
  28  * provided with the distribution.
 
  30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 
  31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 
  32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 
  33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 
  34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 
  35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 
  36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
 
  37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
 
  38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 
  39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 
  40  * POSSIBILITY OF SUCH DAMAGE.
 
  43 #include <asm/current.h>
 
  45 #include <rdma/ib_umem.h>
 
  47 #include "ehca_iverbs.h"
 
  48 #include "ehca_mrmw.h"
 
  52 #define NUM_CHUNKS(length, chunk_size) \
 
  53         (((length) + (chunk_size - 1)) / (chunk_size))
 
  54 /* max number of rpages (per hcall register_rpages) */
 
  55 #define MAX_RPAGES 512
 
  57 static struct kmem_cache *mr_cache;
 
  58 static struct kmem_cache *mw_cache;
 
  61         EHCA_MR_PGSIZE4K  = 0x1000L,
 
  62         EHCA_MR_PGSIZE64K = 0x10000L,
 
  63         EHCA_MR_PGSIZE1M  = 0x100000L,
 
  64         EHCA_MR_PGSIZE16M = 0x1000000L
 
  67 static u32 ehca_encode_hwpage_size(u32 pgsize)
 
  72          * map mr page size into hw code:
 
  73          * 0, 1, 2, 3 for 4K, 64K, 1M, 64M
 
  75         while (!(pgsize & 1)) {
 
  82 static u64 ehca_get_max_hwpage_size(struct ehca_shca *shca)
 
  84         if (shca->hca_cap_mr_pgsize & HCA_CAP_MR_PGSIZE_16M)
 
  85                 return EHCA_MR_PGSIZE16M;
 
  86         return EHCA_MR_PGSIZE4K;
 
  89 static struct ehca_mr *ehca_mr_new(void)
 
  93         me = kmem_cache_zalloc(mr_cache, GFP_KERNEL);
 
  95                 spin_lock_init(&me->mrlock);
 
  97                 ehca_gen_err("alloc failed");
 
 102 static void ehca_mr_delete(struct ehca_mr *me)
 
 104         kmem_cache_free(mr_cache, me);
 
 107 static struct ehca_mw *ehca_mw_new(void)
 
 111         me = kmem_cache_zalloc(mw_cache, GFP_KERNEL);
 
 113                 spin_lock_init(&me->mwlock);
 
 115                 ehca_gen_err("alloc failed");
 
 120 static void ehca_mw_delete(struct ehca_mw *me)
 
 122         kmem_cache_free(mw_cache, me);
 
 125 /*----------------------------------------------------------------------*/
 
 127 struct ib_mr *ehca_get_dma_mr(struct ib_pd *pd, int mr_access_flags)
 
 131         struct ehca_mr *e_maxmr;
 
 132         struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 133         struct ehca_shca *shca =
 
 134                 container_of(pd->device, struct ehca_shca, ib_device);
 
 137                 e_maxmr = ehca_mr_new();
 
 139                         ehca_err(&shca->ib_device, "out of memory");
 
 140                         ib_mr = ERR_PTR(-ENOMEM);
 
 141                         goto get_dma_mr_exit0;
 
 144                 ret = ehca_reg_maxmr(shca, e_maxmr, (u64 *)KERNELBASE,
 
 145                                      mr_access_flags, e_pd,
 
 146                                      &e_maxmr->ib.ib_mr.lkey,
 
 147                                      &e_maxmr->ib.ib_mr.rkey);
 
 149                         ehca_mr_delete(e_maxmr);
 
 150                         ib_mr = ERR_PTR(ret);
 
 151                         goto get_dma_mr_exit0;
 
 153                 ib_mr = &e_maxmr->ib.ib_mr;
 
 155                 ehca_err(&shca->ib_device, "no internal max-MR exist!");
 
 156                 ib_mr = ERR_PTR(-EINVAL);
 
 157                 goto get_dma_mr_exit0;
 
 162                 ehca_err(&shca->ib_device, "rc=%lx pd=%p mr_access_flags=%x ",
 
 163                          PTR_ERR(ib_mr), pd, mr_access_flags);
 
 165 } /* end ehca_get_dma_mr() */
 
 167 /*----------------------------------------------------------------------*/
 
 169 struct ib_mr *ehca_reg_phys_mr(struct ib_pd *pd,
 
 170                                struct ib_phys_buf *phys_buf_array,
 
 177         struct ehca_mr *e_mr;
 
 178         struct ehca_shca *shca =
 
 179                 container_of(pd->device, struct ehca_shca, ib_device);
 
 180         struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 184         if ((num_phys_buf <= 0) || !phys_buf_array) {
 
 185                 ehca_err(pd->device, "bad input values: num_phys_buf=%x "
 
 186                          "phys_buf_array=%p", num_phys_buf, phys_buf_array);
 
 187                 ib_mr = ERR_PTR(-EINVAL);
 
 188                 goto reg_phys_mr_exit0;
 
 190         if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
 
 191              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
 
 192             ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
 
 193              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
 
 195                  * Remote Write Access requires Local Write Access
 
 196                  * Remote Atomic Access requires Local Write Access
 
 198                 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
 
 200                 ib_mr = ERR_PTR(-EINVAL);
 
 201                 goto reg_phys_mr_exit0;
 
 204         /* check physical buffer list and calculate size */
 
 205         ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array, num_phys_buf,
 
 208                 ib_mr = ERR_PTR(ret);
 
 209                 goto reg_phys_mr_exit0;
 
 212             (((u64)iova_start + size) < (u64)iova_start)) {
 
 213                 ehca_err(pd->device, "bad input values: size=%lx iova_start=%p",
 
 215                 ib_mr = ERR_PTR(-EINVAL);
 
 216                 goto reg_phys_mr_exit0;
 
 219         e_mr = ehca_mr_new();
 
 221                 ehca_err(pd->device, "out of memory");
 
 222                 ib_mr = ERR_PTR(-ENOMEM);
 
 223                 goto reg_phys_mr_exit0;
 
 226         /* register MR on HCA */
 
 227         if (ehca_mr_is_maxmr(size, iova_start)) {
 
 228                 e_mr->flags |= EHCA_MR_FLAG_MAXMR;
 
 229                 ret = ehca_reg_maxmr(shca, e_mr, iova_start, mr_access_flags,
 
 230                                      e_pd, &e_mr->ib.ib_mr.lkey,
 
 231                                      &e_mr->ib.ib_mr.rkey);
 
 233                         ib_mr = ERR_PTR(ret);
 
 234                         goto reg_phys_mr_exit1;
 
 237                 struct ehca_mr_pginfo pginfo;
 
 242                 num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size,
 
 244                 /* for kernel space we try most possible pgsize */
 
 245                 hw_pgsize = ehca_get_max_hwpage_size(shca);
 
 246                 num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size,
 
 248                 memset(&pginfo, 0, sizeof(pginfo));
 
 249                 pginfo.type = EHCA_MR_PGI_PHYS;
 
 250                 pginfo.num_kpages = num_kpages;
 
 251                 pginfo.hwpage_size = hw_pgsize;
 
 252                 pginfo.num_hwpages = num_hwpages;
 
 253                 pginfo.u.phy.num_phys_buf = num_phys_buf;
 
 254                 pginfo.u.phy.phys_buf_array = phys_buf_array;
 
 256                         ((u64)iova_start & ~(hw_pgsize - 1)) / hw_pgsize;
 
 258                 ret = ehca_reg_mr(shca, e_mr, iova_start, size, mr_access_flags,
 
 259                                   e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
 
 260                                   &e_mr->ib.ib_mr.rkey);
 
 262                         ib_mr = ERR_PTR(ret);
 
 263                         goto reg_phys_mr_exit1;
 
 267         /* successful registration of all pages */
 
 268         return &e_mr->ib.ib_mr;
 
 271         ehca_mr_delete(e_mr);
 
 274                 ehca_err(pd->device, "rc=%lx pd=%p phys_buf_array=%p "
 
 275                          "num_phys_buf=%x mr_access_flags=%x iova_start=%p",
 
 276                          PTR_ERR(ib_mr), pd, phys_buf_array,
 
 277                          num_phys_buf, mr_access_flags, iova_start);
 
 279 } /* end ehca_reg_phys_mr() */
 
 281 /*----------------------------------------------------------------------*/
 
 283 struct ib_mr *ehca_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
 
 284                                u64 virt, int mr_access_flags,
 
 285                                struct ib_udata *udata)
 
 288         struct ehca_mr *e_mr;
 
 289         struct ehca_shca *shca =
 
 290                 container_of(pd->device, struct ehca_shca, ib_device);
 
 291         struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 292         struct ehca_mr_pginfo pginfo;
 
 299                 ehca_gen_err("bad pd=%p", pd);
 
 300                 return ERR_PTR(-EFAULT);
 
 303         if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
 
 304              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
 
 305             ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
 
 306              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
 
 308                  * Remote Write Access requires Local Write Access
 
 309                  * Remote Atomic Access requires Local Write Access
 
 311                 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
 
 313                 ib_mr = ERR_PTR(-EINVAL);
 
 314                 goto reg_user_mr_exit0;
 
 317         if (length == 0 || virt + length < virt) {
 
 318                 ehca_err(pd->device, "bad input values: length=%lx "
 
 319                          "virt_base=%lx", length, virt);
 
 320                 ib_mr = ERR_PTR(-EINVAL);
 
 321                 goto reg_user_mr_exit0;
 
 324         e_mr = ehca_mr_new();
 
 326                 ehca_err(pd->device, "out of memory");
 
 327                 ib_mr = ERR_PTR(-ENOMEM);
 
 328                 goto reg_user_mr_exit0;
 
 331         e_mr->umem = ib_umem_get(pd->uobject->context, start, length,
 
 333         if (IS_ERR(e_mr->umem)) {
 
 334                 ib_mr = (void *)e_mr->umem;
 
 335                 goto reg_user_mr_exit1;
 
 338         if (e_mr->umem->page_size != PAGE_SIZE) {
 
 339                 ehca_err(pd->device, "page size not supported, "
 
 340                          "e_mr->umem->page_size=%x", e_mr->umem->page_size);
 
 341                 ib_mr = ERR_PTR(-EINVAL);
 
 342                 goto reg_user_mr_exit2;
 
 345         /* determine number of MR pages */
 
 346         num_kpages = NUM_CHUNKS((virt % PAGE_SIZE) + length, PAGE_SIZE);
 
 347         /* select proper hw_pgsize */
 
 348         if (ehca_mr_largepage &&
 
 349             (shca->hca_cap_mr_pgsize & HCA_CAP_MR_PGSIZE_16M)) {
 
 350                 if (length <= EHCA_MR_PGSIZE4K
 
 351                     && PAGE_SIZE == EHCA_MR_PGSIZE4K)
 
 352                         hwpage_size = EHCA_MR_PGSIZE4K;
 
 353                 else if (length <= EHCA_MR_PGSIZE64K)
 
 354                         hwpage_size = EHCA_MR_PGSIZE64K;
 
 355                 else if (length <= EHCA_MR_PGSIZE1M)
 
 356                         hwpage_size = EHCA_MR_PGSIZE1M;
 
 358                         hwpage_size = EHCA_MR_PGSIZE16M;
 
 360                 hwpage_size = EHCA_MR_PGSIZE4K;
 
 361         ehca_dbg(pd->device, "hwpage_size=%lx", hwpage_size);
 
 363 reg_user_mr_fallback:
 
 364         num_hwpages = NUM_CHUNKS((virt % hwpage_size) + length, hwpage_size);
 
 365         /* register MR on HCA */
 
 366         memset(&pginfo, 0, sizeof(pginfo));
 
 367         pginfo.type = EHCA_MR_PGI_USER;
 
 368         pginfo.hwpage_size = hwpage_size;
 
 369         pginfo.num_kpages = num_kpages;
 
 370         pginfo.num_hwpages = num_hwpages;
 
 371         pginfo.u.usr.region = e_mr->umem;
 
 372         pginfo.next_hwpage = e_mr->umem->offset / hwpage_size;
 
 373         pginfo.u.usr.next_chunk = list_prepare_entry(pginfo.u.usr.next_chunk,
 
 374                                                      (&e_mr->umem->chunk_list),
 
 377         ret = ehca_reg_mr(shca, e_mr, (u64 *)virt, length, mr_access_flags,
 
 378                           e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
 
 379                           &e_mr->ib.ib_mr.rkey);
 
 380         if (ret == -EINVAL && pginfo.hwpage_size > PAGE_SIZE) {
 
 381                 ehca_warn(pd->device, "failed to register mr "
 
 382                           "with hwpage_size=%lx", hwpage_size);
 
 383                 ehca_info(pd->device, "try to register mr with "
 
 384                           "kpage_size=%lx", PAGE_SIZE);
 
 386                  * this means kpages are not contiguous for a hw page
 
 387                  * try kernel page size as fallback solution
 
 389                 hwpage_size = PAGE_SIZE;
 
 390                 goto reg_user_mr_fallback;
 
 393                 ib_mr = ERR_PTR(ret);
 
 394                 goto reg_user_mr_exit2;
 
 397         /* successful registration of all pages */
 
 398         return &e_mr->ib.ib_mr;
 
 401         ib_umem_release(e_mr->umem);
 
 403         ehca_mr_delete(e_mr);
 
 406                 ehca_err(pd->device, "rc=%lx pd=%p mr_access_flags=%x"
 
 408                          PTR_ERR(ib_mr), pd, mr_access_flags, udata);
 
 410 } /* end ehca_reg_user_mr() */
 
 412 /*----------------------------------------------------------------------*/
 
 414 int ehca_rereg_phys_mr(struct ib_mr *mr,
 
 417                        struct ib_phys_buf *phys_buf_array,
 
 424         struct ehca_shca *shca =
 
 425                 container_of(mr->device, struct ehca_shca, ib_device);
 
 426         struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
 
 427         struct ehca_pd *my_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
 
 431         struct ehca_pd *new_pd;
 
 432         u32 tmp_lkey, tmp_rkey;
 
 433         unsigned long sl_flags;
 
 436         struct ehca_mr_pginfo pginfo;
 
 437         u32 cur_pid = current->tgid;
 
 439         if (my_pd->ib_pd.uobject && my_pd->ib_pd.uobject->context &&
 
 440             (my_pd->ownpid != cur_pid)) {
 
 441                 ehca_err(mr->device, "Invalid caller pid=%x ownpid=%x",
 
 442                          cur_pid, my_pd->ownpid);
 
 444                 goto rereg_phys_mr_exit0;
 
 447         if (!(mr_rereg_mask & IB_MR_REREG_TRANS)) {
 
 448                 /* TODO not supported, because PHYP rereg hCall needs pages */
 
 449                 ehca_err(mr->device, "rereg without IB_MR_REREG_TRANS not "
 
 450                          "supported yet, mr_rereg_mask=%x", mr_rereg_mask);
 
 452                 goto rereg_phys_mr_exit0;
 
 455         if (mr_rereg_mask & IB_MR_REREG_PD) {
 
 457                         ehca_err(mr->device, "rereg with bad pd, pd=%p "
 
 458                                  "mr_rereg_mask=%x", pd, mr_rereg_mask);
 
 460                         goto rereg_phys_mr_exit0;
 
 465              ~(IB_MR_REREG_TRANS | IB_MR_REREG_PD | IB_MR_REREG_ACCESS)) ||
 
 466             (mr_rereg_mask == 0)) {
 
 468                 goto rereg_phys_mr_exit0;
 
 471         /* check other parameters */
 
 472         if (e_mr == shca->maxmr) {
 
 473                 /* should be impossible, however reject to be sure */
 
 474                 ehca_err(mr->device, "rereg internal max-MR impossible, mr=%p "
 
 475                          "shca->maxmr=%p mr->lkey=%x",
 
 476                          mr, shca->maxmr, mr->lkey);
 
 478                 goto rereg_phys_mr_exit0;
 
 480         if (mr_rereg_mask & IB_MR_REREG_TRANS) { /* transl., i.e. addr/size */
 
 481                 if (e_mr->flags & EHCA_MR_FLAG_FMR) {
 
 482                         ehca_err(mr->device, "not supported for FMR, mr=%p "
 
 483                                  "flags=%x", mr, e_mr->flags);
 
 485                         goto rereg_phys_mr_exit0;
 
 487                 if (!phys_buf_array || num_phys_buf <= 0) {
 
 488                         ehca_err(mr->device, "bad input values mr_rereg_mask=%x"
 
 489                                  " phys_buf_array=%p num_phys_buf=%x",
 
 490                                  mr_rereg_mask, phys_buf_array, num_phys_buf);
 
 492                         goto rereg_phys_mr_exit0;
 
 495         if ((mr_rereg_mask & IB_MR_REREG_ACCESS) &&     /* change ACL */
 
 496             (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
 
 497               !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
 
 498              ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
 
 499               !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)))) {
 
 501                  * Remote Write Access requires Local Write Access
 
 502                  * Remote Atomic Access requires Local Write Access
 
 504                 ehca_err(mr->device, "bad input values: mr_rereg_mask=%x "
 
 505                          "mr_access_flags=%x", mr_rereg_mask, mr_access_flags);
 
 507                 goto rereg_phys_mr_exit0;
 
 510         /* set requested values dependent on rereg request */
 
 511         spin_lock_irqsave(&e_mr->mrlock, sl_flags);
 
 512         new_start = e_mr->start;
 
 513         new_size = e_mr->size;
 
 515         new_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
 
 517         if (mr_rereg_mask & IB_MR_REREG_TRANS) {
 
 518                 u64 hw_pgsize = ehca_get_max_hwpage_size(shca);
 
 520                 new_start = iova_start; /* change address */
 
 521                 /* check physical buffer list and calculate size */
 
 522                 ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array,
 
 523                                                     num_phys_buf, iova_start,
 
 526                         goto rereg_phys_mr_exit1;
 
 527                 if ((new_size == 0) ||
 
 528                     (((u64)iova_start + new_size) < (u64)iova_start)) {
 
 529                         ehca_err(mr->device, "bad input values: new_size=%lx "
 
 530                                  "iova_start=%p", new_size, iova_start);
 
 532                         goto rereg_phys_mr_exit1;
 
 534                 num_kpages = NUM_CHUNKS(((u64)new_start % PAGE_SIZE) +
 
 535                                         new_size, PAGE_SIZE);
 
 536                 num_hwpages = NUM_CHUNKS(((u64)new_start % hw_pgsize) +
 
 537                                          new_size, hw_pgsize);
 
 538                 memset(&pginfo, 0, sizeof(pginfo));
 
 539                 pginfo.type = EHCA_MR_PGI_PHYS;
 
 540                 pginfo.num_kpages = num_kpages;
 
 541                 pginfo.hwpage_size = hw_pgsize;
 
 542                 pginfo.num_hwpages = num_hwpages;
 
 543                 pginfo.u.phy.num_phys_buf = num_phys_buf;
 
 544                 pginfo.u.phy.phys_buf_array = phys_buf_array;
 
 546                         ((u64)iova_start & ~(hw_pgsize - 1)) / hw_pgsize;
 
 548         if (mr_rereg_mask & IB_MR_REREG_ACCESS)
 
 549                 new_acl = mr_access_flags;
 
 550         if (mr_rereg_mask & IB_MR_REREG_PD)
 
 551                 new_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 553         ret = ehca_rereg_mr(shca, e_mr, new_start, new_size, new_acl,
 
 554                             new_pd, &pginfo, &tmp_lkey, &tmp_rkey);
 
 556                 goto rereg_phys_mr_exit1;
 
 558         /* successful reregistration */
 
 559         if (mr_rereg_mask & IB_MR_REREG_PD)
 
 565         spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
 
 568                 ehca_err(mr->device, "ret=%x mr=%p mr_rereg_mask=%x pd=%p "
 
 569                          "phys_buf_array=%p num_phys_buf=%x mr_access_flags=%x "
 
 571                          ret, mr, mr_rereg_mask, pd, phys_buf_array,
 
 572                          num_phys_buf, mr_access_flags, iova_start);
 
 574 } /* end ehca_rereg_phys_mr() */
 
 576 /*----------------------------------------------------------------------*/
 
 578 int ehca_query_mr(struct ib_mr *mr, struct ib_mr_attr *mr_attr)
 
 582         struct ehca_shca *shca =
 
 583                 container_of(mr->device, struct ehca_shca, ib_device);
 
 584         struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
 
 585         struct ehca_pd *my_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
 
 586         u32 cur_pid = current->tgid;
 
 587         unsigned long sl_flags;
 
 588         struct ehca_mr_hipzout_parms hipzout;
 
 590         if (my_pd->ib_pd.uobject && my_pd->ib_pd.uobject->context &&
 
 591             (my_pd->ownpid != cur_pid)) {
 
 592                 ehca_err(mr->device, "Invalid caller pid=%x ownpid=%x",
 
 593                          cur_pid, my_pd->ownpid);
 
 598         if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
 
 599                 ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
 
 600                          "e_mr->flags=%x", mr, e_mr, e_mr->flags);
 
 605         memset(mr_attr, 0, sizeof(struct ib_mr_attr));
 
 606         spin_lock_irqsave(&e_mr->mrlock, sl_flags);
 
 608         h_ret = hipz_h_query_mr(shca->ipz_hca_handle, e_mr, &hipzout);
 
 609         if (h_ret != H_SUCCESS) {
 
 610                 ehca_err(mr->device, "hipz_mr_query failed, h_ret=%lx mr=%p "
 
 611                          "hca_hndl=%lx mr_hndl=%lx lkey=%x",
 
 612                          h_ret, mr, shca->ipz_hca_handle.handle,
 
 613                          e_mr->ipz_mr_handle.handle, mr->lkey);
 
 614                 ret = ehca2ib_return_code(h_ret);
 
 617         mr_attr->pd = mr->pd;
 
 618         mr_attr->device_virt_addr = hipzout.vaddr;
 
 619         mr_attr->size = hipzout.len;
 
 620         mr_attr->lkey = hipzout.lkey;
 
 621         mr_attr->rkey = hipzout.rkey;
 
 622         ehca_mrmw_reverse_map_acl(&hipzout.acl, &mr_attr->mr_access_flags);
 
 625         spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
 
 628                 ehca_err(mr->device, "ret=%x mr=%p mr_attr=%p",
 
 631 } /* end ehca_query_mr() */
 
 633 /*----------------------------------------------------------------------*/
 
 635 int ehca_dereg_mr(struct ib_mr *mr)
 
 639         struct ehca_shca *shca =
 
 640                 container_of(mr->device, struct ehca_shca, ib_device);
 
 641         struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
 
 642         struct ehca_pd *my_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
 
 643         u32 cur_pid = current->tgid;
 
 645         if (my_pd->ib_pd.uobject && my_pd->ib_pd.uobject->context &&
 
 646             (my_pd->ownpid != cur_pid)) {
 
 647                 ehca_err(mr->device, "Invalid caller pid=%x ownpid=%x",
 
 648                          cur_pid, my_pd->ownpid);
 
 653         if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
 
 654                 ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
 
 655                          "e_mr->flags=%x", mr, e_mr, e_mr->flags);
 
 658         } else if (e_mr == shca->maxmr) {
 
 659                 /* should be impossible, however reject to be sure */
 
 660                 ehca_err(mr->device, "dereg internal max-MR impossible, mr=%p "
 
 661                          "shca->maxmr=%p mr->lkey=%x",
 
 662                          mr, shca->maxmr, mr->lkey);
 
 667         /* TODO: BUSY: MR still has bound window(s) */
 
 668         h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
 
 669         if (h_ret != H_SUCCESS) {
 
 670                 ehca_err(mr->device, "hipz_free_mr failed, h_ret=%lx shca=%p "
 
 671                          "e_mr=%p hca_hndl=%lx mr_hndl=%lx mr->lkey=%x",
 
 672                          h_ret, shca, e_mr, shca->ipz_hca_handle.handle,
 
 673                          e_mr->ipz_mr_handle.handle, mr->lkey);
 
 674                 ret = ehca2ib_return_code(h_ret);
 
 679                 ib_umem_release(e_mr->umem);
 
 681         /* successful deregistration */
 
 682         ehca_mr_delete(e_mr);
 
 686                 ehca_err(mr->device, "ret=%x mr=%p", ret, mr);
 
 688 } /* end ehca_dereg_mr() */
 
 690 /*----------------------------------------------------------------------*/
 
 692 struct ib_mw *ehca_alloc_mw(struct ib_pd *pd)
 
 696         struct ehca_mw *e_mw;
 
 697         struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 698         struct ehca_shca *shca =
 
 699                 container_of(pd->device, struct ehca_shca, ib_device);
 
 700         struct ehca_mw_hipzout_parms hipzout;
 
 702         e_mw = ehca_mw_new();
 
 704                 ib_mw = ERR_PTR(-ENOMEM);
 
 708         h_ret = hipz_h_alloc_resource_mw(shca->ipz_hca_handle, e_mw,
 
 709                                          e_pd->fw_pd, &hipzout);
 
 710         if (h_ret != H_SUCCESS) {
 
 711                 ehca_err(pd->device, "hipz_mw_allocate failed, h_ret=%lx "
 
 712                          "shca=%p hca_hndl=%lx mw=%p",
 
 713                          h_ret, shca, shca->ipz_hca_handle.handle, e_mw);
 
 714                 ib_mw = ERR_PTR(ehca2ib_return_code(h_ret));
 
 717         /* successful MW allocation */
 
 718         e_mw->ipz_mw_handle = hipzout.handle;
 
 719         e_mw->ib_mw.rkey    = hipzout.rkey;
 
 723         ehca_mw_delete(e_mw);
 
 726                 ehca_err(pd->device, "rc=%lx pd=%p", PTR_ERR(ib_mw), pd);
 
 728 } /* end ehca_alloc_mw() */
 
 730 /*----------------------------------------------------------------------*/
 
 732 int ehca_bind_mw(struct ib_qp *qp,
 
 734                  struct ib_mw_bind *mw_bind)
 
 736         /* TODO: not supported up to now */
 
 737         ehca_gen_err("bind MW currently not supported by HCAD");
 
 740 } /* end ehca_bind_mw() */
 
 742 /*----------------------------------------------------------------------*/
 
 744 int ehca_dealloc_mw(struct ib_mw *mw)
 
 747         struct ehca_shca *shca =
 
 748                 container_of(mw->device, struct ehca_shca, ib_device);
 
 749         struct ehca_mw *e_mw = container_of(mw, struct ehca_mw, ib_mw);
 
 751         h_ret = hipz_h_free_resource_mw(shca->ipz_hca_handle, e_mw);
 
 752         if (h_ret != H_SUCCESS) {
 
 753                 ehca_err(mw->device, "hipz_free_mw failed, h_ret=%lx shca=%p "
 
 754                          "mw=%p rkey=%x hca_hndl=%lx mw_hndl=%lx",
 
 755                          h_ret, shca, mw, mw->rkey, shca->ipz_hca_handle.handle,
 
 756                          e_mw->ipz_mw_handle.handle);
 
 757                 return ehca2ib_return_code(h_ret);
 
 759         /* successful deallocation */
 
 760         ehca_mw_delete(e_mw);
 
 762 } /* end ehca_dealloc_mw() */
 
 764 /*----------------------------------------------------------------------*/
 
 766 struct ib_fmr *ehca_alloc_fmr(struct ib_pd *pd,
 
 768                               struct ib_fmr_attr *fmr_attr)
 
 770         struct ib_fmr *ib_fmr;
 
 771         struct ehca_shca *shca =
 
 772                 container_of(pd->device, struct ehca_shca, ib_device);
 
 773         struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
 
 774         struct ehca_mr *e_fmr;
 
 776         u32 tmp_lkey, tmp_rkey;
 
 777         struct ehca_mr_pginfo pginfo;
 
 780         /* check other parameters */
 
 781         if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
 
 782              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
 
 783             ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
 
 784              !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
 
 786                  * Remote Write Access requires Local Write Access
 
 787                  * Remote Atomic Access requires Local Write Access
 
 789                 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
 
 791                 ib_fmr = ERR_PTR(-EINVAL);
 
 792                 goto alloc_fmr_exit0;
 
 794         if (mr_access_flags & IB_ACCESS_MW_BIND) {
 
 795                 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
 
 797                 ib_fmr = ERR_PTR(-EINVAL);
 
 798                 goto alloc_fmr_exit0;
 
 800         if ((fmr_attr->max_pages == 0) || (fmr_attr->max_maps == 0)) {
 
 801                 ehca_err(pd->device, "bad input values: fmr_attr->max_pages=%x "
 
 802                          "fmr_attr->max_maps=%x fmr_attr->page_shift=%x",
 
 803                          fmr_attr->max_pages, fmr_attr->max_maps,
 
 804                          fmr_attr->page_shift);
 
 805                 ib_fmr = ERR_PTR(-EINVAL);
 
 806                 goto alloc_fmr_exit0;
 
 808         hw_pgsize = ehca_get_max_hwpage_size(shca);
 
 809         if ((1 << fmr_attr->page_shift) != hw_pgsize) {
 
 810                 ehca_err(pd->device, "unsupported fmr_attr->page_shift=%x",
 
 811                          fmr_attr->page_shift);
 
 812                 ib_fmr = ERR_PTR(-EINVAL);
 
 813                 goto alloc_fmr_exit0;
 
 816         e_fmr = ehca_mr_new();
 
 818                 ib_fmr = ERR_PTR(-ENOMEM);
 
 819                 goto alloc_fmr_exit0;
 
 821         e_fmr->flags |= EHCA_MR_FLAG_FMR;
 
 823         /* register MR on HCA */
 
 824         memset(&pginfo, 0, sizeof(pginfo));
 
 826          * pginfo.num_hwpages==0, ie register_rpages() will not be called
 
 827          * but deferred to map_phys_fmr()
 
 829         ret = ehca_reg_mr(shca, e_fmr, NULL,
 
 830                           fmr_attr->max_pages * (1 << fmr_attr->page_shift),
 
 831                           mr_access_flags, e_pd, &pginfo,
 
 832                           &tmp_lkey, &tmp_rkey);
 
 834                 ib_fmr = ERR_PTR(ret);
 
 835                 goto alloc_fmr_exit1;
 
 839         e_fmr->hwpage_size = hw_pgsize;
 
 840         e_fmr->fmr_page_size = 1 << fmr_attr->page_shift;
 
 841         e_fmr->fmr_max_pages = fmr_attr->max_pages;
 
 842         e_fmr->fmr_max_maps = fmr_attr->max_maps;
 
 843         e_fmr->fmr_map_cnt = 0;
 
 844         return &e_fmr->ib.ib_fmr;
 
 847         ehca_mr_delete(e_fmr);
 
 850                 ehca_err(pd->device, "rc=%lx pd=%p mr_access_flags=%x "
 
 851                          "fmr_attr=%p", PTR_ERR(ib_fmr), pd,
 
 852                          mr_access_flags, fmr_attr);
 
 854 } /* end ehca_alloc_fmr() */
 
 856 /*----------------------------------------------------------------------*/
 
 858 int ehca_map_phys_fmr(struct ib_fmr *fmr,
 
 864         struct ehca_shca *shca =
 
 865                 container_of(fmr->device, struct ehca_shca, ib_device);
 
 866         struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
 
 867         struct ehca_pd *e_pd = container_of(fmr->pd, struct ehca_pd, ib_pd);
 
 868         struct ehca_mr_pginfo pginfo;
 
 869         u32 tmp_lkey, tmp_rkey;
 
 871         if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
 
 872                 ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
 
 873                          e_fmr, e_fmr->flags);
 
 875                 goto map_phys_fmr_exit0;
 
 877         ret = ehca_fmr_check_page_list(e_fmr, page_list, list_len);
 
 879                 goto map_phys_fmr_exit0;
 
 880         if (iova % e_fmr->fmr_page_size) {
 
 881                 /* only whole-numbered pages */
 
 882                 ehca_err(fmr->device, "bad iova, iova=%lx fmr_page_size=%x",
 
 883                          iova, e_fmr->fmr_page_size);
 
 885                 goto map_phys_fmr_exit0;
 
 887         if (e_fmr->fmr_map_cnt >= e_fmr->fmr_max_maps) {
 
 888                 /* HCAD does not limit the maps, however trace this anyway */
 
 889                 ehca_info(fmr->device, "map limit exceeded, fmr=%p "
 
 890                           "e_fmr->fmr_map_cnt=%x e_fmr->fmr_max_maps=%x",
 
 891                           fmr, e_fmr->fmr_map_cnt, e_fmr->fmr_max_maps);
 
 894         memset(&pginfo, 0, sizeof(pginfo));
 
 895         pginfo.type = EHCA_MR_PGI_FMR;
 
 896         pginfo.num_kpages = list_len;
 
 897         pginfo.hwpage_size = e_fmr->hwpage_size;
 
 899                 list_len * e_fmr->fmr_page_size / pginfo.hwpage_size;
 
 900         pginfo.u.fmr.page_list = page_list;
 
 902                 (iova & (e_fmr->fmr_page_size-1)) / pginfo.hwpage_size;
 
 903         pginfo.u.fmr.fmr_pgsize = e_fmr->fmr_page_size;
 
 905         ret = ehca_rereg_mr(shca, e_fmr, (u64 *)iova,
 
 906                             list_len * e_fmr->fmr_page_size,
 
 907                             e_fmr->acl, e_pd, &pginfo, &tmp_lkey, &tmp_rkey);
 
 909                 goto map_phys_fmr_exit0;
 
 911         /* successful reregistration */
 
 912         e_fmr->fmr_map_cnt++;
 
 913         e_fmr->ib.ib_fmr.lkey = tmp_lkey;
 
 914         e_fmr->ib.ib_fmr.rkey = tmp_rkey;
 
 919                 ehca_err(fmr->device, "ret=%x fmr=%p page_list=%p list_len=%x "
 
 920                          "iova=%lx", ret, fmr, page_list, list_len, iova);
 
 922 } /* end ehca_map_phys_fmr() */
 
 924 /*----------------------------------------------------------------------*/
 
 926 int ehca_unmap_fmr(struct list_head *fmr_list)
 
 929         struct ib_fmr *ib_fmr;
 
 930         struct ehca_shca *shca = NULL;
 
 931         struct ehca_shca *prev_shca;
 
 932         struct ehca_mr *e_fmr;
 
 934         u32 unmap_fmr_cnt = 0;
 
 936         /* check all FMR belong to same SHCA, and check internal flag */
 
 937         list_for_each_entry(ib_fmr, fmr_list, list) {
 
 940                         ehca_gen_err("bad fmr=%p in list", ib_fmr);
 
 942                         goto unmap_fmr_exit0;
 
 944                 shca = container_of(ib_fmr->device, struct ehca_shca,
 
 946                 e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
 
 947                 if ((shca != prev_shca) && prev_shca) {
 
 948                         ehca_err(&shca->ib_device, "SHCA mismatch, shca=%p "
 
 949                                  "prev_shca=%p e_fmr=%p",
 
 950                                  shca, prev_shca, e_fmr);
 
 952                         goto unmap_fmr_exit0;
 
 954                 if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
 
 955                         ehca_err(&shca->ib_device, "not a FMR, e_fmr=%p "
 
 956                                  "e_fmr->flags=%x", e_fmr, e_fmr->flags);
 
 958                         goto unmap_fmr_exit0;
 
 963         /* loop over all FMRs to unmap */
 
 964         list_for_each_entry(ib_fmr, fmr_list, list) {
 
 966                 e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
 
 967                 shca = container_of(ib_fmr->device, struct ehca_shca,
 
 969                 ret = ehca_unmap_one_fmr(shca, e_fmr);
 
 971                         /* unmap failed, stop unmapping of rest of FMRs */
 
 972                         ehca_err(&shca->ib_device, "unmap of one FMR failed, "
 
 973                                  "stop rest, e_fmr=%p num_fmr=%x "
 
 974                                  "unmap_fmr_cnt=%x lkey=%x", e_fmr, num_fmr,
 
 975                                  unmap_fmr_cnt, e_fmr->ib.ib_fmr.lkey);
 
 976                         goto unmap_fmr_exit0;
 
 982                 ehca_gen_err("ret=%x fmr_list=%p num_fmr=%x unmap_fmr_cnt=%x",
 
 983                              ret, fmr_list, num_fmr, unmap_fmr_cnt);
 
 985 } /* end ehca_unmap_fmr() */
 
 987 /*----------------------------------------------------------------------*/
 
 989 int ehca_dealloc_fmr(struct ib_fmr *fmr)
 
 993         struct ehca_shca *shca =
 
 994                 container_of(fmr->device, struct ehca_shca, ib_device);
 
 995         struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
 
 997         if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
 
 998                 ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
 
 999                          e_fmr, e_fmr->flags);
 
1001                 goto free_fmr_exit0;
 
1004         h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
 
1005         if (h_ret != H_SUCCESS) {
 
1006                 ehca_err(fmr->device, "hipz_free_mr failed, h_ret=%lx e_fmr=%p "
 
1007                          "hca_hndl=%lx fmr_hndl=%lx fmr->lkey=%x",
 
1008                          h_ret, e_fmr, shca->ipz_hca_handle.handle,
 
1009                          e_fmr->ipz_mr_handle.handle, fmr->lkey);
 
1010                 ret = ehca2ib_return_code(h_ret);
 
1011                 goto free_fmr_exit0;
 
1013         /* successful deregistration */
 
1014         ehca_mr_delete(e_fmr);
 
1019                 ehca_err(&shca->ib_device, "ret=%x fmr=%p", ret, fmr);
 
1021 } /* end ehca_dealloc_fmr() */
 
1023 /*----------------------------------------------------------------------*/
 
1025 int ehca_reg_mr(struct ehca_shca *shca,
 
1026                 struct ehca_mr *e_mr,
 
1030                 struct ehca_pd *e_pd,
 
1031                 struct ehca_mr_pginfo *pginfo,
 
1038         struct ehca_mr_hipzout_parms hipzout;
 
1040         ehca_mrmw_map_acl(acl, &hipz_acl);
 
1041         ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
 
1042         if (ehca_use_hp_mr == 1)
 
1043                 hipz_acl |= 0x00000001;
 
1045         h_ret = hipz_h_alloc_resource_mr(shca->ipz_hca_handle, e_mr,
 
1046                                          (u64)iova_start, size, hipz_acl,
 
1047                                          e_pd->fw_pd, &hipzout);
 
1048         if (h_ret != H_SUCCESS) {
 
1049                 ehca_err(&shca->ib_device, "hipz_alloc_mr failed, h_ret=%lx "
 
1050                          "hca_hndl=%lx", h_ret, shca->ipz_hca_handle.handle);
 
1051                 ret = ehca2ib_return_code(h_ret);
 
1052                 goto ehca_reg_mr_exit0;
 
1055         e_mr->ipz_mr_handle = hipzout.handle;
 
1057         ret = ehca_reg_mr_rpages(shca, e_mr, pginfo);
 
1059                 goto ehca_reg_mr_exit1;
 
1061         /* successful registration */
 
1062         e_mr->num_kpages = pginfo->num_kpages;
 
1063         e_mr->num_hwpages = pginfo->num_hwpages;
 
1064         e_mr->hwpage_size = pginfo->hwpage_size;
 
1065         e_mr->start = iova_start;
 
1068         *lkey = hipzout.lkey;
 
1069         *rkey = hipzout.rkey;
 
1073         h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
 
1074         if (h_ret != H_SUCCESS) {
 
1075                 ehca_err(&shca->ib_device, "h_ret=%lx shca=%p e_mr=%p "
 
1076                          "iova_start=%p size=%lx acl=%x e_pd=%p lkey=%x "
 
1077                          "pginfo=%p num_kpages=%lx num_hwpages=%lx ret=%x",
 
1078                          h_ret, shca, e_mr, iova_start, size, acl, e_pd,
 
1079                          hipzout.lkey, pginfo, pginfo->num_kpages,
 
1080                          pginfo->num_hwpages, ret);
 
1081                 ehca_err(&shca->ib_device, "internal error in ehca_reg_mr, "
 
1086                 ehca_err(&shca->ib_device, "ret=%x shca=%p e_mr=%p "
 
1087                          "iova_start=%p size=%lx acl=%x e_pd=%p pginfo=%p "
 
1088                          "num_kpages=%lx num_hwpages=%lx",
 
1089                          ret, shca, e_mr, iova_start, size, acl, e_pd, pginfo,
 
1090                          pginfo->num_kpages, pginfo->num_hwpages);
 
1092 } /* end ehca_reg_mr() */
 
1094 /*----------------------------------------------------------------------*/
 
1096 int ehca_reg_mr_rpages(struct ehca_shca *shca,
 
1097                        struct ehca_mr *e_mr,
 
1098                        struct ehca_mr_pginfo *pginfo)
 
1107         if (!pginfo->num_hwpages) /* in case of fmr */
 
1110         kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
 
1112                 ehca_err(&shca->ib_device, "kpage alloc failed");
 
1114                 goto ehca_reg_mr_rpages_exit0;
 
1117         /* max MAX_RPAGES ehca mr pages per register call */
 
1118         for (i = 0; i < NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES); i++) {
 
1120                 if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
 
1121                         rnum = pginfo->num_hwpages % MAX_RPAGES; /* last shot */
 
1123                                 rnum = MAX_RPAGES;      /* last shot is full */
 
1127                 ret = ehca_set_pagebuf(pginfo, rnum, kpage);
 
1129                         ehca_err(&shca->ib_device, "ehca_set_pagebuf "
 
1130                                  "bad rc, ret=%x rnum=%x kpage=%p",
 
1132                         goto ehca_reg_mr_rpages_exit1;
 
1136                         rpage = virt_to_abs(kpage);
 
1138                                 ehca_err(&shca->ib_device, "kpage=%p i=%x",
 
1141                                 goto ehca_reg_mr_rpages_exit1;
 
1146                 h_ret = hipz_h_register_rpage_mr(
 
1147                         shca->ipz_hca_handle, e_mr,
 
1148                         ehca_encode_hwpage_size(pginfo->hwpage_size),
 
1151                 if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
 
1153                          * check for 'registration complete'==H_SUCCESS
 
1154                          * and for 'page registered'==H_PAGE_REGISTERED
 
1156                         if (h_ret != H_SUCCESS) {
 
1157                                 ehca_err(&shca->ib_device, "last "
 
1158                                          "hipz_reg_rpage_mr failed, h_ret=%lx "
 
1159                                          "e_mr=%p i=%x hca_hndl=%lx mr_hndl=%lx"
 
1160                                          " lkey=%x", h_ret, e_mr, i,
 
1161                                          shca->ipz_hca_handle.handle,
 
1162                                          e_mr->ipz_mr_handle.handle,
 
1163                                          e_mr->ib.ib_mr.lkey);
 
1164                                 ret = ehca2ib_return_code(h_ret);
 
1168                 } else if (h_ret != H_PAGE_REGISTERED) {
 
1169                         ehca_err(&shca->ib_device, "hipz_reg_rpage_mr failed, "
 
1170                                  "h_ret=%lx e_mr=%p i=%x lkey=%x hca_hndl=%lx "
 
1171                                  "mr_hndl=%lx", h_ret, e_mr, i,
 
1172                                  e_mr->ib.ib_mr.lkey,
 
1173                                  shca->ipz_hca_handle.handle,
 
1174                                  e_mr->ipz_mr_handle.handle);
 
1175                         ret = ehca2ib_return_code(h_ret);
 
1182 ehca_reg_mr_rpages_exit1:
 
1183         ehca_free_fw_ctrlblock(kpage);
 
1184 ehca_reg_mr_rpages_exit0:
 
1186                 ehca_err(&shca->ib_device, "ret=%x shca=%p e_mr=%p pginfo=%p "
 
1187                          "num_kpages=%lx num_hwpages=%lx", ret, shca, e_mr,
 
1188                          pginfo, pginfo->num_kpages, pginfo->num_hwpages);
 
1190 } /* end ehca_reg_mr_rpages() */
 
1192 /*----------------------------------------------------------------------*/
 
1194 inline int ehca_rereg_mr_rereg1(struct ehca_shca *shca,
 
1195                                 struct ehca_mr *e_mr,
 
1199                                 struct ehca_pd *e_pd,
 
1200                                 struct ehca_mr_pginfo *pginfo,
 
1209         struct ehca_mr_pginfo pginfo_save;
 
1210         struct ehca_mr_hipzout_parms hipzout;
 
1212         ehca_mrmw_map_acl(acl, &hipz_acl);
 
1213         ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
 
1215         kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
 
1217                 ehca_err(&shca->ib_device, "kpage alloc failed");
 
1219                 goto ehca_rereg_mr_rereg1_exit0;
 
1222         pginfo_save = *pginfo;
 
1223         ret = ehca_set_pagebuf(pginfo, pginfo->num_hwpages, kpage);
 
1225                 ehca_err(&shca->ib_device, "set pagebuf failed, e_mr=%p "
 
1226                          "pginfo=%p type=%x num_kpages=%lx num_hwpages=%lx "
 
1227                          "kpage=%p", e_mr, pginfo, pginfo->type,
 
1228                          pginfo->num_kpages, pginfo->num_hwpages, kpage);
 
1229                 goto ehca_rereg_mr_rereg1_exit1;
 
1231         rpage = virt_to_abs(kpage);
 
1233                 ehca_err(&shca->ib_device, "kpage=%p", kpage);
 
1235                 goto ehca_rereg_mr_rereg1_exit1;
 
1237         h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_mr,
 
1238                                       (u64)iova_start, size, hipz_acl,
 
1239                                       e_pd->fw_pd, rpage, &hipzout);
 
1240         if (h_ret != H_SUCCESS) {
 
1242                  * reregistration unsuccessful, try it again with the 3 hCalls,
 
1243                  * e.g. this is required in case H_MR_CONDITION
 
1244                  * (MW bound or MR is shared)
 
1246                 ehca_warn(&shca->ib_device, "hipz_h_reregister_pmr failed "
 
1247                           "(Rereg1), h_ret=%lx e_mr=%p", h_ret, e_mr);
 
1248                 *pginfo = pginfo_save;
 
1250         } else if ((u64 *)hipzout.vaddr != iova_start) {
 
1251                 ehca_err(&shca->ib_device, "PHYP changed iova_start in "
 
1252                          "rereg_pmr, iova_start=%p iova_start_out=%lx e_mr=%p "
 
1253                          "mr_handle=%lx lkey=%x lkey_out=%x", iova_start,
 
1254                          hipzout.vaddr, e_mr, e_mr->ipz_mr_handle.handle,
 
1255                          e_mr->ib.ib_mr.lkey, hipzout.lkey);
 
1259                  * successful reregistration
 
1260                  * note: start and start_out are identical for eServer HCAs
 
1262                 e_mr->num_kpages = pginfo->num_kpages;
 
1263                 e_mr->num_hwpages = pginfo->num_hwpages;
 
1264                 e_mr->hwpage_size = pginfo->hwpage_size;
 
1265                 e_mr->start = iova_start;
 
1268                 *lkey = hipzout.lkey;
 
1269                 *rkey = hipzout.rkey;
 
1272 ehca_rereg_mr_rereg1_exit1:
 
1273         ehca_free_fw_ctrlblock(kpage);
 
1274 ehca_rereg_mr_rereg1_exit0:
 
1275         if ( ret && (ret != -EAGAIN) )
 
1276                 ehca_err(&shca->ib_device, "ret=%x lkey=%x rkey=%x "
 
1277                          "pginfo=%p num_kpages=%lx num_hwpages=%lx",
 
1278                          ret, *lkey, *rkey, pginfo, pginfo->num_kpages,
 
1279                          pginfo->num_hwpages);
 
1281 } /* end ehca_rereg_mr_rereg1() */
 
1283 /*----------------------------------------------------------------------*/
 
1285 int ehca_rereg_mr(struct ehca_shca *shca,
 
1286                   struct ehca_mr *e_mr,
 
1290                   struct ehca_pd *e_pd,
 
1291                   struct ehca_mr_pginfo *pginfo,
 
1297         int rereg_1_hcall = 1; /* 1: use hipz_h_reregister_pmr directly */
 
1298         int rereg_3_hcall = 0; /* 1: use 3 hipz calls for reregistration */
 
1300         /* first determine reregistration hCall(s) */
 
1301         if ((pginfo->num_hwpages > MAX_RPAGES) ||
 
1302             (e_mr->num_hwpages > MAX_RPAGES) ||
 
1303             (pginfo->num_hwpages > e_mr->num_hwpages)) {
 
1304                 ehca_dbg(&shca->ib_device, "Rereg3 case, "
 
1305                          "pginfo->num_hwpages=%lx e_mr->num_hwpages=%x",
 
1306                          pginfo->num_hwpages, e_mr->num_hwpages);
 
1311         if (e_mr->flags & EHCA_MR_FLAG_MAXMR) { /* check for max-MR */
 
1314                 e_mr->flags &= ~EHCA_MR_FLAG_MAXMR;
 
1315                 ehca_err(&shca->ib_device, "Rereg MR for max-MR! e_mr=%p",
 
1319         if (rereg_1_hcall) {
 
1320                 ret = ehca_rereg_mr_rereg1(shca, e_mr, iova_start, size,
 
1321                                            acl, e_pd, pginfo, lkey, rkey);
 
1326                                 goto ehca_rereg_mr_exit0;
 
1330         if (rereg_3_hcall) {
 
1331                 struct ehca_mr save_mr;
 
1333                 /* first deregister old MR */
 
1334                 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
 
1335                 if (h_ret != H_SUCCESS) {
 
1336                         ehca_err(&shca->ib_device, "hipz_free_mr failed, "
 
1337                                  "h_ret=%lx e_mr=%p hca_hndl=%lx mr_hndl=%lx "
 
1339                                  h_ret, e_mr, shca->ipz_hca_handle.handle,
 
1340                                  e_mr->ipz_mr_handle.handle,
 
1341                                  e_mr->ib.ib_mr.lkey);
 
1342                         ret = ehca2ib_return_code(h_ret);
 
1343                         goto ehca_rereg_mr_exit0;
 
1345                 /* clean ehca_mr_t, without changing struct ib_mr and lock */
 
1347                 ehca_mr_deletenew(e_mr);
 
1349                 /* set some MR values */
 
1350                 e_mr->flags = save_mr.flags;
 
1351                 e_mr->hwpage_size = save_mr.hwpage_size;
 
1352                 e_mr->fmr_page_size = save_mr.fmr_page_size;
 
1353                 e_mr->fmr_max_pages = save_mr.fmr_max_pages;
 
1354                 e_mr->fmr_max_maps = save_mr.fmr_max_maps;
 
1355                 e_mr->fmr_map_cnt = save_mr.fmr_map_cnt;
 
1357                 ret = ehca_reg_mr(shca, e_mr, iova_start, size, acl,
 
1358                                   e_pd, pginfo, lkey, rkey);
 
1360                         u32 offset = (u64)(&e_mr->flags) - (u64)e_mr;
 
1361                         memcpy(&e_mr->flags, &(save_mr.flags),
 
1362                                sizeof(struct ehca_mr) - offset);
 
1363                         goto ehca_rereg_mr_exit0;
 
1367 ehca_rereg_mr_exit0:
 
1369                 ehca_err(&shca->ib_device, "ret=%x shca=%p e_mr=%p "
 
1370                          "iova_start=%p size=%lx acl=%x e_pd=%p pginfo=%p "
 
1371                          "num_kpages=%lx lkey=%x rkey=%x rereg_1_hcall=%x "
 
1372                          "rereg_3_hcall=%x", ret, shca, e_mr, iova_start, size,
 
1373                          acl, e_pd, pginfo, pginfo->num_kpages, *lkey, *rkey,
 
1374                          rereg_1_hcall, rereg_3_hcall);
 
1376 } /* end ehca_rereg_mr() */
 
1378 /*----------------------------------------------------------------------*/
 
1380 int ehca_unmap_one_fmr(struct ehca_shca *shca,
 
1381                        struct ehca_mr *e_fmr)
 
1385         struct ehca_pd *e_pd =
 
1386                 container_of(e_fmr->ib.ib_fmr.pd, struct ehca_pd, ib_pd);
 
1387         struct ehca_mr save_fmr;
 
1388         u32 tmp_lkey, tmp_rkey;
 
1389         struct ehca_mr_pginfo pginfo;
 
1390         struct ehca_mr_hipzout_parms hipzout;
 
1391         struct ehca_mr save_mr;
 
1393         if (e_fmr->fmr_max_pages <= MAX_RPAGES) {
 
1395                  * note: after using rereg hcall with len=0,
 
1396                  * rereg hcall must be used again for registering pages
 
1398                 h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_fmr, 0,
 
1399                                               0, 0, e_pd->fw_pd, 0, &hipzout);
 
1400                 if (h_ret == H_SUCCESS) {
 
1401                         /* successful reregistration */
 
1402                         e_fmr->start = NULL;
 
1404                         tmp_lkey = hipzout.lkey;
 
1405                         tmp_rkey = hipzout.rkey;
 
1409                  * should not happen, because length checked above,
 
1410                  * FMRs are not shared and no MW bound to FMRs
 
1412                 ehca_err(&shca->ib_device, "hipz_reregister_pmr failed "
 
1413                          "(Rereg1), h_ret=%lx e_fmr=%p hca_hndl=%lx "
 
1414                          "mr_hndl=%lx lkey=%x lkey_out=%x",
 
1415                          h_ret, e_fmr, shca->ipz_hca_handle.handle,
 
1416                          e_fmr->ipz_mr_handle.handle,
 
1417                          e_fmr->ib.ib_fmr.lkey, hipzout.lkey);
 
1418                 /* try free and rereg */
 
1421         /* first free old FMR */
 
1422         h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
 
1423         if (h_ret != H_SUCCESS) {
 
1424                 ehca_err(&shca->ib_device, "hipz_free_mr failed, "
 
1425                          "h_ret=%lx e_fmr=%p hca_hndl=%lx mr_hndl=%lx "
 
1427                          h_ret, e_fmr, shca->ipz_hca_handle.handle,
 
1428                          e_fmr->ipz_mr_handle.handle,
 
1429                          e_fmr->ib.ib_fmr.lkey);
 
1430                 ret = ehca2ib_return_code(h_ret);
 
1431                 goto ehca_unmap_one_fmr_exit0;
 
1433         /* clean ehca_mr_t, without changing lock */
 
1435         ehca_mr_deletenew(e_fmr);
 
1437         /* set some MR values */
 
1438         e_fmr->flags = save_fmr.flags;
 
1439         e_fmr->hwpage_size = save_fmr.hwpage_size;
 
1440         e_fmr->fmr_page_size = save_fmr.fmr_page_size;
 
1441         e_fmr->fmr_max_pages = save_fmr.fmr_max_pages;
 
1442         e_fmr->fmr_max_maps = save_fmr.fmr_max_maps;
 
1443         e_fmr->fmr_map_cnt = save_fmr.fmr_map_cnt;
 
1444         e_fmr->acl = save_fmr.acl;
 
1446         memset(&pginfo, 0, sizeof(pginfo));
 
1447         pginfo.type = EHCA_MR_PGI_FMR;
 
1448         ret = ehca_reg_mr(shca, e_fmr, NULL,
 
1449                           (e_fmr->fmr_max_pages * e_fmr->fmr_page_size),
 
1450                           e_fmr->acl, e_pd, &pginfo, &tmp_lkey,
 
1453                 u32 offset = (u64)(&e_fmr->flags) - (u64)e_fmr;
 
1454                 memcpy(&e_fmr->flags, &(save_mr.flags),
 
1455                        sizeof(struct ehca_mr) - offset);
 
1458 ehca_unmap_one_fmr_exit0:
 
1460                 ehca_err(&shca->ib_device, "ret=%x tmp_lkey=%x tmp_rkey=%x "
 
1462                          ret, tmp_lkey, tmp_rkey, e_fmr->fmr_max_pages);
 
1464 } /* end ehca_unmap_one_fmr() */
 
1466 /*----------------------------------------------------------------------*/
 
1468 int ehca_reg_smr(struct ehca_shca *shca,
 
1469                  struct ehca_mr *e_origmr,
 
1470                  struct ehca_mr *e_newmr,
 
1473                  struct ehca_pd *e_pd,
 
1480         struct ehca_mr_hipzout_parms hipzout;
 
1482         ehca_mrmw_map_acl(acl, &hipz_acl);
 
1483         ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
 
1485         h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
 
1486                                     (u64)iova_start, hipz_acl, e_pd->fw_pd,
 
1488         if (h_ret != H_SUCCESS) {
 
1489                 ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lx "
 
1490                          "shca=%p e_origmr=%p e_newmr=%p iova_start=%p acl=%x "
 
1491                          "e_pd=%p hca_hndl=%lx mr_hndl=%lx lkey=%x",
 
1492                          h_ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd,
 
1493                          shca->ipz_hca_handle.handle,
 
1494                          e_origmr->ipz_mr_handle.handle,
 
1495                          e_origmr->ib.ib_mr.lkey);
 
1496                 ret = ehca2ib_return_code(h_ret);
 
1497                 goto ehca_reg_smr_exit0;
 
1499         /* successful registration */
 
1500         e_newmr->num_kpages = e_origmr->num_kpages;
 
1501         e_newmr->num_hwpages = e_origmr->num_hwpages;
 
1502         e_newmr->hwpage_size   = e_origmr->hwpage_size;
 
1503         e_newmr->start = iova_start;
 
1504         e_newmr->size = e_origmr->size;
 
1506         e_newmr->ipz_mr_handle = hipzout.handle;
 
1507         *lkey = hipzout.lkey;
 
1508         *rkey = hipzout.rkey;
 
1513                 ehca_err(&shca->ib_device, "ret=%x shca=%p e_origmr=%p "
 
1514                          "e_newmr=%p iova_start=%p acl=%x e_pd=%p",
 
1515                          ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd);
 
1517 } /* end ehca_reg_smr() */
 
1519 /*----------------------------------------------------------------------*/
 
1521 /* register internal max-MR to internal SHCA */
 
1522 int ehca_reg_internal_maxmr(
 
1523         struct ehca_shca *shca,
 
1524         struct ehca_pd *e_pd,
 
1525         struct ehca_mr **e_maxmr)  /*OUT*/
 
1528         struct ehca_mr *e_mr;
 
1531         struct ehca_mr_pginfo pginfo;
 
1532         struct ib_phys_buf ib_pbuf;
 
1537         e_mr = ehca_mr_new();
 
1539                 ehca_err(&shca->ib_device, "out of memory");
 
1541                 goto ehca_reg_internal_maxmr_exit0;
 
1543         e_mr->flags |= EHCA_MR_FLAG_MAXMR;
 
1545         /* register internal max-MR on HCA */
 
1546         size_maxmr = (u64)high_memory - PAGE_OFFSET;
 
1547         iova_start = (u64 *)KERNELBASE;
 
1549         ib_pbuf.size = size_maxmr;
 
1550         num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size_maxmr,
 
1552         hw_pgsize = ehca_get_max_hwpage_size(shca);
 
1553         num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size_maxmr,
 
1556         memset(&pginfo, 0, sizeof(pginfo));
 
1557         pginfo.type = EHCA_MR_PGI_PHYS;
 
1558         pginfo.num_kpages = num_kpages;
 
1559         pginfo.num_hwpages = num_hwpages;
 
1560         pginfo.hwpage_size = hw_pgsize;
 
1561         pginfo.u.phy.num_phys_buf = 1;
 
1562         pginfo.u.phy.phys_buf_array = &ib_pbuf;
 
1564         ret = ehca_reg_mr(shca, e_mr, iova_start, size_maxmr, 0, e_pd,
 
1565                           &pginfo, &e_mr->ib.ib_mr.lkey,
 
1566                           &e_mr->ib.ib_mr.rkey);
 
1568                 ehca_err(&shca->ib_device, "reg of internal max MR failed, "
 
1569                          "e_mr=%p iova_start=%p size_maxmr=%lx num_kpages=%x "
 
1570                          "num_hwpages=%x", e_mr, iova_start, size_maxmr,
 
1571                          num_kpages, num_hwpages);
 
1572                 goto ehca_reg_internal_maxmr_exit1;
 
1575         /* successful registration of all pages */
 
1576         e_mr->ib.ib_mr.device = e_pd->ib_pd.device;
 
1577         e_mr->ib.ib_mr.pd = &e_pd->ib_pd;
 
1578         e_mr->ib.ib_mr.uobject = NULL;
 
1579         atomic_inc(&(e_pd->ib_pd.usecnt));
 
1580         atomic_set(&(e_mr->ib.ib_mr.usecnt), 0);
 
1584 ehca_reg_internal_maxmr_exit1:
 
1585         ehca_mr_delete(e_mr);
 
1586 ehca_reg_internal_maxmr_exit0:
 
1588                 ehca_err(&shca->ib_device, "ret=%x shca=%p e_pd=%p e_maxmr=%p",
 
1589                          ret, shca, e_pd, e_maxmr);
 
1591 } /* end ehca_reg_internal_maxmr() */
 
1593 /*----------------------------------------------------------------------*/
 
1595 int ehca_reg_maxmr(struct ehca_shca *shca,
 
1596                    struct ehca_mr *e_newmr,
 
1599                    struct ehca_pd *e_pd,
 
1604         struct ehca_mr *e_origmr = shca->maxmr;
 
1606         struct ehca_mr_hipzout_parms hipzout;
 
1608         ehca_mrmw_map_acl(acl, &hipz_acl);
 
1609         ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
 
1611         h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
 
1612                                     (u64)iova_start, hipz_acl, e_pd->fw_pd,
 
1614         if (h_ret != H_SUCCESS) {
 
1615                 ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lx "
 
1616                          "e_origmr=%p hca_hndl=%lx mr_hndl=%lx lkey=%x",
 
1617                          h_ret, e_origmr, shca->ipz_hca_handle.handle,
 
1618                          e_origmr->ipz_mr_handle.handle,
 
1619                          e_origmr->ib.ib_mr.lkey);
 
1620                 return ehca2ib_return_code(h_ret);
 
1622         /* successful registration */
 
1623         e_newmr->num_kpages = e_origmr->num_kpages;
 
1624         e_newmr->num_hwpages = e_origmr->num_hwpages;
 
1625         e_newmr->hwpage_size = e_origmr->hwpage_size;
 
1626         e_newmr->start = iova_start;
 
1627         e_newmr->size = e_origmr->size;
 
1629         e_newmr->ipz_mr_handle = hipzout.handle;
 
1630         *lkey = hipzout.lkey;
 
1631         *rkey = hipzout.rkey;
 
1633 } /* end ehca_reg_maxmr() */
 
1635 /*----------------------------------------------------------------------*/
 
1637 int ehca_dereg_internal_maxmr(struct ehca_shca *shca)
 
1640         struct ehca_mr *e_maxmr;
 
1641         struct ib_pd *ib_pd;
 
1644                 ehca_err(&shca->ib_device, "bad call, shca=%p", shca);
 
1646                 goto ehca_dereg_internal_maxmr_exit0;
 
1649         e_maxmr = shca->maxmr;
 
1650         ib_pd = e_maxmr->ib.ib_mr.pd;
 
1651         shca->maxmr = NULL; /* remove internal max-MR indication from SHCA */
 
1653         ret = ehca_dereg_mr(&e_maxmr->ib.ib_mr);
 
1655                 ehca_err(&shca->ib_device, "dereg internal max-MR failed, "
 
1656                          "ret=%x e_maxmr=%p shca=%p lkey=%x",
 
1657                          ret, e_maxmr, shca, e_maxmr->ib.ib_mr.lkey);
 
1658                 shca->maxmr = e_maxmr;
 
1659                 goto ehca_dereg_internal_maxmr_exit0;
 
1662         atomic_dec(&ib_pd->usecnt);
 
1664 ehca_dereg_internal_maxmr_exit0:
 
1666                 ehca_err(&shca->ib_device, "ret=%x shca=%p shca->maxmr=%p",
 
1667                          ret, shca, shca->maxmr);
 
1669 } /* end ehca_dereg_internal_maxmr() */
 
1671 /*----------------------------------------------------------------------*/
 
1674  * check physical buffer array of MR verbs for validness and
 
1675  * calculates MR size
 
1677 int ehca_mr_chk_buf_and_calc_size(struct ib_phys_buf *phys_buf_array,
 
1682         struct ib_phys_buf *pbuf = phys_buf_array;
 
1686         if (num_phys_buf == 0) {
 
1687                 ehca_gen_err("bad phys buf array len, num_phys_buf=0");
 
1690         /* check first buffer */
 
1691         if (((u64)iova_start & ~PAGE_MASK) != (pbuf->addr & ~PAGE_MASK)) {
 
1692                 ehca_gen_err("iova_start/addr mismatch, iova_start=%p "
 
1693                              "pbuf->addr=%lx pbuf->size=%lx",
 
1694                              iova_start, pbuf->addr, pbuf->size);
 
1697         if (((pbuf->addr + pbuf->size) % PAGE_SIZE) &&
 
1698             (num_phys_buf > 1)) {
 
1699                 ehca_gen_err("addr/size mismatch in 1st buf, pbuf->addr=%lx "
 
1700                              "pbuf->size=%lx", pbuf->addr, pbuf->size);
 
1704         for (i = 0; i < num_phys_buf; i++) {
 
1705                 if ((i > 0) && (pbuf->addr % PAGE_SIZE)) {
 
1706                         ehca_gen_err("bad address, i=%x pbuf->addr=%lx "
 
1708                                      i, pbuf->addr, pbuf->size);
 
1711                 if (((i > 0) && /* not 1st */
 
1712                      (i < (num_phys_buf - 1)) &&        /* not last */
 
1713                      (pbuf->size % PAGE_SIZE)) || (pbuf->size == 0)) {
 
1714                         ehca_gen_err("bad size, i=%x pbuf->size=%lx",
 
1718                 size_count += pbuf->size;
 
1724 } /* end ehca_mr_chk_buf_and_calc_size() */
 
1726 /*----------------------------------------------------------------------*/
 
1728 /* check page list of map FMR verb for validness */
 
1729 int ehca_fmr_check_page_list(struct ehca_mr *e_fmr,
 
1736         if ((list_len == 0) || (list_len > e_fmr->fmr_max_pages)) {
 
1737                 ehca_gen_err("bad list_len, list_len=%x "
 
1738                              "e_fmr->fmr_max_pages=%x fmr=%p",
 
1739                              list_len, e_fmr->fmr_max_pages, e_fmr);
 
1743         /* each page must be aligned */
 
1745         for (i = 0; i < list_len; i++) {
 
1746                 if (*page % e_fmr->fmr_page_size) {
 
1747                         ehca_gen_err("bad page, i=%x *page=%lx page=%p fmr=%p "
 
1748                                      "fmr_page_size=%x", i, *page, page, e_fmr,
 
1749                                      e_fmr->fmr_page_size);
 
1756 } /* end ehca_fmr_check_page_list() */
 
1758 /*----------------------------------------------------------------------*/
 
1760 /* PAGE_SIZE >= pginfo->hwpage_size */
 
1761 static int ehca_set_pagebuf_user1(struct ehca_mr_pginfo *pginfo,
 
1766         struct ib_umem_chunk *prev_chunk;
 
1767         struct ib_umem_chunk *chunk;
 
1771         int hwpages_per_kpage = PAGE_SIZE / pginfo->hwpage_size;
 
1773         /* loop over desired chunk entries */
 
1774         chunk      = pginfo->u.usr.next_chunk;
 
1775         prev_chunk = pginfo->u.usr.next_chunk;
 
1776         list_for_each_entry_continue(
 
1777                 chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
 
1778                 for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
 
1779                         pgaddr = page_to_pfn(chunk->page_list[i].page)
 
1781                         *kpage = phys_to_abs(pgaddr +
 
1782                                              (pginfo->next_hwpage *
 
1783                                               pginfo->hwpage_size));
 
1785                                 ehca_gen_err("pgaddr=%lx "
 
1786                                              "chunk->page_list[i]=%lx "
 
1787                                              "i=%x next_hwpage=%lx",
 
1788                                              pgaddr, (u64)sg_dma_address(
 
1789                                                      &chunk->page_list[i]),
 
1790                                              i, pginfo->next_hwpage);
 
1793                         (pginfo->hwpage_cnt)++;
 
1794                         (pginfo->next_hwpage)++;
 
1796                         if (pginfo->next_hwpage % hwpages_per_kpage == 0) {
 
1797                                 (pginfo->kpage_cnt)++;
 
1798                                 (pginfo->u.usr.next_nmap)++;
 
1799                                 pginfo->next_hwpage = 0;
 
1803                         if (j >= number) break;
 
1805                 if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
 
1807                         pginfo->u.usr.next_nmap = 0;
 
1810                 } else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
 
1811                         pginfo->u.usr.next_nmap = 0;
 
1813                 } else if (j >= number)
 
1818         pginfo->u.usr.next_chunk =
 
1819                 list_prepare_entry(prev_chunk,
 
1820                                    (&(pginfo->u.usr.region->chunk_list)),
 
1826  * check given pages for contiguous layout
 
1827  * last page addr is returned in prev_pgaddr for further check
 
1829 static int ehca_check_kpages_per_ate(struct scatterlist *page_list,
 
1830                                      int start_idx, int end_idx,
 
1834         for (t = start_idx; t <= end_idx; t++) {
 
1835                 u64 pgaddr = page_to_pfn(page_list[t].page) << PAGE_SHIFT;
 
1836                 ehca_gen_dbg("chunk_page=%lx value=%016lx", pgaddr,
 
1837                              *(u64 *)abs_to_virt(phys_to_abs(pgaddr)));
 
1838                 if (pgaddr - PAGE_SIZE != *prev_pgaddr) {
 
1839                         ehca_gen_err("uncontiguous page found pgaddr=%lx "
 
1840                                      "prev_pgaddr=%lx page_list_i=%x",
 
1841                                      pgaddr, *prev_pgaddr, t);
 
1844                 *prev_pgaddr = pgaddr;
 
1849 /* PAGE_SIZE < pginfo->hwpage_size */
 
1850 static int ehca_set_pagebuf_user2(struct ehca_mr_pginfo *pginfo,
 
1855         struct ib_umem_chunk *prev_chunk;
 
1856         struct ib_umem_chunk *chunk;
 
1857         u64 pgaddr, prev_pgaddr;
 
1860         int kpages_per_hwpage = pginfo->hwpage_size / PAGE_SIZE;
 
1861         int nr_kpages = kpages_per_hwpage;
 
1863         /* loop over desired chunk entries */
 
1864         chunk      = pginfo->u.usr.next_chunk;
 
1865         prev_chunk = pginfo->u.usr.next_chunk;
 
1866         list_for_each_entry_continue(
 
1867                 chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
 
1868                 for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
 
1869                         if (nr_kpages == kpages_per_hwpage) {
 
1870                                 pgaddr = ( page_to_pfn(chunk->page_list[i].page)
 
1872                                 *kpage = phys_to_abs(pgaddr);
 
1874                                         ehca_gen_err("pgaddr=%lx i=%x",
 
1880                                  * The first page in a hwpage must be aligned;
 
1881                                  * the first MR page is exempt from this rule.
 
1883                                 if (pgaddr & (pginfo->hwpage_size - 1)) {
 
1884                                         if (pginfo->hwpage_cnt) {
 
1886                                                         "invalid alignment "
 
1890                                                         pginfo->hwpage_size);
 
1897                                                  (pginfo->hwpage_size - 1)) >>
 
1899                                         nr_kpages -= pginfo->kpage_cnt;
 
1900                                         *kpage = phys_to_abs(
 
1902                                                 ~(pginfo->hwpage_size - 1));
 
1904                                 ehca_gen_dbg("kpage=%lx chunk_page=%lx "
 
1905                                              "value=%016lx", *kpage, pgaddr,
 
1906                                              *(u64 *)abs_to_virt(
 
1907                                                      phys_to_abs(pgaddr)));
 
1908                                 prev_pgaddr = pgaddr;
 
1910                                 pginfo->kpage_cnt++;
 
1911                                 pginfo->u.usr.next_nmap++;
 
1917                         if (i + nr_kpages > chunk->nmap) {
 
1918                                 ret = ehca_check_kpages_per_ate(
 
1919                                         chunk->page_list, i,
 
1920                                         chunk->nmap - 1, &prev_pgaddr);
 
1921                                 if (ret) return ret;
 
1922                                 pginfo->kpage_cnt += chunk->nmap - i;
 
1923                                 pginfo->u.usr.next_nmap += chunk->nmap - i;
 
1924                                 nr_kpages -= chunk->nmap - i;
 
1928                         ret = ehca_check_kpages_per_ate(chunk->page_list, i,
 
1931                         if (ret) return ret;
 
1933                         pginfo->kpage_cnt += nr_kpages;
 
1934                         pginfo->u.usr.next_nmap += nr_kpages;
 
1936                         nr_kpages = kpages_per_hwpage;
 
1937                         (pginfo->hwpage_cnt)++;
 
1940                         if (j >= number) break;
 
1942                 if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
 
1944                         pginfo->u.usr.next_nmap = 0;
 
1947                 } else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
 
1948                         pginfo->u.usr.next_nmap = 0;
 
1950                 } else if (j >= number)
 
1955         pginfo->u.usr.next_chunk =
 
1956                 list_prepare_entry(prev_chunk,
 
1957                                    (&(pginfo->u.usr.region->chunk_list)),
 
1962 int ehca_set_pagebuf_phys(struct ehca_mr_pginfo *pginfo,
 
1967         struct ib_phys_buf *pbuf;
 
1968         u64 num_hw, offs_hw;
 
1971         /* loop over desired phys_buf_array entries */
 
1972         while (i < number) {
 
1973                 pbuf   = pginfo->u.phy.phys_buf_array + pginfo->u.phy.next_buf;
 
1974                 num_hw  = NUM_CHUNKS((pbuf->addr % pginfo->hwpage_size) +
 
1975                                      pbuf->size, pginfo->hwpage_size);
 
1976                 offs_hw = (pbuf->addr & ~(pginfo->hwpage_size - 1)) /
 
1977                         pginfo->hwpage_size;
 
1978                 while (pginfo->next_hwpage < offs_hw + num_hw) {
 
1980                         if ((pginfo->kpage_cnt >= pginfo->num_kpages) ||
 
1981                             (pginfo->hwpage_cnt >= pginfo->num_hwpages)) {
 
1982                                 ehca_gen_err("kpage_cnt >= num_kpages, "
 
1983                                              "kpage_cnt=%lx num_kpages=%lx "
 
1985                                              "num_hwpages=%lx i=%x",
 
1989                                              pginfo->num_hwpages, i);
 
1992                         *kpage = phys_to_abs(
 
1993                                 (pbuf->addr & ~(pginfo->hwpage_size - 1)) +
 
1994                                 (pginfo->next_hwpage * pginfo->hwpage_size));
 
1995                         if ( !(*kpage) && pbuf->addr ) {
 
1996                                 ehca_gen_err("pbuf->addr=%lx pbuf->size=%lx "
 
1997                                              "next_hwpage=%lx", pbuf->addr,
 
1998                                              pbuf->size, pginfo->next_hwpage);
 
2001                         (pginfo->hwpage_cnt)++;
 
2002                         (pginfo->next_hwpage)++;
 
2003                         if (PAGE_SIZE >= pginfo->hwpage_size) {
 
2004                                 if (pginfo->next_hwpage %
 
2005                                     (PAGE_SIZE / pginfo->hwpage_size) == 0)
 
2006                                         (pginfo->kpage_cnt)++;
 
2008                                 pginfo->kpage_cnt += pginfo->hwpage_size /
 
2012                         if (i >= number) break;
 
2014                 if (pginfo->next_hwpage >= offs_hw + num_hw) {
 
2015                         (pginfo->u.phy.next_buf)++;
 
2016                         pginfo->next_hwpage = 0;
 
2022 int ehca_set_pagebuf_fmr(struct ehca_mr_pginfo *pginfo,
 
2030         /* loop over desired page_list entries */
 
2031         fmrlist = pginfo->u.fmr.page_list + pginfo->u.fmr.next_listelem;
 
2032         for (i = 0; i < number; i++) {
 
2033                 *kpage = phys_to_abs((*fmrlist & ~(pginfo->hwpage_size - 1)) +
 
2034                                      pginfo->next_hwpage * pginfo->hwpage_size);
 
2036                         ehca_gen_err("*fmrlist=%lx fmrlist=%p "
 
2037                                      "next_listelem=%lx next_hwpage=%lx",
 
2039                                      pginfo->u.fmr.next_listelem,
 
2040                                      pginfo->next_hwpage);
 
2043                 (pginfo->hwpage_cnt)++;
 
2044                 if (pginfo->u.fmr.fmr_pgsize >= pginfo->hwpage_size) {
 
2045                         if (pginfo->next_hwpage %
 
2046                             (pginfo->u.fmr.fmr_pgsize /
 
2047                              pginfo->hwpage_size) == 0) {
 
2048                                 (pginfo->kpage_cnt)++;
 
2049                                 (pginfo->u.fmr.next_listelem)++;
 
2051                                 pginfo->next_hwpage = 0;
 
2053                                 (pginfo->next_hwpage)++;
 
2055                         unsigned int cnt_per_hwpage = pginfo->hwpage_size /
 
2056                                 pginfo->u.fmr.fmr_pgsize;
 
2059                         /* check if adrs are contiguous */
 
2060                         for (j = 1; j < cnt_per_hwpage; j++) {
 
2061                                 u64 p = phys_to_abs(fmrlist[j] &
 
2062                                                     ~(pginfo->hwpage_size - 1));
 
2063                                 if (prev + pginfo->u.fmr.fmr_pgsize != p) {
 
2064                                         ehca_gen_err("uncontiguous fmr pages "
 
2065                                                      "found prev=%lx p=%lx "
 
2066                                                      "idx=%x", prev, p, i + j);
 
2071                         pginfo->kpage_cnt += cnt_per_hwpage;
 
2072                         pginfo->u.fmr.next_listelem += cnt_per_hwpage;
 
2073                         fmrlist += cnt_per_hwpage;
 
2080 /* setup page buffer from page info */
 
2081 int ehca_set_pagebuf(struct ehca_mr_pginfo *pginfo,
 
2087         switch (pginfo->type) {
 
2088         case EHCA_MR_PGI_PHYS:
 
2089                 ret = ehca_set_pagebuf_phys(pginfo, number, kpage);
 
2091         case EHCA_MR_PGI_USER:
 
2092                 ret = PAGE_SIZE >= pginfo->hwpage_size ?
 
2093                         ehca_set_pagebuf_user1(pginfo, number, kpage) :
 
2094                         ehca_set_pagebuf_user2(pginfo, number, kpage);
 
2096         case EHCA_MR_PGI_FMR:
 
2097                 ret = ehca_set_pagebuf_fmr(pginfo, number, kpage);
 
2100                 ehca_gen_err("bad pginfo->type=%x", pginfo->type);
 
2105 } /* end ehca_set_pagebuf() */
 
2107 /*----------------------------------------------------------------------*/
 
2110  * check MR if it is a max-MR, i.e. uses whole memory
 
2111  * in case it's a max-MR 1 is returned, else 0
 
2113 int ehca_mr_is_maxmr(u64 size,
 
2116         /* a MR is treated as max-MR only if it fits following: */
 
2117         if ((size == ((u64)high_memory - PAGE_OFFSET)) &&
 
2118             (iova_start == (void *)KERNELBASE)) {
 
2119                 ehca_gen_dbg("this is a max-MR");
 
2123 } /* end ehca_mr_is_maxmr() */
 
2125 /*----------------------------------------------------------------------*/
 
2127 /* map access control for MR/MW. This routine is used for MR and MW. */
 
2128 void ehca_mrmw_map_acl(int ib_acl,
 
2132         if (ib_acl & IB_ACCESS_REMOTE_READ)
 
2133                 *hipz_acl |= HIPZ_ACCESSCTRL_R_READ;
 
2134         if (ib_acl & IB_ACCESS_REMOTE_WRITE)
 
2135                 *hipz_acl |= HIPZ_ACCESSCTRL_R_WRITE;
 
2136         if (ib_acl & IB_ACCESS_REMOTE_ATOMIC)
 
2137                 *hipz_acl |= HIPZ_ACCESSCTRL_R_ATOMIC;
 
2138         if (ib_acl & IB_ACCESS_LOCAL_WRITE)
 
2139                 *hipz_acl |= HIPZ_ACCESSCTRL_L_WRITE;
 
2140         if (ib_acl & IB_ACCESS_MW_BIND)
 
2141                 *hipz_acl |= HIPZ_ACCESSCTRL_MW_BIND;
 
2142 } /* end ehca_mrmw_map_acl() */
 
2144 /*----------------------------------------------------------------------*/
 
2146 /* sets page size in hipz access control for MR/MW. */
 
2147 void ehca_mrmw_set_pgsize_hipz_acl(u32 pgsize, u32 *hipz_acl) /*INOUT*/
 
2149         *hipz_acl |= (ehca_encode_hwpage_size(pgsize) << 24);
 
2150 } /* end ehca_mrmw_set_pgsize_hipz_acl() */
 
2152 /*----------------------------------------------------------------------*/
 
2155  * reverse map access control for MR/MW.
 
2156  * This routine is used for MR and MW.
 
2158 void ehca_mrmw_reverse_map_acl(const u32 *hipz_acl,
 
2159                                int *ib_acl) /*OUT*/
 
2162         if (*hipz_acl & HIPZ_ACCESSCTRL_R_READ)
 
2163                 *ib_acl |= IB_ACCESS_REMOTE_READ;
 
2164         if (*hipz_acl & HIPZ_ACCESSCTRL_R_WRITE)
 
2165                 *ib_acl |= IB_ACCESS_REMOTE_WRITE;
 
2166         if (*hipz_acl & HIPZ_ACCESSCTRL_R_ATOMIC)
 
2167                 *ib_acl |= IB_ACCESS_REMOTE_ATOMIC;
 
2168         if (*hipz_acl & HIPZ_ACCESSCTRL_L_WRITE)
 
2169                 *ib_acl |= IB_ACCESS_LOCAL_WRITE;
 
2170         if (*hipz_acl & HIPZ_ACCESSCTRL_MW_BIND)
 
2171                 *ib_acl |= IB_ACCESS_MW_BIND;
 
2172 } /* end ehca_mrmw_reverse_map_acl() */
 
2175 /*----------------------------------------------------------------------*/
 
2178  * MR destructor and constructor
 
2179  * used in Reregister MR verb, sets all fields in ehca_mr_t to 0,
 
2180  * except struct ib_mr and spinlock
 
2182 void ehca_mr_deletenew(struct ehca_mr *mr)
 
2186         mr->num_hwpages = 0;
 
2189         mr->fmr_page_size = 0;
 
2190         mr->fmr_max_pages = 0;
 
2191         mr->fmr_max_maps = 0;
 
2192         mr->fmr_map_cnt = 0;
 
2193         memset(&mr->ipz_mr_handle, 0, sizeof(mr->ipz_mr_handle));
 
2194         memset(&mr->galpas, 0, sizeof(mr->galpas));
 
2195 } /* end ehca_mr_deletenew() */
 
2197 int ehca_init_mrmw_cache(void)
 
2199         mr_cache = kmem_cache_create("ehca_cache_mr",
 
2200                                      sizeof(struct ehca_mr), 0,
 
2205         mw_cache = kmem_cache_create("ehca_cache_mw",
 
2206                                      sizeof(struct ehca_mw), 0,
 
2210                 kmem_cache_destroy(mr_cache);
 
2217 void ehca_cleanup_mrmw_cache(void)
 
2220                 kmem_cache_destroy(mr_cache);
 
2222                 kmem_cache_destroy(mw_cache);