]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blob - drivers/infiniband/hw/ehca/ehca_mrmw.c
Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/x86/linux...
[mirror_ubuntu-artful-kernel.git] / drivers / infiniband / hw / ehca / ehca_mrmw.c
1 /*
2 * IBM eServer eHCA Infiniband device driver for Linux on POWER
3 *
4 * MR/MW functions
5 *
6 * Authors: Dietmar Decker <ddecker@de.ibm.com>
7 * Christoph Raisch <raisch@de.ibm.com>
8 * Hoang-Nam Nguyen <hnguyen@de.ibm.com>
9 *
10 * Copyright (c) 2005 IBM Corporation
11 *
12 * All rights reserved.
13 *
14 * This source code is distributed under a dual license of GPL v2.0 and OpenIB
15 * BSD.
16 *
17 * OpenIB BSD License
18 *
19 * Redistribution and use in source and binary forms, with or without
20 * modification, are permitted provided that the following conditions are met:
21 *
22 * Redistributions of source code must retain the above copyright notice, this
23 * list of conditions and the following disclaimer.
24 *
25 * Redistributions in binary form must reproduce the above copyright notice,
26 * this list of conditions and the following disclaimer in the documentation
27 * and/or other materials
28 * provided with the distribution.
29 *
30 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38 * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40 * POSSIBILITY OF SUCH DAMAGE.
41 */
42
43 #include <rdma/ib_umem.h>
44
45 #include "ehca_iverbs.h"
46 #include "ehca_mrmw.h"
47 #include "hcp_if.h"
48 #include "hipz_hw.h"
49
50 #define NUM_CHUNKS(length, chunk_size) \
51 (((length) + (chunk_size - 1)) / (chunk_size))
52
53 /* max number of rpages (per hcall register_rpages) */
54 #define MAX_RPAGES 512
55
56 static struct kmem_cache *mr_cache;
57 static struct kmem_cache *mw_cache;
58
59 enum ehca_mr_pgsize {
60 EHCA_MR_PGSIZE4K = 0x1000L,
61 EHCA_MR_PGSIZE64K = 0x10000L,
62 EHCA_MR_PGSIZE1M = 0x100000L,
63 EHCA_MR_PGSIZE16M = 0x1000000L
64 };
65
66 #define EHCA_MR_PGSHIFT4K 12
67 #define EHCA_MR_PGSHIFT64K 16
68 #define EHCA_MR_PGSHIFT1M 20
69 #define EHCA_MR_PGSHIFT16M 24
70
71 static u32 ehca_encode_hwpage_size(u32 pgsize)
72 {
73 int log = ilog2(pgsize);
74 WARN_ON(log < 12 || log > 24 || log & 3);
75 return (log - 12) / 4;
76 }
77
78 static u64 ehca_get_max_hwpage_size(struct ehca_shca *shca)
79 {
80 return 1UL << ilog2(shca->hca_cap_mr_pgsize);
81 }
82
83 static struct ehca_mr *ehca_mr_new(void)
84 {
85 struct ehca_mr *me;
86
87 me = kmem_cache_zalloc(mr_cache, GFP_KERNEL);
88 if (me)
89 spin_lock_init(&me->mrlock);
90 else
91 ehca_gen_err("alloc failed");
92
93 return me;
94 }
95
96 static void ehca_mr_delete(struct ehca_mr *me)
97 {
98 kmem_cache_free(mr_cache, me);
99 }
100
101 static struct ehca_mw *ehca_mw_new(void)
102 {
103 struct ehca_mw *me;
104
105 me = kmem_cache_zalloc(mw_cache, GFP_KERNEL);
106 if (me)
107 spin_lock_init(&me->mwlock);
108 else
109 ehca_gen_err("alloc failed");
110
111 return me;
112 }
113
114 static void ehca_mw_delete(struct ehca_mw *me)
115 {
116 kmem_cache_free(mw_cache, me);
117 }
118
119 /*----------------------------------------------------------------------*/
120
121 struct ib_mr *ehca_get_dma_mr(struct ib_pd *pd, int mr_access_flags)
122 {
123 struct ib_mr *ib_mr;
124 int ret;
125 struct ehca_mr *e_maxmr;
126 struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
127 struct ehca_shca *shca =
128 container_of(pd->device, struct ehca_shca, ib_device);
129
130 if (shca->maxmr) {
131 e_maxmr = ehca_mr_new();
132 if (!e_maxmr) {
133 ehca_err(&shca->ib_device, "out of memory");
134 ib_mr = ERR_PTR(-ENOMEM);
135 goto get_dma_mr_exit0;
136 }
137
138 ret = ehca_reg_maxmr(shca, e_maxmr, (u64 *)KERNELBASE,
139 mr_access_flags, e_pd,
140 &e_maxmr->ib.ib_mr.lkey,
141 &e_maxmr->ib.ib_mr.rkey);
142 if (ret) {
143 ehca_mr_delete(e_maxmr);
144 ib_mr = ERR_PTR(ret);
145 goto get_dma_mr_exit0;
146 }
147 ib_mr = &e_maxmr->ib.ib_mr;
148 } else {
149 ehca_err(&shca->ib_device, "no internal max-MR exist!");
150 ib_mr = ERR_PTR(-EINVAL);
151 goto get_dma_mr_exit0;
152 }
153
154 get_dma_mr_exit0:
155 if (IS_ERR(ib_mr))
156 ehca_err(&shca->ib_device, "h_ret=%li pd=%p mr_access_flags=%x",
157 PTR_ERR(ib_mr), pd, mr_access_flags);
158 return ib_mr;
159 } /* end ehca_get_dma_mr() */
160
161 /*----------------------------------------------------------------------*/
162
163 struct ib_mr *ehca_reg_phys_mr(struct ib_pd *pd,
164 struct ib_phys_buf *phys_buf_array,
165 int num_phys_buf,
166 int mr_access_flags,
167 u64 *iova_start)
168 {
169 struct ib_mr *ib_mr;
170 int ret;
171 struct ehca_mr *e_mr;
172 struct ehca_shca *shca =
173 container_of(pd->device, struct ehca_shca, ib_device);
174 struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
175
176 u64 size;
177
178 if ((num_phys_buf <= 0) || !phys_buf_array) {
179 ehca_err(pd->device, "bad input values: num_phys_buf=%x "
180 "phys_buf_array=%p", num_phys_buf, phys_buf_array);
181 ib_mr = ERR_PTR(-EINVAL);
182 goto reg_phys_mr_exit0;
183 }
184 if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
185 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
186 ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
187 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
188 /*
189 * Remote Write Access requires Local Write Access
190 * Remote Atomic Access requires Local Write Access
191 */
192 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
193 mr_access_flags);
194 ib_mr = ERR_PTR(-EINVAL);
195 goto reg_phys_mr_exit0;
196 }
197
198 /* check physical buffer list and calculate size */
199 ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array, num_phys_buf,
200 iova_start, &size);
201 if (ret) {
202 ib_mr = ERR_PTR(ret);
203 goto reg_phys_mr_exit0;
204 }
205 if ((size == 0) ||
206 (((u64)iova_start + size) < (u64)iova_start)) {
207 ehca_err(pd->device, "bad input values: size=%lx iova_start=%p",
208 size, iova_start);
209 ib_mr = ERR_PTR(-EINVAL);
210 goto reg_phys_mr_exit0;
211 }
212
213 e_mr = ehca_mr_new();
214 if (!e_mr) {
215 ehca_err(pd->device, "out of memory");
216 ib_mr = ERR_PTR(-ENOMEM);
217 goto reg_phys_mr_exit0;
218 }
219
220 /* register MR on HCA */
221 if (ehca_mr_is_maxmr(size, iova_start)) {
222 e_mr->flags |= EHCA_MR_FLAG_MAXMR;
223 ret = ehca_reg_maxmr(shca, e_mr, iova_start, mr_access_flags,
224 e_pd, &e_mr->ib.ib_mr.lkey,
225 &e_mr->ib.ib_mr.rkey);
226 if (ret) {
227 ib_mr = ERR_PTR(ret);
228 goto reg_phys_mr_exit1;
229 }
230 } else {
231 struct ehca_mr_pginfo pginfo;
232 u32 num_kpages;
233 u32 num_hwpages;
234 u64 hw_pgsize;
235
236 num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size,
237 PAGE_SIZE);
238 /* for kernel space we try most possible pgsize */
239 hw_pgsize = ehca_get_max_hwpage_size(shca);
240 num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size,
241 hw_pgsize);
242 memset(&pginfo, 0, sizeof(pginfo));
243 pginfo.type = EHCA_MR_PGI_PHYS;
244 pginfo.num_kpages = num_kpages;
245 pginfo.hwpage_size = hw_pgsize;
246 pginfo.num_hwpages = num_hwpages;
247 pginfo.u.phy.num_phys_buf = num_phys_buf;
248 pginfo.u.phy.phys_buf_array = phys_buf_array;
249 pginfo.next_hwpage =
250 ((u64)iova_start & ~PAGE_MASK) / hw_pgsize;
251
252 ret = ehca_reg_mr(shca, e_mr, iova_start, size, mr_access_flags,
253 e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
254 &e_mr->ib.ib_mr.rkey);
255 if (ret) {
256 ib_mr = ERR_PTR(ret);
257 goto reg_phys_mr_exit1;
258 }
259 }
260
261 /* successful registration of all pages */
262 return &e_mr->ib.ib_mr;
263
264 reg_phys_mr_exit1:
265 ehca_mr_delete(e_mr);
266 reg_phys_mr_exit0:
267 if (IS_ERR(ib_mr))
268 ehca_err(pd->device, "h_ret=%li pd=%p phys_buf_array=%p "
269 "num_phys_buf=%x mr_access_flags=%x iova_start=%p",
270 PTR_ERR(ib_mr), pd, phys_buf_array,
271 num_phys_buf, mr_access_flags, iova_start);
272 return ib_mr;
273 } /* end ehca_reg_phys_mr() */
274
275 /*----------------------------------------------------------------------*/
276
277 struct ib_mr *ehca_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
278 u64 virt, int mr_access_flags,
279 struct ib_udata *udata)
280 {
281 struct ib_mr *ib_mr;
282 struct ehca_mr *e_mr;
283 struct ehca_shca *shca =
284 container_of(pd->device, struct ehca_shca, ib_device);
285 struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
286 struct ehca_mr_pginfo pginfo;
287 int ret, page_shift;
288 u32 num_kpages;
289 u32 num_hwpages;
290 u64 hwpage_size;
291
292 if (!pd) {
293 ehca_gen_err("bad pd=%p", pd);
294 return ERR_PTR(-EFAULT);
295 }
296
297 if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
298 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
299 ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
300 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
301 /*
302 * Remote Write Access requires Local Write Access
303 * Remote Atomic Access requires Local Write Access
304 */
305 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
306 mr_access_flags);
307 ib_mr = ERR_PTR(-EINVAL);
308 goto reg_user_mr_exit0;
309 }
310
311 if (length == 0 || virt + length < virt) {
312 ehca_err(pd->device, "bad input values: length=%lx "
313 "virt_base=%lx", length, virt);
314 ib_mr = ERR_PTR(-EINVAL);
315 goto reg_user_mr_exit0;
316 }
317
318 e_mr = ehca_mr_new();
319 if (!e_mr) {
320 ehca_err(pd->device, "out of memory");
321 ib_mr = ERR_PTR(-ENOMEM);
322 goto reg_user_mr_exit0;
323 }
324
325 e_mr->umem = ib_umem_get(pd->uobject->context, start, length,
326 mr_access_flags);
327 if (IS_ERR(e_mr->umem)) {
328 ib_mr = (void *)e_mr->umem;
329 goto reg_user_mr_exit1;
330 }
331
332 if (e_mr->umem->page_size != PAGE_SIZE) {
333 ehca_err(pd->device, "page size not supported, "
334 "e_mr->umem->page_size=%x", e_mr->umem->page_size);
335 ib_mr = ERR_PTR(-EINVAL);
336 goto reg_user_mr_exit2;
337 }
338
339 /* determine number of MR pages */
340 num_kpages = NUM_CHUNKS((virt % PAGE_SIZE) + length, PAGE_SIZE);
341 /* select proper hw_pgsize */
342 page_shift = PAGE_SHIFT;
343 if (e_mr->umem->hugetlb) {
344 /* determine page_shift, clamp between 4K and 16M */
345 page_shift = (fls64(length - 1) + 3) & ~3;
346 page_shift = min(max(page_shift, EHCA_MR_PGSHIFT4K),
347 EHCA_MR_PGSHIFT16M);
348 }
349 hwpage_size = 1UL << page_shift;
350
351 /* now that we have the desired page size, shift until it's
352 * supported, too. 4K is always supported, so this terminates.
353 */
354 while (!(hwpage_size & shca->hca_cap_mr_pgsize))
355 hwpage_size >>= 4;
356
357 reg_user_mr_fallback:
358 num_hwpages = NUM_CHUNKS((virt % hwpage_size) + length, hwpage_size);
359 /* register MR on HCA */
360 memset(&pginfo, 0, sizeof(pginfo));
361 pginfo.type = EHCA_MR_PGI_USER;
362 pginfo.hwpage_size = hwpage_size;
363 pginfo.num_kpages = num_kpages;
364 pginfo.num_hwpages = num_hwpages;
365 pginfo.u.usr.region = e_mr->umem;
366 pginfo.next_hwpage = e_mr->umem->offset / hwpage_size;
367 pginfo.u.usr.next_chunk = list_prepare_entry(pginfo.u.usr.next_chunk,
368 (&e_mr->umem->chunk_list),
369 list);
370
371 ret = ehca_reg_mr(shca, e_mr, (u64 *)virt, length, mr_access_flags,
372 e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
373 &e_mr->ib.ib_mr.rkey);
374 if (ret == -EINVAL && pginfo.hwpage_size > PAGE_SIZE) {
375 ehca_warn(pd->device, "failed to register mr "
376 "with hwpage_size=%lx", hwpage_size);
377 ehca_info(pd->device, "try to register mr with "
378 "kpage_size=%lx", PAGE_SIZE);
379 /*
380 * this means kpages are not contiguous for a hw page
381 * try kernel page size as fallback solution
382 */
383 hwpage_size = PAGE_SIZE;
384 goto reg_user_mr_fallback;
385 }
386 if (ret) {
387 ib_mr = ERR_PTR(ret);
388 goto reg_user_mr_exit2;
389 }
390
391 /* successful registration of all pages */
392 return &e_mr->ib.ib_mr;
393
394 reg_user_mr_exit2:
395 ib_umem_release(e_mr->umem);
396 reg_user_mr_exit1:
397 ehca_mr_delete(e_mr);
398 reg_user_mr_exit0:
399 if (IS_ERR(ib_mr))
400 ehca_err(pd->device, "rc=%li pd=%p mr_access_flags=%x udata=%p",
401 PTR_ERR(ib_mr), pd, mr_access_flags, udata);
402 return ib_mr;
403 } /* end ehca_reg_user_mr() */
404
405 /*----------------------------------------------------------------------*/
406
407 int ehca_rereg_phys_mr(struct ib_mr *mr,
408 int mr_rereg_mask,
409 struct ib_pd *pd,
410 struct ib_phys_buf *phys_buf_array,
411 int num_phys_buf,
412 int mr_access_flags,
413 u64 *iova_start)
414 {
415 int ret;
416
417 struct ehca_shca *shca =
418 container_of(mr->device, struct ehca_shca, ib_device);
419 struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
420 u64 new_size;
421 u64 *new_start;
422 u32 new_acl;
423 struct ehca_pd *new_pd;
424 u32 tmp_lkey, tmp_rkey;
425 unsigned long sl_flags;
426 u32 num_kpages = 0;
427 u32 num_hwpages = 0;
428 struct ehca_mr_pginfo pginfo;
429
430 if (!(mr_rereg_mask & IB_MR_REREG_TRANS)) {
431 /* TODO not supported, because PHYP rereg hCall needs pages */
432 ehca_err(mr->device, "rereg without IB_MR_REREG_TRANS not "
433 "supported yet, mr_rereg_mask=%x", mr_rereg_mask);
434 ret = -EINVAL;
435 goto rereg_phys_mr_exit0;
436 }
437
438 if (mr_rereg_mask & IB_MR_REREG_PD) {
439 if (!pd) {
440 ehca_err(mr->device, "rereg with bad pd, pd=%p "
441 "mr_rereg_mask=%x", pd, mr_rereg_mask);
442 ret = -EINVAL;
443 goto rereg_phys_mr_exit0;
444 }
445 }
446
447 if ((mr_rereg_mask &
448 ~(IB_MR_REREG_TRANS | IB_MR_REREG_PD | IB_MR_REREG_ACCESS)) ||
449 (mr_rereg_mask == 0)) {
450 ret = -EINVAL;
451 goto rereg_phys_mr_exit0;
452 }
453
454 /* check other parameters */
455 if (e_mr == shca->maxmr) {
456 /* should be impossible, however reject to be sure */
457 ehca_err(mr->device, "rereg internal max-MR impossible, mr=%p "
458 "shca->maxmr=%p mr->lkey=%x",
459 mr, shca->maxmr, mr->lkey);
460 ret = -EINVAL;
461 goto rereg_phys_mr_exit0;
462 }
463 if (mr_rereg_mask & IB_MR_REREG_TRANS) { /* transl., i.e. addr/size */
464 if (e_mr->flags & EHCA_MR_FLAG_FMR) {
465 ehca_err(mr->device, "not supported for FMR, mr=%p "
466 "flags=%x", mr, e_mr->flags);
467 ret = -EINVAL;
468 goto rereg_phys_mr_exit0;
469 }
470 if (!phys_buf_array || num_phys_buf <= 0) {
471 ehca_err(mr->device, "bad input values mr_rereg_mask=%x"
472 " phys_buf_array=%p num_phys_buf=%x",
473 mr_rereg_mask, phys_buf_array, num_phys_buf);
474 ret = -EINVAL;
475 goto rereg_phys_mr_exit0;
476 }
477 }
478 if ((mr_rereg_mask & IB_MR_REREG_ACCESS) && /* change ACL */
479 (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
480 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
481 ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
482 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)))) {
483 /*
484 * Remote Write Access requires Local Write Access
485 * Remote Atomic Access requires Local Write Access
486 */
487 ehca_err(mr->device, "bad input values: mr_rereg_mask=%x "
488 "mr_access_flags=%x", mr_rereg_mask, mr_access_flags);
489 ret = -EINVAL;
490 goto rereg_phys_mr_exit0;
491 }
492
493 /* set requested values dependent on rereg request */
494 spin_lock_irqsave(&e_mr->mrlock, sl_flags);
495 new_start = e_mr->start;
496 new_size = e_mr->size;
497 new_acl = e_mr->acl;
498 new_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
499
500 if (mr_rereg_mask & IB_MR_REREG_TRANS) {
501 u64 hw_pgsize = ehca_get_max_hwpage_size(shca);
502
503 new_start = iova_start; /* change address */
504 /* check physical buffer list and calculate size */
505 ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array,
506 num_phys_buf, iova_start,
507 &new_size);
508 if (ret)
509 goto rereg_phys_mr_exit1;
510 if ((new_size == 0) ||
511 (((u64)iova_start + new_size) < (u64)iova_start)) {
512 ehca_err(mr->device, "bad input values: new_size=%lx "
513 "iova_start=%p", new_size, iova_start);
514 ret = -EINVAL;
515 goto rereg_phys_mr_exit1;
516 }
517 num_kpages = NUM_CHUNKS(((u64)new_start % PAGE_SIZE) +
518 new_size, PAGE_SIZE);
519 num_hwpages = NUM_CHUNKS(((u64)new_start % hw_pgsize) +
520 new_size, hw_pgsize);
521 memset(&pginfo, 0, sizeof(pginfo));
522 pginfo.type = EHCA_MR_PGI_PHYS;
523 pginfo.num_kpages = num_kpages;
524 pginfo.hwpage_size = hw_pgsize;
525 pginfo.num_hwpages = num_hwpages;
526 pginfo.u.phy.num_phys_buf = num_phys_buf;
527 pginfo.u.phy.phys_buf_array = phys_buf_array;
528 pginfo.next_hwpage =
529 ((u64)iova_start & ~PAGE_MASK) / hw_pgsize;
530 }
531 if (mr_rereg_mask & IB_MR_REREG_ACCESS)
532 new_acl = mr_access_flags;
533 if (mr_rereg_mask & IB_MR_REREG_PD)
534 new_pd = container_of(pd, struct ehca_pd, ib_pd);
535
536 ret = ehca_rereg_mr(shca, e_mr, new_start, new_size, new_acl,
537 new_pd, &pginfo, &tmp_lkey, &tmp_rkey);
538 if (ret)
539 goto rereg_phys_mr_exit1;
540
541 /* successful reregistration */
542 if (mr_rereg_mask & IB_MR_REREG_PD)
543 mr->pd = pd;
544 mr->lkey = tmp_lkey;
545 mr->rkey = tmp_rkey;
546
547 rereg_phys_mr_exit1:
548 spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
549 rereg_phys_mr_exit0:
550 if (ret)
551 ehca_err(mr->device, "ret=%i mr=%p mr_rereg_mask=%x pd=%p "
552 "phys_buf_array=%p num_phys_buf=%x mr_access_flags=%x "
553 "iova_start=%p",
554 ret, mr, mr_rereg_mask, pd, phys_buf_array,
555 num_phys_buf, mr_access_flags, iova_start);
556 return ret;
557 } /* end ehca_rereg_phys_mr() */
558
559 /*----------------------------------------------------------------------*/
560
561 int ehca_query_mr(struct ib_mr *mr, struct ib_mr_attr *mr_attr)
562 {
563 int ret = 0;
564 u64 h_ret;
565 struct ehca_shca *shca =
566 container_of(mr->device, struct ehca_shca, ib_device);
567 struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
568 unsigned long sl_flags;
569 struct ehca_mr_hipzout_parms hipzout;
570
571 if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
572 ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
573 "e_mr->flags=%x", mr, e_mr, e_mr->flags);
574 ret = -EINVAL;
575 goto query_mr_exit0;
576 }
577
578 memset(mr_attr, 0, sizeof(struct ib_mr_attr));
579 spin_lock_irqsave(&e_mr->mrlock, sl_flags);
580
581 h_ret = hipz_h_query_mr(shca->ipz_hca_handle, e_mr, &hipzout);
582 if (h_ret != H_SUCCESS) {
583 ehca_err(mr->device, "hipz_mr_query failed, h_ret=%li mr=%p "
584 "hca_hndl=%lx mr_hndl=%lx lkey=%x",
585 h_ret, mr, shca->ipz_hca_handle.handle,
586 e_mr->ipz_mr_handle.handle, mr->lkey);
587 ret = ehca2ib_return_code(h_ret);
588 goto query_mr_exit1;
589 }
590 mr_attr->pd = mr->pd;
591 mr_attr->device_virt_addr = hipzout.vaddr;
592 mr_attr->size = hipzout.len;
593 mr_attr->lkey = hipzout.lkey;
594 mr_attr->rkey = hipzout.rkey;
595 ehca_mrmw_reverse_map_acl(&hipzout.acl, &mr_attr->mr_access_flags);
596
597 query_mr_exit1:
598 spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
599 query_mr_exit0:
600 if (ret)
601 ehca_err(mr->device, "ret=%i mr=%p mr_attr=%p",
602 ret, mr, mr_attr);
603 return ret;
604 } /* end ehca_query_mr() */
605
606 /*----------------------------------------------------------------------*/
607
608 int ehca_dereg_mr(struct ib_mr *mr)
609 {
610 int ret = 0;
611 u64 h_ret;
612 struct ehca_shca *shca =
613 container_of(mr->device, struct ehca_shca, ib_device);
614 struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
615
616 if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
617 ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
618 "e_mr->flags=%x", mr, e_mr, e_mr->flags);
619 ret = -EINVAL;
620 goto dereg_mr_exit0;
621 } else if (e_mr == shca->maxmr) {
622 /* should be impossible, however reject to be sure */
623 ehca_err(mr->device, "dereg internal max-MR impossible, mr=%p "
624 "shca->maxmr=%p mr->lkey=%x",
625 mr, shca->maxmr, mr->lkey);
626 ret = -EINVAL;
627 goto dereg_mr_exit0;
628 }
629
630 /* TODO: BUSY: MR still has bound window(s) */
631 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
632 if (h_ret != H_SUCCESS) {
633 ehca_err(mr->device, "hipz_free_mr failed, h_ret=%li shca=%p "
634 "e_mr=%p hca_hndl=%lx mr_hndl=%lx mr->lkey=%x",
635 h_ret, shca, e_mr, shca->ipz_hca_handle.handle,
636 e_mr->ipz_mr_handle.handle, mr->lkey);
637 ret = ehca2ib_return_code(h_ret);
638 goto dereg_mr_exit0;
639 }
640
641 if (e_mr->umem)
642 ib_umem_release(e_mr->umem);
643
644 /* successful deregistration */
645 ehca_mr_delete(e_mr);
646
647 dereg_mr_exit0:
648 if (ret)
649 ehca_err(mr->device, "ret=%i mr=%p", ret, mr);
650 return ret;
651 } /* end ehca_dereg_mr() */
652
653 /*----------------------------------------------------------------------*/
654
655 struct ib_mw *ehca_alloc_mw(struct ib_pd *pd)
656 {
657 struct ib_mw *ib_mw;
658 u64 h_ret;
659 struct ehca_mw *e_mw;
660 struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
661 struct ehca_shca *shca =
662 container_of(pd->device, struct ehca_shca, ib_device);
663 struct ehca_mw_hipzout_parms hipzout;
664
665 e_mw = ehca_mw_new();
666 if (!e_mw) {
667 ib_mw = ERR_PTR(-ENOMEM);
668 goto alloc_mw_exit0;
669 }
670
671 h_ret = hipz_h_alloc_resource_mw(shca->ipz_hca_handle, e_mw,
672 e_pd->fw_pd, &hipzout);
673 if (h_ret != H_SUCCESS) {
674 ehca_err(pd->device, "hipz_mw_allocate failed, h_ret=%li "
675 "shca=%p hca_hndl=%lx mw=%p",
676 h_ret, shca, shca->ipz_hca_handle.handle, e_mw);
677 ib_mw = ERR_PTR(ehca2ib_return_code(h_ret));
678 goto alloc_mw_exit1;
679 }
680 /* successful MW allocation */
681 e_mw->ipz_mw_handle = hipzout.handle;
682 e_mw->ib_mw.rkey = hipzout.rkey;
683 return &e_mw->ib_mw;
684
685 alloc_mw_exit1:
686 ehca_mw_delete(e_mw);
687 alloc_mw_exit0:
688 if (IS_ERR(ib_mw))
689 ehca_err(pd->device, "h_ret=%li pd=%p", PTR_ERR(ib_mw), pd);
690 return ib_mw;
691 } /* end ehca_alloc_mw() */
692
693 /*----------------------------------------------------------------------*/
694
695 int ehca_bind_mw(struct ib_qp *qp,
696 struct ib_mw *mw,
697 struct ib_mw_bind *mw_bind)
698 {
699 /* TODO: not supported up to now */
700 ehca_gen_err("bind MW currently not supported by HCAD");
701
702 return -EPERM;
703 } /* end ehca_bind_mw() */
704
705 /*----------------------------------------------------------------------*/
706
707 int ehca_dealloc_mw(struct ib_mw *mw)
708 {
709 u64 h_ret;
710 struct ehca_shca *shca =
711 container_of(mw->device, struct ehca_shca, ib_device);
712 struct ehca_mw *e_mw = container_of(mw, struct ehca_mw, ib_mw);
713
714 h_ret = hipz_h_free_resource_mw(shca->ipz_hca_handle, e_mw);
715 if (h_ret != H_SUCCESS) {
716 ehca_err(mw->device, "hipz_free_mw failed, h_ret=%li shca=%p "
717 "mw=%p rkey=%x hca_hndl=%lx mw_hndl=%lx",
718 h_ret, shca, mw, mw->rkey, shca->ipz_hca_handle.handle,
719 e_mw->ipz_mw_handle.handle);
720 return ehca2ib_return_code(h_ret);
721 }
722 /* successful deallocation */
723 ehca_mw_delete(e_mw);
724 return 0;
725 } /* end ehca_dealloc_mw() */
726
727 /*----------------------------------------------------------------------*/
728
729 struct ib_fmr *ehca_alloc_fmr(struct ib_pd *pd,
730 int mr_access_flags,
731 struct ib_fmr_attr *fmr_attr)
732 {
733 struct ib_fmr *ib_fmr;
734 struct ehca_shca *shca =
735 container_of(pd->device, struct ehca_shca, ib_device);
736 struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
737 struct ehca_mr *e_fmr;
738 int ret;
739 u32 tmp_lkey, tmp_rkey;
740 struct ehca_mr_pginfo pginfo;
741 u64 hw_pgsize;
742
743 /* check other parameters */
744 if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
745 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
746 ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
747 !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
748 /*
749 * Remote Write Access requires Local Write Access
750 * Remote Atomic Access requires Local Write Access
751 */
752 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
753 mr_access_flags);
754 ib_fmr = ERR_PTR(-EINVAL);
755 goto alloc_fmr_exit0;
756 }
757 if (mr_access_flags & IB_ACCESS_MW_BIND) {
758 ehca_err(pd->device, "bad input values: mr_access_flags=%x",
759 mr_access_flags);
760 ib_fmr = ERR_PTR(-EINVAL);
761 goto alloc_fmr_exit0;
762 }
763 if ((fmr_attr->max_pages == 0) || (fmr_attr->max_maps == 0)) {
764 ehca_err(pd->device, "bad input values: fmr_attr->max_pages=%x "
765 "fmr_attr->max_maps=%x fmr_attr->page_shift=%x",
766 fmr_attr->max_pages, fmr_attr->max_maps,
767 fmr_attr->page_shift);
768 ib_fmr = ERR_PTR(-EINVAL);
769 goto alloc_fmr_exit0;
770 }
771
772 hw_pgsize = 1 << fmr_attr->page_shift;
773 if (!(hw_pgsize & shca->hca_cap_mr_pgsize)) {
774 ehca_err(pd->device, "unsupported fmr_attr->page_shift=%x",
775 fmr_attr->page_shift);
776 ib_fmr = ERR_PTR(-EINVAL);
777 goto alloc_fmr_exit0;
778 }
779
780 e_fmr = ehca_mr_new();
781 if (!e_fmr) {
782 ib_fmr = ERR_PTR(-ENOMEM);
783 goto alloc_fmr_exit0;
784 }
785 e_fmr->flags |= EHCA_MR_FLAG_FMR;
786
787 /* register MR on HCA */
788 memset(&pginfo, 0, sizeof(pginfo));
789 pginfo.hwpage_size = hw_pgsize;
790 /*
791 * pginfo.num_hwpages==0, ie register_rpages() will not be called
792 * but deferred to map_phys_fmr()
793 */
794 ret = ehca_reg_mr(shca, e_fmr, NULL,
795 fmr_attr->max_pages * (1 << fmr_attr->page_shift),
796 mr_access_flags, e_pd, &pginfo,
797 &tmp_lkey, &tmp_rkey);
798 if (ret) {
799 ib_fmr = ERR_PTR(ret);
800 goto alloc_fmr_exit1;
801 }
802
803 /* successful */
804 e_fmr->hwpage_size = hw_pgsize;
805 e_fmr->fmr_page_size = 1 << fmr_attr->page_shift;
806 e_fmr->fmr_max_pages = fmr_attr->max_pages;
807 e_fmr->fmr_max_maps = fmr_attr->max_maps;
808 e_fmr->fmr_map_cnt = 0;
809 return &e_fmr->ib.ib_fmr;
810
811 alloc_fmr_exit1:
812 ehca_mr_delete(e_fmr);
813 alloc_fmr_exit0:
814 return ib_fmr;
815 } /* end ehca_alloc_fmr() */
816
817 /*----------------------------------------------------------------------*/
818
819 int ehca_map_phys_fmr(struct ib_fmr *fmr,
820 u64 *page_list,
821 int list_len,
822 u64 iova)
823 {
824 int ret;
825 struct ehca_shca *shca =
826 container_of(fmr->device, struct ehca_shca, ib_device);
827 struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
828 struct ehca_pd *e_pd = container_of(fmr->pd, struct ehca_pd, ib_pd);
829 struct ehca_mr_pginfo pginfo;
830 u32 tmp_lkey, tmp_rkey;
831
832 if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
833 ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
834 e_fmr, e_fmr->flags);
835 ret = -EINVAL;
836 goto map_phys_fmr_exit0;
837 }
838 ret = ehca_fmr_check_page_list(e_fmr, page_list, list_len);
839 if (ret)
840 goto map_phys_fmr_exit0;
841 if (iova % e_fmr->fmr_page_size) {
842 /* only whole-numbered pages */
843 ehca_err(fmr->device, "bad iova, iova=%lx fmr_page_size=%x",
844 iova, e_fmr->fmr_page_size);
845 ret = -EINVAL;
846 goto map_phys_fmr_exit0;
847 }
848 if (e_fmr->fmr_map_cnt >= e_fmr->fmr_max_maps) {
849 /* HCAD does not limit the maps, however trace this anyway */
850 ehca_info(fmr->device, "map limit exceeded, fmr=%p "
851 "e_fmr->fmr_map_cnt=%x e_fmr->fmr_max_maps=%x",
852 fmr, e_fmr->fmr_map_cnt, e_fmr->fmr_max_maps);
853 }
854
855 memset(&pginfo, 0, sizeof(pginfo));
856 pginfo.type = EHCA_MR_PGI_FMR;
857 pginfo.num_kpages = list_len;
858 pginfo.hwpage_size = e_fmr->hwpage_size;
859 pginfo.num_hwpages =
860 list_len * e_fmr->fmr_page_size / pginfo.hwpage_size;
861 pginfo.u.fmr.page_list = page_list;
862 pginfo.next_hwpage =
863 (iova & (e_fmr->fmr_page_size-1)) / pginfo.hwpage_size;
864 pginfo.u.fmr.fmr_pgsize = e_fmr->fmr_page_size;
865
866 ret = ehca_rereg_mr(shca, e_fmr, (u64 *)iova,
867 list_len * e_fmr->fmr_page_size,
868 e_fmr->acl, e_pd, &pginfo, &tmp_lkey, &tmp_rkey);
869 if (ret)
870 goto map_phys_fmr_exit0;
871
872 /* successful reregistration */
873 e_fmr->fmr_map_cnt++;
874 e_fmr->ib.ib_fmr.lkey = tmp_lkey;
875 e_fmr->ib.ib_fmr.rkey = tmp_rkey;
876 return 0;
877
878 map_phys_fmr_exit0:
879 if (ret)
880 ehca_err(fmr->device, "ret=%i fmr=%p page_list=%p list_len=%x "
881 "iova=%lx", ret, fmr, page_list, list_len, iova);
882 return ret;
883 } /* end ehca_map_phys_fmr() */
884
885 /*----------------------------------------------------------------------*/
886
887 int ehca_unmap_fmr(struct list_head *fmr_list)
888 {
889 int ret = 0;
890 struct ib_fmr *ib_fmr;
891 struct ehca_shca *shca = NULL;
892 struct ehca_shca *prev_shca;
893 struct ehca_mr *e_fmr;
894 u32 num_fmr = 0;
895 u32 unmap_fmr_cnt = 0;
896
897 /* check all FMR belong to same SHCA, and check internal flag */
898 list_for_each_entry(ib_fmr, fmr_list, list) {
899 prev_shca = shca;
900 if (!ib_fmr) {
901 ehca_gen_err("bad fmr=%p in list", ib_fmr);
902 ret = -EINVAL;
903 goto unmap_fmr_exit0;
904 }
905 shca = container_of(ib_fmr->device, struct ehca_shca,
906 ib_device);
907 e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
908 if ((shca != prev_shca) && prev_shca) {
909 ehca_err(&shca->ib_device, "SHCA mismatch, shca=%p "
910 "prev_shca=%p e_fmr=%p",
911 shca, prev_shca, e_fmr);
912 ret = -EINVAL;
913 goto unmap_fmr_exit0;
914 }
915 if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
916 ehca_err(&shca->ib_device, "not a FMR, e_fmr=%p "
917 "e_fmr->flags=%x", e_fmr, e_fmr->flags);
918 ret = -EINVAL;
919 goto unmap_fmr_exit0;
920 }
921 num_fmr++;
922 }
923
924 /* loop over all FMRs to unmap */
925 list_for_each_entry(ib_fmr, fmr_list, list) {
926 unmap_fmr_cnt++;
927 e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
928 shca = container_of(ib_fmr->device, struct ehca_shca,
929 ib_device);
930 ret = ehca_unmap_one_fmr(shca, e_fmr);
931 if (ret) {
932 /* unmap failed, stop unmapping of rest of FMRs */
933 ehca_err(&shca->ib_device, "unmap of one FMR failed, "
934 "stop rest, e_fmr=%p num_fmr=%x "
935 "unmap_fmr_cnt=%x lkey=%x", e_fmr, num_fmr,
936 unmap_fmr_cnt, e_fmr->ib.ib_fmr.lkey);
937 goto unmap_fmr_exit0;
938 }
939 }
940
941 unmap_fmr_exit0:
942 if (ret)
943 ehca_gen_err("ret=%i fmr_list=%p num_fmr=%x unmap_fmr_cnt=%x",
944 ret, fmr_list, num_fmr, unmap_fmr_cnt);
945 return ret;
946 } /* end ehca_unmap_fmr() */
947
948 /*----------------------------------------------------------------------*/
949
950 int ehca_dealloc_fmr(struct ib_fmr *fmr)
951 {
952 int ret;
953 u64 h_ret;
954 struct ehca_shca *shca =
955 container_of(fmr->device, struct ehca_shca, ib_device);
956 struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
957
958 if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
959 ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
960 e_fmr, e_fmr->flags);
961 ret = -EINVAL;
962 goto free_fmr_exit0;
963 }
964
965 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
966 if (h_ret != H_SUCCESS) {
967 ehca_err(fmr->device, "hipz_free_mr failed, h_ret=%li e_fmr=%p "
968 "hca_hndl=%lx fmr_hndl=%lx fmr->lkey=%x",
969 h_ret, e_fmr, shca->ipz_hca_handle.handle,
970 e_fmr->ipz_mr_handle.handle, fmr->lkey);
971 ret = ehca2ib_return_code(h_ret);
972 goto free_fmr_exit0;
973 }
974 /* successful deregistration */
975 ehca_mr_delete(e_fmr);
976 return 0;
977
978 free_fmr_exit0:
979 if (ret)
980 ehca_err(&shca->ib_device, "ret=%i fmr=%p", ret, fmr);
981 return ret;
982 } /* end ehca_dealloc_fmr() */
983
984 /*----------------------------------------------------------------------*/
985
986 int ehca_reg_mr(struct ehca_shca *shca,
987 struct ehca_mr *e_mr,
988 u64 *iova_start,
989 u64 size,
990 int acl,
991 struct ehca_pd *e_pd,
992 struct ehca_mr_pginfo *pginfo,
993 u32 *lkey, /*OUT*/
994 u32 *rkey) /*OUT*/
995 {
996 int ret;
997 u64 h_ret;
998 u32 hipz_acl;
999 struct ehca_mr_hipzout_parms hipzout;
1000
1001 ehca_mrmw_map_acl(acl, &hipz_acl);
1002 ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
1003 if (ehca_use_hp_mr == 1)
1004 hipz_acl |= 0x00000001;
1005
1006 h_ret = hipz_h_alloc_resource_mr(shca->ipz_hca_handle, e_mr,
1007 (u64)iova_start, size, hipz_acl,
1008 e_pd->fw_pd, &hipzout);
1009 if (h_ret != H_SUCCESS) {
1010 ehca_err(&shca->ib_device, "hipz_alloc_mr failed, h_ret=%li "
1011 "hca_hndl=%lx", h_ret, shca->ipz_hca_handle.handle);
1012 ret = ehca2ib_return_code(h_ret);
1013 goto ehca_reg_mr_exit0;
1014 }
1015
1016 e_mr->ipz_mr_handle = hipzout.handle;
1017
1018 ret = ehca_reg_mr_rpages(shca, e_mr, pginfo);
1019 if (ret)
1020 goto ehca_reg_mr_exit1;
1021
1022 /* successful registration */
1023 e_mr->num_kpages = pginfo->num_kpages;
1024 e_mr->num_hwpages = pginfo->num_hwpages;
1025 e_mr->hwpage_size = pginfo->hwpage_size;
1026 e_mr->start = iova_start;
1027 e_mr->size = size;
1028 e_mr->acl = acl;
1029 *lkey = hipzout.lkey;
1030 *rkey = hipzout.rkey;
1031 return 0;
1032
1033 ehca_reg_mr_exit1:
1034 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
1035 if (h_ret != H_SUCCESS) {
1036 ehca_err(&shca->ib_device, "h_ret=%li shca=%p e_mr=%p "
1037 "iova_start=%p size=%lx acl=%x e_pd=%p lkey=%x "
1038 "pginfo=%p num_kpages=%lx num_hwpages=%lx ret=%i",
1039 h_ret, shca, e_mr, iova_start, size, acl, e_pd,
1040 hipzout.lkey, pginfo, pginfo->num_kpages,
1041 pginfo->num_hwpages, ret);
1042 ehca_err(&shca->ib_device, "internal error in ehca_reg_mr, "
1043 "not recoverable");
1044 }
1045 ehca_reg_mr_exit0:
1046 if (ret)
1047 ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "
1048 "iova_start=%p size=%lx acl=%x e_pd=%p pginfo=%p "
1049 "num_kpages=%lx num_hwpages=%lx",
1050 ret, shca, e_mr, iova_start, size, acl, e_pd, pginfo,
1051 pginfo->num_kpages, pginfo->num_hwpages);
1052 return ret;
1053 } /* end ehca_reg_mr() */
1054
1055 /*----------------------------------------------------------------------*/
1056
1057 int ehca_reg_mr_rpages(struct ehca_shca *shca,
1058 struct ehca_mr *e_mr,
1059 struct ehca_mr_pginfo *pginfo)
1060 {
1061 int ret = 0;
1062 u64 h_ret;
1063 u32 rnum;
1064 u64 rpage;
1065 u32 i;
1066 u64 *kpage;
1067
1068 if (!pginfo->num_hwpages) /* in case of fmr */
1069 return 0;
1070
1071 kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
1072 if (!kpage) {
1073 ehca_err(&shca->ib_device, "kpage alloc failed");
1074 ret = -ENOMEM;
1075 goto ehca_reg_mr_rpages_exit0;
1076 }
1077
1078 /* max MAX_RPAGES ehca mr pages per register call */
1079 for (i = 0; i < NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES); i++) {
1080
1081 if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
1082 rnum = pginfo->num_hwpages % MAX_RPAGES; /* last shot */
1083 if (rnum == 0)
1084 rnum = MAX_RPAGES; /* last shot is full */
1085 } else
1086 rnum = MAX_RPAGES;
1087
1088 ret = ehca_set_pagebuf(pginfo, rnum, kpage);
1089 if (ret) {
1090 ehca_err(&shca->ib_device, "ehca_set_pagebuf "
1091 "bad rc, ret=%i rnum=%x kpage=%p",
1092 ret, rnum, kpage);
1093 goto ehca_reg_mr_rpages_exit1;
1094 }
1095
1096 if (rnum > 1) {
1097 rpage = virt_to_abs(kpage);
1098 if (!rpage) {
1099 ehca_err(&shca->ib_device, "kpage=%p i=%x",
1100 kpage, i);
1101 ret = -EFAULT;
1102 goto ehca_reg_mr_rpages_exit1;
1103 }
1104 } else
1105 rpage = *kpage;
1106
1107 h_ret = hipz_h_register_rpage_mr(
1108 shca->ipz_hca_handle, e_mr,
1109 ehca_encode_hwpage_size(pginfo->hwpage_size),
1110 0, rpage, rnum);
1111
1112 if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
1113 /*
1114 * check for 'registration complete'==H_SUCCESS
1115 * and for 'page registered'==H_PAGE_REGISTERED
1116 */
1117 if (h_ret != H_SUCCESS) {
1118 ehca_err(&shca->ib_device, "last "
1119 "hipz_reg_rpage_mr failed, h_ret=%li "
1120 "e_mr=%p i=%x hca_hndl=%lx mr_hndl=%lx"
1121 " lkey=%x", h_ret, e_mr, i,
1122 shca->ipz_hca_handle.handle,
1123 e_mr->ipz_mr_handle.handle,
1124 e_mr->ib.ib_mr.lkey);
1125 ret = ehca2ib_return_code(h_ret);
1126 break;
1127 } else
1128 ret = 0;
1129 } else if (h_ret != H_PAGE_REGISTERED) {
1130 ehca_err(&shca->ib_device, "hipz_reg_rpage_mr failed, "
1131 "h_ret=%li e_mr=%p i=%x lkey=%x hca_hndl=%lx "
1132 "mr_hndl=%lx", h_ret, e_mr, i,
1133 e_mr->ib.ib_mr.lkey,
1134 shca->ipz_hca_handle.handle,
1135 e_mr->ipz_mr_handle.handle);
1136 ret = ehca2ib_return_code(h_ret);
1137 break;
1138 } else
1139 ret = 0;
1140 } /* end for(i) */
1141
1142
1143 ehca_reg_mr_rpages_exit1:
1144 ehca_free_fw_ctrlblock(kpage);
1145 ehca_reg_mr_rpages_exit0:
1146 if (ret)
1147 ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p pginfo=%p "
1148 "num_kpages=%lx num_hwpages=%lx", ret, shca, e_mr,
1149 pginfo, pginfo->num_kpages, pginfo->num_hwpages);
1150 return ret;
1151 } /* end ehca_reg_mr_rpages() */
1152
1153 /*----------------------------------------------------------------------*/
1154
1155 inline int ehca_rereg_mr_rereg1(struct ehca_shca *shca,
1156 struct ehca_mr *e_mr,
1157 u64 *iova_start,
1158 u64 size,
1159 u32 acl,
1160 struct ehca_pd *e_pd,
1161 struct ehca_mr_pginfo *pginfo,
1162 u32 *lkey, /*OUT*/
1163 u32 *rkey) /*OUT*/
1164 {
1165 int ret;
1166 u64 h_ret;
1167 u32 hipz_acl;
1168 u64 *kpage;
1169 u64 rpage;
1170 struct ehca_mr_pginfo pginfo_save;
1171 struct ehca_mr_hipzout_parms hipzout;
1172
1173 ehca_mrmw_map_acl(acl, &hipz_acl);
1174 ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
1175
1176 kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
1177 if (!kpage) {
1178 ehca_err(&shca->ib_device, "kpage alloc failed");
1179 ret = -ENOMEM;
1180 goto ehca_rereg_mr_rereg1_exit0;
1181 }
1182
1183 pginfo_save = *pginfo;
1184 ret = ehca_set_pagebuf(pginfo, pginfo->num_hwpages, kpage);
1185 if (ret) {
1186 ehca_err(&shca->ib_device, "set pagebuf failed, e_mr=%p "
1187 "pginfo=%p type=%x num_kpages=%lx num_hwpages=%lx "
1188 "kpage=%p", e_mr, pginfo, pginfo->type,
1189 pginfo->num_kpages, pginfo->num_hwpages, kpage);
1190 goto ehca_rereg_mr_rereg1_exit1;
1191 }
1192 rpage = virt_to_abs(kpage);
1193 if (!rpage) {
1194 ehca_err(&shca->ib_device, "kpage=%p", kpage);
1195 ret = -EFAULT;
1196 goto ehca_rereg_mr_rereg1_exit1;
1197 }
1198 h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_mr,
1199 (u64)iova_start, size, hipz_acl,
1200 e_pd->fw_pd, rpage, &hipzout);
1201 if (h_ret != H_SUCCESS) {
1202 /*
1203 * reregistration unsuccessful, try it again with the 3 hCalls,
1204 * e.g. this is required in case H_MR_CONDITION
1205 * (MW bound or MR is shared)
1206 */
1207 ehca_warn(&shca->ib_device, "hipz_h_reregister_pmr failed "
1208 "(Rereg1), h_ret=%li e_mr=%p", h_ret, e_mr);
1209 *pginfo = pginfo_save;
1210 ret = -EAGAIN;
1211 } else if ((u64 *)hipzout.vaddr != iova_start) {
1212 ehca_err(&shca->ib_device, "PHYP changed iova_start in "
1213 "rereg_pmr, iova_start=%p iova_start_out=%lx e_mr=%p "
1214 "mr_handle=%lx lkey=%x lkey_out=%x", iova_start,
1215 hipzout.vaddr, e_mr, e_mr->ipz_mr_handle.handle,
1216 e_mr->ib.ib_mr.lkey, hipzout.lkey);
1217 ret = -EFAULT;
1218 } else {
1219 /*
1220 * successful reregistration
1221 * note: start and start_out are identical for eServer HCAs
1222 */
1223 e_mr->num_kpages = pginfo->num_kpages;
1224 e_mr->num_hwpages = pginfo->num_hwpages;
1225 e_mr->hwpage_size = pginfo->hwpage_size;
1226 e_mr->start = iova_start;
1227 e_mr->size = size;
1228 e_mr->acl = acl;
1229 *lkey = hipzout.lkey;
1230 *rkey = hipzout.rkey;
1231 }
1232
1233 ehca_rereg_mr_rereg1_exit1:
1234 ehca_free_fw_ctrlblock(kpage);
1235 ehca_rereg_mr_rereg1_exit0:
1236 if ( ret && (ret != -EAGAIN) )
1237 ehca_err(&shca->ib_device, "ret=%i lkey=%x rkey=%x "
1238 "pginfo=%p num_kpages=%lx num_hwpages=%lx",
1239 ret, *lkey, *rkey, pginfo, pginfo->num_kpages,
1240 pginfo->num_hwpages);
1241 return ret;
1242 } /* end ehca_rereg_mr_rereg1() */
1243
1244 /*----------------------------------------------------------------------*/
1245
1246 int ehca_rereg_mr(struct ehca_shca *shca,
1247 struct ehca_mr *e_mr,
1248 u64 *iova_start,
1249 u64 size,
1250 int acl,
1251 struct ehca_pd *e_pd,
1252 struct ehca_mr_pginfo *pginfo,
1253 u32 *lkey,
1254 u32 *rkey)
1255 {
1256 int ret = 0;
1257 u64 h_ret;
1258 int rereg_1_hcall = 1; /* 1: use hipz_h_reregister_pmr directly */
1259 int rereg_3_hcall = 0; /* 1: use 3 hipz calls for reregistration */
1260
1261 /* first determine reregistration hCall(s) */
1262 if ((pginfo->num_hwpages > MAX_RPAGES) ||
1263 (e_mr->num_hwpages > MAX_RPAGES) ||
1264 (pginfo->num_hwpages > e_mr->num_hwpages)) {
1265 ehca_dbg(&shca->ib_device, "Rereg3 case, "
1266 "pginfo->num_hwpages=%lx e_mr->num_hwpages=%x",
1267 pginfo->num_hwpages, e_mr->num_hwpages);
1268 rereg_1_hcall = 0;
1269 rereg_3_hcall = 1;
1270 }
1271
1272 if (e_mr->flags & EHCA_MR_FLAG_MAXMR) { /* check for max-MR */
1273 rereg_1_hcall = 0;
1274 rereg_3_hcall = 1;
1275 e_mr->flags &= ~EHCA_MR_FLAG_MAXMR;
1276 ehca_err(&shca->ib_device, "Rereg MR for max-MR! e_mr=%p",
1277 e_mr);
1278 }
1279
1280 if (rereg_1_hcall) {
1281 ret = ehca_rereg_mr_rereg1(shca, e_mr, iova_start, size,
1282 acl, e_pd, pginfo, lkey, rkey);
1283 if (ret) {
1284 if (ret == -EAGAIN)
1285 rereg_3_hcall = 1;
1286 else
1287 goto ehca_rereg_mr_exit0;
1288 }
1289 }
1290
1291 if (rereg_3_hcall) {
1292 struct ehca_mr save_mr;
1293
1294 /* first deregister old MR */
1295 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
1296 if (h_ret != H_SUCCESS) {
1297 ehca_err(&shca->ib_device, "hipz_free_mr failed, "
1298 "h_ret=%li e_mr=%p hca_hndl=%lx mr_hndl=%lx "
1299 "mr->lkey=%x",
1300 h_ret, e_mr, shca->ipz_hca_handle.handle,
1301 e_mr->ipz_mr_handle.handle,
1302 e_mr->ib.ib_mr.lkey);
1303 ret = ehca2ib_return_code(h_ret);
1304 goto ehca_rereg_mr_exit0;
1305 }
1306 /* clean ehca_mr_t, without changing struct ib_mr and lock */
1307 save_mr = *e_mr;
1308 ehca_mr_deletenew(e_mr);
1309
1310 /* set some MR values */
1311 e_mr->flags = save_mr.flags;
1312 e_mr->hwpage_size = save_mr.hwpage_size;
1313 e_mr->fmr_page_size = save_mr.fmr_page_size;
1314 e_mr->fmr_max_pages = save_mr.fmr_max_pages;
1315 e_mr->fmr_max_maps = save_mr.fmr_max_maps;
1316 e_mr->fmr_map_cnt = save_mr.fmr_map_cnt;
1317
1318 ret = ehca_reg_mr(shca, e_mr, iova_start, size, acl,
1319 e_pd, pginfo, lkey, rkey);
1320 if (ret) {
1321 u32 offset = (u64)(&e_mr->flags) - (u64)e_mr;
1322 memcpy(&e_mr->flags, &(save_mr.flags),
1323 sizeof(struct ehca_mr) - offset);
1324 goto ehca_rereg_mr_exit0;
1325 }
1326 }
1327
1328 ehca_rereg_mr_exit0:
1329 if (ret)
1330 ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "
1331 "iova_start=%p size=%lx acl=%x e_pd=%p pginfo=%p "
1332 "num_kpages=%lx lkey=%x rkey=%x rereg_1_hcall=%x "
1333 "rereg_3_hcall=%x", ret, shca, e_mr, iova_start, size,
1334 acl, e_pd, pginfo, pginfo->num_kpages, *lkey, *rkey,
1335 rereg_1_hcall, rereg_3_hcall);
1336 return ret;
1337 } /* end ehca_rereg_mr() */
1338
1339 /*----------------------------------------------------------------------*/
1340
1341 int ehca_unmap_one_fmr(struct ehca_shca *shca,
1342 struct ehca_mr *e_fmr)
1343 {
1344 int ret = 0;
1345 u64 h_ret;
1346 struct ehca_pd *e_pd =
1347 container_of(e_fmr->ib.ib_fmr.pd, struct ehca_pd, ib_pd);
1348 struct ehca_mr save_fmr;
1349 u32 tmp_lkey, tmp_rkey;
1350 struct ehca_mr_pginfo pginfo;
1351 struct ehca_mr_hipzout_parms hipzout;
1352 struct ehca_mr save_mr;
1353
1354 if (e_fmr->fmr_max_pages <= MAX_RPAGES) {
1355 /*
1356 * note: after using rereg hcall with len=0,
1357 * rereg hcall must be used again for registering pages
1358 */
1359 h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_fmr, 0,
1360 0, 0, e_pd->fw_pd, 0, &hipzout);
1361 if (h_ret == H_SUCCESS) {
1362 /* successful reregistration */
1363 e_fmr->start = NULL;
1364 e_fmr->size = 0;
1365 tmp_lkey = hipzout.lkey;
1366 tmp_rkey = hipzout.rkey;
1367 return 0;
1368 }
1369 /*
1370 * should not happen, because length checked above,
1371 * FMRs are not shared and no MW bound to FMRs
1372 */
1373 ehca_err(&shca->ib_device, "hipz_reregister_pmr failed "
1374 "(Rereg1), h_ret=%li e_fmr=%p hca_hndl=%lx "
1375 "mr_hndl=%lx lkey=%x lkey_out=%x",
1376 h_ret, e_fmr, shca->ipz_hca_handle.handle,
1377 e_fmr->ipz_mr_handle.handle,
1378 e_fmr->ib.ib_fmr.lkey, hipzout.lkey);
1379 /* try free and rereg */
1380 }
1381
1382 /* first free old FMR */
1383 h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
1384 if (h_ret != H_SUCCESS) {
1385 ehca_err(&shca->ib_device, "hipz_free_mr failed, "
1386 "h_ret=%li e_fmr=%p hca_hndl=%lx mr_hndl=%lx "
1387 "lkey=%x",
1388 h_ret, e_fmr, shca->ipz_hca_handle.handle,
1389 e_fmr->ipz_mr_handle.handle,
1390 e_fmr->ib.ib_fmr.lkey);
1391 ret = ehca2ib_return_code(h_ret);
1392 goto ehca_unmap_one_fmr_exit0;
1393 }
1394 /* clean ehca_mr_t, without changing lock */
1395 save_fmr = *e_fmr;
1396 ehca_mr_deletenew(e_fmr);
1397
1398 /* set some MR values */
1399 e_fmr->flags = save_fmr.flags;
1400 e_fmr->hwpage_size = save_fmr.hwpage_size;
1401 e_fmr->fmr_page_size = save_fmr.fmr_page_size;
1402 e_fmr->fmr_max_pages = save_fmr.fmr_max_pages;
1403 e_fmr->fmr_max_maps = save_fmr.fmr_max_maps;
1404 e_fmr->fmr_map_cnt = save_fmr.fmr_map_cnt;
1405 e_fmr->acl = save_fmr.acl;
1406
1407 memset(&pginfo, 0, sizeof(pginfo));
1408 pginfo.type = EHCA_MR_PGI_FMR;
1409 ret = ehca_reg_mr(shca, e_fmr, NULL,
1410 (e_fmr->fmr_max_pages * e_fmr->fmr_page_size),
1411 e_fmr->acl, e_pd, &pginfo, &tmp_lkey,
1412 &tmp_rkey);
1413 if (ret) {
1414 u32 offset = (u64)(&e_fmr->flags) - (u64)e_fmr;
1415 memcpy(&e_fmr->flags, &(save_mr.flags),
1416 sizeof(struct ehca_mr) - offset);
1417 }
1418
1419 ehca_unmap_one_fmr_exit0:
1420 if (ret)
1421 ehca_err(&shca->ib_device, "ret=%i tmp_lkey=%x tmp_rkey=%x "
1422 "fmr_max_pages=%x",
1423 ret, tmp_lkey, tmp_rkey, e_fmr->fmr_max_pages);
1424 return ret;
1425 } /* end ehca_unmap_one_fmr() */
1426
1427 /*----------------------------------------------------------------------*/
1428
1429 int ehca_reg_smr(struct ehca_shca *shca,
1430 struct ehca_mr *e_origmr,
1431 struct ehca_mr *e_newmr,
1432 u64 *iova_start,
1433 int acl,
1434 struct ehca_pd *e_pd,
1435 u32 *lkey, /*OUT*/
1436 u32 *rkey) /*OUT*/
1437 {
1438 int ret = 0;
1439 u64 h_ret;
1440 u32 hipz_acl;
1441 struct ehca_mr_hipzout_parms hipzout;
1442
1443 ehca_mrmw_map_acl(acl, &hipz_acl);
1444 ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
1445
1446 h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
1447 (u64)iova_start, hipz_acl, e_pd->fw_pd,
1448 &hipzout);
1449 if (h_ret != H_SUCCESS) {
1450 ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%li "
1451 "shca=%p e_origmr=%p e_newmr=%p iova_start=%p acl=%x "
1452 "e_pd=%p hca_hndl=%lx mr_hndl=%lx lkey=%x",
1453 h_ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd,
1454 shca->ipz_hca_handle.handle,
1455 e_origmr->ipz_mr_handle.handle,
1456 e_origmr->ib.ib_mr.lkey);
1457 ret = ehca2ib_return_code(h_ret);
1458 goto ehca_reg_smr_exit0;
1459 }
1460 /* successful registration */
1461 e_newmr->num_kpages = e_origmr->num_kpages;
1462 e_newmr->num_hwpages = e_origmr->num_hwpages;
1463 e_newmr->hwpage_size = e_origmr->hwpage_size;
1464 e_newmr->start = iova_start;
1465 e_newmr->size = e_origmr->size;
1466 e_newmr->acl = acl;
1467 e_newmr->ipz_mr_handle = hipzout.handle;
1468 *lkey = hipzout.lkey;
1469 *rkey = hipzout.rkey;
1470 return 0;
1471
1472 ehca_reg_smr_exit0:
1473 if (ret)
1474 ehca_err(&shca->ib_device, "ret=%i shca=%p e_origmr=%p "
1475 "e_newmr=%p iova_start=%p acl=%x e_pd=%p",
1476 ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd);
1477 return ret;
1478 } /* end ehca_reg_smr() */
1479
1480 /*----------------------------------------------------------------------*/
1481
1482 /* register internal max-MR to internal SHCA */
1483 int ehca_reg_internal_maxmr(
1484 struct ehca_shca *shca,
1485 struct ehca_pd *e_pd,
1486 struct ehca_mr **e_maxmr) /*OUT*/
1487 {
1488 int ret;
1489 struct ehca_mr *e_mr;
1490 u64 *iova_start;
1491 u64 size_maxmr;
1492 struct ehca_mr_pginfo pginfo;
1493 struct ib_phys_buf ib_pbuf;
1494 u32 num_kpages;
1495 u32 num_hwpages;
1496 u64 hw_pgsize;
1497
1498 e_mr = ehca_mr_new();
1499 if (!e_mr) {
1500 ehca_err(&shca->ib_device, "out of memory");
1501 ret = -ENOMEM;
1502 goto ehca_reg_internal_maxmr_exit0;
1503 }
1504 e_mr->flags |= EHCA_MR_FLAG_MAXMR;
1505
1506 /* register internal max-MR on HCA */
1507 size_maxmr = (u64)high_memory - PAGE_OFFSET;
1508 iova_start = (u64 *)KERNELBASE;
1509 ib_pbuf.addr = 0;
1510 ib_pbuf.size = size_maxmr;
1511 num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size_maxmr,
1512 PAGE_SIZE);
1513 hw_pgsize = ehca_get_max_hwpage_size(shca);
1514 num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size_maxmr,
1515 hw_pgsize);
1516
1517 memset(&pginfo, 0, sizeof(pginfo));
1518 pginfo.type = EHCA_MR_PGI_PHYS;
1519 pginfo.num_kpages = num_kpages;
1520 pginfo.num_hwpages = num_hwpages;
1521 pginfo.hwpage_size = hw_pgsize;
1522 pginfo.u.phy.num_phys_buf = 1;
1523 pginfo.u.phy.phys_buf_array = &ib_pbuf;
1524
1525 ret = ehca_reg_mr(shca, e_mr, iova_start, size_maxmr, 0, e_pd,
1526 &pginfo, &e_mr->ib.ib_mr.lkey,
1527 &e_mr->ib.ib_mr.rkey);
1528 if (ret) {
1529 ehca_err(&shca->ib_device, "reg of internal max MR failed, "
1530 "e_mr=%p iova_start=%p size_maxmr=%lx num_kpages=%x "
1531 "num_hwpages=%x", e_mr, iova_start, size_maxmr,
1532 num_kpages, num_hwpages);
1533 goto ehca_reg_internal_maxmr_exit1;
1534 }
1535
1536 /* successful registration of all pages */
1537 e_mr->ib.ib_mr.device = e_pd->ib_pd.device;
1538 e_mr->ib.ib_mr.pd = &e_pd->ib_pd;
1539 e_mr->ib.ib_mr.uobject = NULL;
1540 atomic_inc(&(e_pd->ib_pd.usecnt));
1541 atomic_set(&(e_mr->ib.ib_mr.usecnt), 0);
1542 *e_maxmr = e_mr;
1543 return 0;
1544
1545 ehca_reg_internal_maxmr_exit1:
1546 ehca_mr_delete(e_mr);
1547 ehca_reg_internal_maxmr_exit0:
1548 if (ret)
1549 ehca_err(&shca->ib_device, "ret=%i shca=%p e_pd=%p e_maxmr=%p",
1550 ret, shca, e_pd, e_maxmr);
1551 return ret;
1552 } /* end ehca_reg_internal_maxmr() */
1553
1554 /*----------------------------------------------------------------------*/
1555
1556 int ehca_reg_maxmr(struct ehca_shca *shca,
1557 struct ehca_mr *e_newmr,
1558 u64 *iova_start,
1559 int acl,
1560 struct ehca_pd *e_pd,
1561 u32 *lkey,
1562 u32 *rkey)
1563 {
1564 u64 h_ret;
1565 struct ehca_mr *e_origmr = shca->maxmr;
1566 u32 hipz_acl;
1567 struct ehca_mr_hipzout_parms hipzout;
1568
1569 ehca_mrmw_map_acl(acl, &hipz_acl);
1570 ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
1571
1572 h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
1573 (u64)iova_start, hipz_acl, e_pd->fw_pd,
1574 &hipzout);
1575 if (h_ret != H_SUCCESS) {
1576 ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%li "
1577 "e_origmr=%p hca_hndl=%lx mr_hndl=%lx lkey=%x",
1578 h_ret, e_origmr, shca->ipz_hca_handle.handle,
1579 e_origmr->ipz_mr_handle.handle,
1580 e_origmr->ib.ib_mr.lkey);
1581 return ehca2ib_return_code(h_ret);
1582 }
1583 /* successful registration */
1584 e_newmr->num_kpages = e_origmr->num_kpages;
1585 e_newmr->num_hwpages = e_origmr->num_hwpages;
1586 e_newmr->hwpage_size = e_origmr->hwpage_size;
1587 e_newmr->start = iova_start;
1588 e_newmr->size = e_origmr->size;
1589 e_newmr->acl = acl;
1590 e_newmr->ipz_mr_handle = hipzout.handle;
1591 *lkey = hipzout.lkey;
1592 *rkey = hipzout.rkey;
1593 return 0;
1594 } /* end ehca_reg_maxmr() */
1595
1596 /*----------------------------------------------------------------------*/
1597
1598 int ehca_dereg_internal_maxmr(struct ehca_shca *shca)
1599 {
1600 int ret;
1601 struct ehca_mr *e_maxmr;
1602 struct ib_pd *ib_pd;
1603
1604 if (!shca->maxmr) {
1605 ehca_err(&shca->ib_device, "bad call, shca=%p", shca);
1606 ret = -EINVAL;
1607 goto ehca_dereg_internal_maxmr_exit0;
1608 }
1609
1610 e_maxmr = shca->maxmr;
1611 ib_pd = e_maxmr->ib.ib_mr.pd;
1612 shca->maxmr = NULL; /* remove internal max-MR indication from SHCA */
1613
1614 ret = ehca_dereg_mr(&e_maxmr->ib.ib_mr);
1615 if (ret) {
1616 ehca_err(&shca->ib_device, "dereg internal max-MR failed, "
1617 "ret=%i e_maxmr=%p shca=%p lkey=%x",
1618 ret, e_maxmr, shca, e_maxmr->ib.ib_mr.lkey);
1619 shca->maxmr = e_maxmr;
1620 goto ehca_dereg_internal_maxmr_exit0;
1621 }
1622
1623 atomic_dec(&ib_pd->usecnt);
1624
1625 ehca_dereg_internal_maxmr_exit0:
1626 if (ret)
1627 ehca_err(&shca->ib_device, "ret=%i shca=%p shca->maxmr=%p",
1628 ret, shca, shca->maxmr);
1629 return ret;
1630 } /* end ehca_dereg_internal_maxmr() */
1631
1632 /*----------------------------------------------------------------------*/
1633
1634 /*
1635 * check physical buffer array of MR verbs for validness and
1636 * calculates MR size
1637 */
1638 int ehca_mr_chk_buf_and_calc_size(struct ib_phys_buf *phys_buf_array,
1639 int num_phys_buf,
1640 u64 *iova_start,
1641 u64 *size)
1642 {
1643 struct ib_phys_buf *pbuf = phys_buf_array;
1644 u64 size_count = 0;
1645 u32 i;
1646
1647 if (num_phys_buf == 0) {
1648 ehca_gen_err("bad phys buf array len, num_phys_buf=0");
1649 return -EINVAL;
1650 }
1651 /* check first buffer */
1652 if (((u64)iova_start & ~PAGE_MASK) != (pbuf->addr & ~PAGE_MASK)) {
1653 ehca_gen_err("iova_start/addr mismatch, iova_start=%p "
1654 "pbuf->addr=%lx pbuf->size=%lx",
1655 iova_start, pbuf->addr, pbuf->size);
1656 return -EINVAL;
1657 }
1658 if (((pbuf->addr + pbuf->size) % PAGE_SIZE) &&
1659 (num_phys_buf > 1)) {
1660 ehca_gen_err("addr/size mismatch in 1st buf, pbuf->addr=%lx "
1661 "pbuf->size=%lx", pbuf->addr, pbuf->size);
1662 return -EINVAL;
1663 }
1664
1665 for (i = 0; i < num_phys_buf; i++) {
1666 if ((i > 0) && (pbuf->addr % PAGE_SIZE)) {
1667 ehca_gen_err("bad address, i=%x pbuf->addr=%lx "
1668 "pbuf->size=%lx",
1669 i, pbuf->addr, pbuf->size);
1670 return -EINVAL;
1671 }
1672 if (((i > 0) && /* not 1st */
1673 (i < (num_phys_buf - 1)) && /* not last */
1674 (pbuf->size % PAGE_SIZE)) || (pbuf->size == 0)) {
1675 ehca_gen_err("bad size, i=%x pbuf->size=%lx",
1676 i, pbuf->size);
1677 return -EINVAL;
1678 }
1679 size_count += pbuf->size;
1680 pbuf++;
1681 }
1682
1683 *size = size_count;
1684 return 0;
1685 } /* end ehca_mr_chk_buf_and_calc_size() */
1686
1687 /*----------------------------------------------------------------------*/
1688
1689 /* check page list of map FMR verb for validness */
1690 int ehca_fmr_check_page_list(struct ehca_mr *e_fmr,
1691 u64 *page_list,
1692 int list_len)
1693 {
1694 u32 i;
1695 u64 *page;
1696
1697 if ((list_len == 0) || (list_len > e_fmr->fmr_max_pages)) {
1698 ehca_gen_err("bad list_len, list_len=%x "
1699 "e_fmr->fmr_max_pages=%x fmr=%p",
1700 list_len, e_fmr->fmr_max_pages, e_fmr);
1701 return -EINVAL;
1702 }
1703
1704 /* each page must be aligned */
1705 page = page_list;
1706 for (i = 0; i < list_len; i++) {
1707 if (*page % e_fmr->fmr_page_size) {
1708 ehca_gen_err("bad page, i=%x *page=%lx page=%p fmr=%p "
1709 "fmr_page_size=%x", i, *page, page, e_fmr,
1710 e_fmr->fmr_page_size);
1711 return -EINVAL;
1712 }
1713 page++;
1714 }
1715
1716 return 0;
1717 } /* end ehca_fmr_check_page_list() */
1718
1719 /*----------------------------------------------------------------------*/
1720
1721 /* PAGE_SIZE >= pginfo->hwpage_size */
1722 static int ehca_set_pagebuf_user1(struct ehca_mr_pginfo *pginfo,
1723 u32 number,
1724 u64 *kpage)
1725 {
1726 int ret = 0;
1727 struct ib_umem_chunk *prev_chunk;
1728 struct ib_umem_chunk *chunk;
1729 u64 pgaddr;
1730 u32 i = 0;
1731 u32 j = 0;
1732 int hwpages_per_kpage = PAGE_SIZE / pginfo->hwpage_size;
1733
1734 /* loop over desired chunk entries */
1735 chunk = pginfo->u.usr.next_chunk;
1736 prev_chunk = pginfo->u.usr.next_chunk;
1737 list_for_each_entry_continue(
1738 chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
1739 for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
1740 pgaddr = page_to_pfn(sg_page(&chunk->page_list[i]))
1741 << PAGE_SHIFT ;
1742 *kpage = phys_to_abs(pgaddr +
1743 (pginfo->next_hwpage *
1744 pginfo->hwpage_size));
1745 if ( !(*kpage) ) {
1746 ehca_gen_err("pgaddr=%lx "
1747 "chunk->page_list[i]=%lx "
1748 "i=%x next_hwpage=%lx",
1749 pgaddr, (u64)sg_dma_address(
1750 &chunk->page_list[i]),
1751 i, pginfo->next_hwpage);
1752 return -EFAULT;
1753 }
1754 (pginfo->hwpage_cnt)++;
1755 (pginfo->next_hwpage)++;
1756 kpage++;
1757 if (pginfo->next_hwpage % hwpages_per_kpage == 0) {
1758 (pginfo->kpage_cnt)++;
1759 (pginfo->u.usr.next_nmap)++;
1760 pginfo->next_hwpage = 0;
1761 i++;
1762 }
1763 j++;
1764 if (j >= number) break;
1765 }
1766 if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
1767 (j >= number)) {
1768 pginfo->u.usr.next_nmap = 0;
1769 prev_chunk = chunk;
1770 break;
1771 } else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
1772 pginfo->u.usr.next_nmap = 0;
1773 prev_chunk = chunk;
1774 } else if (j >= number)
1775 break;
1776 else
1777 prev_chunk = chunk;
1778 }
1779 pginfo->u.usr.next_chunk =
1780 list_prepare_entry(prev_chunk,
1781 (&(pginfo->u.usr.region->chunk_list)),
1782 list);
1783 return ret;
1784 }
1785
1786 /*
1787 * check given pages for contiguous layout
1788 * last page addr is returned in prev_pgaddr for further check
1789 */
1790 static int ehca_check_kpages_per_ate(struct scatterlist *page_list,
1791 int start_idx, int end_idx,
1792 u64 *prev_pgaddr)
1793 {
1794 int t;
1795 for (t = start_idx; t <= end_idx; t++) {
1796 u64 pgaddr = page_to_pfn(sg_page(&page_list[t])) << PAGE_SHIFT;
1797 ehca_gen_dbg("chunk_page=%lx value=%016lx", pgaddr,
1798 *(u64 *)abs_to_virt(phys_to_abs(pgaddr)));
1799 if (pgaddr - PAGE_SIZE != *prev_pgaddr) {
1800 ehca_gen_err("uncontiguous page found pgaddr=%lx "
1801 "prev_pgaddr=%lx page_list_i=%x",
1802 pgaddr, *prev_pgaddr, t);
1803 return -EINVAL;
1804 }
1805 *prev_pgaddr = pgaddr;
1806 }
1807 return 0;
1808 }
1809
1810 /* PAGE_SIZE < pginfo->hwpage_size */
1811 static int ehca_set_pagebuf_user2(struct ehca_mr_pginfo *pginfo,
1812 u32 number,
1813 u64 *kpage)
1814 {
1815 int ret = 0;
1816 struct ib_umem_chunk *prev_chunk;
1817 struct ib_umem_chunk *chunk;
1818 u64 pgaddr, prev_pgaddr;
1819 u32 i = 0;
1820 u32 j = 0;
1821 int kpages_per_hwpage = pginfo->hwpage_size / PAGE_SIZE;
1822 int nr_kpages = kpages_per_hwpage;
1823
1824 /* loop over desired chunk entries */
1825 chunk = pginfo->u.usr.next_chunk;
1826 prev_chunk = pginfo->u.usr.next_chunk;
1827 list_for_each_entry_continue(
1828 chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
1829 for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
1830 if (nr_kpages == kpages_per_hwpage) {
1831 pgaddr = ( page_to_pfn(sg_page(&chunk->page_list[i]))
1832 << PAGE_SHIFT );
1833 *kpage = phys_to_abs(pgaddr);
1834 if ( !(*kpage) ) {
1835 ehca_gen_err("pgaddr=%lx i=%x",
1836 pgaddr, i);
1837 ret = -EFAULT;
1838 return ret;
1839 }
1840 /*
1841 * The first page in a hwpage must be aligned;
1842 * the first MR page is exempt from this rule.
1843 */
1844 if (pgaddr & (pginfo->hwpage_size - 1)) {
1845 if (pginfo->hwpage_cnt) {
1846 ehca_gen_err(
1847 "invalid alignment "
1848 "pgaddr=%lx i=%x "
1849 "mr_pgsize=%lx",
1850 pgaddr, i,
1851 pginfo->hwpage_size);
1852 ret = -EFAULT;
1853 return ret;
1854 }
1855 /* first MR page */
1856 pginfo->kpage_cnt =
1857 (pgaddr &
1858 (pginfo->hwpage_size - 1)) >>
1859 PAGE_SHIFT;
1860 nr_kpages -= pginfo->kpage_cnt;
1861 *kpage = phys_to_abs(
1862 pgaddr &
1863 ~(pginfo->hwpage_size - 1));
1864 }
1865 ehca_gen_dbg("kpage=%lx chunk_page=%lx "
1866 "value=%016lx", *kpage, pgaddr,
1867 *(u64 *)abs_to_virt(
1868 phys_to_abs(pgaddr)));
1869 prev_pgaddr = pgaddr;
1870 i++;
1871 pginfo->kpage_cnt++;
1872 pginfo->u.usr.next_nmap++;
1873 nr_kpages--;
1874 if (!nr_kpages)
1875 goto next_kpage;
1876 continue;
1877 }
1878 if (i + nr_kpages > chunk->nmap) {
1879 ret = ehca_check_kpages_per_ate(
1880 chunk->page_list, i,
1881 chunk->nmap - 1, &prev_pgaddr);
1882 if (ret) return ret;
1883 pginfo->kpage_cnt += chunk->nmap - i;
1884 pginfo->u.usr.next_nmap += chunk->nmap - i;
1885 nr_kpages -= chunk->nmap - i;
1886 break;
1887 }
1888
1889 ret = ehca_check_kpages_per_ate(chunk->page_list, i,
1890 i + nr_kpages - 1,
1891 &prev_pgaddr);
1892 if (ret) return ret;
1893 i += nr_kpages;
1894 pginfo->kpage_cnt += nr_kpages;
1895 pginfo->u.usr.next_nmap += nr_kpages;
1896 next_kpage:
1897 nr_kpages = kpages_per_hwpage;
1898 (pginfo->hwpage_cnt)++;
1899 kpage++;
1900 j++;
1901 if (j >= number) break;
1902 }
1903 if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
1904 (j >= number)) {
1905 pginfo->u.usr.next_nmap = 0;
1906 prev_chunk = chunk;
1907 break;
1908 } else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
1909 pginfo->u.usr.next_nmap = 0;
1910 prev_chunk = chunk;
1911 } else if (j >= number)
1912 break;
1913 else
1914 prev_chunk = chunk;
1915 }
1916 pginfo->u.usr.next_chunk =
1917 list_prepare_entry(prev_chunk,
1918 (&(pginfo->u.usr.region->chunk_list)),
1919 list);
1920 return ret;
1921 }
1922
1923 static int ehca_set_pagebuf_phys(struct ehca_mr_pginfo *pginfo,
1924 u32 number, u64 *kpage)
1925 {
1926 int ret = 0;
1927 struct ib_phys_buf *pbuf;
1928 u64 num_hw, offs_hw;
1929 u32 i = 0;
1930
1931 /* loop over desired phys_buf_array entries */
1932 while (i < number) {
1933 pbuf = pginfo->u.phy.phys_buf_array + pginfo->u.phy.next_buf;
1934 num_hw = NUM_CHUNKS((pbuf->addr % pginfo->hwpage_size) +
1935 pbuf->size, pginfo->hwpage_size);
1936 offs_hw = (pbuf->addr & ~(pginfo->hwpage_size - 1)) /
1937 pginfo->hwpage_size;
1938 while (pginfo->next_hwpage < offs_hw + num_hw) {
1939 /* sanity check */
1940 if ((pginfo->kpage_cnt >= pginfo->num_kpages) ||
1941 (pginfo->hwpage_cnt >= pginfo->num_hwpages)) {
1942 ehca_gen_err("kpage_cnt >= num_kpages, "
1943 "kpage_cnt=%lx num_kpages=%lx "
1944 "hwpage_cnt=%lx "
1945 "num_hwpages=%lx i=%x",
1946 pginfo->kpage_cnt,
1947 pginfo->num_kpages,
1948 pginfo->hwpage_cnt,
1949 pginfo->num_hwpages, i);
1950 return -EFAULT;
1951 }
1952 *kpage = phys_to_abs(
1953 (pbuf->addr & ~(pginfo->hwpage_size - 1)) +
1954 (pginfo->next_hwpage * pginfo->hwpage_size));
1955 if ( !(*kpage) && pbuf->addr ) {
1956 ehca_gen_err("pbuf->addr=%lx pbuf->size=%lx "
1957 "next_hwpage=%lx", pbuf->addr,
1958 pbuf->size, pginfo->next_hwpage);
1959 return -EFAULT;
1960 }
1961 (pginfo->hwpage_cnt)++;
1962 (pginfo->next_hwpage)++;
1963 if (PAGE_SIZE >= pginfo->hwpage_size) {
1964 if (pginfo->next_hwpage %
1965 (PAGE_SIZE / pginfo->hwpage_size) == 0)
1966 (pginfo->kpage_cnt)++;
1967 } else
1968 pginfo->kpage_cnt += pginfo->hwpage_size /
1969 PAGE_SIZE;
1970 kpage++;
1971 i++;
1972 if (i >= number) break;
1973 }
1974 if (pginfo->next_hwpage >= offs_hw + num_hw) {
1975 (pginfo->u.phy.next_buf)++;
1976 pginfo->next_hwpage = 0;
1977 }
1978 }
1979 return ret;
1980 }
1981
1982 static int ehca_set_pagebuf_fmr(struct ehca_mr_pginfo *pginfo,
1983 u32 number, u64 *kpage)
1984 {
1985 int ret = 0;
1986 u64 *fmrlist;
1987 u32 i;
1988
1989 /* loop over desired page_list entries */
1990 fmrlist = pginfo->u.fmr.page_list + pginfo->u.fmr.next_listelem;
1991 for (i = 0; i < number; i++) {
1992 *kpage = phys_to_abs((*fmrlist & ~(pginfo->hwpage_size - 1)) +
1993 pginfo->next_hwpage * pginfo->hwpage_size);
1994 if ( !(*kpage) ) {
1995 ehca_gen_err("*fmrlist=%lx fmrlist=%p "
1996 "next_listelem=%lx next_hwpage=%lx",
1997 *fmrlist, fmrlist,
1998 pginfo->u.fmr.next_listelem,
1999 pginfo->next_hwpage);
2000 return -EFAULT;
2001 }
2002 (pginfo->hwpage_cnt)++;
2003 if (pginfo->u.fmr.fmr_pgsize >= pginfo->hwpage_size) {
2004 if (pginfo->next_hwpage %
2005 (pginfo->u.fmr.fmr_pgsize /
2006 pginfo->hwpage_size) == 0) {
2007 (pginfo->kpage_cnt)++;
2008 (pginfo->u.fmr.next_listelem)++;
2009 fmrlist++;
2010 pginfo->next_hwpage = 0;
2011 } else
2012 (pginfo->next_hwpage)++;
2013 } else {
2014 unsigned int cnt_per_hwpage = pginfo->hwpage_size /
2015 pginfo->u.fmr.fmr_pgsize;
2016 unsigned int j;
2017 u64 prev = *kpage;
2018 /* check if adrs are contiguous */
2019 for (j = 1; j < cnt_per_hwpage; j++) {
2020 u64 p = phys_to_abs(fmrlist[j] &
2021 ~(pginfo->hwpage_size - 1));
2022 if (prev + pginfo->u.fmr.fmr_pgsize != p) {
2023 ehca_gen_err("uncontiguous fmr pages "
2024 "found prev=%lx p=%lx "
2025 "idx=%x", prev, p, i + j);
2026 return -EINVAL;
2027 }
2028 prev = p;
2029 }
2030 pginfo->kpage_cnt += cnt_per_hwpage;
2031 pginfo->u.fmr.next_listelem += cnt_per_hwpage;
2032 fmrlist += cnt_per_hwpage;
2033 }
2034 kpage++;
2035 }
2036 return ret;
2037 }
2038
2039 /* setup page buffer from page info */
2040 int ehca_set_pagebuf(struct ehca_mr_pginfo *pginfo,
2041 u32 number,
2042 u64 *kpage)
2043 {
2044 int ret;
2045
2046 switch (pginfo->type) {
2047 case EHCA_MR_PGI_PHYS:
2048 ret = ehca_set_pagebuf_phys(pginfo, number, kpage);
2049 break;
2050 case EHCA_MR_PGI_USER:
2051 ret = PAGE_SIZE >= pginfo->hwpage_size ?
2052 ehca_set_pagebuf_user1(pginfo, number, kpage) :
2053 ehca_set_pagebuf_user2(pginfo, number, kpage);
2054 break;
2055 case EHCA_MR_PGI_FMR:
2056 ret = ehca_set_pagebuf_fmr(pginfo, number, kpage);
2057 break;
2058 default:
2059 ehca_gen_err("bad pginfo->type=%x", pginfo->type);
2060 ret = -EFAULT;
2061 break;
2062 }
2063 return ret;
2064 } /* end ehca_set_pagebuf() */
2065
2066 /*----------------------------------------------------------------------*/
2067
2068 /*
2069 * check MR if it is a max-MR, i.e. uses whole memory
2070 * in case it's a max-MR 1 is returned, else 0
2071 */
2072 int ehca_mr_is_maxmr(u64 size,
2073 u64 *iova_start)
2074 {
2075 /* a MR is treated as max-MR only if it fits following: */
2076 if ((size == ((u64)high_memory - PAGE_OFFSET)) &&
2077 (iova_start == (void *)KERNELBASE)) {
2078 ehca_gen_dbg("this is a max-MR");
2079 return 1;
2080 } else
2081 return 0;
2082 } /* end ehca_mr_is_maxmr() */
2083
2084 /*----------------------------------------------------------------------*/
2085
2086 /* map access control for MR/MW. This routine is used for MR and MW. */
2087 void ehca_mrmw_map_acl(int ib_acl,
2088 u32 *hipz_acl)
2089 {
2090 *hipz_acl = 0;
2091 if (ib_acl & IB_ACCESS_REMOTE_READ)
2092 *hipz_acl |= HIPZ_ACCESSCTRL_R_READ;
2093 if (ib_acl & IB_ACCESS_REMOTE_WRITE)
2094 *hipz_acl |= HIPZ_ACCESSCTRL_R_WRITE;
2095 if (ib_acl & IB_ACCESS_REMOTE_ATOMIC)
2096 *hipz_acl |= HIPZ_ACCESSCTRL_R_ATOMIC;
2097 if (ib_acl & IB_ACCESS_LOCAL_WRITE)
2098 *hipz_acl |= HIPZ_ACCESSCTRL_L_WRITE;
2099 if (ib_acl & IB_ACCESS_MW_BIND)
2100 *hipz_acl |= HIPZ_ACCESSCTRL_MW_BIND;
2101 } /* end ehca_mrmw_map_acl() */
2102
2103 /*----------------------------------------------------------------------*/
2104
2105 /* sets page size in hipz access control for MR/MW. */
2106 void ehca_mrmw_set_pgsize_hipz_acl(u32 pgsize, u32 *hipz_acl) /*INOUT*/
2107 {
2108 *hipz_acl |= (ehca_encode_hwpage_size(pgsize) << 24);
2109 } /* end ehca_mrmw_set_pgsize_hipz_acl() */
2110
2111 /*----------------------------------------------------------------------*/
2112
2113 /*
2114 * reverse map access control for MR/MW.
2115 * This routine is used for MR and MW.
2116 */
2117 void ehca_mrmw_reverse_map_acl(const u32 *hipz_acl,
2118 int *ib_acl) /*OUT*/
2119 {
2120 *ib_acl = 0;
2121 if (*hipz_acl & HIPZ_ACCESSCTRL_R_READ)
2122 *ib_acl |= IB_ACCESS_REMOTE_READ;
2123 if (*hipz_acl & HIPZ_ACCESSCTRL_R_WRITE)
2124 *ib_acl |= IB_ACCESS_REMOTE_WRITE;
2125 if (*hipz_acl & HIPZ_ACCESSCTRL_R_ATOMIC)
2126 *ib_acl |= IB_ACCESS_REMOTE_ATOMIC;
2127 if (*hipz_acl & HIPZ_ACCESSCTRL_L_WRITE)
2128 *ib_acl |= IB_ACCESS_LOCAL_WRITE;
2129 if (*hipz_acl & HIPZ_ACCESSCTRL_MW_BIND)
2130 *ib_acl |= IB_ACCESS_MW_BIND;
2131 } /* end ehca_mrmw_reverse_map_acl() */
2132
2133
2134 /*----------------------------------------------------------------------*/
2135
2136 /*
2137 * MR destructor and constructor
2138 * used in Reregister MR verb, sets all fields in ehca_mr_t to 0,
2139 * except struct ib_mr and spinlock
2140 */
2141 void ehca_mr_deletenew(struct ehca_mr *mr)
2142 {
2143 mr->flags = 0;
2144 mr->num_kpages = 0;
2145 mr->num_hwpages = 0;
2146 mr->acl = 0;
2147 mr->start = NULL;
2148 mr->fmr_page_size = 0;
2149 mr->fmr_max_pages = 0;
2150 mr->fmr_max_maps = 0;
2151 mr->fmr_map_cnt = 0;
2152 memset(&mr->ipz_mr_handle, 0, sizeof(mr->ipz_mr_handle));
2153 memset(&mr->galpas, 0, sizeof(mr->galpas));
2154 } /* end ehca_mr_deletenew() */
2155
2156 int ehca_init_mrmw_cache(void)
2157 {
2158 mr_cache = kmem_cache_create("ehca_cache_mr",
2159 sizeof(struct ehca_mr), 0,
2160 SLAB_HWCACHE_ALIGN,
2161 NULL);
2162 if (!mr_cache)
2163 return -ENOMEM;
2164 mw_cache = kmem_cache_create("ehca_cache_mw",
2165 sizeof(struct ehca_mw), 0,
2166 SLAB_HWCACHE_ALIGN,
2167 NULL);
2168 if (!mw_cache) {
2169 kmem_cache_destroy(mr_cache);
2170 mr_cache = NULL;
2171 return -ENOMEM;
2172 }
2173 return 0;
2174 }
2175
2176 void ehca_cleanup_mrmw_cache(void)
2177 {
2178 if (mr_cache)
2179 kmem_cache_destroy(mr_cache);
2180 if (mw_cache)
2181 kmem_cache_destroy(mw_cache);
2182 }