• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  MR/MW functions
5  *
6  *  Authors: Dietmar Decker <ddecker@de.ibm.com>
7  *           Christoph Raisch <raisch@de.ibm.com>
8  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42 
43 #include <rdma/ib_umem.h>
44 
45 #include "ehca_iverbs.h"
46 #include "ehca_mrmw.h"
47 #include "hcp_if.h"
48 #include "hipz_hw.h"
49 
50 #define NUM_CHUNKS(length, chunk_size) \
51 	(((length) + (chunk_size - 1)) / (chunk_size))
52 
53 /* max number of rpages (per hcall register_rpages) */
54 #define MAX_RPAGES 512
55 
56 static struct kmem_cache *mr_cache;
57 static struct kmem_cache *mw_cache;
58 
59 enum ehca_mr_pgsize {
60 	EHCA_MR_PGSIZE4K  = 0x1000L,
61 	EHCA_MR_PGSIZE64K = 0x10000L,
62 	EHCA_MR_PGSIZE1M  = 0x100000L,
63 	EHCA_MR_PGSIZE16M = 0x1000000L
64 };
65 
66 #define EHCA_MR_PGSHIFT4K  12
67 #define EHCA_MR_PGSHIFT64K 16
68 #define EHCA_MR_PGSHIFT1M  20
69 #define EHCA_MR_PGSHIFT16M 24
70 
ehca_encode_hwpage_size(u32 pgsize)71 static u32 ehca_encode_hwpage_size(u32 pgsize)
72 {
73 	int log = ilog2(pgsize);
74 	WARN_ON(log < 12 || log > 24 || log & 3);
75 	return (log - 12) / 4;
76 }
77 
ehca_get_max_hwpage_size(struct ehca_shca * shca)78 static u64 ehca_get_max_hwpage_size(struct ehca_shca *shca)
79 {
80 	return 1UL << ilog2(shca->hca_cap_mr_pgsize);
81 }
82 
ehca_mr_new(void)83 static struct ehca_mr *ehca_mr_new(void)
84 {
85 	struct ehca_mr *me;
86 
87 	me = kmem_cache_zalloc(mr_cache, GFP_KERNEL);
88 	if (me)
89 		spin_lock_init(&me->mrlock);
90 	else
91 		ehca_gen_err("alloc failed");
92 
93 	return me;
94 }
95 
ehca_mr_delete(struct ehca_mr * me)96 static void ehca_mr_delete(struct ehca_mr *me)
97 {
98 	kmem_cache_free(mr_cache, me);
99 }
100 
ehca_mw_new(void)101 static struct ehca_mw *ehca_mw_new(void)
102 {
103 	struct ehca_mw *me;
104 
105 	me = kmem_cache_zalloc(mw_cache, GFP_KERNEL);
106 	if (me)
107 		spin_lock_init(&me->mwlock);
108 	else
109 		ehca_gen_err("alloc failed");
110 
111 	return me;
112 }
113 
ehca_mw_delete(struct ehca_mw * me)114 static void ehca_mw_delete(struct ehca_mw *me)
115 {
116 	kmem_cache_free(mw_cache, me);
117 }
118 
119 /*----------------------------------------------------------------------*/
120 
ehca_get_dma_mr(struct ib_pd * pd,int mr_access_flags)121 struct ib_mr *ehca_get_dma_mr(struct ib_pd *pd, int mr_access_flags)
122 {
123 	struct ib_mr *ib_mr;
124 	int ret;
125 	struct ehca_mr *e_maxmr;
126 	struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
127 	struct ehca_shca *shca =
128 		container_of(pd->device, struct ehca_shca, ib_device);
129 
130 	if (shca->maxmr) {
131 		e_maxmr = ehca_mr_new();
132 		if (!e_maxmr) {
133 			ehca_err(&shca->ib_device, "out of memory");
134 			ib_mr = ERR_PTR(-ENOMEM);
135 			goto get_dma_mr_exit0;
136 		}
137 
138 		ret = ehca_reg_maxmr(shca, e_maxmr, (u64 *)KERNELBASE,
139 				     mr_access_flags, e_pd,
140 				     &e_maxmr->ib.ib_mr.lkey,
141 				     &e_maxmr->ib.ib_mr.rkey);
142 		if (ret) {
143 			ehca_mr_delete(e_maxmr);
144 			ib_mr = ERR_PTR(ret);
145 			goto get_dma_mr_exit0;
146 		}
147 		ib_mr = &e_maxmr->ib.ib_mr;
148 	} else {
149 		ehca_err(&shca->ib_device, "no internal max-MR exist!");
150 		ib_mr = ERR_PTR(-EINVAL);
151 		goto get_dma_mr_exit0;
152 	}
153 
154 get_dma_mr_exit0:
155 	if (IS_ERR(ib_mr))
156 		ehca_err(&shca->ib_device, "h_ret=%li pd=%p mr_access_flags=%x",
157 			 PTR_ERR(ib_mr), pd, mr_access_flags);
158 	return ib_mr;
159 } /* end ehca_get_dma_mr() */
160 
161 /*----------------------------------------------------------------------*/
162 
ehca_reg_phys_mr(struct ib_pd * pd,struct ib_phys_buf * phys_buf_array,int num_phys_buf,int mr_access_flags,u64 * iova_start)163 struct ib_mr *ehca_reg_phys_mr(struct ib_pd *pd,
164 			       struct ib_phys_buf *phys_buf_array,
165 			       int num_phys_buf,
166 			       int mr_access_flags,
167 			       u64 *iova_start)
168 {
169 	struct ib_mr *ib_mr;
170 	int ret;
171 	struct ehca_mr *e_mr;
172 	struct ehca_shca *shca =
173 		container_of(pd->device, struct ehca_shca, ib_device);
174 	struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
175 
176 	u64 size;
177 
178 	if ((num_phys_buf <= 0) || !phys_buf_array) {
179 		ehca_err(pd->device, "bad input values: num_phys_buf=%x "
180 			 "phys_buf_array=%p", num_phys_buf, phys_buf_array);
181 		ib_mr = ERR_PTR(-EINVAL);
182 		goto reg_phys_mr_exit0;
183 	}
184 	if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
185 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
186 	    ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
187 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
188 		/*
189 		 * Remote Write Access requires Local Write Access
190 		 * Remote Atomic Access requires Local Write Access
191 		 */
192 		ehca_err(pd->device, "bad input values: mr_access_flags=%x",
193 			 mr_access_flags);
194 		ib_mr = ERR_PTR(-EINVAL);
195 		goto reg_phys_mr_exit0;
196 	}
197 
198 	/* check physical buffer list and calculate size */
199 	ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array, num_phys_buf,
200 					    iova_start, &size);
201 	if (ret) {
202 		ib_mr = ERR_PTR(ret);
203 		goto reg_phys_mr_exit0;
204 	}
205 	if ((size == 0) ||
206 	    (((u64)iova_start + size) < (u64)iova_start)) {
207 		ehca_err(pd->device, "bad input values: size=%llx iova_start=%p",
208 			 size, iova_start);
209 		ib_mr = ERR_PTR(-EINVAL);
210 		goto reg_phys_mr_exit0;
211 	}
212 
213 	e_mr = ehca_mr_new();
214 	if (!e_mr) {
215 		ehca_err(pd->device, "out of memory");
216 		ib_mr = ERR_PTR(-ENOMEM);
217 		goto reg_phys_mr_exit0;
218 	}
219 
220 	/* register MR on HCA */
221 	if (ehca_mr_is_maxmr(size, iova_start)) {
222 		e_mr->flags |= EHCA_MR_FLAG_MAXMR;
223 		ret = ehca_reg_maxmr(shca, e_mr, iova_start, mr_access_flags,
224 				     e_pd, &e_mr->ib.ib_mr.lkey,
225 				     &e_mr->ib.ib_mr.rkey);
226 		if (ret) {
227 			ib_mr = ERR_PTR(ret);
228 			goto reg_phys_mr_exit1;
229 		}
230 	} else {
231 		struct ehca_mr_pginfo pginfo;
232 		u32 num_kpages;
233 		u32 num_hwpages;
234 		u64 hw_pgsize;
235 
236 		num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size,
237 					PAGE_SIZE);
238 		/* for kernel space we try most possible pgsize */
239 		hw_pgsize = ehca_get_max_hwpage_size(shca);
240 		num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size,
241 					 hw_pgsize);
242 		memset(&pginfo, 0, sizeof(pginfo));
243 		pginfo.type = EHCA_MR_PGI_PHYS;
244 		pginfo.num_kpages = num_kpages;
245 		pginfo.hwpage_size = hw_pgsize;
246 		pginfo.num_hwpages = num_hwpages;
247 		pginfo.u.phy.num_phys_buf = num_phys_buf;
248 		pginfo.u.phy.phys_buf_array = phys_buf_array;
249 		pginfo.next_hwpage =
250 			((u64)iova_start & ~PAGE_MASK) / hw_pgsize;
251 
252 		ret = ehca_reg_mr(shca, e_mr, iova_start, size, mr_access_flags,
253 				  e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
254 				  &e_mr->ib.ib_mr.rkey);
255 		if (ret) {
256 			ib_mr = ERR_PTR(ret);
257 			goto reg_phys_mr_exit1;
258 		}
259 	}
260 
261 	/* successful registration of all pages */
262 	return &e_mr->ib.ib_mr;
263 
264 reg_phys_mr_exit1:
265 	ehca_mr_delete(e_mr);
266 reg_phys_mr_exit0:
267 	if (IS_ERR(ib_mr))
268 		ehca_err(pd->device, "h_ret=%li pd=%p phys_buf_array=%p "
269 			 "num_phys_buf=%x mr_access_flags=%x iova_start=%p",
270 			 PTR_ERR(ib_mr), pd, phys_buf_array,
271 			 num_phys_buf, mr_access_flags, iova_start);
272 	return ib_mr;
273 } /* end ehca_reg_phys_mr() */
274 
275 /*----------------------------------------------------------------------*/
276 
ehca_reg_user_mr(struct ib_pd * pd,u64 start,u64 length,u64 virt,int mr_access_flags,struct ib_udata * udata)277 struct ib_mr *ehca_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
278 			       u64 virt, int mr_access_flags,
279 			       struct ib_udata *udata)
280 {
281 	struct ib_mr *ib_mr;
282 	struct ehca_mr *e_mr;
283 	struct ehca_shca *shca =
284 		container_of(pd->device, struct ehca_shca, ib_device);
285 	struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
286 	struct ehca_mr_pginfo pginfo;
287 	int ret, page_shift;
288 	u32 num_kpages;
289 	u32 num_hwpages;
290 	u64 hwpage_size;
291 
292 	if (!pd) {
293 		ehca_gen_err("bad pd=%p", pd);
294 		return ERR_PTR(-EFAULT);
295 	}
296 
297 	if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
298 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
299 	    ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
300 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
301 		/*
302 		 * Remote Write Access requires Local Write Access
303 		 * Remote Atomic Access requires Local Write Access
304 		 */
305 		ehca_err(pd->device, "bad input values: mr_access_flags=%x",
306 			 mr_access_flags);
307 		ib_mr = ERR_PTR(-EINVAL);
308 		goto reg_user_mr_exit0;
309 	}
310 
311 	if (length == 0 || virt + length < virt) {
312 		ehca_err(pd->device, "bad input values: length=%llx "
313 			 "virt_base=%llx", length, virt);
314 		ib_mr = ERR_PTR(-EINVAL);
315 		goto reg_user_mr_exit0;
316 	}
317 
318 	e_mr = ehca_mr_new();
319 	if (!e_mr) {
320 		ehca_err(pd->device, "out of memory");
321 		ib_mr = ERR_PTR(-ENOMEM);
322 		goto reg_user_mr_exit0;
323 	}
324 
325 	e_mr->umem = ib_umem_get(pd->uobject->context, start, length,
326 				 mr_access_flags, 0);
327 	if (IS_ERR(e_mr->umem)) {
328 		ib_mr = (void *)e_mr->umem;
329 		goto reg_user_mr_exit1;
330 	}
331 
332 	if (e_mr->umem->page_size != PAGE_SIZE) {
333 		ehca_err(pd->device, "page size not supported, "
334 			 "e_mr->umem->page_size=%x", e_mr->umem->page_size);
335 		ib_mr = ERR_PTR(-EINVAL);
336 		goto reg_user_mr_exit2;
337 	}
338 
339 	/* determine number of MR pages */
340 	num_kpages = NUM_CHUNKS((virt % PAGE_SIZE) + length, PAGE_SIZE);
341 	/* select proper hw_pgsize */
342 	page_shift = PAGE_SHIFT;
343 	if (e_mr->umem->hugetlb) {
344 		/* determine page_shift, clamp between 4K and 16M */
345 		page_shift = (fls64(length - 1) + 3) & ~3;
346 		page_shift = min(max(page_shift, EHCA_MR_PGSHIFT4K),
347 				 EHCA_MR_PGSHIFT16M);
348 	}
349 	hwpage_size = 1UL << page_shift;
350 
351 	/* now that we have the desired page size, shift until it's
352 	 * supported, too. 4K is always supported, so this terminates.
353 	 */
354 	while (!(hwpage_size & shca->hca_cap_mr_pgsize))
355 		hwpage_size >>= 4;
356 
357 reg_user_mr_fallback:
358 	num_hwpages = NUM_CHUNKS((virt % hwpage_size) + length, hwpage_size);
359 	/* register MR on HCA */
360 	memset(&pginfo, 0, sizeof(pginfo));
361 	pginfo.type = EHCA_MR_PGI_USER;
362 	pginfo.hwpage_size = hwpage_size;
363 	pginfo.num_kpages = num_kpages;
364 	pginfo.num_hwpages = num_hwpages;
365 	pginfo.u.usr.region = e_mr->umem;
366 	pginfo.next_hwpage = e_mr->umem->offset / hwpage_size;
367 	pginfo.u.usr.next_chunk = list_prepare_entry(pginfo.u.usr.next_chunk,
368 						     (&e_mr->umem->chunk_list),
369 						     list);
370 
371 	ret = ehca_reg_mr(shca, e_mr, (u64 *)virt, length, mr_access_flags,
372 			  e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,
373 			  &e_mr->ib.ib_mr.rkey);
374 	if (ret == -EINVAL && pginfo.hwpage_size > PAGE_SIZE) {
375 		ehca_warn(pd->device, "failed to register mr "
376 			  "with hwpage_size=%llx", hwpage_size);
377 		ehca_info(pd->device, "try to register mr with "
378 			  "kpage_size=%lx", PAGE_SIZE);
379 		/*
380 		 * this means kpages are not contiguous for a hw page
381 		 * try kernel page size as fallback solution
382 		 */
383 		hwpage_size = PAGE_SIZE;
384 		goto reg_user_mr_fallback;
385 	}
386 	if (ret) {
387 		ib_mr = ERR_PTR(ret);
388 		goto reg_user_mr_exit2;
389 	}
390 
391 	/* successful registration of all pages */
392 	return &e_mr->ib.ib_mr;
393 
394 reg_user_mr_exit2:
395 	ib_umem_release(e_mr->umem);
396 reg_user_mr_exit1:
397 	ehca_mr_delete(e_mr);
398 reg_user_mr_exit0:
399 	if (IS_ERR(ib_mr))
400 		ehca_err(pd->device, "rc=%li pd=%p mr_access_flags=%x udata=%p",
401 			 PTR_ERR(ib_mr), pd, mr_access_flags, udata);
402 	return ib_mr;
403 } /* end ehca_reg_user_mr() */
404 
405 /*----------------------------------------------------------------------*/
406 
ehca_rereg_phys_mr(struct ib_mr * mr,int mr_rereg_mask,struct ib_pd * pd,struct ib_phys_buf * phys_buf_array,int num_phys_buf,int mr_access_flags,u64 * iova_start)407 int ehca_rereg_phys_mr(struct ib_mr *mr,
408 		       int mr_rereg_mask,
409 		       struct ib_pd *pd,
410 		       struct ib_phys_buf *phys_buf_array,
411 		       int num_phys_buf,
412 		       int mr_access_flags,
413 		       u64 *iova_start)
414 {
415 	int ret;
416 
417 	struct ehca_shca *shca =
418 		container_of(mr->device, struct ehca_shca, ib_device);
419 	struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
420 	u64 new_size;
421 	u64 *new_start;
422 	u32 new_acl;
423 	struct ehca_pd *new_pd;
424 	u32 tmp_lkey, tmp_rkey;
425 	unsigned long sl_flags;
426 	u32 num_kpages = 0;
427 	u32 num_hwpages = 0;
428 	struct ehca_mr_pginfo pginfo;
429 
430 	if (!(mr_rereg_mask & IB_MR_REREG_TRANS)) {
431 		/* TODO not supported, because PHYP rereg hCall needs pages */
432 		ehca_err(mr->device, "rereg without IB_MR_REREG_TRANS not "
433 			 "supported yet, mr_rereg_mask=%x", mr_rereg_mask);
434 		ret = -EINVAL;
435 		goto rereg_phys_mr_exit0;
436 	}
437 
438 	if (mr_rereg_mask & IB_MR_REREG_PD) {
439 		if (!pd) {
440 			ehca_err(mr->device, "rereg with bad pd, pd=%p "
441 				 "mr_rereg_mask=%x", pd, mr_rereg_mask);
442 			ret = -EINVAL;
443 			goto rereg_phys_mr_exit0;
444 		}
445 	}
446 
447 	if ((mr_rereg_mask &
448 	     ~(IB_MR_REREG_TRANS | IB_MR_REREG_PD | IB_MR_REREG_ACCESS)) ||
449 	    (mr_rereg_mask == 0)) {
450 		ret = -EINVAL;
451 		goto rereg_phys_mr_exit0;
452 	}
453 
454 	/* check other parameters */
455 	if (e_mr == shca->maxmr) {
456 		/* should be impossible, however reject to be sure */
457 		ehca_err(mr->device, "rereg internal max-MR impossible, mr=%p "
458 			 "shca->maxmr=%p mr->lkey=%x",
459 			 mr, shca->maxmr, mr->lkey);
460 		ret = -EINVAL;
461 		goto rereg_phys_mr_exit0;
462 	}
463 	if (mr_rereg_mask & IB_MR_REREG_TRANS) { /* transl., i.e. addr/size */
464 		if (e_mr->flags & EHCA_MR_FLAG_FMR) {
465 			ehca_err(mr->device, "not supported for FMR, mr=%p "
466 				 "flags=%x", mr, e_mr->flags);
467 			ret = -EINVAL;
468 			goto rereg_phys_mr_exit0;
469 		}
470 		if (!phys_buf_array || num_phys_buf <= 0) {
471 			ehca_err(mr->device, "bad input values mr_rereg_mask=%x"
472 				 " phys_buf_array=%p num_phys_buf=%x",
473 				 mr_rereg_mask, phys_buf_array, num_phys_buf);
474 			ret = -EINVAL;
475 			goto rereg_phys_mr_exit0;
476 		}
477 	}
478 	if ((mr_rereg_mask & IB_MR_REREG_ACCESS) &&	/* change ACL */
479 	    (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
480 	      !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
481 	     ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
482 	      !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)))) {
483 		/*
484 		 * Remote Write Access requires Local Write Access
485 		 * Remote Atomic Access requires Local Write Access
486 		 */
487 		ehca_err(mr->device, "bad input values: mr_rereg_mask=%x "
488 			 "mr_access_flags=%x", mr_rereg_mask, mr_access_flags);
489 		ret = -EINVAL;
490 		goto rereg_phys_mr_exit0;
491 	}
492 
493 	/* set requested values dependent on rereg request */
494 	spin_lock_irqsave(&e_mr->mrlock, sl_flags);
495 	new_start = e_mr->start;
496 	new_size = e_mr->size;
497 	new_acl = e_mr->acl;
498 	new_pd = container_of(mr->pd, struct ehca_pd, ib_pd);
499 
500 	if (mr_rereg_mask & IB_MR_REREG_TRANS) {
501 		u64 hw_pgsize = ehca_get_max_hwpage_size(shca);
502 
503 		new_start = iova_start;	/* change address */
504 		/* check physical buffer list and calculate size */
505 		ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array,
506 						    num_phys_buf, iova_start,
507 						    &new_size);
508 		if (ret)
509 			goto rereg_phys_mr_exit1;
510 		if ((new_size == 0) ||
511 		    (((u64)iova_start + new_size) < (u64)iova_start)) {
512 			ehca_err(mr->device, "bad input values: new_size=%llx "
513 				 "iova_start=%p", new_size, iova_start);
514 			ret = -EINVAL;
515 			goto rereg_phys_mr_exit1;
516 		}
517 		num_kpages = NUM_CHUNKS(((u64)new_start % PAGE_SIZE) +
518 					new_size, PAGE_SIZE);
519 		num_hwpages = NUM_CHUNKS(((u64)new_start % hw_pgsize) +
520 					 new_size, hw_pgsize);
521 		memset(&pginfo, 0, sizeof(pginfo));
522 		pginfo.type = EHCA_MR_PGI_PHYS;
523 		pginfo.num_kpages = num_kpages;
524 		pginfo.hwpage_size = hw_pgsize;
525 		pginfo.num_hwpages = num_hwpages;
526 		pginfo.u.phy.num_phys_buf = num_phys_buf;
527 		pginfo.u.phy.phys_buf_array = phys_buf_array;
528 		pginfo.next_hwpage =
529 			((u64)iova_start & ~PAGE_MASK) / hw_pgsize;
530 	}
531 	if (mr_rereg_mask & IB_MR_REREG_ACCESS)
532 		new_acl = mr_access_flags;
533 	if (mr_rereg_mask & IB_MR_REREG_PD)
534 		new_pd = container_of(pd, struct ehca_pd, ib_pd);
535 
536 	ret = ehca_rereg_mr(shca, e_mr, new_start, new_size, new_acl,
537 			    new_pd, &pginfo, &tmp_lkey, &tmp_rkey);
538 	if (ret)
539 		goto rereg_phys_mr_exit1;
540 
541 	/* successful reregistration */
542 	if (mr_rereg_mask & IB_MR_REREG_PD)
543 		mr->pd = pd;
544 	mr->lkey = tmp_lkey;
545 	mr->rkey = tmp_rkey;
546 
547 rereg_phys_mr_exit1:
548 	spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
549 rereg_phys_mr_exit0:
550 	if (ret)
551 		ehca_err(mr->device, "ret=%i mr=%p mr_rereg_mask=%x pd=%p "
552 			 "phys_buf_array=%p num_phys_buf=%x mr_access_flags=%x "
553 			 "iova_start=%p",
554 			 ret, mr, mr_rereg_mask, pd, phys_buf_array,
555 			 num_phys_buf, mr_access_flags, iova_start);
556 	return ret;
557 } /* end ehca_rereg_phys_mr() */
558 
559 /*----------------------------------------------------------------------*/
560 
ehca_query_mr(struct ib_mr * mr,struct ib_mr_attr * mr_attr)561 int ehca_query_mr(struct ib_mr *mr, struct ib_mr_attr *mr_attr)
562 {
563 	int ret = 0;
564 	u64 h_ret;
565 	struct ehca_shca *shca =
566 		container_of(mr->device, struct ehca_shca, ib_device);
567 	struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
568 	unsigned long sl_flags;
569 	struct ehca_mr_hipzout_parms hipzout;
570 
571 	if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
572 		ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
573 			 "e_mr->flags=%x", mr, e_mr, e_mr->flags);
574 		ret = -EINVAL;
575 		goto query_mr_exit0;
576 	}
577 
578 	memset(mr_attr, 0, sizeof(struct ib_mr_attr));
579 	spin_lock_irqsave(&e_mr->mrlock, sl_flags);
580 
581 	h_ret = hipz_h_query_mr(shca->ipz_hca_handle, e_mr, &hipzout);
582 	if (h_ret != H_SUCCESS) {
583 		ehca_err(mr->device, "hipz_mr_query failed, h_ret=%lli mr=%p "
584 			 "hca_hndl=%llx mr_hndl=%llx lkey=%x",
585 			 h_ret, mr, shca->ipz_hca_handle.handle,
586 			 e_mr->ipz_mr_handle.handle, mr->lkey);
587 		ret = ehca2ib_return_code(h_ret);
588 		goto query_mr_exit1;
589 	}
590 	mr_attr->pd = mr->pd;
591 	mr_attr->device_virt_addr = hipzout.vaddr;
592 	mr_attr->size = hipzout.len;
593 	mr_attr->lkey = hipzout.lkey;
594 	mr_attr->rkey = hipzout.rkey;
595 	ehca_mrmw_reverse_map_acl(&hipzout.acl, &mr_attr->mr_access_flags);
596 
597 query_mr_exit1:
598 	spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);
599 query_mr_exit0:
600 	if (ret)
601 		ehca_err(mr->device, "ret=%i mr=%p mr_attr=%p",
602 			 ret, mr, mr_attr);
603 	return ret;
604 } /* end ehca_query_mr() */
605 
606 /*----------------------------------------------------------------------*/
607 
ehca_dereg_mr(struct ib_mr * mr)608 int ehca_dereg_mr(struct ib_mr *mr)
609 {
610 	int ret = 0;
611 	u64 h_ret;
612 	struct ehca_shca *shca =
613 		container_of(mr->device, struct ehca_shca, ib_device);
614 	struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);
615 
616 	if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {
617 		ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "
618 			 "e_mr->flags=%x", mr, e_mr, e_mr->flags);
619 		ret = -EINVAL;
620 		goto dereg_mr_exit0;
621 	} else if (e_mr == shca->maxmr) {
622 		/* should be impossible, however reject to be sure */
623 		ehca_err(mr->device, "dereg internal max-MR impossible, mr=%p "
624 			 "shca->maxmr=%p mr->lkey=%x",
625 			 mr, shca->maxmr, mr->lkey);
626 		ret = -EINVAL;
627 		goto dereg_mr_exit0;
628 	}
629 
630 	/* TODO: BUSY: MR still has bound window(s) */
631 	h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
632 	if (h_ret != H_SUCCESS) {
633 		ehca_err(mr->device, "hipz_free_mr failed, h_ret=%lli shca=%p "
634 			 "e_mr=%p hca_hndl=%llx mr_hndl=%llx mr->lkey=%x",
635 			 h_ret, shca, e_mr, shca->ipz_hca_handle.handle,
636 			 e_mr->ipz_mr_handle.handle, mr->lkey);
637 		ret = ehca2ib_return_code(h_ret);
638 		goto dereg_mr_exit0;
639 	}
640 
641 	if (e_mr->umem)
642 		ib_umem_release(e_mr->umem);
643 
644 	/* successful deregistration */
645 	ehca_mr_delete(e_mr);
646 
647 dereg_mr_exit0:
648 	if (ret)
649 		ehca_err(mr->device, "ret=%i mr=%p", ret, mr);
650 	return ret;
651 } /* end ehca_dereg_mr() */
652 
653 /*----------------------------------------------------------------------*/
654 
ehca_alloc_mw(struct ib_pd * pd)655 struct ib_mw *ehca_alloc_mw(struct ib_pd *pd)
656 {
657 	struct ib_mw *ib_mw;
658 	u64 h_ret;
659 	struct ehca_mw *e_mw;
660 	struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
661 	struct ehca_shca *shca =
662 		container_of(pd->device, struct ehca_shca, ib_device);
663 	struct ehca_mw_hipzout_parms hipzout;
664 
665 	e_mw = ehca_mw_new();
666 	if (!e_mw) {
667 		ib_mw = ERR_PTR(-ENOMEM);
668 		goto alloc_mw_exit0;
669 	}
670 
671 	h_ret = hipz_h_alloc_resource_mw(shca->ipz_hca_handle, e_mw,
672 					 e_pd->fw_pd, &hipzout);
673 	if (h_ret != H_SUCCESS) {
674 		ehca_err(pd->device, "hipz_mw_allocate failed, h_ret=%lli "
675 			 "shca=%p hca_hndl=%llx mw=%p",
676 			 h_ret, shca, shca->ipz_hca_handle.handle, e_mw);
677 		ib_mw = ERR_PTR(ehca2ib_return_code(h_ret));
678 		goto alloc_mw_exit1;
679 	}
680 	/* successful MW allocation */
681 	e_mw->ipz_mw_handle = hipzout.handle;
682 	e_mw->ib_mw.rkey    = hipzout.rkey;
683 	return &e_mw->ib_mw;
684 
685 alloc_mw_exit1:
686 	ehca_mw_delete(e_mw);
687 alloc_mw_exit0:
688 	if (IS_ERR(ib_mw))
689 		ehca_err(pd->device, "h_ret=%li pd=%p", PTR_ERR(ib_mw), pd);
690 	return ib_mw;
691 } /* end ehca_alloc_mw() */
692 
693 /*----------------------------------------------------------------------*/
694 
ehca_bind_mw(struct ib_qp * qp,struct ib_mw * mw,struct ib_mw_bind * mw_bind)695 int ehca_bind_mw(struct ib_qp *qp,
696 		 struct ib_mw *mw,
697 		 struct ib_mw_bind *mw_bind)
698 {
699 	/* TODO: not supported up to now */
700 	ehca_gen_err("bind MW currently not supported by HCAD");
701 
702 	return -EPERM;
703 } /* end ehca_bind_mw() */
704 
705 /*----------------------------------------------------------------------*/
706 
ehca_dealloc_mw(struct ib_mw * mw)707 int ehca_dealloc_mw(struct ib_mw *mw)
708 {
709 	u64 h_ret;
710 	struct ehca_shca *shca =
711 		container_of(mw->device, struct ehca_shca, ib_device);
712 	struct ehca_mw *e_mw = container_of(mw, struct ehca_mw, ib_mw);
713 
714 	h_ret = hipz_h_free_resource_mw(shca->ipz_hca_handle, e_mw);
715 	if (h_ret != H_SUCCESS) {
716 		ehca_err(mw->device, "hipz_free_mw failed, h_ret=%lli shca=%p "
717 			 "mw=%p rkey=%x hca_hndl=%llx mw_hndl=%llx",
718 			 h_ret, shca, mw, mw->rkey, shca->ipz_hca_handle.handle,
719 			 e_mw->ipz_mw_handle.handle);
720 		return ehca2ib_return_code(h_ret);
721 	}
722 	/* successful deallocation */
723 	ehca_mw_delete(e_mw);
724 	return 0;
725 } /* end ehca_dealloc_mw() */
726 
727 /*----------------------------------------------------------------------*/
728 
ehca_alloc_fmr(struct ib_pd * pd,int mr_access_flags,struct ib_fmr_attr * fmr_attr)729 struct ib_fmr *ehca_alloc_fmr(struct ib_pd *pd,
730 			      int mr_access_flags,
731 			      struct ib_fmr_attr *fmr_attr)
732 {
733 	struct ib_fmr *ib_fmr;
734 	struct ehca_shca *shca =
735 		container_of(pd->device, struct ehca_shca, ib_device);
736 	struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);
737 	struct ehca_mr *e_fmr;
738 	int ret;
739 	u32 tmp_lkey, tmp_rkey;
740 	struct ehca_mr_pginfo pginfo;
741 	u64 hw_pgsize;
742 
743 	/* check other parameters */
744 	if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&
745 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||
746 	    ((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&
747 	     !(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {
748 		/*
749 		 * Remote Write Access requires Local Write Access
750 		 * Remote Atomic Access requires Local Write Access
751 		 */
752 		ehca_err(pd->device, "bad input values: mr_access_flags=%x",
753 			 mr_access_flags);
754 		ib_fmr = ERR_PTR(-EINVAL);
755 		goto alloc_fmr_exit0;
756 	}
757 	if (mr_access_flags & IB_ACCESS_MW_BIND) {
758 		ehca_err(pd->device, "bad input values: mr_access_flags=%x",
759 			 mr_access_flags);
760 		ib_fmr = ERR_PTR(-EINVAL);
761 		goto alloc_fmr_exit0;
762 	}
763 	if ((fmr_attr->max_pages == 0) || (fmr_attr->max_maps == 0)) {
764 		ehca_err(pd->device, "bad input values: fmr_attr->max_pages=%x "
765 			 "fmr_attr->max_maps=%x fmr_attr->page_shift=%x",
766 			 fmr_attr->max_pages, fmr_attr->max_maps,
767 			 fmr_attr->page_shift);
768 		ib_fmr = ERR_PTR(-EINVAL);
769 		goto alloc_fmr_exit0;
770 	}
771 
772 	hw_pgsize = 1 << fmr_attr->page_shift;
773 	if (!(hw_pgsize & shca->hca_cap_mr_pgsize)) {
774 		ehca_err(pd->device, "unsupported fmr_attr->page_shift=%x",
775 			 fmr_attr->page_shift);
776 		ib_fmr = ERR_PTR(-EINVAL);
777 		goto alloc_fmr_exit0;
778 	}
779 
780 	e_fmr = ehca_mr_new();
781 	if (!e_fmr) {
782 		ib_fmr = ERR_PTR(-ENOMEM);
783 		goto alloc_fmr_exit0;
784 	}
785 	e_fmr->flags |= EHCA_MR_FLAG_FMR;
786 
787 	/* register MR on HCA */
788 	memset(&pginfo, 0, sizeof(pginfo));
789 	pginfo.hwpage_size = hw_pgsize;
790 	/*
791 	 * pginfo.num_hwpages==0, ie register_rpages() will not be called
792 	 * but deferred to map_phys_fmr()
793 	 */
794 	ret = ehca_reg_mr(shca, e_fmr, NULL,
795 			  fmr_attr->max_pages * (1 << fmr_attr->page_shift),
796 			  mr_access_flags, e_pd, &pginfo,
797 			  &tmp_lkey, &tmp_rkey);
798 	if (ret) {
799 		ib_fmr = ERR_PTR(ret);
800 		goto alloc_fmr_exit1;
801 	}
802 
803 	/* successful */
804 	e_fmr->hwpage_size = hw_pgsize;
805 	e_fmr->fmr_page_size = 1 << fmr_attr->page_shift;
806 	e_fmr->fmr_max_pages = fmr_attr->max_pages;
807 	e_fmr->fmr_max_maps = fmr_attr->max_maps;
808 	e_fmr->fmr_map_cnt = 0;
809 	return &e_fmr->ib.ib_fmr;
810 
811 alloc_fmr_exit1:
812 	ehca_mr_delete(e_fmr);
813 alloc_fmr_exit0:
814 	return ib_fmr;
815 } /* end ehca_alloc_fmr() */
816 
817 /*----------------------------------------------------------------------*/
818 
ehca_map_phys_fmr(struct ib_fmr * fmr,u64 * page_list,int list_len,u64 iova)819 int ehca_map_phys_fmr(struct ib_fmr *fmr,
820 		      u64 *page_list,
821 		      int list_len,
822 		      u64 iova)
823 {
824 	int ret;
825 	struct ehca_shca *shca =
826 		container_of(fmr->device, struct ehca_shca, ib_device);
827 	struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
828 	struct ehca_pd *e_pd = container_of(fmr->pd, struct ehca_pd, ib_pd);
829 	struct ehca_mr_pginfo pginfo;
830 	u32 tmp_lkey, tmp_rkey;
831 
832 	if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
833 		ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
834 			 e_fmr, e_fmr->flags);
835 		ret = -EINVAL;
836 		goto map_phys_fmr_exit0;
837 	}
838 	ret = ehca_fmr_check_page_list(e_fmr, page_list, list_len);
839 	if (ret)
840 		goto map_phys_fmr_exit0;
841 	if (iova % e_fmr->fmr_page_size) {
842 		/* only whole-numbered pages */
843 		ehca_err(fmr->device, "bad iova, iova=%llx fmr_page_size=%x",
844 			 iova, e_fmr->fmr_page_size);
845 		ret = -EINVAL;
846 		goto map_phys_fmr_exit0;
847 	}
848 	if (e_fmr->fmr_map_cnt >= e_fmr->fmr_max_maps) {
849 		/* HCAD does not limit the maps, however trace this anyway */
850 		ehca_info(fmr->device, "map limit exceeded, fmr=%p "
851 			  "e_fmr->fmr_map_cnt=%x e_fmr->fmr_max_maps=%x",
852 			  fmr, e_fmr->fmr_map_cnt, e_fmr->fmr_max_maps);
853 	}
854 
855 	memset(&pginfo, 0, sizeof(pginfo));
856 	pginfo.type = EHCA_MR_PGI_FMR;
857 	pginfo.num_kpages = list_len;
858 	pginfo.hwpage_size = e_fmr->hwpage_size;
859 	pginfo.num_hwpages =
860 		list_len * e_fmr->fmr_page_size / pginfo.hwpage_size;
861 	pginfo.u.fmr.page_list = page_list;
862 	pginfo.next_hwpage =
863 		(iova & (e_fmr->fmr_page_size-1)) / pginfo.hwpage_size;
864 	pginfo.u.fmr.fmr_pgsize = e_fmr->fmr_page_size;
865 
866 	ret = ehca_rereg_mr(shca, e_fmr, (u64 *)iova,
867 			    list_len * e_fmr->fmr_page_size,
868 			    e_fmr->acl, e_pd, &pginfo, &tmp_lkey, &tmp_rkey);
869 	if (ret)
870 		goto map_phys_fmr_exit0;
871 
872 	/* successful reregistration */
873 	e_fmr->fmr_map_cnt++;
874 	e_fmr->ib.ib_fmr.lkey = tmp_lkey;
875 	e_fmr->ib.ib_fmr.rkey = tmp_rkey;
876 	return 0;
877 
878 map_phys_fmr_exit0:
879 	if (ret)
880 		ehca_err(fmr->device, "ret=%i fmr=%p page_list=%p list_len=%x "
881 			 "iova=%llx", ret, fmr, page_list, list_len, iova);
882 	return ret;
883 } /* end ehca_map_phys_fmr() */
884 
885 /*----------------------------------------------------------------------*/
886 
ehca_unmap_fmr(struct list_head * fmr_list)887 int ehca_unmap_fmr(struct list_head *fmr_list)
888 {
889 	int ret = 0;
890 	struct ib_fmr *ib_fmr;
891 	struct ehca_shca *shca = NULL;
892 	struct ehca_shca *prev_shca;
893 	struct ehca_mr *e_fmr;
894 	u32 num_fmr = 0;
895 	u32 unmap_fmr_cnt = 0;
896 
897 	/* check all FMR belong to same SHCA, and check internal flag */
898 	list_for_each_entry(ib_fmr, fmr_list, list) {
899 		prev_shca = shca;
900 		if (!ib_fmr) {
901 			ehca_gen_err("bad fmr=%p in list", ib_fmr);
902 			ret = -EINVAL;
903 			goto unmap_fmr_exit0;
904 		}
905 		shca = container_of(ib_fmr->device, struct ehca_shca,
906 				    ib_device);
907 		e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
908 		if ((shca != prev_shca) && prev_shca) {
909 			ehca_err(&shca->ib_device, "SHCA mismatch, shca=%p "
910 				 "prev_shca=%p e_fmr=%p",
911 				 shca, prev_shca, e_fmr);
912 			ret = -EINVAL;
913 			goto unmap_fmr_exit0;
914 		}
915 		if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
916 			ehca_err(&shca->ib_device, "not a FMR, e_fmr=%p "
917 				 "e_fmr->flags=%x", e_fmr, e_fmr->flags);
918 			ret = -EINVAL;
919 			goto unmap_fmr_exit0;
920 		}
921 		num_fmr++;
922 	}
923 
924 	/* loop over all FMRs to unmap */
925 	list_for_each_entry(ib_fmr, fmr_list, list) {
926 		unmap_fmr_cnt++;
927 		e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);
928 		shca = container_of(ib_fmr->device, struct ehca_shca,
929 				    ib_device);
930 		ret = ehca_unmap_one_fmr(shca, e_fmr);
931 		if (ret) {
932 			/* unmap failed, stop unmapping of rest of FMRs */
933 			ehca_err(&shca->ib_device, "unmap of one FMR failed, "
934 				 "stop rest, e_fmr=%p num_fmr=%x "
935 				 "unmap_fmr_cnt=%x lkey=%x", e_fmr, num_fmr,
936 				 unmap_fmr_cnt, e_fmr->ib.ib_fmr.lkey);
937 			goto unmap_fmr_exit0;
938 		}
939 	}
940 
941 unmap_fmr_exit0:
942 	if (ret)
943 		ehca_gen_err("ret=%i fmr_list=%p num_fmr=%x unmap_fmr_cnt=%x",
944 			     ret, fmr_list, num_fmr, unmap_fmr_cnt);
945 	return ret;
946 } /* end ehca_unmap_fmr() */
947 
948 /*----------------------------------------------------------------------*/
949 
ehca_dealloc_fmr(struct ib_fmr * fmr)950 int ehca_dealloc_fmr(struct ib_fmr *fmr)
951 {
952 	int ret;
953 	u64 h_ret;
954 	struct ehca_shca *shca =
955 		container_of(fmr->device, struct ehca_shca, ib_device);
956 	struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);
957 
958 	if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {
959 		ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",
960 			 e_fmr, e_fmr->flags);
961 		ret = -EINVAL;
962 		goto free_fmr_exit0;
963 	}
964 
965 	h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
966 	if (h_ret != H_SUCCESS) {
967 		ehca_err(fmr->device, "hipz_free_mr failed, h_ret=%lli e_fmr=%p "
968 			 "hca_hndl=%llx fmr_hndl=%llx fmr->lkey=%x",
969 			 h_ret, e_fmr, shca->ipz_hca_handle.handle,
970 			 e_fmr->ipz_mr_handle.handle, fmr->lkey);
971 		ret = ehca2ib_return_code(h_ret);
972 		goto free_fmr_exit0;
973 	}
974 	/* successful deregistration */
975 	ehca_mr_delete(e_fmr);
976 	return 0;
977 
978 free_fmr_exit0:
979 	if (ret)
980 		ehca_err(&shca->ib_device, "ret=%i fmr=%p", ret, fmr);
981 	return ret;
982 } /* end ehca_dealloc_fmr() */
983 
984 /*----------------------------------------------------------------------*/
985 
ehca_reg_mr(struct ehca_shca * shca,struct ehca_mr * e_mr,u64 * iova_start,u64 size,int acl,struct ehca_pd * e_pd,struct ehca_mr_pginfo * pginfo,u32 * lkey,u32 * rkey)986 int ehca_reg_mr(struct ehca_shca *shca,
987 		struct ehca_mr *e_mr,
988 		u64 *iova_start,
989 		u64 size,
990 		int acl,
991 		struct ehca_pd *e_pd,
992 		struct ehca_mr_pginfo *pginfo,
993 		u32 *lkey, /*OUT*/
994 		u32 *rkey) /*OUT*/
995 {
996 	int ret;
997 	u64 h_ret;
998 	u32 hipz_acl;
999 	struct ehca_mr_hipzout_parms hipzout;
1000 
1001 	ehca_mrmw_map_acl(acl, &hipz_acl);
1002 	ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
1003 	if (ehca_use_hp_mr == 1)
1004 		hipz_acl |= 0x00000001;
1005 
1006 	h_ret = hipz_h_alloc_resource_mr(shca->ipz_hca_handle, e_mr,
1007 					 (u64)iova_start, size, hipz_acl,
1008 					 e_pd->fw_pd, &hipzout);
1009 	if (h_ret != H_SUCCESS) {
1010 		ehca_err(&shca->ib_device, "hipz_alloc_mr failed, h_ret=%lli "
1011 			 "hca_hndl=%llx", h_ret, shca->ipz_hca_handle.handle);
1012 		ret = ehca2ib_return_code(h_ret);
1013 		goto ehca_reg_mr_exit0;
1014 	}
1015 
1016 	e_mr->ipz_mr_handle = hipzout.handle;
1017 
1018 	ret = ehca_reg_mr_rpages(shca, e_mr, pginfo);
1019 	if (ret)
1020 		goto ehca_reg_mr_exit1;
1021 
1022 	/* successful registration */
1023 	e_mr->num_kpages = pginfo->num_kpages;
1024 	e_mr->num_hwpages = pginfo->num_hwpages;
1025 	e_mr->hwpage_size = pginfo->hwpage_size;
1026 	e_mr->start = iova_start;
1027 	e_mr->size = size;
1028 	e_mr->acl = acl;
1029 	*lkey = hipzout.lkey;
1030 	*rkey = hipzout.rkey;
1031 	return 0;
1032 
1033 ehca_reg_mr_exit1:
1034 	h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
1035 	if (h_ret != H_SUCCESS) {
1036 		ehca_err(&shca->ib_device, "h_ret=%lli shca=%p e_mr=%p "
1037 			 "iova_start=%p size=%llx acl=%x e_pd=%p lkey=%x "
1038 			 "pginfo=%p num_kpages=%llx num_hwpages=%llx ret=%i",
1039 			 h_ret, shca, e_mr, iova_start, size, acl, e_pd,
1040 			 hipzout.lkey, pginfo, pginfo->num_kpages,
1041 			 pginfo->num_hwpages, ret);
1042 		ehca_err(&shca->ib_device, "internal error in ehca_reg_mr, "
1043 			 "not recoverable");
1044 	}
1045 ehca_reg_mr_exit0:
1046 	if (ret)
1047 		ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "
1048 			 "iova_start=%p size=%llx acl=%x e_pd=%p pginfo=%p "
1049 			 "num_kpages=%llx num_hwpages=%llx",
1050 			 ret, shca, e_mr, iova_start, size, acl, e_pd, pginfo,
1051 			 pginfo->num_kpages, pginfo->num_hwpages);
1052 	return ret;
1053 } /* end ehca_reg_mr() */
1054 
1055 /*----------------------------------------------------------------------*/
1056 
ehca_reg_mr_rpages(struct ehca_shca * shca,struct ehca_mr * e_mr,struct ehca_mr_pginfo * pginfo)1057 int ehca_reg_mr_rpages(struct ehca_shca *shca,
1058 		       struct ehca_mr *e_mr,
1059 		       struct ehca_mr_pginfo *pginfo)
1060 {
1061 	int ret = 0;
1062 	u64 h_ret;
1063 	u32 rnum;
1064 	u64 rpage;
1065 	u32 i;
1066 	u64 *kpage;
1067 
1068 	if (!pginfo->num_hwpages) /* in case of fmr */
1069 		return 0;
1070 
1071 	kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
1072 	if (!kpage) {
1073 		ehca_err(&shca->ib_device, "kpage alloc failed");
1074 		ret = -ENOMEM;
1075 		goto ehca_reg_mr_rpages_exit0;
1076 	}
1077 
1078 	/* max MAX_RPAGES ehca mr pages per register call */
1079 	for (i = 0; i < NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES); i++) {
1080 
1081 		if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
1082 			rnum = pginfo->num_hwpages % MAX_RPAGES; /* last shot */
1083 			if (rnum == 0)
1084 				rnum = MAX_RPAGES;      /* last shot is full */
1085 		} else
1086 			rnum = MAX_RPAGES;
1087 
1088 		ret = ehca_set_pagebuf(pginfo, rnum, kpage);
1089 		if (ret) {
1090 			ehca_err(&shca->ib_device, "ehca_set_pagebuf "
1091 				 "bad rc, ret=%i rnum=%x kpage=%p",
1092 				 ret, rnum, kpage);
1093 			goto ehca_reg_mr_rpages_exit1;
1094 		}
1095 
1096 		if (rnum > 1) {
1097 			rpage = virt_to_abs(kpage);
1098 			if (!rpage) {
1099 				ehca_err(&shca->ib_device, "kpage=%p i=%x",
1100 					 kpage, i);
1101 				ret = -EFAULT;
1102 				goto ehca_reg_mr_rpages_exit1;
1103 			}
1104 		} else
1105 			rpage = *kpage;
1106 
1107 		h_ret = hipz_h_register_rpage_mr(
1108 			shca->ipz_hca_handle, e_mr,
1109 			ehca_encode_hwpage_size(pginfo->hwpage_size),
1110 			0, rpage, rnum);
1111 
1112 		if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {
1113 			/*
1114 			 * check for 'registration complete'==H_SUCCESS
1115 			 * and for 'page registered'==H_PAGE_REGISTERED
1116 			 */
1117 			if (h_ret != H_SUCCESS) {
1118 				ehca_err(&shca->ib_device, "last "
1119 					 "hipz_reg_rpage_mr failed, h_ret=%lli "
1120 					 "e_mr=%p i=%x hca_hndl=%llx mr_hndl=%llx"
1121 					 " lkey=%x", h_ret, e_mr, i,
1122 					 shca->ipz_hca_handle.handle,
1123 					 e_mr->ipz_mr_handle.handle,
1124 					 e_mr->ib.ib_mr.lkey);
1125 				ret = ehca2ib_return_code(h_ret);
1126 				break;
1127 			} else
1128 				ret = 0;
1129 		} else if (h_ret != H_PAGE_REGISTERED) {
1130 			ehca_err(&shca->ib_device, "hipz_reg_rpage_mr failed, "
1131 				 "h_ret=%lli e_mr=%p i=%x lkey=%x hca_hndl=%llx "
1132 				 "mr_hndl=%llx", h_ret, e_mr, i,
1133 				 e_mr->ib.ib_mr.lkey,
1134 				 shca->ipz_hca_handle.handle,
1135 				 e_mr->ipz_mr_handle.handle);
1136 			ret = ehca2ib_return_code(h_ret);
1137 			break;
1138 		} else
1139 			ret = 0;
1140 	} /* end for(i) */
1141 
1142 
1143 ehca_reg_mr_rpages_exit1:
1144 	ehca_free_fw_ctrlblock(kpage);
1145 ehca_reg_mr_rpages_exit0:
1146 	if (ret)
1147 		ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p pginfo=%p "
1148 			 "num_kpages=%llx num_hwpages=%llx", ret, shca, e_mr,
1149 			 pginfo, pginfo->num_kpages, pginfo->num_hwpages);
1150 	return ret;
1151 } /* end ehca_reg_mr_rpages() */
1152 
1153 /*----------------------------------------------------------------------*/
1154 
ehca_rereg_mr_rereg1(struct ehca_shca * shca,struct ehca_mr * e_mr,u64 * iova_start,u64 size,u32 acl,struct ehca_pd * e_pd,struct ehca_mr_pginfo * pginfo,u32 * lkey,u32 * rkey)1155 inline int ehca_rereg_mr_rereg1(struct ehca_shca *shca,
1156 				struct ehca_mr *e_mr,
1157 				u64 *iova_start,
1158 				u64 size,
1159 				u32 acl,
1160 				struct ehca_pd *e_pd,
1161 				struct ehca_mr_pginfo *pginfo,
1162 				u32 *lkey, /*OUT*/
1163 				u32 *rkey) /*OUT*/
1164 {
1165 	int ret;
1166 	u64 h_ret;
1167 	u32 hipz_acl;
1168 	u64 *kpage;
1169 	u64 rpage;
1170 	struct ehca_mr_pginfo pginfo_save;
1171 	struct ehca_mr_hipzout_parms hipzout;
1172 
1173 	ehca_mrmw_map_acl(acl, &hipz_acl);
1174 	ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);
1175 
1176 	kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
1177 	if (!kpage) {
1178 		ehca_err(&shca->ib_device, "kpage alloc failed");
1179 		ret = -ENOMEM;
1180 		goto ehca_rereg_mr_rereg1_exit0;
1181 	}
1182 
1183 	pginfo_save = *pginfo;
1184 	ret = ehca_set_pagebuf(pginfo, pginfo->num_hwpages, kpage);
1185 	if (ret) {
1186 		ehca_err(&shca->ib_device, "set pagebuf failed, e_mr=%p "
1187 			 "pginfo=%p type=%x num_kpages=%llx num_hwpages=%llx "
1188 			 "kpage=%p", e_mr, pginfo, pginfo->type,
1189 			 pginfo->num_kpages, pginfo->num_hwpages, kpage);
1190 		goto ehca_rereg_mr_rereg1_exit1;
1191 	}
1192 	rpage = virt_to_abs(kpage);
1193 	if (!rpage) {
1194 		ehca_err(&shca->ib_device, "kpage=%p", kpage);
1195 		ret = -EFAULT;
1196 		goto ehca_rereg_mr_rereg1_exit1;
1197 	}
1198 	h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_mr,
1199 				      (u64)iova_start, size, hipz_acl,
1200 				      e_pd->fw_pd, rpage, &hipzout);
1201 	if (h_ret != H_SUCCESS) {
1202 		/*
1203 		 * reregistration unsuccessful, try it again with the 3 hCalls,
1204 		 * e.g. this is required in case H_MR_CONDITION
1205 		 * (MW bound or MR is shared)
1206 		 */
1207 		ehca_warn(&shca->ib_device, "hipz_h_reregister_pmr failed "
1208 			  "(Rereg1), h_ret=%lli e_mr=%p", h_ret, e_mr);
1209 		*pginfo = pginfo_save;
1210 		ret = -EAGAIN;
1211 	} else if ((u64 *)hipzout.vaddr != iova_start) {
1212 		ehca_err(&shca->ib_device, "PHYP changed iova_start in "
1213 			 "rereg_pmr, iova_start=%p iova_start_out=%llx e_mr=%p "
1214 			 "mr_handle=%llx lkey=%x lkey_out=%x", iova_start,
1215 			 hipzout.vaddr, e_mr, e_mr->ipz_mr_handle.handle,
1216 			 e_mr->ib.ib_mr.lkey, hipzout.lkey);
1217 		ret = -EFAULT;
1218 	} else {
1219 		/*
1220 		 * successful reregistration
1221 		 * note: start and start_out are identical for eServer HCAs
1222 		 */
1223 		e_mr->num_kpages = pginfo->num_kpages;
1224 		e_mr->num_hwpages = pginfo->num_hwpages;
1225 		e_mr->hwpage_size = pginfo->hwpage_size;
1226 		e_mr->start = iova_start;
1227 		e_mr->size = size;
1228 		e_mr->acl = acl;
1229 		*lkey = hipzout.lkey;
1230 		*rkey = hipzout.rkey;
1231 	}
1232 
1233 ehca_rereg_mr_rereg1_exit1:
1234 	ehca_free_fw_ctrlblock(kpage);
1235 ehca_rereg_mr_rereg1_exit0:
1236 	if ( ret && (ret != -EAGAIN) )
1237 		ehca_err(&shca->ib_device, "ret=%i lkey=%x rkey=%x "
1238 			 "pginfo=%p num_kpages=%llx num_hwpages=%llx",
1239 			 ret, *lkey, *rkey, pginfo, pginfo->num_kpages,
1240 			 pginfo->num_hwpages);
1241 	return ret;
1242 } /* end ehca_rereg_mr_rereg1() */
1243 
1244 /*----------------------------------------------------------------------*/
1245 
ehca_rereg_mr(struct ehca_shca * shca,struct ehca_mr * e_mr,u64 * iova_start,u64 size,int acl,struct ehca_pd * e_pd,struct ehca_mr_pginfo * pginfo,u32 * lkey,u32 * rkey)1246 int ehca_rereg_mr(struct ehca_shca *shca,
1247 		  struct ehca_mr *e_mr,
1248 		  u64 *iova_start,
1249 		  u64 size,
1250 		  int acl,
1251 		  struct ehca_pd *e_pd,
1252 		  struct ehca_mr_pginfo *pginfo,
1253 		  u32 *lkey,
1254 		  u32 *rkey)
1255 {
1256 	int ret = 0;
1257 	u64 h_ret;
1258 	int rereg_1_hcall = 1; /* 1: use hipz_h_reregister_pmr directly */
1259 	int rereg_3_hcall = 0; /* 1: use 3 hipz calls for reregistration */
1260 
1261 	/* first determine reregistration hCall(s) */
1262 	if ((pginfo->num_hwpages > MAX_RPAGES) ||
1263 	    (e_mr->num_hwpages > MAX_RPAGES) ||
1264 	    (pginfo->num_hwpages > e_mr->num_hwpages)) {
1265 		ehca_dbg(&shca->ib_device, "Rereg3 case, "
1266 			 "pginfo->num_hwpages=%llx e_mr->num_hwpages=%x",
1267 			 pginfo->num_hwpages, e_mr->num_hwpages);
1268 		rereg_1_hcall = 0;
1269 		rereg_3_hcall = 1;
1270 	}
1271 
1272 	if (e_mr->flags & EHCA_MR_FLAG_MAXMR) {	/* check for max-MR */
1273 		rereg_1_hcall = 0;
1274 		rereg_3_hcall = 1;
1275 		e_mr->flags &= ~EHCA_MR_FLAG_MAXMR;
1276 		ehca_err(&shca->ib_device, "Rereg MR for max-MR! e_mr=%p",
1277 			 e_mr);
1278 	}
1279 
1280 	if (rereg_1_hcall) {
1281 		ret = ehca_rereg_mr_rereg1(shca, e_mr, iova_start, size,
1282 					   acl, e_pd, pginfo, lkey, rkey);
1283 		if (ret) {
1284 			if (ret == -EAGAIN)
1285 				rereg_3_hcall = 1;
1286 			else
1287 				goto ehca_rereg_mr_exit0;
1288 		}
1289 	}
1290 
1291 	if (rereg_3_hcall) {
1292 		struct ehca_mr save_mr;
1293 
1294 		/* first deregister old MR */
1295 		h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);
1296 		if (h_ret != H_SUCCESS) {
1297 			ehca_err(&shca->ib_device, "hipz_free_mr failed, "
1298 				 "h_ret=%lli e_mr=%p hca_hndl=%llx mr_hndl=%llx "
1299 				 "mr->lkey=%x",
1300 				 h_ret, e_mr, shca->ipz_hca_handle.handle,
1301 				 e_mr->ipz_mr_handle.handle,
1302 				 e_mr->ib.ib_mr.lkey);
1303 			ret = ehca2ib_return_code(h_ret);
1304 			goto ehca_rereg_mr_exit0;
1305 		}
1306 		/* clean ehca_mr_t, without changing struct ib_mr and lock */
1307 		save_mr = *e_mr;
1308 		ehca_mr_deletenew(e_mr);
1309 
1310 		/* set some MR values */
1311 		e_mr->flags = save_mr.flags;
1312 		e_mr->hwpage_size = save_mr.hwpage_size;
1313 		e_mr->fmr_page_size = save_mr.fmr_page_size;
1314 		e_mr->fmr_max_pages = save_mr.fmr_max_pages;
1315 		e_mr->fmr_max_maps = save_mr.fmr_max_maps;
1316 		e_mr->fmr_map_cnt = save_mr.fmr_map_cnt;
1317 
1318 		ret = ehca_reg_mr(shca, e_mr, iova_start, size, acl,
1319 				  e_pd, pginfo, lkey, rkey);
1320 		if (ret) {
1321 			u32 offset = (u64)(&e_mr->flags) - (u64)e_mr;
1322 			memcpy(&e_mr->flags, &(save_mr.flags),
1323 			       sizeof(struct ehca_mr) - offset);
1324 			goto ehca_rereg_mr_exit0;
1325 		}
1326 	}
1327 
1328 ehca_rereg_mr_exit0:
1329 	if (ret)
1330 		ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "
1331 			 "iova_start=%p size=%llx acl=%x e_pd=%p pginfo=%p "
1332 			 "num_kpages=%llx lkey=%x rkey=%x rereg_1_hcall=%x "
1333 			 "rereg_3_hcall=%x", ret, shca, e_mr, iova_start, size,
1334 			 acl, e_pd, pginfo, pginfo->num_kpages, *lkey, *rkey,
1335 			 rereg_1_hcall, rereg_3_hcall);
1336 	return ret;
1337 } /* end ehca_rereg_mr() */
1338 
1339 /*----------------------------------------------------------------------*/
1340 
ehca_unmap_one_fmr(struct ehca_shca * shca,struct ehca_mr * e_fmr)1341 int ehca_unmap_one_fmr(struct ehca_shca *shca,
1342 		       struct ehca_mr *e_fmr)
1343 {
1344 	int ret = 0;
1345 	u64 h_ret;
1346 	struct ehca_pd *e_pd =
1347 		container_of(e_fmr->ib.ib_fmr.pd, struct ehca_pd, ib_pd);
1348 	struct ehca_mr save_fmr;
1349 	u32 tmp_lkey, tmp_rkey;
1350 	struct ehca_mr_pginfo pginfo;
1351 	struct ehca_mr_hipzout_parms hipzout;
1352 	struct ehca_mr save_mr;
1353 
1354 	if (e_fmr->fmr_max_pages <= MAX_RPAGES) {
1355 		/*
1356 		 * note: after using rereg hcall with len=0,
1357 		 * rereg hcall must be used again for registering pages
1358 		 */
1359 		h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_fmr, 0,
1360 					      0, 0, e_pd->fw_pd, 0, &hipzout);
1361 		if (h_ret == H_SUCCESS) {
1362 			/* successful reregistration */
1363 			e_fmr->start = NULL;
1364 			e_fmr->size = 0;
1365 			tmp_lkey = hipzout.lkey;
1366 			tmp_rkey = hipzout.rkey;
1367 			return 0;
1368 		}
1369 		/*
1370 		 * should not happen, because length checked above,
1371 		 * FMRs are not shared and no MW bound to FMRs
1372 		 */
1373 		ehca_err(&shca->ib_device, "hipz_reregister_pmr failed "
1374 			 "(Rereg1), h_ret=%lli e_fmr=%p hca_hndl=%llx "
1375 			 "mr_hndl=%llx lkey=%x lkey_out=%x",
1376 			 h_ret, e_fmr, shca->ipz_hca_handle.handle,
1377 			 e_fmr->ipz_mr_handle.handle,
1378 			 e_fmr->ib.ib_fmr.lkey, hipzout.lkey);
1379 		/* try free and rereg */
1380 	}
1381 
1382 	/* first free old FMR */
1383 	h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);
1384 	if (h_ret != H_SUCCESS) {
1385 		ehca_err(&shca->ib_device, "hipz_free_mr failed, "
1386 			 "h_ret=%lli e_fmr=%p hca_hndl=%llx mr_hndl=%llx "
1387 			 "lkey=%x",
1388 			 h_ret, e_fmr, shca->ipz_hca_handle.handle,
1389 			 e_fmr->ipz_mr_handle.handle,
1390 			 e_fmr->ib.ib_fmr.lkey);
1391 		ret = ehca2ib_return_code(h_ret);
1392 		goto ehca_unmap_one_fmr_exit0;
1393 	}
1394 	/* clean ehca_mr_t, without changing lock */
1395 	save_fmr = *e_fmr;
1396 	ehca_mr_deletenew(e_fmr);
1397 
1398 	/* set some MR values */
1399 	e_fmr->flags = save_fmr.flags;
1400 	e_fmr->hwpage_size = save_fmr.hwpage_size;
1401 	e_fmr->fmr_page_size = save_fmr.fmr_page_size;
1402 	e_fmr->fmr_max_pages = save_fmr.fmr_max_pages;
1403 	e_fmr->fmr_max_maps = save_fmr.fmr_max_maps;
1404 	e_fmr->fmr_map_cnt = save_fmr.fmr_map_cnt;
1405 	e_fmr->acl = save_fmr.acl;
1406 
1407 	memset(&pginfo, 0, sizeof(pginfo));
1408 	pginfo.type = EHCA_MR_PGI_FMR;
1409 	ret = ehca_reg_mr(shca, e_fmr, NULL,
1410 			  (e_fmr->fmr_max_pages * e_fmr->fmr_page_size),
1411 			  e_fmr->acl, e_pd, &pginfo, &tmp_lkey,
1412 			  &tmp_rkey);
1413 	if (ret) {
1414 		u32 offset = (u64)(&e_fmr->flags) - (u64)e_fmr;
1415 		memcpy(&e_fmr->flags, &(save_mr.flags),
1416 		       sizeof(struct ehca_mr) - offset);
1417 	}
1418 
1419 ehca_unmap_one_fmr_exit0:
1420 	if (ret)
1421 		ehca_err(&shca->ib_device, "ret=%i tmp_lkey=%x tmp_rkey=%x "
1422 			 "fmr_max_pages=%x",
1423 			 ret, tmp_lkey, tmp_rkey, e_fmr->fmr_max_pages);
1424 	return ret;
1425 } /* end ehca_unmap_one_fmr() */
1426 
1427 /*----------------------------------------------------------------------*/
1428 
ehca_reg_smr(struct ehca_shca * shca,struct ehca_mr * e_origmr,struct ehca_mr * e_newmr,u64 * iova_start,int acl,struct ehca_pd * e_pd,u32 * lkey,u32 * rkey)1429 int ehca_reg_smr(struct ehca_shca *shca,
1430 		 struct ehca_mr *e_origmr,
1431 		 struct ehca_mr *e_newmr,
1432 		 u64 *iova_start,
1433 		 int acl,
1434 		 struct ehca_pd *e_pd,
1435 		 u32 *lkey, /*OUT*/
1436 		 u32 *rkey) /*OUT*/
1437 {
1438 	int ret = 0;
1439 	u64 h_ret;
1440 	u32 hipz_acl;
1441 	struct ehca_mr_hipzout_parms hipzout;
1442 
1443 	ehca_mrmw_map_acl(acl, &hipz_acl);
1444 	ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
1445 
1446 	h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
1447 				    (u64)iova_start, hipz_acl, e_pd->fw_pd,
1448 				    &hipzout);
1449 	if (h_ret != H_SUCCESS) {
1450 		ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lli "
1451 			 "shca=%p e_origmr=%p e_newmr=%p iova_start=%p acl=%x "
1452 			 "e_pd=%p hca_hndl=%llx mr_hndl=%llx lkey=%x",
1453 			 h_ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd,
1454 			 shca->ipz_hca_handle.handle,
1455 			 e_origmr->ipz_mr_handle.handle,
1456 			 e_origmr->ib.ib_mr.lkey);
1457 		ret = ehca2ib_return_code(h_ret);
1458 		goto ehca_reg_smr_exit0;
1459 	}
1460 	/* successful registration */
1461 	e_newmr->num_kpages = e_origmr->num_kpages;
1462 	e_newmr->num_hwpages = e_origmr->num_hwpages;
1463 	e_newmr->hwpage_size   = e_origmr->hwpage_size;
1464 	e_newmr->start = iova_start;
1465 	e_newmr->size = e_origmr->size;
1466 	e_newmr->acl = acl;
1467 	e_newmr->ipz_mr_handle = hipzout.handle;
1468 	*lkey = hipzout.lkey;
1469 	*rkey = hipzout.rkey;
1470 	return 0;
1471 
1472 ehca_reg_smr_exit0:
1473 	if (ret)
1474 		ehca_err(&shca->ib_device, "ret=%i shca=%p e_origmr=%p "
1475 			 "e_newmr=%p iova_start=%p acl=%x e_pd=%p",
1476 			 ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd);
1477 	return ret;
1478 } /* end ehca_reg_smr() */
1479 
1480 /*----------------------------------------------------------------------*/
1481 
1482 /* register internal max-MR to internal SHCA */
ehca_reg_internal_maxmr(struct ehca_shca * shca,struct ehca_pd * e_pd,struct ehca_mr ** e_maxmr)1483 int ehca_reg_internal_maxmr(
1484 	struct ehca_shca *shca,
1485 	struct ehca_pd *e_pd,
1486 	struct ehca_mr **e_maxmr)  /*OUT*/
1487 {
1488 	int ret;
1489 	struct ehca_mr *e_mr;
1490 	u64 *iova_start;
1491 	u64 size_maxmr;
1492 	struct ehca_mr_pginfo pginfo;
1493 	struct ib_phys_buf ib_pbuf;
1494 	u32 num_kpages;
1495 	u32 num_hwpages;
1496 	u64 hw_pgsize;
1497 
1498 	e_mr = ehca_mr_new();
1499 	if (!e_mr) {
1500 		ehca_err(&shca->ib_device, "out of memory");
1501 		ret = -ENOMEM;
1502 		goto ehca_reg_internal_maxmr_exit0;
1503 	}
1504 	e_mr->flags |= EHCA_MR_FLAG_MAXMR;
1505 
1506 	/* register internal max-MR on HCA */
1507 	size_maxmr = (u64)high_memory - PAGE_OFFSET;
1508 	iova_start = (u64 *)KERNELBASE;
1509 	ib_pbuf.addr = 0;
1510 	ib_pbuf.size = size_maxmr;
1511 	num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size_maxmr,
1512 				PAGE_SIZE);
1513 	hw_pgsize = ehca_get_max_hwpage_size(shca);
1514 	num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size_maxmr,
1515 				 hw_pgsize);
1516 
1517 	memset(&pginfo, 0, sizeof(pginfo));
1518 	pginfo.type = EHCA_MR_PGI_PHYS;
1519 	pginfo.num_kpages = num_kpages;
1520 	pginfo.num_hwpages = num_hwpages;
1521 	pginfo.hwpage_size = hw_pgsize;
1522 	pginfo.u.phy.num_phys_buf = 1;
1523 	pginfo.u.phy.phys_buf_array = &ib_pbuf;
1524 
1525 	ret = ehca_reg_mr(shca, e_mr, iova_start, size_maxmr, 0, e_pd,
1526 			  &pginfo, &e_mr->ib.ib_mr.lkey,
1527 			  &e_mr->ib.ib_mr.rkey);
1528 	if (ret) {
1529 		ehca_err(&shca->ib_device, "reg of internal max MR failed, "
1530 			 "e_mr=%p iova_start=%p size_maxmr=%llx num_kpages=%x "
1531 			 "num_hwpages=%x", e_mr, iova_start, size_maxmr,
1532 			 num_kpages, num_hwpages);
1533 		goto ehca_reg_internal_maxmr_exit1;
1534 	}
1535 
1536 	/* successful registration of all pages */
1537 	e_mr->ib.ib_mr.device = e_pd->ib_pd.device;
1538 	e_mr->ib.ib_mr.pd = &e_pd->ib_pd;
1539 	e_mr->ib.ib_mr.uobject = NULL;
1540 	atomic_inc(&(e_pd->ib_pd.usecnt));
1541 	atomic_set(&(e_mr->ib.ib_mr.usecnt), 0);
1542 	*e_maxmr = e_mr;
1543 	return 0;
1544 
1545 ehca_reg_internal_maxmr_exit1:
1546 	ehca_mr_delete(e_mr);
1547 ehca_reg_internal_maxmr_exit0:
1548 	if (ret)
1549 		ehca_err(&shca->ib_device, "ret=%i shca=%p e_pd=%p e_maxmr=%p",
1550 			 ret, shca, e_pd, e_maxmr);
1551 	return ret;
1552 } /* end ehca_reg_internal_maxmr() */
1553 
1554 /*----------------------------------------------------------------------*/
1555 
ehca_reg_maxmr(struct ehca_shca * shca,struct ehca_mr * e_newmr,u64 * iova_start,int acl,struct ehca_pd * e_pd,u32 * lkey,u32 * rkey)1556 int ehca_reg_maxmr(struct ehca_shca *shca,
1557 		   struct ehca_mr *e_newmr,
1558 		   u64 *iova_start,
1559 		   int acl,
1560 		   struct ehca_pd *e_pd,
1561 		   u32 *lkey,
1562 		   u32 *rkey)
1563 {
1564 	u64 h_ret;
1565 	struct ehca_mr *e_origmr = shca->maxmr;
1566 	u32 hipz_acl;
1567 	struct ehca_mr_hipzout_parms hipzout;
1568 
1569 	ehca_mrmw_map_acl(acl, &hipz_acl);
1570 	ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);
1571 
1572 	h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,
1573 				    (u64)iova_start, hipz_acl, e_pd->fw_pd,
1574 				    &hipzout);
1575 	if (h_ret != H_SUCCESS) {
1576 		ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lli "
1577 			 "e_origmr=%p hca_hndl=%llx mr_hndl=%llx lkey=%x",
1578 			 h_ret, e_origmr, shca->ipz_hca_handle.handle,
1579 			 e_origmr->ipz_mr_handle.handle,
1580 			 e_origmr->ib.ib_mr.lkey);
1581 		return ehca2ib_return_code(h_ret);
1582 	}
1583 	/* successful registration */
1584 	e_newmr->num_kpages = e_origmr->num_kpages;
1585 	e_newmr->num_hwpages = e_origmr->num_hwpages;
1586 	e_newmr->hwpage_size = e_origmr->hwpage_size;
1587 	e_newmr->start = iova_start;
1588 	e_newmr->size = e_origmr->size;
1589 	e_newmr->acl = acl;
1590 	e_newmr->ipz_mr_handle = hipzout.handle;
1591 	*lkey = hipzout.lkey;
1592 	*rkey = hipzout.rkey;
1593 	return 0;
1594 } /* end ehca_reg_maxmr() */
1595 
1596 /*----------------------------------------------------------------------*/
1597 
ehca_dereg_internal_maxmr(struct ehca_shca * shca)1598 int ehca_dereg_internal_maxmr(struct ehca_shca *shca)
1599 {
1600 	int ret;
1601 	struct ehca_mr *e_maxmr;
1602 	struct ib_pd *ib_pd;
1603 
1604 	if (!shca->maxmr) {
1605 		ehca_err(&shca->ib_device, "bad call, shca=%p", shca);
1606 		ret = -EINVAL;
1607 		goto ehca_dereg_internal_maxmr_exit0;
1608 	}
1609 
1610 	e_maxmr = shca->maxmr;
1611 	ib_pd = e_maxmr->ib.ib_mr.pd;
1612 	shca->maxmr = NULL; /* remove internal max-MR indication from SHCA */
1613 
1614 	ret = ehca_dereg_mr(&e_maxmr->ib.ib_mr);
1615 	if (ret) {
1616 		ehca_err(&shca->ib_device, "dereg internal max-MR failed, "
1617 			 "ret=%i e_maxmr=%p shca=%p lkey=%x",
1618 			 ret, e_maxmr, shca, e_maxmr->ib.ib_mr.lkey);
1619 		shca->maxmr = e_maxmr;
1620 		goto ehca_dereg_internal_maxmr_exit0;
1621 	}
1622 
1623 	atomic_dec(&ib_pd->usecnt);
1624 
1625 ehca_dereg_internal_maxmr_exit0:
1626 	if (ret)
1627 		ehca_err(&shca->ib_device, "ret=%i shca=%p shca->maxmr=%p",
1628 			 ret, shca, shca->maxmr);
1629 	return ret;
1630 } /* end ehca_dereg_internal_maxmr() */
1631 
1632 /*----------------------------------------------------------------------*/
1633 
1634 /*
1635  * check physical buffer array of MR verbs for validness and
1636  * calculates MR size
1637  */
ehca_mr_chk_buf_and_calc_size(struct ib_phys_buf * phys_buf_array,int num_phys_buf,u64 * iova_start,u64 * size)1638 int ehca_mr_chk_buf_and_calc_size(struct ib_phys_buf *phys_buf_array,
1639 				  int num_phys_buf,
1640 				  u64 *iova_start,
1641 				  u64 *size)
1642 {
1643 	struct ib_phys_buf *pbuf = phys_buf_array;
1644 	u64 size_count = 0;
1645 	u32 i;
1646 
1647 	if (num_phys_buf == 0) {
1648 		ehca_gen_err("bad phys buf array len, num_phys_buf=0");
1649 		return -EINVAL;
1650 	}
1651 	/* check first buffer */
1652 	if (((u64)iova_start & ~PAGE_MASK) != (pbuf->addr & ~PAGE_MASK)) {
1653 		ehca_gen_err("iova_start/addr mismatch, iova_start=%p "
1654 			     "pbuf->addr=%llx pbuf->size=%llx",
1655 			     iova_start, pbuf->addr, pbuf->size);
1656 		return -EINVAL;
1657 	}
1658 	if (((pbuf->addr + pbuf->size) % PAGE_SIZE) &&
1659 	    (num_phys_buf > 1)) {
1660 		ehca_gen_err("addr/size mismatch in 1st buf, pbuf->addr=%llx "
1661 			     "pbuf->size=%llx", pbuf->addr, pbuf->size);
1662 		return -EINVAL;
1663 	}
1664 
1665 	for (i = 0; i < num_phys_buf; i++) {
1666 		if ((i > 0) && (pbuf->addr % PAGE_SIZE)) {
1667 			ehca_gen_err("bad address, i=%x pbuf->addr=%llx "
1668 				     "pbuf->size=%llx",
1669 				     i, pbuf->addr, pbuf->size);
1670 			return -EINVAL;
1671 		}
1672 		if (((i > 0) &&	/* not 1st */
1673 		     (i < (num_phys_buf - 1)) &&	/* not last */
1674 		     (pbuf->size % PAGE_SIZE)) || (pbuf->size == 0)) {
1675 			ehca_gen_err("bad size, i=%x pbuf->size=%llx",
1676 				     i, pbuf->size);
1677 			return -EINVAL;
1678 		}
1679 		size_count += pbuf->size;
1680 		pbuf++;
1681 	}
1682 
1683 	*size = size_count;
1684 	return 0;
1685 } /* end ehca_mr_chk_buf_and_calc_size() */
1686 
1687 /*----------------------------------------------------------------------*/
1688 
1689 /* check page list of map FMR verb for validness */
ehca_fmr_check_page_list(struct ehca_mr * e_fmr,u64 * page_list,int list_len)1690 int ehca_fmr_check_page_list(struct ehca_mr *e_fmr,
1691 			     u64 *page_list,
1692 			     int list_len)
1693 {
1694 	u32 i;
1695 	u64 *page;
1696 
1697 	if ((list_len == 0) || (list_len > e_fmr->fmr_max_pages)) {
1698 		ehca_gen_err("bad list_len, list_len=%x "
1699 			     "e_fmr->fmr_max_pages=%x fmr=%p",
1700 			     list_len, e_fmr->fmr_max_pages, e_fmr);
1701 		return -EINVAL;
1702 	}
1703 
1704 	/* each page must be aligned */
1705 	page = page_list;
1706 	for (i = 0; i < list_len; i++) {
1707 		if (*page % e_fmr->fmr_page_size) {
1708 			ehca_gen_err("bad page, i=%x *page=%llx page=%p fmr=%p "
1709 				     "fmr_page_size=%x", i, *page, page, e_fmr,
1710 				     e_fmr->fmr_page_size);
1711 			return -EINVAL;
1712 		}
1713 		page++;
1714 	}
1715 
1716 	return 0;
1717 } /* end ehca_fmr_check_page_list() */
1718 
1719 /*----------------------------------------------------------------------*/
1720 
1721 /* PAGE_SIZE >= pginfo->hwpage_size */
ehca_set_pagebuf_user1(struct ehca_mr_pginfo * pginfo,u32 number,u64 * kpage)1722 static int ehca_set_pagebuf_user1(struct ehca_mr_pginfo *pginfo,
1723 				  u32 number,
1724 				  u64 *kpage)
1725 {
1726 	int ret = 0;
1727 	struct ib_umem_chunk *prev_chunk;
1728 	struct ib_umem_chunk *chunk;
1729 	u64 pgaddr;
1730 	u32 i = 0;
1731 	u32 j = 0;
1732 	int hwpages_per_kpage = PAGE_SIZE / pginfo->hwpage_size;
1733 
1734 	/* loop over desired chunk entries */
1735 	chunk      = pginfo->u.usr.next_chunk;
1736 	prev_chunk = pginfo->u.usr.next_chunk;
1737 	list_for_each_entry_continue(
1738 		chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
1739 		for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
1740 			pgaddr = page_to_pfn(sg_page(&chunk->page_list[i]))
1741 				<< PAGE_SHIFT ;
1742 			*kpage = phys_to_abs(pgaddr +
1743 					     (pginfo->next_hwpage *
1744 					      pginfo->hwpage_size));
1745 			if ( !(*kpage) ) {
1746 				ehca_gen_err("pgaddr=%llx "
1747 					     "chunk->page_list[i]=%llx "
1748 					     "i=%x next_hwpage=%llx",
1749 					     pgaddr, (u64)sg_dma_address(
1750 						     &chunk->page_list[i]),
1751 					     i, pginfo->next_hwpage);
1752 				return -EFAULT;
1753 			}
1754 			(pginfo->hwpage_cnt)++;
1755 			(pginfo->next_hwpage)++;
1756 			kpage++;
1757 			if (pginfo->next_hwpage % hwpages_per_kpage == 0) {
1758 				(pginfo->kpage_cnt)++;
1759 				(pginfo->u.usr.next_nmap)++;
1760 				pginfo->next_hwpage = 0;
1761 				i++;
1762 			}
1763 			j++;
1764 			if (j >= number) break;
1765 		}
1766 		if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
1767 		    (j >= number)) {
1768 			pginfo->u.usr.next_nmap = 0;
1769 			prev_chunk = chunk;
1770 			break;
1771 		} else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
1772 			pginfo->u.usr.next_nmap = 0;
1773 			prev_chunk = chunk;
1774 		} else if (j >= number)
1775 			break;
1776 		else
1777 			prev_chunk = chunk;
1778 	}
1779 	pginfo->u.usr.next_chunk =
1780 		list_prepare_entry(prev_chunk,
1781 				   (&(pginfo->u.usr.region->chunk_list)),
1782 				   list);
1783 	return ret;
1784 }
1785 
1786 /*
1787  * check given pages for contiguous layout
1788  * last page addr is returned in prev_pgaddr for further check
1789  */
ehca_check_kpages_per_ate(struct scatterlist * page_list,int start_idx,int end_idx,u64 * prev_pgaddr)1790 static int ehca_check_kpages_per_ate(struct scatterlist *page_list,
1791 				     int start_idx, int end_idx,
1792 				     u64 *prev_pgaddr)
1793 {
1794 	int t;
1795 	for (t = start_idx; t <= end_idx; t++) {
1796 		u64 pgaddr = page_to_pfn(sg_page(&page_list[t])) << PAGE_SHIFT;
1797 		if (ehca_debug_level >= 3)
1798 			ehca_gen_dbg("chunk_page=%llx value=%016llx", pgaddr,
1799 				     *(u64 *)abs_to_virt(phys_to_abs(pgaddr)));
1800 		if (pgaddr - PAGE_SIZE != *prev_pgaddr) {
1801 			ehca_gen_err("uncontiguous page found pgaddr=%llx "
1802 				     "prev_pgaddr=%llx page_list_i=%x",
1803 				     pgaddr, *prev_pgaddr, t);
1804 			return -EINVAL;
1805 		}
1806 		*prev_pgaddr = pgaddr;
1807 	}
1808 	return 0;
1809 }
1810 
1811 /* PAGE_SIZE < pginfo->hwpage_size */
ehca_set_pagebuf_user2(struct ehca_mr_pginfo * pginfo,u32 number,u64 * kpage)1812 static int ehca_set_pagebuf_user2(struct ehca_mr_pginfo *pginfo,
1813 				  u32 number,
1814 				  u64 *kpage)
1815 {
1816 	int ret = 0;
1817 	struct ib_umem_chunk *prev_chunk;
1818 	struct ib_umem_chunk *chunk;
1819 	u64 pgaddr, prev_pgaddr;
1820 	u32 i = 0;
1821 	u32 j = 0;
1822 	int kpages_per_hwpage = pginfo->hwpage_size / PAGE_SIZE;
1823 	int nr_kpages = kpages_per_hwpage;
1824 
1825 	/* loop over desired chunk entries */
1826 	chunk      = pginfo->u.usr.next_chunk;
1827 	prev_chunk = pginfo->u.usr.next_chunk;
1828 	list_for_each_entry_continue(
1829 		chunk, (&(pginfo->u.usr.region->chunk_list)), list) {
1830 		for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {
1831 			if (nr_kpages == kpages_per_hwpage) {
1832 				pgaddr = ( page_to_pfn(sg_page(&chunk->page_list[i]))
1833 					   << PAGE_SHIFT );
1834 				*kpage = phys_to_abs(pgaddr);
1835 				if ( !(*kpage) ) {
1836 					ehca_gen_err("pgaddr=%llx i=%x",
1837 						     pgaddr, i);
1838 					ret = -EFAULT;
1839 					return ret;
1840 				}
1841 				/*
1842 				 * The first page in a hwpage must be aligned;
1843 				 * the first MR page is exempt from this rule.
1844 				 */
1845 				if (pgaddr & (pginfo->hwpage_size - 1)) {
1846 					if (pginfo->hwpage_cnt) {
1847 						ehca_gen_err(
1848 							"invalid alignment "
1849 							"pgaddr=%llx i=%x "
1850 							"mr_pgsize=%llx",
1851 							pgaddr, i,
1852 							pginfo->hwpage_size);
1853 						ret = -EFAULT;
1854 						return ret;
1855 					}
1856 					/* first MR page */
1857 					pginfo->kpage_cnt =
1858 						(pgaddr &
1859 						 (pginfo->hwpage_size - 1)) >>
1860 						PAGE_SHIFT;
1861 					nr_kpages -= pginfo->kpage_cnt;
1862 					*kpage = phys_to_abs(
1863 						pgaddr &
1864 						~(pginfo->hwpage_size - 1));
1865 				}
1866 				if (ehca_debug_level >= 3) {
1867 					u64 val = *(u64 *)abs_to_virt(
1868 						phys_to_abs(pgaddr));
1869 					ehca_gen_dbg("kpage=%llx chunk_page=%llx "
1870 						     "value=%016llx",
1871 						     *kpage, pgaddr, val);
1872 				}
1873 				prev_pgaddr = pgaddr;
1874 				i++;
1875 				pginfo->kpage_cnt++;
1876 				pginfo->u.usr.next_nmap++;
1877 				nr_kpages--;
1878 				if (!nr_kpages)
1879 					goto next_kpage;
1880 				continue;
1881 			}
1882 			if (i + nr_kpages > chunk->nmap) {
1883 				ret = ehca_check_kpages_per_ate(
1884 					chunk->page_list, i,
1885 					chunk->nmap - 1, &prev_pgaddr);
1886 				if (ret) return ret;
1887 				pginfo->kpage_cnt += chunk->nmap - i;
1888 				pginfo->u.usr.next_nmap += chunk->nmap - i;
1889 				nr_kpages -= chunk->nmap - i;
1890 				break;
1891 			}
1892 
1893 			ret = ehca_check_kpages_per_ate(chunk->page_list, i,
1894 							i + nr_kpages - 1,
1895 							&prev_pgaddr);
1896 			if (ret) return ret;
1897 			i += nr_kpages;
1898 			pginfo->kpage_cnt += nr_kpages;
1899 			pginfo->u.usr.next_nmap += nr_kpages;
1900 next_kpage:
1901 			nr_kpages = kpages_per_hwpage;
1902 			(pginfo->hwpage_cnt)++;
1903 			kpage++;
1904 			j++;
1905 			if (j >= number) break;
1906 		}
1907 		if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&
1908 		    (j >= number)) {
1909 			pginfo->u.usr.next_nmap = 0;
1910 			prev_chunk = chunk;
1911 			break;
1912 		} else if (pginfo->u.usr.next_nmap >= chunk->nmap) {
1913 			pginfo->u.usr.next_nmap = 0;
1914 			prev_chunk = chunk;
1915 		} else if (j >= number)
1916 			break;
1917 		else
1918 			prev_chunk = chunk;
1919 	}
1920 	pginfo->u.usr.next_chunk =
1921 		list_prepare_entry(prev_chunk,
1922 				   (&(pginfo->u.usr.region->chunk_list)),
1923 				   list);
1924 	return ret;
1925 }
1926 
ehca_set_pagebuf_phys(struct ehca_mr_pginfo * pginfo,u32 number,u64 * kpage)1927 static int ehca_set_pagebuf_phys(struct ehca_mr_pginfo *pginfo,
1928 				 u32 number, u64 *kpage)
1929 {
1930 	int ret = 0;
1931 	struct ib_phys_buf *pbuf;
1932 	u64 num_hw, offs_hw;
1933 	u32 i = 0;
1934 
1935 	/* loop over desired phys_buf_array entries */
1936 	while (i < number) {
1937 		pbuf   = pginfo->u.phy.phys_buf_array + pginfo->u.phy.next_buf;
1938 		num_hw  = NUM_CHUNKS((pbuf->addr % pginfo->hwpage_size) +
1939 				     pbuf->size, pginfo->hwpage_size);
1940 		offs_hw = (pbuf->addr & ~(pginfo->hwpage_size - 1)) /
1941 			pginfo->hwpage_size;
1942 		while (pginfo->next_hwpage < offs_hw + num_hw) {
1943 			/* sanity check */
1944 			if ((pginfo->kpage_cnt >= pginfo->num_kpages) ||
1945 			    (pginfo->hwpage_cnt >= pginfo->num_hwpages)) {
1946 				ehca_gen_err("kpage_cnt >= num_kpages, "
1947 					     "kpage_cnt=%llx num_kpages=%llx "
1948 					     "hwpage_cnt=%llx "
1949 					     "num_hwpages=%llx i=%x",
1950 					     pginfo->kpage_cnt,
1951 					     pginfo->num_kpages,
1952 					     pginfo->hwpage_cnt,
1953 					     pginfo->num_hwpages, i);
1954 				return -EFAULT;
1955 			}
1956 			*kpage = phys_to_abs(
1957 				(pbuf->addr & ~(pginfo->hwpage_size - 1)) +
1958 				(pginfo->next_hwpage * pginfo->hwpage_size));
1959 			if ( !(*kpage) && pbuf->addr ) {
1960 				ehca_gen_err("pbuf->addr=%llx pbuf->size=%llx "
1961 					     "next_hwpage=%llx", pbuf->addr,
1962 					     pbuf->size, pginfo->next_hwpage);
1963 				return -EFAULT;
1964 			}
1965 			(pginfo->hwpage_cnt)++;
1966 			(pginfo->next_hwpage)++;
1967 			if (PAGE_SIZE >= pginfo->hwpage_size) {
1968 				if (pginfo->next_hwpage %
1969 				    (PAGE_SIZE / pginfo->hwpage_size) == 0)
1970 					(pginfo->kpage_cnt)++;
1971 			} else
1972 				pginfo->kpage_cnt += pginfo->hwpage_size /
1973 					PAGE_SIZE;
1974 			kpage++;
1975 			i++;
1976 			if (i >= number) break;
1977 		}
1978 		if (pginfo->next_hwpage >= offs_hw + num_hw) {
1979 			(pginfo->u.phy.next_buf)++;
1980 			pginfo->next_hwpage = 0;
1981 		}
1982 	}
1983 	return ret;
1984 }
1985 
ehca_set_pagebuf_fmr(struct ehca_mr_pginfo * pginfo,u32 number,u64 * kpage)1986 static int ehca_set_pagebuf_fmr(struct ehca_mr_pginfo *pginfo,
1987 				u32 number, u64 *kpage)
1988 {
1989 	int ret = 0;
1990 	u64 *fmrlist;
1991 	u32 i;
1992 
1993 	/* loop over desired page_list entries */
1994 	fmrlist = pginfo->u.fmr.page_list + pginfo->u.fmr.next_listelem;
1995 	for (i = 0; i < number; i++) {
1996 		*kpage = phys_to_abs((*fmrlist & ~(pginfo->hwpage_size - 1)) +
1997 				     pginfo->next_hwpage * pginfo->hwpage_size);
1998 		if ( !(*kpage) ) {
1999 			ehca_gen_err("*fmrlist=%llx fmrlist=%p "
2000 				     "next_listelem=%llx next_hwpage=%llx",
2001 				     *fmrlist, fmrlist,
2002 				     pginfo->u.fmr.next_listelem,
2003 				     pginfo->next_hwpage);
2004 			return -EFAULT;
2005 		}
2006 		(pginfo->hwpage_cnt)++;
2007 		if (pginfo->u.fmr.fmr_pgsize >= pginfo->hwpage_size) {
2008 			if (pginfo->next_hwpage %
2009 			    (pginfo->u.fmr.fmr_pgsize /
2010 			     pginfo->hwpage_size) == 0) {
2011 				(pginfo->kpage_cnt)++;
2012 				(pginfo->u.fmr.next_listelem)++;
2013 				fmrlist++;
2014 				pginfo->next_hwpage = 0;
2015 			} else
2016 				(pginfo->next_hwpage)++;
2017 		} else {
2018 			unsigned int cnt_per_hwpage = pginfo->hwpage_size /
2019 				pginfo->u.fmr.fmr_pgsize;
2020 			unsigned int j;
2021 			u64 prev = *kpage;
2022 			/* check if adrs are contiguous */
2023 			for (j = 1; j < cnt_per_hwpage; j++) {
2024 				u64 p = phys_to_abs(fmrlist[j] &
2025 						    ~(pginfo->hwpage_size - 1));
2026 				if (prev + pginfo->u.fmr.fmr_pgsize != p) {
2027 					ehca_gen_err("uncontiguous fmr pages "
2028 						     "found prev=%llx p=%llx "
2029 						     "idx=%x", prev, p, i + j);
2030 					return -EINVAL;
2031 				}
2032 				prev = p;
2033 			}
2034 			pginfo->kpage_cnt += cnt_per_hwpage;
2035 			pginfo->u.fmr.next_listelem += cnt_per_hwpage;
2036 			fmrlist += cnt_per_hwpage;
2037 		}
2038 		kpage++;
2039 	}
2040 	return ret;
2041 }
2042 
2043 /* setup page buffer from page info */
ehca_set_pagebuf(struct ehca_mr_pginfo * pginfo,u32 number,u64 * kpage)2044 int ehca_set_pagebuf(struct ehca_mr_pginfo *pginfo,
2045 		     u32 number,
2046 		     u64 *kpage)
2047 {
2048 	int ret;
2049 
2050 	switch (pginfo->type) {
2051 	case EHCA_MR_PGI_PHYS:
2052 		ret = ehca_set_pagebuf_phys(pginfo, number, kpage);
2053 		break;
2054 	case EHCA_MR_PGI_USER:
2055 		ret = PAGE_SIZE >= pginfo->hwpage_size ?
2056 			ehca_set_pagebuf_user1(pginfo, number, kpage) :
2057 			ehca_set_pagebuf_user2(pginfo, number, kpage);
2058 		break;
2059 	case EHCA_MR_PGI_FMR:
2060 		ret = ehca_set_pagebuf_fmr(pginfo, number, kpage);
2061 		break;
2062 	default:
2063 		ehca_gen_err("bad pginfo->type=%x", pginfo->type);
2064 		ret = -EFAULT;
2065 		break;
2066 	}
2067 	return ret;
2068 } /* end ehca_set_pagebuf() */
2069 
2070 /*----------------------------------------------------------------------*/
2071 
2072 /*
2073  * check MR if it is a max-MR, i.e. uses whole memory
2074  * in case it's a max-MR 1 is returned, else 0
2075  */
ehca_mr_is_maxmr(u64 size,u64 * iova_start)2076 int ehca_mr_is_maxmr(u64 size,
2077 		     u64 *iova_start)
2078 {
2079 	/* a MR is treated as max-MR only if it fits following: */
2080 	if ((size == ((u64)high_memory - PAGE_OFFSET)) &&
2081 	    (iova_start == (void *)KERNELBASE)) {
2082 		ehca_gen_dbg("this is a max-MR");
2083 		return 1;
2084 	} else
2085 		return 0;
2086 } /* end ehca_mr_is_maxmr() */
2087 
2088 /*----------------------------------------------------------------------*/
2089 
2090 /* map access control for MR/MW. This routine is used for MR and MW. */
ehca_mrmw_map_acl(int ib_acl,u32 * hipz_acl)2091 void ehca_mrmw_map_acl(int ib_acl,
2092 		       u32 *hipz_acl)
2093 {
2094 	*hipz_acl = 0;
2095 	if (ib_acl & IB_ACCESS_REMOTE_READ)
2096 		*hipz_acl |= HIPZ_ACCESSCTRL_R_READ;
2097 	if (ib_acl & IB_ACCESS_REMOTE_WRITE)
2098 		*hipz_acl |= HIPZ_ACCESSCTRL_R_WRITE;
2099 	if (ib_acl & IB_ACCESS_REMOTE_ATOMIC)
2100 		*hipz_acl |= HIPZ_ACCESSCTRL_R_ATOMIC;
2101 	if (ib_acl & IB_ACCESS_LOCAL_WRITE)
2102 		*hipz_acl |= HIPZ_ACCESSCTRL_L_WRITE;
2103 	if (ib_acl & IB_ACCESS_MW_BIND)
2104 		*hipz_acl |= HIPZ_ACCESSCTRL_MW_BIND;
2105 } /* end ehca_mrmw_map_acl() */
2106 
2107 /*----------------------------------------------------------------------*/
2108 
2109 /* sets page size in hipz access control for MR/MW. */
ehca_mrmw_set_pgsize_hipz_acl(u32 pgsize,u32 * hipz_acl)2110 void ehca_mrmw_set_pgsize_hipz_acl(u32 pgsize, u32 *hipz_acl) /*INOUT*/
2111 {
2112 	*hipz_acl |= (ehca_encode_hwpage_size(pgsize) << 24);
2113 } /* end ehca_mrmw_set_pgsize_hipz_acl() */
2114 
2115 /*----------------------------------------------------------------------*/
2116 
2117 /*
2118  * reverse map access control for MR/MW.
2119  * This routine is used for MR and MW.
2120  */
ehca_mrmw_reverse_map_acl(const u32 * hipz_acl,int * ib_acl)2121 void ehca_mrmw_reverse_map_acl(const u32 *hipz_acl,
2122 			       int *ib_acl) /*OUT*/
2123 {
2124 	*ib_acl = 0;
2125 	if (*hipz_acl & HIPZ_ACCESSCTRL_R_READ)
2126 		*ib_acl |= IB_ACCESS_REMOTE_READ;
2127 	if (*hipz_acl & HIPZ_ACCESSCTRL_R_WRITE)
2128 		*ib_acl |= IB_ACCESS_REMOTE_WRITE;
2129 	if (*hipz_acl & HIPZ_ACCESSCTRL_R_ATOMIC)
2130 		*ib_acl |= IB_ACCESS_REMOTE_ATOMIC;
2131 	if (*hipz_acl & HIPZ_ACCESSCTRL_L_WRITE)
2132 		*ib_acl |= IB_ACCESS_LOCAL_WRITE;
2133 	if (*hipz_acl & HIPZ_ACCESSCTRL_MW_BIND)
2134 		*ib_acl |= IB_ACCESS_MW_BIND;
2135 } /* end ehca_mrmw_reverse_map_acl() */
2136 
2137 
2138 /*----------------------------------------------------------------------*/
2139 
2140 /*
2141  * MR destructor and constructor
2142  * used in Reregister MR verb, sets all fields in ehca_mr_t to 0,
2143  * except struct ib_mr and spinlock
2144  */
ehca_mr_deletenew(struct ehca_mr * mr)2145 void ehca_mr_deletenew(struct ehca_mr *mr)
2146 {
2147 	mr->flags = 0;
2148 	mr->num_kpages = 0;
2149 	mr->num_hwpages = 0;
2150 	mr->acl = 0;
2151 	mr->start = NULL;
2152 	mr->fmr_page_size = 0;
2153 	mr->fmr_max_pages = 0;
2154 	mr->fmr_max_maps = 0;
2155 	mr->fmr_map_cnt = 0;
2156 	memset(&mr->ipz_mr_handle, 0, sizeof(mr->ipz_mr_handle));
2157 	memset(&mr->galpas, 0, sizeof(mr->galpas));
2158 } /* end ehca_mr_deletenew() */
2159 
ehca_init_mrmw_cache(void)2160 int ehca_init_mrmw_cache(void)
2161 {
2162 	mr_cache = kmem_cache_create("ehca_cache_mr",
2163 				     sizeof(struct ehca_mr), 0,
2164 				     SLAB_HWCACHE_ALIGN,
2165 				     NULL);
2166 	if (!mr_cache)
2167 		return -ENOMEM;
2168 	mw_cache = kmem_cache_create("ehca_cache_mw",
2169 				     sizeof(struct ehca_mw), 0,
2170 				     SLAB_HWCACHE_ALIGN,
2171 				     NULL);
2172 	if (!mw_cache) {
2173 		kmem_cache_destroy(mr_cache);
2174 		mr_cache = NULL;
2175 		return -ENOMEM;
2176 	}
2177 	return 0;
2178 }
2179 
ehca_cleanup_mrmw_cache(void)2180 void ehca_cleanup_mrmw_cache(void)
2181 {
2182 	if (mr_cache)
2183 		kmem_cache_destroy(mr_cache);
2184 	if (mw_cache)
2185 		kmem_cache_destroy(mw_cache);
2186 }
2187