1 // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
2 /*
3 * Copyright (c) 2018 Hisilicon Limited.
4 */
5
6 #include <rdma/ib_umem.h>
7 #include <rdma/hns-abi.h>
8 #include "hns_roce_device.h"
9 #include "hns_roce_cmd.h"
10 #include "hns_roce_hem.h"
11
hns_roce_srq_event(struct hns_roce_dev * hr_dev,u32 srqn,int event_type)12 void hns_roce_srq_event(struct hns_roce_dev *hr_dev, u32 srqn, int event_type)
13 {
14 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
15 struct hns_roce_srq *srq;
16
17 xa_lock(&srq_table->xa);
18 srq = xa_load(&srq_table->xa, srqn & (hr_dev->caps.num_srqs - 1));
19 if (srq)
20 atomic_inc(&srq->refcount);
21 xa_unlock(&srq_table->xa);
22
23 if (!srq) {
24 dev_warn(hr_dev->dev, "Async event for bogus SRQ %08x\n", srqn);
25 return;
26 }
27
28 srq->event(srq, event_type);
29
30 if (atomic_dec_and_test(&srq->refcount))
31 complete(&srq->free);
32 }
33
hns_roce_ib_srq_event(struct hns_roce_srq * srq,enum hns_roce_event event_type)34 static void hns_roce_ib_srq_event(struct hns_roce_srq *srq,
35 enum hns_roce_event event_type)
36 {
37 struct hns_roce_dev *hr_dev = to_hr_dev(srq->ibsrq.device);
38 struct ib_srq *ibsrq = &srq->ibsrq;
39 struct ib_event event;
40
41 if (ibsrq->event_handler) {
42 event.device = ibsrq->device;
43 event.element.srq = ibsrq;
44 switch (event_type) {
45 case HNS_ROCE_EVENT_TYPE_SRQ_LIMIT_REACH:
46 event.event = IB_EVENT_SRQ_LIMIT_REACHED;
47 break;
48 case HNS_ROCE_EVENT_TYPE_SRQ_CATAS_ERROR:
49 event.event = IB_EVENT_SRQ_ERR;
50 break;
51 default:
52 dev_err(hr_dev->dev,
53 "hns_roce:Unexpected event type 0x%x on SRQ %06lx\n",
54 event_type, srq->srqn);
55 return;
56 }
57
58 ibsrq->event_handler(&event, ibsrq->srq_context);
59 }
60 }
61
hns_roce_hw_create_srq(struct hns_roce_dev * dev,struct hns_roce_cmd_mailbox * mailbox,unsigned long srq_num)62 static int hns_roce_hw_create_srq(struct hns_roce_dev *dev,
63 struct hns_roce_cmd_mailbox *mailbox,
64 unsigned long srq_num)
65 {
66 return hns_roce_cmd_mbox(dev, mailbox->dma, 0, srq_num, 0,
67 HNS_ROCE_CMD_CREATE_SRQ,
68 HNS_ROCE_CMD_TIMEOUT_MSECS);
69 }
70
hns_roce_hw_destroy_srq(struct hns_roce_dev * dev,struct hns_roce_cmd_mailbox * mailbox,unsigned long srq_num)71 static int hns_roce_hw_destroy_srq(struct hns_roce_dev *dev,
72 struct hns_roce_cmd_mailbox *mailbox,
73 unsigned long srq_num)
74 {
75 return hns_roce_cmd_mbox(dev, 0, mailbox ? mailbox->dma : 0, srq_num,
76 mailbox ? 0 : 1, HNS_ROCE_CMD_DESTROY_SRQ,
77 HNS_ROCE_CMD_TIMEOUT_MSECS);
78 }
79
alloc_srqc(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq,u32 pdn,u32 cqn,u16 xrcd,u64 db_rec_addr)80 static int alloc_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
81 u32 pdn, u32 cqn, u16 xrcd, u64 db_rec_addr)
82 {
83 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
84 struct ib_device *ibdev = &hr_dev->ib_dev;
85 struct hns_roce_cmd_mailbox *mailbox;
86 u64 mtts_wqe[MTT_MIN_COUNT] = { 0 };
87 u64 mtts_idx[MTT_MIN_COUNT] = { 0 };
88 dma_addr_t dma_handle_wqe = 0;
89 dma_addr_t dma_handle_idx = 0;
90 int ret;
91
92 /* Get the physical address of srq buf */
93 ret = hns_roce_mtr_find(hr_dev, &srq->buf_mtr, 0, mtts_wqe,
94 ARRAY_SIZE(mtts_wqe), &dma_handle_wqe);
95 if (ret < 1) {
96 ibdev_err(ibdev, "failed to find mtr for SRQ WQE, ret = %d.\n",
97 ret);
98 return -ENOBUFS;
99 }
100
101 /* Get physical address of idx que buf */
102 ret = hns_roce_mtr_find(hr_dev, &srq->idx_que.mtr, 0, mtts_idx,
103 ARRAY_SIZE(mtts_idx), &dma_handle_idx);
104 if (ret < 1) {
105 ibdev_err(ibdev, "failed to find mtr for SRQ idx, ret = %d.\n",
106 ret);
107 return -ENOBUFS;
108 }
109
110 ret = hns_roce_bitmap_alloc(&srq_table->bitmap, &srq->srqn);
111 if (ret) {
112 ibdev_err(ibdev,
113 "failed to alloc SRQ number, ret = %d.\n", ret);
114 return -ENOMEM;
115 }
116
117 ret = hns_roce_table_get(hr_dev, &srq_table->table, srq->srqn);
118 if (ret) {
119 ibdev_err(ibdev, "failed to get SRQC table, ret = %d.\n", ret);
120 goto err_out;
121 }
122
123 ret = xa_err(xa_store(&srq_table->xa, srq->srqn, srq, GFP_KERNEL));
124 if (ret) {
125 ibdev_err(ibdev, "failed to store SRQC, ret = %d.\n", ret);
126 goto err_put;
127 }
128
129 mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
130 if (IS_ERR_OR_NULL(mailbox)) {
131 ret = -ENOMEM;
132 ibdev_err(ibdev, "failed to alloc mailbox for SRQC.\n");
133 goto err_xa;
134 }
135
136 hr_dev->hw->write_srqc(hr_dev, srq, pdn, xrcd, cqn, mailbox->buf,
137 mtts_wqe, mtts_idx, dma_handle_wqe,
138 dma_handle_idx);
139
140 ret = hns_roce_hw_create_srq(hr_dev, mailbox, srq->srqn);
141 hns_roce_free_cmd_mailbox(hr_dev, mailbox);
142 if (ret) {
143 ibdev_err(ibdev, "failed to config SRQC, ret = %d.\n", ret);
144 goto err_xa;
145 }
146
147 atomic_set(&srq->refcount, 1);
148 init_completion(&srq->free);
149 return ret;
150
151 err_xa:
152 xa_erase(&srq_table->xa, srq->srqn);
153
154 err_put:
155 hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
156
157 err_out:
158 hns_roce_bitmap_free(&srq_table->bitmap, srq->srqn, BITMAP_NO_RR);
159 return ret;
160 }
161
free_srqc(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq)162 static void free_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
163 {
164 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
165 int ret;
166
167 ret = hns_roce_hw_destroy_srq(hr_dev, NULL, srq->srqn);
168 if (ret)
169 dev_err(hr_dev->dev, "DESTROY_SRQ failed (%d) for SRQN %06lx\n",
170 ret, srq->srqn);
171
172 xa_erase(&srq_table->xa, srq->srqn);
173
174 if (atomic_dec_and_test(&srq->refcount))
175 complete(&srq->free);
176 wait_for_completion(&srq->free);
177
178 hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
179 hns_roce_bitmap_free(&srq_table->bitmap, srq->srqn, BITMAP_NO_RR);
180 }
181
alloc_srq_buf(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq,struct ib_udata * udata,unsigned long addr)182 static int alloc_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
183 struct ib_udata *udata, unsigned long addr)
184 {
185 struct ib_device *ibdev = &hr_dev->ib_dev;
186 struct hns_roce_buf_attr buf_attr = {};
187 int err;
188
189 srq->wqe_shift = ilog2(roundup_pow_of_two(max(HNS_ROCE_SGE_SIZE,
190 HNS_ROCE_SGE_SIZE *
191 srq->max_gs)));
192
193 buf_attr.page_shift = hr_dev->caps.srqwqe_buf_pg_sz + HNS_HW_PAGE_SHIFT;
194 buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
195 srq->wqe_shift);
196 buf_attr.region[0].hopnum = hr_dev->caps.srqwqe_hop_num;
197 buf_attr.region_count = 1;
198 buf_attr.fixed_page = true;
199
200 err = hns_roce_mtr_create(hr_dev, &srq->buf_mtr, &buf_attr,
201 hr_dev->caps.srqwqe_ba_pg_sz +
202 HNS_HW_PAGE_SHIFT, udata, addr);
203 if (err)
204 ibdev_err(ibdev,
205 "failed to alloc SRQ buf mtr, ret = %d.\n", err);
206
207 return err;
208 }
209
free_srq_buf(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq)210 static void free_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
211 {
212 hns_roce_mtr_destroy(hr_dev, &srq->buf_mtr);
213 }
214
alloc_srq_idx(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq,struct ib_udata * udata,unsigned long addr)215 static int alloc_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
216 struct ib_udata *udata, unsigned long addr)
217 {
218 struct hns_roce_idx_que *idx_que = &srq->idx_que;
219 struct ib_device *ibdev = &hr_dev->ib_dev;
220 struct hns_roce_buf_attr buf_attr = {};
221 int err;
222
223 srq->idx_que.entry_shift = ilog2(HNS_ROCE_IDX_QUE_ENTRY_SZ);
224
225 buf_attr.page_shift = hr_dev->caps.idx_buf_pg_sz + HNS_HW_PAGE_SHIFT;
226 buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
227 srq->idx_que.entry_shift);
228 buf_attr.region[0].hopnum = hr_dev->caps.idx_hop_num;
229 buf_attr.region_count = 1;
230 buf_attr.fixed_page = true;
231
232 err = hns_roce_mtr_create(hr_dev, &idx_que->mtr, &buf_attr,
233 hr_dev->caps.idx_ba_pg_sz + HNS_HW_PAGE_SHIFT,
234 udata, addr);
235 if (err) {
236 ibdev_err(ibdev,
237 "failed to alloc SRQ idx mtr, ret = %d.\n", err);
238 return err;
239 }
240
241 if (!udata) {
242 idx_que->bitmap = bitmap_zalloc(srq->wqe_cnt, GFP_KERNEL);
243 if (!idx_que->bitmap) {
244 ibdev_err(ibdev, "failed to alloc SRQ idx bitmap.\n");
245 err = -ENOMEM;
246 goto err_idx_mtr;
247 }
248
249 }
250
251 return 0;
252 err_idx_mtr:
253 hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
254
255 return err;
256 }
257
free_srq_idx(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq)258 static void free_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
259 {
260 struct hns_roce_idx_que *idx_que = &srq->idx_que;
261
262 bitmap_free(idx_que->bitmap);
263 idx_que->bitmap = NULL;
264 hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
265 }
266
alloc_srq_wrid(struct hns_roce_dev * hr_dev,struct hns_roce_srq * srq)267 static int alloc_srq_wrid(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
268 {
269 srq->head = 0;
270 srq->tail = srq->wqe_cnt - 1;
271 srq->wrid = kvmalloc_array(srq->wqe_cnt, sizeof(u64), GFP_KERNEL);
272 if (!srq->wrid)
273 return -ENOMEM;
274
275 return 0;
276 }
277
free_srq_wrid(struct hns_roce_srq * srq)278 static void free_srq_wrid(struct hns_roce_srq *srq)
279 {
280 kvfree(srq->wrid);
281 srq->wrid = NULL;
282 }
283
hns_roce_create_srq(struct ib_srq * ib_srq,struct ib_srq_init_attr * init_attr,struct ib_udata * udata)284 int hns_roce_create_srq(struct ib_srq *ib_srq,
285 struct ib_srq_init_attr *init_attr,
286 struct ib_udata *udata)
287 {
288 struct hns_roce_dev *hr_dev = to_hr_dev(ib_srq->device);
289 struct hns_roce_ib_create_srq_resp resp = {};
290 struct hns_roce_srq *srq = to_hr_srq(ib_srq);
291 struct ib_device *ibdev = &hr_dev->ib_dev;
292 struct hns_roce_ib_create_srq ucmd = {};
293 int ret;
294 u32 cqn;
295
296 /* Check the actual SRQ wqe and SRQ sge num */
297 if (init_attr->attr.max_wr >= hr_dev->caps.max_srq_wrs ||
298 init_attr->attr.max_sge > hr_dev->caps.max_srq_sges)
299 return -EINVAL;
300
301 mutex_init(&srq->mutex);
302 spin_lock_init(&srq->lock);
303
304 srq->wqe_cnt = roundup_pow_of_two(init_attr->attr.max_wr + 1);
305 srq->max_gs = init_attr->attr.max_sge;
306
307 if (udata) {
308 ret = ib_copy_from_udata(&ucmd, udata,
309 min(udata->inlen, sizeof(ucmd)));
310 if (ret) {
311 ibdev_err(ibdev, "failed to copy SRQ udata, ret = %d.\n",
312 ret);
313 return ret;
314 }
315 }
316
317 ret = alloc_srq_buf(hr_dev, srq, udata, ucmd.buf_addr);
318 if (ret) {
319 ibdev_err(ibdev,
320 "failed to alloc SRQ buffer, ret = %d.\n", ret);
321 return ret;
322 }
323
324 ret = alloc_srq_idx(hr_dev, srq, udata, ucmd.que_addr);
325 if (ret) {
326 ibdev_err(ibdev, "failed to alloc SRQ idx, ret = %d.\n", ret);
327 goto err_buf_alloc;
328 }
329
330 if (!udata) {
331 ret = alloc_srq_wrid(hr_dev, srq);
332 if (ret) {
333 ibdev_err(ibdev, "failed to alloc SRQ wrid, ret = %d.\n",
334 ret);
335 goto err_idx_alloc;
336 }
337 }
338
339 cqn = ib_srq_has_cq(init_attr->srq_type) ?
340 to_hr_cq(init_attr->ext.cq)->cqn : 0;
341 srq->db_reg_l = hr_dev->reg_base + SRQ_DB_REG;
342
343 ret = alloc_srqc(hr_dev, srq, to_hr_pd(ib_srq->pd)->pdn, cqn, 0, 0);
344 if (ret) {
345 ibdev_err(ibdev,
346 "failed to alloc SRQ context, ret = %d.\n", ret);
347 goto err_wrid_alloc;
348 }
349
350 srq->event = hns_roce_ib_srq_event;
351 resp.srqn = srq->srqn;
352
353 if (udata) {
354 ret = ib_copy_to_udata(udata, &resp,
355 min(udata->outlen, sizeof(resp)));
356 if (ret)
357 goto err_srqc_alloc;
358 }
359
360 return 0;
361
362 err_srqc_alloc:
363 free_srqc(hr_dev, srq);
364 err_wrid_alloc:
365 free_srq_wrid(srq);
366 err_idx_alloc:
367 free_srq_idx(hr_dev, srq);
368 err_buf_alloc:
369 free_srq_buf(hr_dev, srq);
370 return ret;
371 }
372
hns_roce_destroy_srq(struct ib_srq * ibsrq,struct ib_udata * udata)373 int hns_roce_destroy_srq(struct ib_srq *ibsrq, struct ib_udata *udata)
374 {
375 struct hns_roce_dev *hr_dev = to_hr_dev(ibsrq->device);
376 struct hns_roce_srq *srq = to_hr_srq(ibsrq);
377
378 free_srqc(hr_dev, srq);
379 free_srq_idx(hr_dev, srq);
380 free_srq_wrid(srq);
381 free_srq_buf(hr_dev, srq);
382 return 0;
383 }
384
hns_roce_init_srq_table(struct hns_roce_dev * hr_dev)385 int hns_roce_init_srq_table(struct hns_roce_dev *hr_dev)
386 {
387 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
388
389 xa_init(&srq_table->xa);
390
391 return hns_roce_bitmap_init(&srq_table->bitmap, hr_dev->caps.num_srqs,
392 hr_dev->caps.num_srqs - 1,
393 hr_dev->caps.reserved_srqs, 0);
394 }
395
hns_roce_cleanup_srq_table(struct hns_roce_dev * hr_dev)396 void hns_roce_cleanup_srq_table(struct hns_roce_dev *hr_dev)
397 {
398 hns_roce_bitmap_cleanup(&hr_dev->srq_table.bitmap);
399 }
400