1// SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
2/*
3 * Copyright (c) 2018 Hisilicon Limited.
4 */
5
6#include <rdma/ib_umem.h>
7#include <rdma/uverbs_ioctl.h>
8#include "hns_roce_device.h"
9#include "hns_roce_cmd.h"
10#include "hns_roce_hem.h"
11
12void hns_roce_srq_event(struct hns_roce_dev *hr_dev, u32 srqn, int event_type)
13{
14 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
15 struct hns_roce_srq *srq;
16
17 xa_lock(&srq_table->xa);
18 srq = xa_load(&srq_table->xa, index: srqn & (hr_dev->caps.num_srqs - 1));
19 if (srq)
20 refcount_inc(r: &srq->refcount);
21 xa_unlock(&srq_table->xa);
22
23 if (!srq) {
24 dev_warn(hr_dev->dev, "Async event for bogus SRQ %08x\n", srqn);
25 return;
26 }
27
28 srq->event(srq, event_type);
29
30 if (refcount_dec_and_test(r: &srq->refcount))
31 complete(&srq->free);
32}
33
34static void hns_roce_ib_srq_event(struct hns_roce_srq *srq,
35 enum hns_roce_event event_type)
36{
37 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev: srq->ibsrq.device);
38 struct ib_srq *ibsrq = &srq->ibsrq;
39 struct ib_event event;
40
41 if (ibsrq->event_handler) {
42 event.device = ibsrq->device;
43 event.element.srq = ibsrq;
44 switch (event_type) {
45 case HNS_ROCE_EVENT_TYPE_SRQ_LIMIT_REACH:
46 event.event = IB_EVENT_SRQ_LIMIT_REACHED;
47 break;
48 case HNS_ROCE_EVENT_TYPE_SRQ_CATAS_ERROR:
49 event.event = IB_EVENT_SRQ_ERR;
50 break;
51 default:
52 dev_err(hr_dev->dev,
53 "hns_roce:Unexpected event type %d on SRQ %06lx\n",
54 event_type, srq->srqn);
55 return;
56 }
57
58 ibsrq->event_handler(&event, ibsrq->srq_context);
59 }
60}
61
62static int alloc_srqn(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
63{
64 struct hns_roce_ida *srq_ida = &hr_dev->srq_table.srq_ida;
65 int id;
66
67 id = ida_alloc_range(&srq_ida->ida, min: srq_ida->min, max: srq_ida->max,
68 GFP_KERNEL);
69 if (id < 0) {
70 ibdev_err(ibdev: &hr_dev->ib_dev, format: "failed to alloc srq(%d).\n", id);
71 return -ENOMEM;
72 }
73
74 srq->srqn = id;
75
76 return 0;
77}
78
79static void free_srqn(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
80{
81 ida_free(&hr_dev->srq_table.srq_ida.ida, id: (int)srq->srqn);
82}
83
84static int hns_roce_create_srqc(struct hns_roce_dev *hr_dev,
85 struct hns_roce_srq *srq)
86{
87 struct ib_device *ibdev = &hr_dev->ib_dev;
88 struct hns_roce_cmd_mailbox *mailbox;
89 int ret;
90
91 mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
92 if (IS_ERR(ptr: mailbox)) {
93 ibdev_err(ibdev, format: "failed to alloc mailbox for SRQC.\n");
94 return PTR_ERR(ptr: mailbox);
95 }
96
97 ret = hr_dev->hw->write_srqc(srq, mailbox->buf);
98 if (ret) {
99 ibdev_err(ibdev, format: "failed to write SRQC.\n");
100 goto err_mbox;
101 }
102
103 ret = hns_roce_create_hw_ctx(dev: hr_dev, mailbox, cmd: HNS_ROCE_CMD_CREATE_SRQ,
104 idx: srq->srqn);
105 if (ret)
106 ibdev_err(ibdev, format: "failed to config SRQC, ret = %d.\n", ret);
107
108err_mbox:
109 hns_roce_free_cmd_mailbox(hr_dev, mailbox);
110 return ret;
111}
112
113static int alloc_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
114{
115 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
116 struct ib_device *ibdev = &hr_dev->ib_dev;
117 int ret;
118
119 ret = hns_roce_table_get(hr_dev, table: &srq_table->table, obj: srq->srqn);
120 if (ret) {
121 ibdev_err(ibdev, format: "failed to get SRQC table, ret = %d.\n", ret);
122 return ret;
123 }
124
125 ret = xa_err(entry: xa_store_irq(xa: &srq_table->xa, index: srq->srqn, entry: srq, GFP_KERNEL));
126 if (ret) {
127 ibdev_err(ibdev, format: "failed to store SRQC, ret = %d.\n", ret);
128 goto err_put;
129 }
130
131 ret = hns_roce_create_srqc(hr_dev, srq);
132 if (ret)
133 goto err_xa;
134
135 return 0;
136
137err_xa:
138 xa_erase_irq(xa: &srq_table->xa, index: srq->srqn);
139err_put:
140 hns_roce_table_put(hr_dev, table: &srq_table->table, obj: srq->srqn);
141
142 return ret;
143}
144
145static void free_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
146{
147 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
148 int ret;
149
150 ret = hns_roce_destroy_hw_ctx(dev: hr_dev, cmd: HNS_ROCE_CMD_DESTROY_SRQ,
151 idx: srq->srqn);
152 if (ret)
153 dev_err_ratelimited(hr_dev->dev, "DESTROY_SRQ failed (%d) for SRQN %06lx\n",
154 ret, srq->srqn);
155
156 xa_erase_irq(xa: &srq_table->xa, index: srq->srqn);
157
158 if (refcount_dec_and_test(r: &srq->refcount))
159 complete(&srq->free);
160 wait_for_completion(&srq->free);
161
162 hns_roce_table_put(hr_dev, table: &srq_table->table, obj: srq->srqn);
163}
164
165static int alloc_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
166 struct ib_udata *udata, unsigned long addr)
167{
168 struct hns_roce_idx_que *idx_que = &srq->idx_que;
169 struct ib_device *ibdev = &hr_dev->ib_dev;
170 struct hns_roce_buf_attr buf_attr = {};
171 int ret;
172
173 srq->idx_que.entry_shift = ilog2(HNS_ROCE_IDX_QUE_ENTRY_SZ);
174
175 buf_attr.page_shift = hr_dev->caps.idx_buf_pg_sz + PAGE_SHIFT;
176 buf_attr.region[0].size = to_hr_hem_entries_size(count: srq->wqe_cnt,
177 buf_shift: srq->idx_que.entry_shift);
178 buf_attr.region[0].hopnum = hr_dev->caps.idx_hop_num;
179 buf_attr.region_count = 1;
180
181 ret = hns_roce_mtr_create(hr_dev, mtr: &idx_que->mtr, buf_attr: &buf_attr,
182 page_shift: hr_dev->caps.idx_ba_pg_sz + PAGE_SHIFT,
183 udata, user_addr: addr);
184 if (ret) {
185 ibdev_err(ibdev,
186 format: "failed to alloc SRQ idx mtr, ret = %d.\n", ret);
187 return ret;
188 }
189
190 if (!udata) {
191 idx_que->bitmap = bitmap_zalloc(nbits: srq->wqe_cnt, GFP_KERNEL);
192 if (!idx_que->bitmap) {
193 ibdev_err(ibdev, format: "failed to alloc SRQ idx bitmap.\n");
194 ret = -ENOMEM;
195 goto err_idx_mtr;
196 }
197 }
198
199 idx_que->head = 0;
200 idx_que->tail = 0;
201
202 return 0;
203err_idx_mtr:
204 hns_roce_mtr_destroy(hr_dev, mtr: &idx_que->mtr);
205
206 return ret;
207}
208
209static void free_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
210{
211 struct hns_roce_idx_que *idx_que = &srq->idx_que;
212
213 bitmap_free(bitmap: idx_que->bitmap);
214 idx_que->bitmap = NULL;
215 hns_roce_mtr_destroy(hr_dev, mtr: &idx_que->mtr);
216}
217
218static int alloc_srq_wqe_buf(struct hns_roce_dev *hr_dev,
219 struct hns_roce_srq *srq,
220 struct ib_udata *udata, unsigned long addr)
221{
222 struct ib_device *ibdev = &hr_dev->ib_dev;
223 struct hns_roce_buf_attr buf_attr = {};
224 int ret;
225
226 srq->wqe_shift = ilog2(roundup_pow_of_two(max(HNS_ROCE_SGE_SIZE,
227 HNS_ROCE_SGE_SIZE *
228 srq->max_gs)));
229
230 buf_attr.page_shift = hr_dev->caps.srqwqe_buf_pg_sz + PAGE_SHIFT;
231 buf_attr.region[0].size = to_hr_hem_entries_size(count: srq->wqe_cnt,
232 buf_shift: srq->wqe_shift);
233 buf_attr.region[0].hopnum = hr_dev->caps.srqwqe_hop_num;
234 buf_attr.region_count = 1;
235
236 ret = hns_roce_mtr_create(hr_dev, mtr: &srq->buf_mtr, buf_attr: &buf_attr,
237 page_shift: hr_dev->caps.srqwqe_ba_pg_sz + PAGE_SHIFT,
238 udata, user_addr: addr);
239 if (ret)
240 ibdev_err(ibdev,
241 format: "failed to alloc SRQ buf mtr, ret = %d.\n", ret);
242
243 return ret;
244}
245
246static void free_srq_wqe_buf(struct hns_roce_dev *hr_dev,
247 struct hns_roce_srq *srq)
248{
249 hns_roce_mtr_destroy(hr_dev, mtr: &srq->buf_mtr);
250}
251
252static int alloc_srq_wrid(struct hns_roce_srq *srq)
253{
254 srq->wrid = kvmalloc_array(srq->wqe_cnt, sizeof(u64), GFP_KERNEL);
255 if (!srq->wrid)
256 return -ENOMEM;
257
258 return 0;
259}
260
261static void free_srq_wrid(struct hns_roce_srq *srq)
262{
263 kvfree(addr: srq->wrid);
264 srq->wrid = NULL;
265}
266
267static u32 proc_srq_sge(struct hns_roce_dev *dev, struct hns_roce_srq *hr_srq,
268 bool user)
269{
270 u32 max_sge = dev->caps.max_srq_sges;
271
272 if (dev->pci_dev->revision >= PCI_REVISION_ID_HIP09)
273 return max_sge;
274
275 /* Reserve SGEs only for HIP08 in kernel; The userspace driver will
276 * calculate number of max_sge with reserved SGEs when allocating wqe
277 * buf, so there is no need to do this again in kernel. But the number
278 * may exceed the capacity of SGEs recorded in the firmware, so the
279 * kernel driver should just adapt the value accordingly.
280 */
281 if (user)
282 max_sge = roundup_pow_of_two(max_sge + 1);
283 else
284 hr_srq->rsv_sge = 1;
285
286 return max_sge;
287}
288
289static int set_srq_basic_param(struct hns_roce_srq *srq,
290 struct ib_srq_init_attr *init_attr,
291 struct ib_udata *udata)
292{
293 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev: srq->ibsrq.device);
294 struct ib_srq_attr *attr = &init_attr->attr;
295 u32 max_sge;
296
297 max_sge = proc_srq_sge(dev: hr_dev, hr_srq: srq, user: !!udata);
298 if (attr->max_wr > hr_dev->caps.max_srq_wrs ||
299 attr->max_sge > max_sge || !attr->max_sge) {
300 ibdev_err(ibdev: &hr_dev->ib_dev,
301 format: "invalid SRQ attr, depth = %u, sge = %u.\n",
302 attr->max_wr, attr->max_sge);
303 return -EINVAL;
304 }
305
306 attr->max_wr = max_t(u32, attr->max_wr, HNS_ROCE_MIN_SRQ_WQE_NUM);
307 srq->wqe_cnt = roundup_pow_of_two(attr->max_wr);
308 srq->max_gs = roundup_pow_of_two(attr->max_sge + srq->rsv_sge);
309
310 attr->max_wr = srq->wqe_cnt;
311 attr->max_sge = srq->max_gs - srq->rsv_sge;
312 attr->srq_limit = 0;
313
314 return 0;
315}
316
317static void set_srq_ext_param(struct hns_roce_srq *srq,
318 struct ib_srq_init_attr *init_attr)
319{
320 srq->cqn = ib_srq_has_cq(srq_type: init_attr->srq_type) ?
321 to_hr_cq(ib_cq: init_attr->ext.cq)->cqn : 0;
322
323 srq->xrcdn = (init_attr->srq_type == IB_SRQT_XRC) ?
324 to_hr_xrcd(ibxrcd: init_attr->ext.xrc.xrcd)->xrcdn : 0;
325}
326
327static int set_srq_param(struct hns_roce_srq *srq,
328 struct ib_srq_init_attr *init_attr,
329 struct ib_udata *udata)
330{
331 int ret;
332
333 ret = set_srq_basic_param(srq, init_attr, udata);
334 if (ret)
335 return ret;
336
337 set_srq_ext_param(srq, init_attr);
338
339 return 0;
340}
341
342static int alloc_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
343 struct ib_udata *udata)
344{
345 struct hns_roce_ib_create_srq ucmd = {};
346 int ret;
347
348 if (udata) {
349 ret = ib_copy_from_udata(dest: &ucmd, udata,
350 min(udata->inlen, sizeof(ucmd)));
351 if (ret) {
352 ibdev_err(ibdev: &hr_dev->ib_dev,
353 format: "failed to copy SRQ udata, ret = %d.\n",
354 ret);
355 return ret;
356 }
357 }
358
359 ret = alloc_srq_idx(hr_dev, srq, udata, addr: ucmd.que_addr);
360 if (ret)
361 return ret;
362
363 ret = alloc_srq_wqe_buf(hr_dev, srq, udata, addr: ucmd.buf_addr);
364 if (ret)
365 goto err_idx;
366
367 if (!udata) {
368 ret = alloc_srq_wrid(srq);
369 if (ret)
370 goto err_wqe_buf;
371 }
372
373 return 0;
374
375err_wqe_buf:
376 free_srq_wqe_buf(hr_dev, srq);
377err_idx:
378 free_srq_idx(hr_dev, srq);
379
380 return ret;
381}
382
383static void free_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
384{
385 free_srq_wrid(srq);
386 free_srq_wqe_buf(hr_dev, srq);
387 free_srq_idx(hr_dev, srq);
388}
389
390static int get_srq_ucmd(struct hns_roce_srq *srq, struct ib_udata *udata,
391 struct hns_roce_ib_create_srq *ucmd)
392{
393 struct ib_device *ibdev = srq->ibsrq.device;
394 int ret;
395
396 ret = ib_copy_from_udata(dest: ucmd, udata, min(udata->inlen, sizeof(*ucmd)));
397 if (ret) {
398 ibdev_err(ibdev, format: "failed to copy SRQ udata, ret = %d.\n", ret);
399 return ret;
400 }
401
402 return 0;
403}
404
405static void free_srq_db(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
406 struct ib_udata *udata)
407{
408 struct hns_roce_ucontext *uctx;
409
410 if (!(srq->cap_flags & HNS_ROCE_SRQ_CAP_RECORD_DB))
411 return;
412
413 srq->cap_flags &= ~HNS_ROCE_SRQ_CAP_RECORD_DB;
414 if (udata) {
415 uctx = rdma_udata_to_drv_context(udata,
416 struct hns_roce_ucontext,
417 ibucontext);
418 hns_roce_db_unmap_user(context: uctx, db: &srq->rdb);
419 } else {
420 hns_roce_free_db(hr_dev, db: &srq->rdb);
421 }
422}
423
424static int alloc_srq_db(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
425 struct ib_udata *udata,
426 struct hns_roce_ib_create_srq_resp *resp)
427{
428 struct hns_roce_ib_create_srq ucmd = {};
429 struct hns_roce_ucontext *uctx;
430 int ret;
431
432 if (udata) {
433 ret = get_srq_ucmd(srq, udata, ucmd: &ucmd);
434 if (ret)
435 return ret;
436
437 if ((hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ_RECORD_DB) &&
438 (ucmd.req_cap_flags & HNS_ROCE_SRQ_CAP_RECORD_DB)) {
439 uctx = rdma_udata_to_drv_context(udata,
440 struct hns_roce_ucontext, ibucontext);
441 ret = hns_roce_db_map_user(context: uctx, virt: ucmd.db_addr,
442 db: &srq->rdb);
443 if (ret)
444 return ret;
445
446 srq->cap_flags |= HNS_ROCE_RSP_SRQ_CAP_RECORD_DB;
447 }
448 } else {
449 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ_RECORD_DB) {
450 ret = hns_roce_alloc_db(hr_dev, db: &srq->rdb, order: 1);
451 if (ret)
452 return ret;
453
454 *srq->rdb.db_record = 0;
455 srq->cap_flags |= HNS_ROCE_RSP_SRQ_CAP_RECORD_DB;
456 }
457 srq->db_reg = hr_dev->reg_base + SRQ_DB_REG;
458 }
459
460 return 0;
461}
462
463int hns_roce_create_srq(struct ib_srq *ib_srq,
464 struct ib_srq_init_attr *init_attr,
465 struct ib_udata *udata)
466{
467 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev: ib_srq->device);
468 struct hns_roce_ib_create_srq_resp resp = {};
469 struct hns_roce_srq *srq = to_hr_srq(ibsrq: ib_srq);
470 int ret;
471
472 mutex_init(&srq->mutex);
473 spin_lock_init(&srq->lock);
474
475 ret = set_srq_param(srq, init_attr, udata);
476 if (ret)
477 goto err_out;
478
479 ret = alloc_srq_buf(hr_dev, srq, udata);
480 if (ret)
481 goto err_out;
482
483 ret = alloc_srq_db(hr_dev, srq, udata, resp: &resp);
484 if (ret)
485 goto err_srq_buf;
486
487 ret = alloc_srqn(hr_dev, srq);
488 if (ret)
489 goto err_srq_db;
490
491 ret = alloc_srqc(hr_dev, srq);
492 if (ret)
493 goto err_srqn;
494
495 if (udata) {
496 resp.cap_flags = srq->cap_flags;
497 resp.srqn = srq->srqn;
498 if (ib_copy_to_udata(udata, src: &resp,
499 min(udata->outlen, sizeof(resp)))) {
500 ret = -EFAULT;
501 goto err_srqc;
502 }
503 }
504
505 srq->event = hns_roce_ib_srq_event;
506 refcount_set(r: &srq->refcount, n: 1);
507 init_completion(x: &srq->free);
508
509 return 0;
510
511err_srqc:
512 free_srqc(hr_dev, srq);
513err_srqn:
514 free_srqn(hr_dev, srq);
515err_srq_db:
516 free_srq_db(hr_dev, srq, udata);
517err_srq_buf:
518 free_srq_buf(hr_dev, srq);
519err_out:
520 mutex_destroy(lock: &srq->mutex);
521 atomic64_inc(v: &hr_dev->dfx_cnt[HNS_ROCE_DFX_SRQ_CREATE_ERR_CNT]);
522
523 return ret;
524}
525
526int hns_roce_destroy_srq(struct ib_srq *ibsrq, struct ib_udata *udata)
527{
528 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev: ibsrq->device);
529 struct hns_roce_srq *srq = to_hr_srq(ibsrq);
530
531 free_srqc(hr_dev, srq);
532 free_srqn(hr_dev, srq);
533 free_srq_db(hr_dev, srq, udata);
534 free_srq_buf(hr_dev, srq);
535 mutex_destroy(lock: &srq->mutex);
536 return 0;
537}
538
539void hns_roce_init_srq_table(struct hns_roce_dev *hr_dev)
540{
541 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
542 struct hns_roce_ida *srq_ida = &srq_table->srq_ida;
543
544 xa_init(xa: &srq_table->xa);
545
546 ida_init(ida: &srq_ida->ida);
547 srq_ida->max = hr_dev->caps.num_srqs - 1;
548 srq_ida->min = hr_dev->caps.reserved_srqs;
549}
550

source code of linux/drivers/infiniband/hw/hns/hns_roce_srq.c