1 // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
3 * Copyright (c) 2018 Hisilicon Limited.
7 #include <rdma/ib_umem.h>
8 #include "hns_roce_device.h"
9 #include "hns_roce_cmd.h"
10 #include "hns_roce_hem.h"
12 void hns_roce_srq_event(struct hns_roce_dev *hr_dev, u32 srqn, int event_type)
14 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
15 struct hns_roce_srq *srq;
17 xa_lock(&srq_table->xa);
18 srq = xa_load(&srq_table->xa, srqn & (hr_dev->caps.num_srqs - 1));
20 refcount_inc(&srq->refcount);
21 xa_unlock(&srq_table->xa);
24 dev_warn(hr_dev->dev, "Async event for bogus SRQ %08x\n", srqn);
28 srq->event(srq, event_type);
30 if (refcount_dec_and_test(&srq->refcount))
34 static void hns_roce_ib_srq_event(struct hns_roce_srq *srq,
35 enum hns_roce_event event_type)
37 struct hns_roce_dev *hr_dev = to_hr_dev(srq->ibsrq.device);
38 struct ib_srq *ibsrq = &srq->ibsrq;
39 struct ib_event event;
41 if (ibsrq->event_handler) {
42 event.device = ibsrq->device;
43 event.element.srq = ibsrq;
45 case HNS_ROCE_EVENT_TYPE_SRQ_LIMIT_REACH:
46 event.event = IB_EVENT_SRQ_LIMIT_REACHED;
48 case HNS_ROCE_EVENT_TYPE_SRQ_CATAS_ERROR:
49 event.event = IB_EVENT_SRQ_ERR;
53 "hns_roce:Unexpected event type 0x%x on SRQ %06lx\n",
54 event_type, srq->srqn);
58 ibsrq->event_handler(&event, ibsrq->srq_context);
62 static int alloc_srqn(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
64 struct hns_roce_ida *srq_ida = &hr_dev->srq_table.srq_ida;
67 id = ida_alloc_range(&srq_ida->ida, srq_ida->min, srq_ida->max,
70 ibdev_err(&hr_dev->ib_dev, "failed to alloc srq(%d).\n", id);
79 static void free_srqn(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
81 ida_free(&hr_dev->srq_table.srq_ida.ida, (int)srq->srqn);
84 static int hns_roce_create_srqc(struct hns_roce_dev *hr_dev,
85 struct hns_roce_srq *srq)
87 struct ib_device *ibdev = &hr_dev->ib_dev;
88 struct hns_roce_cmd_mailbox *mailbox;
91 mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
92 if (IS_ERR(mailbox)) {
93 ibdev_err(ibdev, "failed to alloc mailbox for SRQC.\n");
94 return PTR_ERR(mailbox);
97 ret = hr_dev->hw->write_srqc(srq, mailbox->buf);
99 ibdev_err(ibdev, "failed to write SRQC.\n");
103 ret = hns_roce_create_hw_ctx(hr_dev, mailbox, HNS_ROCE_CMD_CREATE_SRQ,
106 ibdev_err(ibdev, "failed to config SRQC, ret = %d.\n", ret);
109 hns_roce_free_cmd_mailbox(hr_dev, mailbox);
113 static int alloc_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
115 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
116 struct ib_device *ibdev = &hr_dev->ib_dev;
119 ret = hns_roce_table_get(hr_dev, &srq_table->table, srq->srqn);
121 ibdev_err(ibdev, "failed to get SRQC table, ret = %d.\n", ret);
125 ret = xa_err(xa_store(&srq_table->xa, srq->srqn, srq, GFP_KERNEL));
127 ibdev_err(ibdev, "failed to store SRQC, ret = %d.\n", ret);
131 ret = hns_roce_create_srqc(hr_dev, srq);
138 xa_erase(&srq_table->xa, srq->srqn);
140 hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
145 static void free_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
147 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
150 ret = hns_roce_destroy_hw_ctx(hr_dev, HNS_ROCE_CMD_DESTROY_SRQ,
153 dev_err(hr_dev->dev, "DESTROY_SRQ failed (%d) for SRQN %06lx\n",
156 xa_erase(&srq_table->xa, srq->srqn);
158 if (refcount_dec_and_test(&srq->refcount))
159 complete(&srq->free);
160 wait_for_completion(&srq->free);
162 hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
165 static int alloc_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
166 struct ib_udata *udata, unsigned long addr)
168 struct hns_roce_idx_que *idx_que = &srq->idx_que;
169 struct ib_device *ibdev = &hr_dev->ib_dev;
170 struct hns_roce_buf_attr buf_attr = {};
173 srq->idx_que.entry_shift = ilog2(HNS_ROCE_IDX_QUE_ENTRY_SZ);
175 buf_attr.page_shift = hr_dev->caps.idx_buf_pg_sz + PAGE_SHIFT;
176 buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
177 srq->idx_que.entry_shift);
178 buf_attr.region[0].hopnum = hr_dev->caps.idx_hop_num;
179 buf_attr.region_count = 1;
181 ret = hns_roce_mtr_create(hr_dev, &idx_que->mtr, &buf_attr,
182 hr_dev->caps.idx_ba_pg_sz + PAGE_SHIFT,
186 "failed to alloc SRQ idx mtr, ret = %d.\n", ret);
191 idx_que->bitmap = bitmap_zalloc(srq->wqe_cnt, GFP_KERNEL);
192 if (!idx_que->bitmap) {
193 ibdev_err(ibdev, "failed to alloc SRQ idx bitmap.\n");
204 hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
209 static void free_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
211 struct hns_roce_idx_que *idx_que = &srq->idx_que;
213 bitmap_free(idx_que->bitmap);
214 idx_que->bitmap = NULL;
215 hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
218 static int alloc_srq_wqe_buf(struct hns_roce_dev *hr_dev,
219 struct hns_roce_srq *srq,
220 struct ib_udata *udata, unsigned long addr)
222 struct ib_device *ibdev = &hr_dev->ib_dev;
223 struct hns_roce_buf_attr buf_attr = {};
226 srq->wqe_shift = ilog2(roundup_pow_of_two(max(HNS_ROCE_SGE_SIZE,
230 buf_attr.page_shift = hr_dev->caps.srqwqe_buf_pg_sz + PAGE_SHIFT;
231 buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
233 buf_attr.region[0].hopnum = hr_dev->caps.srqwqe_hop_num;
234 buf_attr.region_count = 1;
236 ret = hns_roce_mtr_create(hr_dev, &srq->buf_mtr, &buf_attr,
237 hr_dev->caps.srqwqe_ba_pg_sz + PAGE_SHIFT,
241 "failed to alloc SRQ buf mtr, ret = %d.\n", ret);
246 static void free_srq_wqe_buf(struct hns_roce_dev *hr_dev,
247 struct hns_roce_srq *srq)
249 hns_roce_mtr_destroy(hr_dev, &srq->buf_mtr);
252 static int alloc_srq_wrid(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
254 srq->wrid = kvmalloc_array(srq->wqe_cnt, sizeof(u64), GFP_KERNEL);
261 static void free_srq_wrid(struct hns_roce_srq *srq)
267 static u32 proc_srq_sge(struct hns_roce_dev *dev, struct hns_roce_srq *hr_srq,
270 u32 max_sge = dev->caps.max_srq_sges;
272 if (dev->pci_dev->revision >= PCI_REVISION_ID_HIP09)
275 /* Reserve SGEs only for HIP08 in kernel; The userspace driver will
276 * calculate number of max_sge with reserved SGEs when allocating wqe
277 * buf, so there is no need to do this again in kernel. But the number
278 * may exceed the capacity of SGEs recorded in the firmware, so the
279 * kernel driver should just adapt the value accordingly.
282 max_sge = roundup_pow_of_two(max_sge + 1);
289 static int set_srq_basic_param(struct hns_roce_srq *srq,
290 struct ib_srq_init_attr *init_attr,
291 struct ib_udata *udata)
293 struct hns_roce_dev *hr_dev = to_hr_dev(srq->ibsrq.device);
294 struct ib_srq_attr *attr = &init_attr->attr;
297 max_sge = proc_srq_sge(hr_dev, srq, !!udata);
298 if (attr->max_wr > hr_dev->caps.max_srq_wrs ||
299 attr->max_sge > max_sge) {
300 ibdev_err(&hr_dev->ib_dev,
301 "invalid SRQ attr, depth = %u, sge = %u.\n",
302 attr->max_wr, attr->max_sge);
306 attr->max_wr = max_t(u32, attr->max_wr, HNS_ROCE_MIN_SRQ_WQE_NUM);
307 srq->wqe_cnt = roundup_pow_of_two(attr->max_wr);
308 srq->max_gs = roundup_pow_of_two(attr->max_sge + srq->rsv_sge);
310 attr->max_wr = srq->wqe_cnt;
311 attr->max_sge = srq->max_gs - srq->rsv_sge;
317 static void set_srq_ext_param(struct hns_roce_srq *srq,
318 struct ib_srq_init_attr *init_attr)
320 srq->cqn = ib_srq_has_cq(init_attr->srq_type) ?
321 to_hr_cq(init_attr->ext.cq)->cqn : 0;
323 srq->xrcdn = (init_attr->srq_type == IB_SRQT_XRC) ?
324 to_hr_xrcd(init_attr->ext.xrc.xrcd)->xrcdn : 0;
327 static int set_srq_param(struct hns_roce_srq *srq,
328 struct ib_srq_init_attr *init_attr,
329 struct ib_udata *udata)
333 ret = set_srq_basic_param(srq, init_attr, udata);
337 set_srq_ext_param(srq, init_attr);
342 static int alloc_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
343 struct ib_udata *udata)
345 struct hns_roce_ib_create_srq ucmd = {};
349 ret = ib_copy_from_udata(&ucmd, udata,
350 min(udata->inlen, sizeof(ucmd)));
352 ibdev_err(&hr_dev->ib_dev,
353 "failed to copy SRQ udata, ret = %d.\n",
359 ret = alloc_srq_idx(hr_dev, srq, udata, ucmd.que_addr);
363 ret = alloc_srq_wqe_buf(hr_dev, srq, udata, ucmd.buf_addr);
368 ret = alloc_srq_wrid(hr_dev, srq);
376 free_srq_wqe_buf(hr_dev, srq);
378 free_srq_idx(hr_dev, srq);
383 static void free_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
386 free_srq_wqe_buf(hr_dev, srq);
387 free_srq_idx(hr_dev, srq);
390 int hns_roce_create_srq(struct ib_srq *ib_srq,
391 struct ib_srq_init_attr *init_attr,
392 struct ib_udata *udata)
394 struct hns_roce_dev *hr_dev = to_hr_dev(ib_srq->device);
395 struct hns_roce_ib_create_srq_resp resp = {};
396 struct hns_roce_srq *srq = to_hr_srq(ib_srq);
399 mutex_init(&srq->mutex);
400 spin_lock_init(&srq->lock);
402 ret = set_srq_param(srq, init_attr, udata);
406 ret = alloc_srq_buf(hr_dev, srq, udata);
410 ret = alloc_srqn(hr_dev, srq);
414 ret = alloc_srqc(hr_dev, srq);
419 resp.srqn = srq->srqn;
420 if (ib_copy_to_udata(udata, &resp,
421 min(udata->outlen, sizeof(resp)))) {
427 srq->db_reg = hr_dev->reg_base + SRQ_DB_REG;
428 srq->event = hns_roce_ib_srq_event;
429 refcount_set(&srq->refcount, 1);
430 init_completion(&srq->free);
435 free_srqc(hr_dev, srq);
437 free_srqn(hr_dev, srq);
439 free_srq_buf(hr_dev, srq);
444 int hns_roce_destroy_srq(struct ib_srq *ibsrq, struct ib_udata *udata)
446 struct hns_roce_dev *hr_dev = to_hr_dev(ibsrq->device);
447 struct hns_roce_srq *srq = to_hr_srq(ibsrq);
449 free_srqc(hr_dev, srq);
450 free_srqn(hr_dev, srq);
451 free_srq_buf(hr_dev, srq);
455 void hns_roce_init_srq_table(struct hns_roce_dev *hr_dev)
457 struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
458 struct hns_roce_ida *srq_ida = &srq_table->srq_ida;
460 xa_init(&srq_table->xa);
462 ida_init(&srq_ida->ida);
463 srq_ida->max = hr_dev->caps.num_srqs - 1;
464 srq_ida->min = hr_dev->caps.reserved_srqs;