Merge tag 'io_uring-worker.v3-2021-02-25' of git://git.kernel.dk/linux-block
[linux-2.6-microblaze.git] / drivers / infiniband / hw / hns / hns_roce_srq.c
1 // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
2 /*
3  * Copyright (c) 2018 Hisilicon Limited.
4  */
5
6 #include <linux/pci.h>
7 #include <rdma/ib_umem.h>
8 #include "hns_roce_device.h"
9 #include "hns_roce_cmd.h"
10 #include "hns_roce_hem.h"
11
12 void hns_roce_srq_event(struct hns_roce_dev *hr_dev, u32 srqn, int event_type)
13 {
14         struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
15         struct hns_roce_srq *srq;
16
17         xa_lock(&srq_table->xa);
18         srq = xa_load(&srq_table->xa, srqn & (hr_dev->caps.num_srqs - 1));
19         if (srq)
20                 atomic_inc(&srq->refcount);
21         xa_unlock(&srq_table->xa);
22
23         if (!srq) {
24                 dev_warn(hr_dev->dev, "Async event for bogus SRQ %08x\n", srqn);
25                 return;
26         }
27
28         srq->event(srq, event_type);
29
30         if (atomic_dec_and_test(&srq->refcount))
31                 complete(&srq->free);
32 }
33
34 static void hns_roce_ib_srq_event(struct hns_roce_srq *srq,
35                                   enum hns_roce_event event_type)
36 {
37         struct hns_roce_dev *hr_dev = to_hr_dev(srq->ibsrq.device);
38         struct ib_srq *ibsrq = &srq->ibsrq;
39         struct ib_event event;
40
41         if (ibsrq->event_handler) {
42                 event.device      = ibsrq->device;
43                 event.element.srq = ibsrq;
44                 switch (event_type) {
45                 case HNS_ROCE_EVENT_TYPE_SRQ_LIMIT_REACH:
46                         event.event = IB_EVENT_SRQ_LIMIT_REACHED;
47                         break;
48                 case HNS_ROCE_EVENT_TYPE_SRQ_CATAS_ERROR:
49                         event.event = IB_EVENT_SRQ_ERR;
50                         break;
51                 default:
52                         dev_err(hr_dev->dev,
53                            "hns_roce:Unexpected event type 0x%x on SRQ %06lx\n",
54                            event_type, srq->srqn);
55                         return;
56                 }
57
58                 ibsrq->event_handler(&event, ibsrq->srq_context);
59         }
60 }
61
62 static int hns_roce_hw_create_srq(struct hns_roce_dev *dev,
63                                   struct hns_roce_cmd_mailbox *mailbox,
64                                   unsigned long srq_num)
65 {
66         return hns_roce_cmd_mbox(dev, mailbox->dma, 0, srq_num, 0,
67                                  HNS_ROCE_CMD_CREATE_SRQ,
68                                  HNS_ROCE_CMD_TIMEOUT_MSECS);
69 }
70
71 static int hns_roce_hw_destroy_srq(struct hns_roce_dev *dev,
72                                    struct hns_roce_cmd_mailbox *mailbox,
73                                    unsigned long srq_num)
74 {
75         return hns_roce_cmd_mbox(dev, 0, mailbox ? mailbox->dma : 0, srq_num,
76                                  mailbox ? 0 : 1, HNS_ROCE_CMD_DESTROY_SRQ,
77                                  HNS_ROCE_CMD_TIMEOUT_MSECS);
78 }
79
80 static int alloc_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
81 {
82         struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
83         struct ib_device *ibdev = &hr_dev->ib_dev;
84         struct hns_roce_cmd_mailbox *mailbox;
85         int ret;
86
87         ret = hns_roce_bitmap_alloc(&srq_table->bitmap, &srq->srqn);
88         if (ret) {
89                 ibdev_err(ibdev, "failed to alloc SRQ number.\n");
90                 return -ENOMEM;
91         }
92
93         ret = hns_roce_table_get(hr_dev, &srq_table->table, srq->srqn);
94         if (ret) {
95                 ibdev_err(ibdev, "failed to get SRQC table, ret = %d.\n", ret);
96                 goto err_out;
97         }
98
99         ret = xa_err(xa_store(&srq_table->xa, srq->srqn, srq, GFP_KERNEL));
100         if (ret) {
101                 ibdev_err(ibdev, "failed to store SRQC, ret = %d.\n", ret);
102                 goto err_put;
103         }
104
105         mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
106         if (IS_ERR_OR_NULL(mailbox)) {
107                 ibdev_err(ibdev, "failed to alloc mailbox for SRQC.\n");
108                 ret = -ENOMEM;
109                 goto err_xa;
110         }
111
112         ret = hr_dev->hw->write_srqc(srq, mailbox->buf);
113         if (ret) {
114                 ibdev_err(ibdev, "failed to write SRQC.\n");
115                 goto err_mbox;
116         }
117
118         ret = hns_roce_hw_create_srq(hr_dev, mailbox, srq->srqn);
119         if (ret) {
120                 ibdev_err(ibdev, "failed to config SRQC, ret = %d.\n", ret);
121                 goto err_mbox;
122         }
123
124         hns_roce_free_cmd_mailbox(hr_dev, mailbox);
125
126         return 0;
127
128 err_mbox:
129         hns_roce_free_cmd_mailbox(hr_dev, mailbox);
130 err_xa:
131         xa_erase(&srq_table->xa, srq->srqn);
132 err_put:
133         hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
134 err_out:
135         hns_roce_bitmap_free(&srq_table->bitmap, srq->srqn, BITMAP_NO_RR);
136
137         return ret;
138 }
139
140 static void free_srqc(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
141 {
142         struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
143         int ret;
144
145         ret = hns_roce_hw_destroy_srq(hr_dev, NULL, srq->srqn);
146         if (ret)
147                 dev_err(hr_dev->dev, "DESTROY_SRQ failed (%d) for SRQN %06lx\n",
148                         ret, srq->srqn);
149
150         xa_erase(&srq_table->xa, srq->srqn);
151
152         if (atomic_dec_and_test(&srq->refcount))
153                 complete(&srq->free);
154         wait_for_completion(&srq->free);
155
156         hns_roce_table_put(hr_dev, &srq_table->table, srq->srqn);
157         hns_roce_bitmap_free(&srq_table->bitmap, srq->srqn, BITMAP_NO_RR);
158 }
159
160 static int alloc_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
161                          struct ib_udata *udata, unsigned long addr)
162 {
163         struct hns_roce_idx_que *idx_que = &srq->idx_que;
164         struct ib_device *ibdev = &hr_dev->ib_dev;
165         struct hns_roce_buf_attr buf_attr = {};
166         int ret;
167
168         srq->idx_que.entry_shift = ilog2(HNS_ROCE_IDX_QUE_ENTRY_SZ);
169
170         buf_attr.page_shift = hr_dev->caps.idx_buf_pg_sz + HNS_HW_PAGE_SHIFT;
171         buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
172                                         srq->idx_que.entry_shift);
173         buf_attr.region[0].hopnum = hr_dev->caps.idx_hop_num;
174         buf_attr.region_count = 1;
175
176         ret = hns_roce_mtr_create(hr_dev, &idx_que->mtr, &buf_attr,
177                                   hr_dev->caps.idx_ba_pg_sz + HNS_HW_PAGE_SHIFT,
178                                   udata, addr);
179         if (ret) {
180                 ibdev_err(ibdev,
181                           "failed to alloc SRQ idx mtr, ret = %d.\n", ret);
182                 return ret;
183         }
184
185         if (!udata) {
186                 idx_que->bitmap = bitmap_zalloc(srq->wqe_cnt, GFP_KERNEL);
187                 if (!idx_que->bitmap) {
188                         ibdev_err(ibdev, "failed to alloc SRQ idx bitmap.\n");
189                         ret = -ENOMEM;
190                         goto err_idx_mtr;
191                 }
192         }
193
194         idx_que->head = 0;
195         idx_que->tail = 0;
196
197         return 0;
198 err_idx_mtr:
199         hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
200
201         return ret;
202 }
203
204 static void free_srq_idx(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
205 {
206         struct hns_roce_idx_que *idx_que = &srq->idx_que;
207
208         bitmap_free(idx_que->bitmap);
209         idx_que->bitmap = NULL;
210         hns_roce_mtr_destroy(hr_dev, &idx_que->mtr);
211 }
212
213 static int alloc_srq_wqe_buf(struct hns_roce_dev *hr_dev,
214                              struct hns_roce_srq *srq,
215                              struct ib_udata *udata, unsigned long addr)
216 {
217         struct ib_device *ibdev = &hr_dev->ib_dev;
218         struct hns_roce_buf_attr buf_attr = {};
219         int ret;
220
221         srq->wqe_shift = ilog2(roundup_pow_of_two(max(HNS_ROCE_SGE_SIZE,
222                                                       HNS_ROCE_SGE_SIZE *
223                                                       srq->max_gs)));
224
225         buf_attr.page_shift = hr_dev->caps.srqwqe_buf_pg_sz + HNS_HW_PAGE_SHIFT;
226         buf_attr.region[0].size = to_hr_hem_entries_size(srq->wqe_cnt,
227                                                          srq->wqe_shift);
228         buf_attr.region[0].hopnum = hr_dev->caps.srqwqe_hop_num;
229         buf_attr.region_count = 1;
230
231         ret = hns_roce_mtr_create(hr_dev, &srq->buf_mtr, &buf_attr,
232                                   hr_dev->caps.srqwqe_ba_pg_sz +
233                                   HNS_HW_PAGE_SHIFT, udata, addr);
234         if (ret)
235                 ibdev_err(ibdev,
236                           "failed to alloc SRQ buf mtr, ret = %d.\n", ret);
237
238         return ret;
239 }
240
241 static void free_srq_wqe_buf(struct hns_roce_dev *hr_dev,
242                              struct hns_roce_srq *srq)
243 {
244         hns_roce_mtr_destroy(hr_dev, &srq->buf_mtr);
245 }
246
247 static int alloc_srq_wrid(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
248 {
249         srq->wrid = kvmalloc_array(srq->wqe_cnt, sizeof(u64), GFP_KERNEL);
250         if (!srq->wrid)
251                 return -ENOMEM;
252
253         return 0;
254 }
255
256 static void free_srq_wrid(struct hns_roce_srq *srq)
257 {
258         kfree(srq->wrid);
259         srq->wrid = NULL;
260 }
261
262 static u32 proc_srq_sge(struct hns_roce_dev *dev, struct hns_roce_srq *hr_srq,
263                         bool user)
264 {
265         u32 max_sge = dev->caps.max_srq_sges;
266
267         if (dev->pci_dev->revision >= PCI_REVISION_ID_HIP09)
268                 return max_sge;
269
270         /* Reserve SGEs only for HIP08 in kernel; The userspace driver will
271          * calculate number of max_sge with reserved SGEs when allocating wqe
272          * buf, so there is no need to do this again in kernel. But the number
273          * may exceed the capacity of SGEs recorded in the firmware, so the
274          * kernel driver should just adapt the value accordingly.
275          */
276         if (user)
277                 max_sge = roundup_pow_of_two(max_sge + 1);
278         else
279                 hr_srq->rsv_sge = 1;
280
281         return max_sge;
282 }
283
284 static int set_srq_basic_param(struct hns_roce_srq *srq,
285                                struct ib_srq_init_attr *init_attr,
286                                struct ib_udata *udata)
287 {
288         struct hns_roce_dev *hr_dev = to_hr_dev(srq->ibsrq.device);
289         struct ib_srq_attr *attr = &init_attr->attr;
290         u32 max_sge;
291
292         max_sge = proc_srq_sge(hr_dev, srq, !!udata);
293         if (attr->max_wr > hr_dev->caps.max_srq_wrs ||
294             attr->max_sge > max_sge) {
295                 ibdev_err(&hr_dev->ib_dev,
296                           "invalid SRQ attr, depth = %u, sge = %u.\n",
297                           attr->max_wr, attr->max_sge);
298                 return -EINVAL;
299         }
300
301         attr->max_wr = max_t(u32, attr->max_wr, HNS_ROCE_MIN_SRQ_WQE_NUM);
302         srq->wqe_cnt = roundup_pow_of_two(attr->max_wr);
303         srq->max_gs = roundup_pow_of_two(attr->max_sge + srq->rsv_sge);
304
305         attr->max_wr = srq->wqe_cnt;
306         attr->max_sge = srq->max_gs - srq->rsv_sge;
307         attr->srq_limit = 0;
308
309         return 0;
310 }
311
312 static void set_srq_ext_param(struct hns_roce_srq *srq,
313                               struct ib_srq_init_attr *init_attr)
314 {
315         srq->cqn = ib_srq_has_cq(init_attr->srq_type) ?
316                    to_hr_cq(init_attr->ext.cq)->cqn : 0;
317 }
318
319 static int set_srq_param(struct hns_roce_srq *srq,
320                          struct ib_srq_init_attr *init_attr,
321                          struct ib_udata *udata)
322 {
323         int ret;
324
325         ret = set_srq_basic_param(srq, init_attr, udata);
326         if (ret)
327                 return ret;
328
329         set_srq_ext_param(srq, init_attr);
330
331         return 0;
332 }
333
334 static int alloc_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq,
335                          struct ib_udata *udata)
336 {
337         struct hns_roce_ib_create_srq ucmd = {};
338         int ret;
339
340         if (udata) {
341                 ret = ib_copy_from_udata(&ucmd, udata,
342                                          min(udata->inlen, sizeof(ucmd)));
343                 if (ret) {
344                         ibdev_err(&hr_dev->ib_dev,
345                                   "failed to copy SRQ udata, ret = %d.\n",
346                                   ret);
347                         return ret;
348                 }
349         }
350
351         ret = alloc_srq_idx(hr_dev, srq, udata, ucmd.que_addr);
352         if (ret)
353                 return ret;
354
355         ret = alloc_srq_wqe_buf(hr_dev, srq, udata, ucmd.buf_addr);
356         if (ret)
357                 goto err_idx;
358
359         if (!udata) {
360                 ret = alloc_srq_wrid(hr_dev, srq);
361                 if (ret)
362                         goto err_wqe_buf;
363         }
364
365         return 0;
366
367 err_wqe_buf:
368         free_srq_wqe_buf(hr_dev, srq);
369 err_idx:
370         free_srq_idx(hr_dev, srq);
371
372         return ret;
373 }
374
375 static void free_srq_buf(struct hns_roce_dev *hr_dev, struct hns_roce_srq *srq)
376 {
377         free_srq_wrid(srq);
378         free_srq_wqe_buf(hr_dev, srq);
379         free_srq_idx(hr_dev, srq);
380 }
381
382 int hns_roce_create_srq(struct ib_srq *ib_srq,
383                         struct ib_srq_init_attr *init_attr,
384                         struct ib_udata *udata)
385 {
386         struct hns_roce_dev *hr_dev = to_hr_dev(ib_srq->device);
387         struct hns_roce_ib_create_srq_resp resp = {};
388         struct hns_roce_srq *srq = to_hr_srq(ib_srq);
389         int ret;
390
391         mutex_init(&srq->mutex);
392         spin_lock_init(&srq->lock);
393
394         ret = set_srq_param(srq, init_attr, udata);
395         if (ret)
396                 return ret;
397
398         ret = alloc_srq_buf(hr_dev, srq, udata);
399         if (ret)
400                 return ret;
401
402         ret = alloc_srqc(hr_dev, srq);
403         if (ret)
404                 goto err_srq_buf;
405
406         if (udata) {
407                 resp.srqn = srq->srqn;
408                 if (ib_copy_to_udata(udata, &resp,
409                                      min(udata->outlen, sizeof(resp)))) {
410                         ret = -EFAULT;
411                         goto err_srqc;
412                 }
413         }
414
415         srq->db_reg_l = hr_dev->reg_base + SRQ_DB_REG;
416         srq->event = hns_roce_ib_srq_event;
417         atomic_set(&srq->refcount, 1);
418         init_completion(&srq->free);
419
420         return 0;
421
422 err_srqc:
423         free_srqc(hr_dev, srq);
424 err_srq_buf:
425         free_srq_buf(hr_dev, srq);
426
427         return ret;
428 }
429
430 int hns_roce_destroy_srq(struct ib_srq *ibsrq, struct ib_udata *udata)
431 {
432         struct hns_roce_dev *hr_dev = to_hr_dev(ibsrq->device);
433         struct hns_roce_srq *srq = to_hr_srq(ibsrq);
434
435         free_srqc(hr_dev, srq);
436         free_srq_buf(hr_dev, srq);
437         return 0;
438 }
439
440 int hns_roce_init_srq_table(struct hns_roce_dev *hr_dev)
441 {
442         struct hns_roce_srq_table *srq_table = &hr_dev->srq_table;
443
444         xa_init(&srq_table->xa);
445
446         return hns_roce_bitmap_init(&srq_table->bitmap, hr_dev->caps.num_srqs,
447                                     hr_dev->caps.num_srqs - 1,
448                                     hr_dev->caps.reserved_srqs, 0);
449 }
450
451 void hns_roce_cleanup_srq_table(struct hns_roce_dev *hr_dev)
452 {
453         hns_roce_bitmap_cleanup(&hr_dev->srq_table.bitmap);
454 }