1 // SPDX-License-Identifier: GPL-2.0-only
3 * Intel MIC Platform Software Stack (MPSS)
5 * Copyright(c) 2015 Intel Corporation.
10 #include "scif_main.h"
13 * scif_recv_mark: Handle SCIF_MARK request
14 * @scifdev: SCIF device
15 * @msg: Interrupt message
17 * The peer has requested a mark.
19 void scif_recv_mark(struct scif_dev *scifdev, struct scifmsg *msg)
21 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
25 err = _scif_fence_mark(ep, &mark);
27 msg->uop = SCIF_MARK_NACK;
29 msg->uop = SCIF_MARK_ACK;
30 msg->payload[0] = ep->remote_ep;
31 msg->payload[2] = mark;
32 scif_nodeqp_send(ep->remote_dev, msg);
36 * scif_recv_mark_resp: Handle SCIF_MARK_(N)ACK messages.
37 * @scifdev: SCIF device
38 * @msg: Interrupt message
40 * The peer has responded to a SCIF_MARK message.
42 void scif_recv_mark_resp(struct scif_dev *scifdev, struct scifmsg *msg)
44 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
45 struct scif_fence_info *fence_req =
46 (struct scif_fence_info *)msg->payload[1];
48 mutex_lock(&ep->rma_info.rma_lock);
49 if (msg->uop == SCIF_MARK_ACK) {
50 fence_req->state = OP_COMPLETED;
51 fence_req->dma_mark = (int)msg->payload[2];
53 fence_req->state = OP_FAILED;
55 mutex_unlock(&ep->rma_info.rma_lock);
56 complete(&fence_req->comp);
60 * scif_recv_wait: Handle SCIF_WAIT request
61 * @scifdev: SCIF device
62 * @msg: Interrupt message
64 * The peer has requested waiting on a fence.
66 void scif_recv_wait(struct scif_dev *scifdev, struct scifmsg *msg)
68 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
69 struct scif_remote_fence_info *fence;
72 * Allocate structure for remote fence information and
73 * send a NACK if the allocation failed. The peer will
74 * return ENOMEM upon receiving a NACK.
76 fence = kmalloc(sizeof(*fence), GFP_KERNEL);
78 msg->payload[0] = ep->remote_ep;
79 msg->uop = SCIF_WAIT_NACK;
80 scif_nodeqp_send(ep->remote_dev, msg);
84 /* Prepare the fence request */
85 memcpy(&fence->msg, msg, sizeof(struct scifmsg));
86 INIT_LIST_HEAD(&fence->list);
88 /* Insert to the global remote fence request list */
89 mutex_lock(&scif_info.fencelock);
90 atomic_inc(&ep->rma_info.fence_refcount);
91 list_add_tail(&fence->list, &scif_info.fence);
92 mutex_unlock(&scif_info.fencelock);
94 schedule_work(&scif_info.misc_work);
98 * scif_recv_wait_resp: Handle SCIF_WAIT_(N)ACK messages.
99 * @scifdev: SCIF device
100 * @msg: Interrupt message
102 * The peer has responded to a SCIF_WAIT message.
104 void scif_recv_wait_resp(struct scif_dev *scifdev, struct scifmsg *msg)
106 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
107 struct scif_fence_info *fence_req =
108 (struct scif_fence_info *)msg->payload[1];
110 mutex_lock(&ep->rma_info.rma_lock);
111 if (msg->uop == SCIF_WAIT_ACK)
112 fence_req->state = OP_COMPLETED;
114 fence_req->state = OP_FAILED;
115 mutex_unlock(&ep->rma_info.rma_lock);
116 complete(&fence_req->comp);
120 * scif_recv_sig_local: Handle SCIF_SIG_LOCAL request
121 * @scifdev: SCIF device
122 * @msg: Interrupt message
124 * The peer has requested a signal on a local offset.
126 void scif_recv_sig_local(struct scif_dev *scifdev, struct scifmsg *msg)
128 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
131 err = scif_prog_signal(ep, msg->payload[1], msg->payload[2],
134 msg->uop = SCIF_SIG_NACK;
136 msg->uop = SCIF_SIG_ACK;
137 msg->payload[0] = ep->remote_ep;
138 scif_nodeqp_send(ep->remote_dev, msg);
142 * scif_recv_sig_remote: Handle SCIF_SIGNAL_REMOTE request
143 * @scifdev: SCIF device
144 * @msg: Interrupt message
146 * The peer has requested a signal on a remote offset.
148 void scif_recv_sig_remote(struct scif_dev *scifdev, struct scifmsg *msg)
150 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
153 err = scif_prog_signal(ep, msg->payload[1], msg->payload[2],
156 msg->uop = SCIF_SIG_NACK;
158 msg->uop = SCIF_SIG_ACK;
159 msg->payload[0] = ep->remote_ep;
160 scif_nodeqp_send(ep->remote_dev, msg);
164 * scif_recv_sig_resp: Handle SCIF_SIG_(N)ACK messages.
165 * @scifdev: SCIF device
166 * @msg: Interrupt message
168 * The peer has responded to a signal request.
170 void scif_recv_sig_resp(struct scif_dev *scifdev, struct scifmsg *msg)
172 struct scif_endpt *ep = (struct scif_endpt *)msg->payload[0];
173 struct scif_fence_info *fence_req =
174 (struct scif_fence_info *)msg->payload[3];
176 mutex_lock(&ep->rma_info.rma_lock);
177 if (msg->uop == SCIF_SIG_ACK)
178 fence_req->state = OP_COMPLETED;
180 fence_req->state = OP_FAILED;
181 mutex_unlock(&ep->rma_info.rma_lock);
182 complete(&fence_req->comp);
185 static inline void *scif_get_local_va(off_t off, struct scif_window *window)
187 struct page **pages = window->pinned_pages->pages;
188 int page_nr = (off - window->offset) >> PAGE_SHIFT;
189 off_t page_off = off & ~PAGE_MASK;
191 return page_address(pages[page_nr]) + page_off;
194 static void scif_prog_signal_cb(void *arg)
196 struct scif_cb_arg *cb_arg = arg;
198 dma_pool_free(cb_arg->ep->remote_dev->signal_pool, cb_arg->status,
199 cb_arg->src_dma_addr);
203 static int _scif_prog_signal(scif_epd_t epd, dma_addr_t dst, u64 val)
205 struct scif_endpt *ep = (struct scif_endpt *)epd;
206 struct dma_chan *chan = ep->rma_info.dma_chan;
207 struct dma_device *ddev = chan->device;
208 bool x100 = !is_dma_copy_aligned(chan->device, 1, 1, 1);
209 struct dma_async_tx_descriptor *tx;
210 struct scif_status *status = NULL;
211 struct scif_cb_arg *cb_arg = NULL;
216 tx = ddev->device_prep_dma_memcpy(chan, 0, 0, 0, DMA_PREP_FENCE);
219 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
220 __func__, __LINE__, err);
223 cookie = tx->tx_submit(tx);
224 if (dma_submit_error(cookie)) {
226 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
227 __func__, __LINE__, err);
230 dma_async_issue_pending(chan);
233 * For X100 use the status descriptor to write the value to
236 tx = ddev->device_prep_dma_imm_data(chan, dst, val, 0);
238 status = dma_pool_alloc(ep->remote_dev->signal_pool, GFP_KERNEL,
242 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
243 __func__, __LINE__, err);
247 status->src_dma_addr = src;
249 src += offsetof(struct scif_status, val);
250 tx = ddev->device_prep_dma_memcpy(chan, dst, src, sizeof(val),
255 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
256 __func__, __LINE__, err);
260 cb_arg = kmalloc(sizeof(*cb_arg), GFP_KERNEL);
265 cb_arg->src_dma_addr = src;
266 cb_arg->status = status;
268 tx->callback = scif_prog_signal_cb;
269 tx->callback_param = cb_arg;
271 cookie = tx->tx_submit(tx);
272 if (dma_submit_error(cookie)) {
274 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
275 __func__, __LINE__, err);
278 dma_async_issue_pending(chan);
282 dma_pool_free(ep->remote_dev->signal_pool, status,
283 src - offsetof(struct scif_status, val));
292 * @epd: Endpoint Descriptor
293 * @offset: registered address to write @val to
294 * @val: Value to be written at @offset
295 * @type: Type of the window.
297 * Arrange to write a value to the registered offset after ensuring that the
298 * offset provided is indeed valid.
300 int scif_prog_signal(scif_epd_t epd, off_t offset, u64 val,
301 enum scif_window_type type)
303 struct scif_endpt *ep = (struct scif_endpt *)epd;
304 struct scif_window *window = NULL;
305 struct scif_rma_req req;
306 dma_addr_t dst_dma_addr;
309 mutex_lock(&ep->rma_info.rma_lock);
310 req.out_window = &window;
312 req.nr_bytes = sizeof(u64);
313 req.prot = SCIF_PROT_WRITE;
314 req.type = SCIF_WINDOW_SINGLE;
315 if (type == SCIF_WINDOW_SELF)
316 req.head = &ep->rma_info.reg_list;
318 req.head = &ep->rma_info.remote_reg_list;
319 /* Does a valid window exist? */
320 err = scif_query_window(&req);
322 dev_err(scif_info.mdev.this_device,
323 "%s %d err %d\n", __func__, __LINE__, err);
327 if (scif_is_mgmt_node() && scifdev_self(ep->remote_dev)) {
330 if (type == SCIF_WINDOW_SELF)
331 dst_virt = scif_get_local_va(offset, window);
334 scif_get_local_va(offset, (struct scif_window *)
335 window->peer_window);
338 dst_dma_addr = __scif_off_to_dma_addr(window, offset);
339 err = _scif_prog_signal(epd, dst_dma_addr, val);
342 mutex_unlock(&ep->rma_info.rma_lock);
346 static int _scif_fence_wait(scif_epd_t epd, int mark)
348 struct scif_endpt *ep = (struct scif_endpt *)epd;
349 dma_cookie_t cookie = mark & ~SCIF_REMOTE_FENCE;
352 /* Wait for DMA callback in scif_fence_mark_cb(..) */
353 err = wait_event_interruptible_timeout(ep->rma_info.markwq,
354 dma_async_is_tx_complete(
355 ep->rma_info.dma_chan,
356 cookie, NULL, NULL) ==
358 SCIF_NODE_ALIVE_TIMEOUT);
367 * scif_rma_handle_remote_fences:
369 * This routine services remote fence requests.
371 void scif_rma_handle_remote_fences(void)
373 struct list_head *item, *tmp;
374 struct scif_remote_fence_info *fence;
375 struct scif_endpt *ep;
379 mutex_lock(&scif_info.fencelock);
380 list_for_each_safe(item, tmp, &scif_info.fence) {
381 fence = list_entry(item, struct scif_remote_fence_info,
383 /* Remove fence from global list */
384 list_del(&fence->list);
386 /* Initiate the fence operation */
387 ep = (struct scif_endpt *)fence->msg.payload[0];
388 mark = fence->msg.payload[2];
389 err = _scif_fence_wait(ep, mark);
391 fence->msg.uop = SCIF_WAIT_NACK;
393 fence->msg.uop = SCIF_WAIT_ACK;
394 fence->msg.payload[0] = ep->remote_ep;
395 scif_nodeqp_send(ep->remote_dev, &fence->msg);
397 if (!atomic_sub_return(1, &ep->rma_info.fence_refcount))
398 schedule_work(&scif_info.misc_work);
400 mutex_unlock(&scif_info.fencelock);
403 static int _scif_send_fence(scif_epd_t epd, int uop, int mark, int *out_mark)
407 struct scif_fence_info *fence_req;
408 struct scif_endpt *ep = (struct scif_endpt *)epd;
410 fence_req = kmalloc(sizeof(*fence_req), GFP_KERNEL);
416 fence_req->state = OP_IN_PROGRESS;
417 init_completion(&fence_req->comp);
421 msg.payload[0] = ep->remote_ep;
422 msg.payload[1] = (u64)fence_req;
423 if (uop == SCIF_WAIT)
424 msg.payload[2] = mark;
425 spin_lock(&ep->lock);
426 if (ep->state == SCIFEP_CONNECTED)
427 err = scif_nodeqp_send(ep->remote_dev, &msg);
430 spin_unlock(&ep->lock);
434 /* Wait for a SCIF_WAIT_(N)ACK message */
435 err = wait_for_completion_timeout(&fence_req->comp,
436 SCIF_NODE_ALIVE_TIMEOUT);
437 if (!err && scifdev_alive(ep))
443 mutex_lock(&ep->rma_info.rma_lock);
445 if (fence_req->state == OP_IN_PROGRESS)
446 fence_req->state = OP_FAILED;
448 if (fence_req->state == OP_FAILED && !err)
450 if (uop == SCIF_MARK && fence_req->state == OP_COMPLETED)
451 *out_mark = SCIF_REMOTE_FENCE | fence_req->dma_mark;
452 mutex_unlock(&ep->rma_info.rma_lock);
460 * scif_send_fence_mark:
461 * @epd: end point descriptor.
462 * @out_mark: Output DMA mark reported by peer.
464 * Send a remote fence mark request.
466 static int scif_send_fence_mark(scif_epd_t epd, int *out_mark)
468 return _scif_send_fence(epd, SCIF_MARK, 0, out_mark);
472 * scif_send_fence_wait:
473 * @epd: end point descriptor.
474 * @mark: DMA mark to wait for.
476 * Send a remote fence wait request.
478 static int scif_send_fence_wait(scif_epd_t epd, int mark)
480 return _scif_send_fence(epd, SCIF_WAIT, mark, NULL);
483 static int _scif_send_fence_signal_wait(struct scif_endpt *ep,
484 struct scif_fence_info *fence_req)
489 /* Wait for a SCIF_SIG_(N)ACK message */
490 err = wait_for_completion_timeout(&fence_req->comp,
491 SCIF_NODE_ALIVE_TIMEOUT);
492 if (!err && scifdev_alive(ep))
499 mutex_lock(&ep->rma_info.rma_lock);
500 if (fence_req->state == OP_IN_PROGRESS)
501 fence_req->state = OP_FAILED;
502 mutex_unlock(&ep->rma_info.rma_lock);
504 if (fence_req->state == OP_FAILED && !err)
510 * scif_send_fence_signal:
511 * @epd: endpoint descriptor
512 * @loff: local offset
513 * @lval: local value to write to loffset
514 * @roff: remote offset
515 * @rval: remote value to write to roffset
518 * Sends a remote fence signal request
520 static int scif_send_fence_signal(scif_epd_t epd, off_t roff, u64 rval,
521 off_t loff, u64 lval, int flags)
525 struct scif_fence_info *fence_req;
526 struct scif_endpt *ep = (struct scif_endpt *)epd;
528 fence_req = kmalloc(sizeof(*fence_req), GFP_KERNEL);
534 fence_req->state = OP_IN_PROGRESS;
535 init_completion(&fence_req->comp);
537 if (flags & SCIF_SIGNAL_LOCAL) {
538 msg.uop = SCIF_SIG_LOCAL;
539 msg.payload[0] = ep->remote_ep;
540 msg.payload[1] = roff;
541 msg.payload[2] = rval;
542 msg.payload[3] = (u64)fence_req;
543 spin_lock(&ep->lock);
544 if (ep->state == SCIFEP_CONNECTED)
545 err = scif_nodeqp_send(ep->remote_dev, &msg);
548 spin_unlock(&ep->lock);
551 err = _scif_send_fence_signal_wait(ep, fence_req);
555 fence_req->state = OP_IN_PROGRESS;
557 if (flags & SCIF_SIGNAL_REMOTE) {
558 msg.uop = SCIF_SIG_REMOTE;
559 msg.payload[0] = ep->remote_ep;
560 msg.payload[1] = loff;
561 msg.payload[2] = lval;
562 msg.payload[3] = (u64)fence_req;
563 spin_lock(&ep->lock);
564 if (ep->state == SCIFEP_CONNECTED)
565 err = scif_nodeqp_send(ep->remote_dev, &msg);
568 spin_unlock(&ep->lock);
571 err = _scif_send_fence_signal_wait(ep, fence_req);
579 static void scif_fence_mark_cb(void *arg)
581 struct scif_endpt *ep = (struct scif_endpt *)arg;
583 wake_up_interruptible(&ep->rma_info.markwq);
584 atomic_dec(&ep->rma_info.fence_refcount);
589 * @epd: endpoint descriptor
590 * @mark: DMA mark to set-up
592 * Set up a mark for this endpoint and return the value of the mark.
594 int _scif_fence_mark(scif_epd_t epd, int *mark)
596 struct scif_endpt *ep = (struct scif_endpt *)epd;
597 struct dma_chan *chan = ep->rma_info.dma_chan;
598 struct dma_device *ddev = chan->device;
599 struct dma_async_tx_descriptor *tx;
603 tx = ddev->device_prep_dma_memcpy(chan, 0, 0, 0, DMA_PREP_FENCE);
606 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
607 __func__, __LINE__, err);
610 cookie = tx->tx_submit(tx);
611 if (dma_submit_error(cookie)) {
613 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
614 __func__, __LINE__, err);
617 dma_async_issue_pending(chan);
618 tx = ddev->device_prep_dma_interrupt(chan, DMA_PREP_INTERRUPT);
621 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
622 __func__, __LINE__, err);
625 tx->callback = scif_fence_mark_cb;
626 tx->callback_param = ep;
627 *mark = cookie = tx->tx_submit(tx);
628 if (dma_submit_error(cookie)) {
630 dev_err(&ep->remote_dev->sdev->dev, "%s %d err %d\n",
631 __func__, __LINE__, err);
634 atomic_inc(&ep->rma_info.fence_refcount);
635 dma_async_issue_pending(chan);
639 #define SCIF_LOOPB_MAGIC_MARK 0xdead
641 int scif_fence_mark(scif_epd_t epd, int flags, int *mark)
643 struct scif_endpt *ep = (struct scif_endpt *)epd;
646 dev_dbg(scif_info.mdev.this_device,
647 "SCIFAPI fence_mark: ep %p flags 0x%x mark 0x%x\n",
649 err = scif_verify_epd(ep);
654 if (flags & ~(SCIF_FENCE_INIT_SELF | SCIF_FENCE_INIT_PEER))
657 /* At least one of init self or peer RMA should be set */
658 if (!(flags & (SCIF_FENCE_INIT_SELF | SCIF_FENCE_INIT_PEER)))
661 /* Exactly one of init self or peer RMA should be set but not both */
662 if ((flags & SCIF_FENCE_INIT_SELF) && (flags & SCIF_FENCE_INIT_PEER))
666 * Management node loopback does not need to use DMA.
667 * Return a valid mark to be symmetric.
669 if (scifdev_self(ep->remote_dev) && scif_is_mgmt_node()) {
670 *mark = SCIF_LOOPB_MAGIC_MARK;
674 if (flags & SCIF_FENCE_INIT_SELF)
675 err = _scif_fence_mark(epd, mark);
677 err = scif_send_fence_mark(ep, mark);
680 dev_err(scif_info.mdev.this_device,
681 "%s %d err %d\n", __func__, __LINE__, err);
682 dev_dbg(scif_info.mdev.this_device,
683 "SCIFAPI fence_mark: ep %p flags 0x%x mark 0x%x err %d\n",
684 ep, flags, *mark, err);
687 EXPORT_SYMBOL_GPL(scif_fence_mark);
689 int scif_fence_wait(scif_epd_t epd, int mark)
691 struct scif_endpt *ep = (struct scif_endpt *)epd;
694 dev_dbg(scif_info.mdev.this_device,
695 "SCIFAPI fence_wait: ep %p mark 0x%x\n",
697 err = scif_verify_epd(ep);
701 * Management node loopback does not need to use DMA.
702 * The only valid mark provided is 0 so simply
703 * return success if the mark is valid.
705 if (scifdev_self(ep->remote_dev) && scif_is_mgmt_node()) {
706 if (mark == SCIF_LOOPB_MAGIC_MARK)
711 if (mark & SCIF_REMOTE_FENCE)
712 err = scif_send_fence_wait(epd, mark);
714 err = _scif_fence_wait(epd, mark);
716 dev_err(scif_info.mdev.this_device,
717 "%s %d err %d\n", __func__, __LINE__, err);
720 EXPORT_SYMBOL_GPL(scif_fence_wait);
722 int scif_fence_signal(scif_epd_t epd, off_t loff, u64 lval,
723 off_t roff, u64 rval, int flags)
725 struct scif_endpt *ep = (struct scif_endpt *)epd;
728 dev_dbg(scif_info.mdev.this_device,
729 "SCIFAPI fence_signal: ep %p loff 0x%lx lval 0x%llx roff 0x%lx rval 0x%llx flags 0x%x\n",
730 ep, loff, lval, roff, rval, flags);
731 err = scif_verify_epd(ep);
736 if (flags & ~(SCIF_FENCE_INIT_SELF | SCIF_FENCE_INIT_PEER |
737 SCIF_SIGNAL_LOCAL | SCIF_SIGNAL_REMOTE))
740 /* At least one of init self or peer RMA should be set */
741 if (!(flags & (SCIF_FENCE_INIT_SELF | SCIF_FENCE_INIT_PEER)))
744 /* Exactly one of init self or peer RMA should be set but not both */
745 if ((flags & SCIF_FENCE_INIT_SELF) && (flags & SCIF_FENCE_INIT_PEER))
748 /* At least one of SCIF_SIGNAL_LOCAL or SCIF_SIGNAL_REMOTE required */
749 if (!(flags & (SCIF_SIGNAL_LOCAL | SCIF_SIGNAL_REMOTE)))
752 /* Only Dword offsets allowed */
753 if ((flags & SCIF_SIGNAL_LOCAL) && (loff & (sizeof(u32) - 1)))
756 /* Only Dword aligned offsets allowed */
757 if ((flags & SCIF_SIGNAL_REMOTE) && (roff & (sizeof(u32) - 1)))
760 if (flags & SCIF_FENCE_INIT_PEER) {
761 err = scif_send_fence_signal(epd, roff, rval, loff,
764 /* Local Signal in Local RAS */
765 if (flags & SCIF_SIGNAL_LOCAL) {
766 err = scif_prog_signal(epd, loff, lval,
772 /* Signal in Remote RAS */
773 if (flags & SCIF_SIGNAL_REMOTE)
774 err = scif_prog_signal(epd, roff,
775 rval, SCIF_WINDOW_PEER);
779 dev_err(scif_info.mdev.this_device,
780 "%s %d err %d\n", __func__, __LINE__, err);
783 EXPORT_SYMBOL_GPL(scif_fence_signal);