1 // SPDX-License-Identifier: GPL-2.0
3 * Shared Memory Communications over RDMA (SMC-R) and RoCE
5 * Link Layer Control (LLC)
7 * Copyright IBM Corp. 2016
9 * Author(s): Klaus Wacker <Klaus.Wacker@de.ibm.com>
10 * Ursula Braun <ubraun@linux.vnet.ibm.com>
14 #include <rdma/ib_verbs.h>
21 #define SMC_LLC_DATA_LEN 40
24 struct smc_wr_rx_hdr common;
26 #if defined(__BIG_ENDIAN_BITFIELD)
29 #elif defined(__LITTLE_ENDIAN_BITFIELD)
30 u8 add_link_rej_rsn:4,
36 #define SMC_LLC_FLAG_NO_RMBE_EYEC 0x03
38 struct smc_llc_msg_confirm_link { /* type 0x01 */
39 struct smc_llc_hdr hd;
40 u8 sender_mac[ETH_ALEN];
41 u8 sender_gid[SMC_GID_SIZE];
44 u8 link_uid[SMC_LGR_ID_SIZE];
49 #define SMC_LLC_FLAG_ADD_LNK_REJ 0x40
50 #define SMC_LLC_REJ_RSN_NO_ALT_PATH 1
52 #define SMC_LLC_ADD_LNK_MAX_LINKS 2
54 struct smc_llc_msg_add_link { /* type 0x02 */
55 struct smc_llc_hdr hd;
56 u8 sender_mac[ETH_ALEN];
58 u8 sender_gid[SMC_GID_SIZE];
61 u8 flags2; /* QP mtu */
66 #define SMC_LLC_FLAG_DEL_LINK_ALL 0x40
67 #define SMC_LLC_FLAG_DEL_LINK_ORDERLY 0x20
69 struct smc_llc_msg_del_link { /* type 0x04 */
70 struct smc_llc_hdr hd;
74 } __packed; /* format defined in RFC7609 */
76 struct smc_llc_msg_test_link { /* type 0x07 */
77 struct smc_llc_hdr hd;
82 struct smc_rmb_rtoken {
84 u8 num_rkeys; /* first rtoken byte of CONFIRM LINK msg */
85 /* is actually the num of rtokens, first */
86 /* rtoken is always for the current link */
87 u8 link_id; /* link id of the rtoken */
91 } __packed; /* format defined in RFC7609 */
93 #define SMC_LLC_RKEYS_PER_MSG 3
95 struct smc_llc_msg_confirm_rkey { /* type 0x06 */
96 struct smc_llc_hdr hd;
97 struct smc_rmb_rtoken rtoken[SMC_LLC_RKEYS_PER_MSG];
101 #define SMC_LLC_DEL_RKEY_MAX 8
102 #define SMC_LLC_FLAG_RKEY_RETRY 0x10
103 #define SMC_LLC_FLAG_RKEY_NEG 0x20
105 struct smc_llc_msg_delete_rkey { /* type 0x09 */
106 struct smc_llc_hdr hd;
115 struct smc_llc_msg_confirm_link confirm_link;
116 struct smc_llc_msg_add_link add_link;
117 struct smc_llc_msg_del_link delete_link;
119 struct smc_llc_msg_confirm_rkey confirm_rkey;
120 struct smc_llc_msg_delete_rkey delete_rkey;
122 struct smc_llc_msg_test_link test_link;
124 struct smc_llc_hdr hdr;
125 u8 data[SMC_LLC_DATA_LEN];
129 #define SMC_LLC_FLAG_RESP 0x80
131 struct smc_llc_qentry {
132 struct list_head list;
133 struct smc_link *link;
134 union smc_llc_msg msg;
137 struct smc_llc_qentry *smc_llc_flow_qentry_clr(struct smc_llc_flow *flow)
139 struct smc_llc_qentry *qentry = flow->qentry;
145 void smc_llc_flow_qentry_del(struct smc_llc_flow *flow)
147 struct smc_llc_qentry *qentry;
150 qentry = flow->qentry;
156 static inline void smc_llc_flow_qentry_set(struct smc_llc_flow *flow,
157 struct smc_llc_qentry *qentry)
159 flow->qentry = qentry;
162 /* try to start a new llc flow, initiated by an incoming llc msg */
163 static bool smc_llc_flow_start(struct smc_llc_flow *flow,
164 struct smc_llc_qentry *qentry)
166 struct smc_link_group *lgr = qentry->link->lgr;
168 spin_lock_bh(&lgr->llc_flow_lock);
170 /* a flow is already active */
171 if ((qentry->msg.raw.hdr.common.type == SMC_LLC_ADD_LINK ||
172 qentry->msg.raw.hdr.common.type == SMC_LLC_DELETE_LINK) &&
173 !lgr->delayed_event) {
174 lgr->delayed_event = qentry;
176 /* forget this llc request */
179 spin_unlock_bh(&lgr->llc_flow_lock);
182 switch (qentry->msg.raw.hdr.common.type) {
183 case SMC_LLC_ADD_LINK:
184 flow->type = SMC_LLC_FLOW_ADD_LINK;
186 case SMC_LLC_DELETE_LINK:
187 flow->type = SMC_LLC_FLOW_DEL_LINK;
189 case SMC_LLC_CONFIRM_RKEY:
190 case SMC_LLC_DELETE_RKEY:
191 flow->type = SMC_LLC_FLOW_RKEY;
194 flow->type = SMC_LLC_FLOW_NONE;
196 if (qentry == lgr->delayed_event)
197 lgr->delayed_event = NULL;
198 spin_unlock_bh(&lgr->llc_flow_lock);
199 smc_llc_flow_qentry_set(flow, qentry);
203 /* start a new local llc flow, wait till current flow finished */
204 int smc_llc_flow_initiate(struct smc_link_group *lgr,
205 enum smc_llc_flowtype type)
207 enum smc_llc_flowtype allowed_remote = SMC_LLC_FLOW_NONE;
210 /* all flows except confirm_rkey and delete_rkey are exclusive,
211 * confirm/delete rkey flows can run concurrently (local and remote)
213 if (type == SMC_LLC_FLOW_RKEY)
214 allowed_remote = SMC_LLC_FLOW_RKEY;
216 if (list_empty(&lgr->list))
218 spin_lock_bh(&lgr->llc_flow_lock);
219 if (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
220 (lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
221 lgr->llc_flow_rmt.type == allowed_remote)) {
222 lgr->llc_flow_lcl.type = type;
223 spin_unlock_bh(&lgr->llc_flow_lock);
226 spin_unlock_bh(&lgr->llc_flow_lock);
227 rc = wait_event_interruptible_timeout(lgr->llc_waiter,
228 (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
229 (lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
230 lgr->llc_flow_rmt.type == allowed_remote)),
237 /* finish the current llc flow */
238 void smc_llc_flow_stop(struct smc_link_group *lgr, struct smc_llc_flow *flow)
240 spin_lock_bh(&lgr->llc_flow_lock);
241 memset(flow, 0, sizeof(*flow));
242 flow->type = SMC_LLC_FLOW_NONE;
243 spin_unlock_bh(&lgr->llc_flow_lock);
244 if (!list_empty(&lgr->list) && lgr->delayed_event &&
245 flow == &lgr->llc_flow_lcl)
246 schedule_work(&lgr->llc_event_work);
248 wake_up_interruptible(&lgr->llc_waiter);
251 /* lnk is optional and used for early wakeup when link goes down, useful in
252 * cases where we wait for a response on the link after we sent a request
254 struct smc_llc_qentry *smc_llc_wait(struct smc_link_group *lgr,
255 struct smc_link *lnk,
256 int time_out, u8 exp_msg)
258 struct smc_llc_flow *flow = &lgr->llc_flow_lcl;
260 wait_event_interruptible_timeout(lgr->llc_waiter,
262 (lnk && !smc_link_usable(lnk)) ||
263 list_empty(&lgr->list)),
266 (lnk && !smc_link_usable(lnk)) || list_empty(&lgr->list)) {
267 smc_llc_flow_qentry_del(flow);
270 if (exp_msg && flow->qentry->msg.raw.hdr.common.type != exp_msg) {
271 if (exp_msg == SMC_LLC_ADD_LINK &&
272 flow->qentry->msg.raw.hdr.common.type ==
273 SMC_LLC_DELETE_LINK) {
274 /* flow_start will delay the unexpected msg */
275 smc_llc_flow_start(&lgr->llc_flow_lcl,
276 smc_llc_flow_qentry_clr(flow));
279 smc_llc_flow_qentry_del(flow);
285 /********************************** send *************************************/
287 struct smc_llc_tx_pend {
290 /* handler for send/transmission completion of an LLC msg */
291 static void smc_llc_tx_handler(struct smc_wr_tx_pend_priv *pend,
292 struct smc_link *link,
293 enum ib_wc_status wc_status)
295 /* future work: handle wc_status error for recovery and failover */
299 * smc_llc_add_pending_send() - add LLC control message to pending WQE transmits
300 * @link: Pointer to SMC link used for sending LLC control message.
301 * @wr_buf: Out variable returning pointer to work request payload buffer.
302 * @pend: Out variable returning pointer to private pending WR tracking.
303 * It's the context the transmit complete handler will get.
305 * Reserves and pre-fills an entry for a pending work request send/tx.
306 * Used by mid-level smc_llc_send_msg() to prepare for later actual send/tx.
307 * Can sleep due to smc_get_ctrl_buf (if not in softirq context).
309 * Return: 0 on success, otherwise an error value.
311 static int smc_llc_add_pending_send(struct smc_link *link,
312 struct smc_wr_buf **wr_buf,
313 struct smc_wr_tx_pend_priv **pend)
317 rc = smc_wr_tx_get_free_slot(link, smc_llc_tx_handler, wr_buf, NULL,
322 sizeof(union smc_llc_msg) > SMC_WR_BUF_SIZE,
323 "must increase SMC_WR_BUF_SIZE to at least sizeof(struct smc_llc_msg)");
325 sizeof(union smc_llc_msg) != SMC_WR_TX_SIZE,
326 "must adapt SMC_WR_TX_SIZE to sizeof(struct smc_llc_msg); if not all smc_wr upper layer protocols use the same message size any more, must start to set link->wr_tx_sges[i].length on each individual smc_wr_tx_send()");
328 sizeof(struct smc_llc_tx_pend) > SMC_WR_TX_PEND_PRIV_SIZE,
329 "must increase SMC_WR_TX_PEND_PRIV_SIZE to at least sizeof(struct smc_llc_tx_pend)");
333 /* high-level API to send LLC confirm link */
334 int smc_llc_send_confirm_link(struct smc_link *link,
335 enum smc_llc_reqresp reqresp)
337 struct smc_link_group *lgr = smc_get_lgr(link);
338 struct smc_llc_msg_confirm_link *confllc;
339 struct smc_wr_tx_pend_priv *pend;
340 struct smc_wr_buf *wr_buf;
343 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
346 confllc = (struct smc_llc_msg_confirm_link *)wr_buf;
347 memset(confllc, 0, sizeof(*confllc));
348 confllc->hd.common.type = SMC_LLC_CONFIRM_LINK;
349 confllc->hd.length = sizeof(struct smc_llc_msg_confirm_link);
350 confllc->hd.flags |= SMC_LLC_FLAG_NO_RMBE_EYEC;
351 if (reqresp == SMC_LLC_RESP)
352 confllc->hd.flags |= SMC_LLC_FLAG_RESP;
353 memcpy(confllc->sender_mac, link->smcibdev->mac[link->ibport - 1],
355 memcpy(confllc->sender_gid, link->gid, SMC_GID_SIZE);
356 hton24(confllc->sender_qp_num, link->roce_qp->qp_num);
357 confllc->link_num = link->link_id;
358 memcpy(confllc->link_uid, lgr->id, SMC_LGR_ID_SIZE);
359 confllc->max_links = SMC_LLC_ADD_LNK_MAX_LINKS; /* enforce peer resp. */
360 /* send llc message */
361 rc = smc_wr_tx_send(link, pend);
365 /* send LLC confirm rkey request */
366 static int smc_llc_send_confirm_rkey(struct smc_link *send_link,
367 struct smc_buf_desc *rmb_desc)
369 struct smc_llc_msg_confirm_rkey *rkeyllc;
370 struct smc_wr_tx_pend_priv *pend;
371 struct smc_wr_buf *wr_buf;
372 struct smc_link *link;
375 rc = smc_llc_add_pending_send(send_link, &wr_buf, &pend);
378 rkeyllc = (struct smc_llc_msg_confirm_rkey *)wr_buf;
379 memset(rkeyllc, 0, sizeof(*rkeyllc));
380 rkeyllc->hd.common.type = SMC_LLC_CONFIRM_RKEY;
381 rkeyllc->hd.length = sizeof(struct smc_llc_msg_confirm_rkey);
384 for (i = 0; i < SMC_LINKS_PER_LGR_MAX; i++) {
385 link = &send_link->lgr->lnk[i];
386 if (link->state == SMC_LNK_ACTIVE && link != send_link) {
387 rkeyllc->rtoken[rtok_ix].link_id = link->link_id;
388 rkeyllc->rtoken[rtok_ix].rmb_key =
389 htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
390 rkeyllc->rtoken[rtok_ix].rmb_vaddr = cpu_to_be64(
392 rmb_desc->sgt[link->link_idx].sgl));
396 /* rkey of send_link is in rtoken[0] */
397 rkeyllc->rtoken[0].num_rkeys = rtok_ix - 1;
398 rkeyllc->rtoken[0].rmb_key =
399 htonl(rmb_desc->mr_rx[send_link->link_idx]->rkey);
400 rkeyllc->rtoken[0].rmb_vaddr = cpu_to_be64(
401 (u64)sg_dma_address(rmb_desc->sgt[send_link->link_idx].sgl));
402 /* send llc message */
403 rc = smc_wr_tx_send(send_link, pend);
407 /* send LLC delete rkey request */
408 static int smc_llc_send_delete_rkey(struct smc_link *link,
409 struct smc_buf_desc *rmb_desc)
411 struct smc_llc_msg_delete_rkey *rkeyllc;
412 struct smc_wr_tx_pend_priv *pend;
413 struct smc_wr_buf *wr_buf;
416 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
419 rkeyllc = (struct smc_llc_msg_delete_rkey *)wr_buf;
420 memset(rkeyllc, 0, sizeof(*rkeyllc));
421 rkeyllc->hd.common.type = SMC_LLC_DELETE_RKEY;
422 rkeyllc->hd.length = sizeof(struct smc_llc_msg_delete_rkey);
423 rkeyllc->num_rkeys = 1;
424 rkeyllc->rkey[0] = htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
425 /* send llc message */
426 rc = smc_wr_tx_send(link, pend);
430 /* prepare an add link message */
431 static void smc_llc_prep_add_link(struct smc_llc_msg_add_link *addllc,
432 struct smc_link *link, u8 mac[], u8 gid[],
433 enum smc_llc_reqresp reqresp)
435 memset(addllc, 0, sizeof(*addllc));
436 addllc->hd.common.type = SMC_LLC_ADD_LINK;
437 addllc->hd.length = sizeof(struct smc_llc_msg_add_link);
438 if (reqresp == SMC_LLC_RESP) {
439 addllc->hd.flags |= SMC_LLC_FLAG_RESP;
440 /* always reject more links for now */
441 addllc->hd.flags |= SMC_LLC_FLAG_ADD_LNK_REJ;
442 addllc->hd.add_link_rej_rsn = SMC_LLC_REJ_RSN_NO_ALT_PATH;
444 memcpy(addllc->sender_mac, mac, ETH_ALEN);
445 memcpy(addllc->sender_gid, gid, SMC_GID_SIZE);
448 /* send ADD LINK request or response */
449 int smc_llc_send_add_link(struct smc_link *link, u8 mac[], u8 gid[],
450 enum smc_llc_reqresp reqresp)
452 struct smc_llc_msg_add_link *addllc;
453 struct smc_wr_tx_pend_priv *pend;
454 struct smc_wr_buf *wr_buf;
457 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
460 addllc = (struct smc_llc_msg_add_link *)wr_buf;
461 smc_llc_prep_add_link(addllc, link, mac, gid, reqresp);
462 /* send llc message */
463 rc = smc_wr_tx_send(link, pend);
467 /* prepare a delete link message */
468 static void smc_llc_prep_delete_link(struct smc_llc_msg_del_link *delllc,
469 struct smc_link *link,
470 enum smc_llc_reqresp reqresp, bool orderly)
472 memset(delllc, 0, sizeof(*delllc));
473 delllc->hd.common.type = SMC_LLC_DELETE_LINK;
474 delllc->hd.length = sizeof(struct smc_llc_msg_add_link);
475 if (reqresp == SMC_LLC_RESP)
476 delllc->hd.flags |= SMC_LLC_FLAG_RESP;
477 /* DEL_LINK_ALL because only 1 link supported */
478 delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ALL;
480 delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ORDERLY;
481 delllc->link_num = link->link_id;
484 /* send DELETE LINK request or response */
485 int smc_llc_send_delete_link(struct smc_link *link,
486 enum smc_llc_reqresp reqresp, bool orderly)
488 struct smc_llc_msg_del_link *delllc;
489 struct smc_wr_tx_pend_priv *pend;
490 struct smc_wr_buf *wr_buf;
493 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
496 delllc = (struct smc_llc_msg_del_link *)wr_buf;
497 smc_llc_prep_delete_link(delllc, link, reqresp, orderly);
498 /* send llc message */
499 rc = smc_wr_tx_send(link, pend);
503 /* send LLC test link request */
504 static int smc_llc_send_test_link(struct smc_link *link, u8 user_data[16])
506 struct smc_llc_msg_test_link *testllc;
507 struct smc_wr_tx_pend_priv *pend;
508 struct smc_wr_buf *wr_buf;
511 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
514 testllc = (struct smc_llc_msg_test_link *)wr_buf;
515 memset(testllc, 0, sizeof(*testllc));
516 testllc->hd.common.type = SMC_LLC_TEST_LINK;
517 testllc->hd.length = sizeof(struct smc_llc_msg_test_link);
518 memcpy(testllc->user_data, user_data, sizeof(testllc->user_data));
519 /* send llc message */
520 rc = smc_wr_tx_send(link, pend);
524 /* schedule an llc send on link, may wait for buffers */
525 static int smc_llc_send_message(struct smc_link *link, void *llcbuf)
527 struct smc_wr_tx_pend_priv *pend;
528 struct smc_wr_buf *wr_buf;
531 if (!smc_link_usable(link))
533 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
536 memcpy(wr_buf, llcbuf, sizeof(union smc_llc_msg));
537 return smc_wr_tx_send(link, pend);
540 /********************************* receive ***********************************/
542 static void smc_llc_rx_delete_link(struct smc_link *link,
543 struct smc_llc_msg_del_link *llc)
545 struct smc_link_group *lgr = smc_get_lgr(link);
548 smc_llc_link_deleting(link);
549 if (lgr->role == SMC_SERV) {
550 /* client asks to delete this link, send request */
551 smc_llc_prep_delete_link(llc, link, SMC_LLC_REQ, true);
553 /* server requests to delete this link, send response */
554 smc_llc_prep_delete_link(llc, link, SMC_LLC_RESP, true);
556 smc_llc_send_message(link, llc);
557 smc_lgr_terminate_sched(lgr);
560 /* process a confirm_rkey request from peer, remote flow */
561 static void smc_llc_rmt_conf_rkey(struct smc_link_group *lgr)
563 struct smc_llc_msg_confirm_rkey *llc;
564 struct smc_llc_qentry *qentry;
565 struct smc_link *link;
570 qentry = lgr->llc_flow_rmt.qentry;
571 llc = &qentry->msg.confirm_rkey;
574 num_entries = llc->rtoken[0].num_rkeys;
575 /* first rkey entry is for receiving link */
576 rk_idx = smc_rtoken_add(link,
577 llc->rtoken[0].rmb_vaddr,
578 llc->rtoken[0].rmb_key);
582 for (i = 1; i <= min_t(u8, num_entries, SMC_LLC_RKEYS_PER_MSG - 1); i++)
583 smc_rtoken_set2(lgr, rk_idx, llc->rtoken[i].link_id,
584 llc->rtoken[i].rmb_vaddr,
585 llc->rtoken[i].rmb_key);
586 /* max links is 3 so there is no need to support conf_rkey_cont msgs */
589 llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
590 llc->hd.flags |= SMC_LLC_FLAG_RKEY_RETRY;
592 llc->hd.flags |= SMC_LLC_FLAG_RESP;
593 smc_llc_send_message(link, &qentry->msg);
594 smc_llc_flow_qentry_del(&lgr->llc_flow_rmt);
597 /* process a delete_rkey request from peer, remote flow */
598 static void smc_llc_rmt_delete_rkey(struct smc_link_group *lgr)
600 struct smc_llc_msg_delete_rkey *llc;
601 struct smc_llc_qentry *qentry;
602 struct smc_link *link;
606 qentry = lgr->llc_flow_rmt.qentry;
607 llc = &qentry->msg.delete_rkey;
610 max = min_t(u8, llc->num_rkeys, SMC_LLC_DEL_RKEY_MAX);
611 for (i = 0; i < max; i++) {
612 if (smc_rtoken_delete(link, llc->rkey[i]))
613 err_mask |= 1 << (SMC_LLC_DEL_RKEY_MAX - 1 - i);
616 llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
617 llc->err_mask = err_mask;
619 llc->hd.flags |= SMC_LLC_FLAG_RESP;
620 smc_llc_send_message(link, &qentry->msg);
621 smc_llc_flow_qentry_del(&lgr->llc_flow_rmt);
624 /* flush the llc event queue */
625 static void smc_llc_event_flush(struct smc_link_group *lgr)
627 struct smc_llc_qentry *qentry, *q;
629 spin_lock_bh(&lgr->llc_event_q_lock);
630 list_for_each_entry_safe(qentry, q, &lgr->llc_event_q, list) {
631 list_del_init(&qentry->list);
634 spin_unlock_bh(&lgr->llc_event_q_lock);
637 static void smc_llc_event_handler(struct smc_llc_qentry *qentry)
639 union smc_llc_msg *llc = &qentry->msg;
640 struct smc_link *link = qentry->link;
641 struct smc_link_group *lgr = link->lgr;
643 if (!smc_link_usable(link))
646 switch (llc->raw.hdr.common.type) {
647 case SMC_LLC_TEST_LINK:
648 llc->test_link.hd.flags |= SMC_LLC_FLAG_RESP;
649 smc_llc_send_message(link, llc);
651 case SMC_LLC_ADD_LINK:
652 if (list_empty(&lgr->list))
653 goto out; /* lgr is terminating */
654 if (lgr->role == SMC_CLNT) {
655 if (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_ADD_LINK) {
656 /* a flow is waiting for this message */
657 smc_llc_flow_qentry_set(&lgr->llc_flow_lcl,
659 wake_up_interruptible(&lgr->llc_waiter);
660 } else if (smc_llc_flow_start(&lgr->llc_flow_lcl,
662 /* tbd: schedule_work(&lgr->llc_add_link_work); */
664 } else if (smc_llc_flow_start(&lgr->llc_flow_lcl, qentry)) {
665 /* as smc server, handle client suggestion */
666 /* tbd: schedule_work(&lgr->llc_add_link_work); */
669 case SMC_LLC_CONFIRM_LINK:
670 if (lgr->llc_flow_lcl.type != SMC_LLC_FLOW_NONE) {
671 /* a flow is waiting for this message */
672 smc_llc_flow_qentry_set(&lgr->llc_flow_lcl, qentry);
673 wake_up_interruptible(&lgr->llc_waiter);
677 case SMC_LLC_DELETE_LINK:
678 smc_llc_rx_delete_link(link, &llc->delete_link);
680 case SMC_LLC_CONFIRM_RKEY:
681 /* new request from remote, assign to remote flow */
682 if (smc_llc_flow_start(&lgr->llc_flow_rmt, qentry)) {
683 /* process here, does not wait for more llc msgs */
684 smc_llc_rmt_conf_rkey(lgr);
685 smc_llc_flow_stop(lgr, &lgr->llc_flow_rmt);
688 case SMC_LLC_CONFIRM_RKEY_CONT:
689 /* not used because max links is 3, and 3 rkeys fit into
690 * one CONFIRM_RKEY message
693 case SMC_LLC_DELETE_RKEY:
694 /* new request from remote, assign to remote flow */
695 if (smc_llc_flow_start(&lgr->llc_flow_rmt, qentry)) {
696 /* process here, does not wait for more llc msgs */
697 smc_llc_rmt_delete_rkey(lgr);
698 smc_llc_flow_stop(lgr, &lgr->llc_flow_rmt);
706 /* worker to process llc messages on the event queue */
707 static void smc_llc_event_work(struct work_struct *work)
709 struct smc_link_group *lgr = container_of(work, struct smc_link_group,
711 struct smc_llc_qentry *qentry;
713 if (!lgr->llc_flow_lcl.type && lgr->delayed_event) {
714 if (smc_link_usable(lgr->delayed_event->link)) {
715 smc_llc_event_handler(lgr->delayed_event);
717 qentry = lgr->delayed_event;
718 lgr->delayed_event = NULL;
724 spin_lock_bh(&lgr->llc_event_q_lock);
725 if (!list_empty(&lgr->llc_event_q)) {
726 qentry = list_first_entry(&lgr->llc_event_q,
727 struct smc_llc_qentry, list);
728 list_del_init(&qentry->list);
729 spin_unlock_bh(&lgr->llc_event_q_lock);
730 smc_llc_event_handler(qentry);
733 spin_unlock_bh(&lgr->llc_event_q_lock);
736 /* process llc responses in tasklet context */
737 static void smc_llc_rx_response(struct smc_link *link,
738 struct smc_llc_qentry *qentry)
740 u8 llc_type = qentry->msg.raw.hdr.common.type;
743 case SMC_LLC_TEST_LINK:
744 if (link->state == SMC_LNK_ACTIVE)
745 complete(&link->llc_testlink_resp);
747 case SMC_LLC_ADD_LINK:
748 case SMC_LLC_CONFIRM_LINK:
749 case SMC_LLC_CONFIRM_RKEY:
750 case SMC_LLC_DELETE_RKEY:
751 /* assign responses to the local flow, we requested them */
752 smc_llc_flow_qentry_set(&link->lgr->llc_flow_lcl, qentry);
753 wake_up_interruptible(&link->lgr->llc_waiter);
755 case SMC_LLC_DELETE_LINK:
756 if (link->lgr->role == SMC_SERV)
757 smc_lgr_schedule_free_work_fast(link->lgr);
759 case SMC_LLC_CONFIRM_RKEY_CONT:
760 /* not used because max links is 3 */
766 static void smc_llc_enqueue(struct smc_link *link, union smc_llc_msg *llc)
768 struct smc_link_group *lgr = link->lgr;
769 struct smc_llc_qentry *qentry;
772 qentry = kmalloc(sizeof(*qentry), GFP_ATOMIC);
776 INIT_LIST_HEAD(&qentry->list);
777 memcpy(&qentry->msg, llc, sizeof(union smc_llc_msg));
779 /* process responses immediately */
780 if (llc->raw.hdr.flags & SMC_LLC_FLAG_RESP) {
781 smc_llc_rx_response(link, qentry);
785 /* add requests to event queue */
786 spin_lock_irqsave(&lgr->llc_event_q_lock, flags);
787 list_add_tail(&qentry->list, &lgr->llc_event_q);
788 spin_unlock_irqrestore(&lgr->llc_event_q_lock, flags);
789 schedule_work(&link->lgr->llc_event_work);
792 /* copy received msg and add it to the event queue */
793 static void smc_llc_rx_handler(struct ib_wc *wc, void *buf)
795 struct smc_link *link = (struct smc_link *)wc->qp->qp_context;
796 union smc_llc_msg *llc = buf;
798 if (wc->byte_len < sizeof(*llc))
799 return; /* short message */
800 if (llc->raw.hdr.length != sizeof(*llc))
801 return; /* invalid message */
803 smc_llc_enqueue(link, llc);
806 /***************************** worker, utils *********************************/
808 static void smc_llc_testlink_work(struct work_struct *work)
810 struct smc_link *link = container_of(to_delayed_work(work),
811 struct smc_link, llc_testlink_wrk);
812 unsigned long next_interval;
813 unsigned long expire_time;
814 u8 user_data[16] = { 0 };
817 if (link->state != SMC_LNK_ACTIVE)
818 return; /* don't reschedule worker */
819 expire_time = link->wr_rx_tstamp + link->llc_testlink_time;
820 if (time_is_after_jiffies(expire_time)) {
821 next_interval = expire_time - jiffies;
824 reinit_completion(&link->llc_testlink_resp);
825 smc_llc_send_test_link(link, user_data);
826 /* receive TEST LINK response over RoCE fabric */
827 rc = wait_for_completion_interruptible_timeout(&link->llc_testlink_resp,
829 if (link->state != SMC_LNK_ACTIVE)
830 return; /* link state changed */
832 smc_lgr_terminate_sched(smc_get_lgr(link));
835 next_interval = link->llc_testlink_time;
837 schedule_delayed_work(&link->llc_testlink_wrk, next_interval);
840 void smc_llc_lgr_init(struct smc_link_group *lgr, struct smc_sock *smc)
842 struct net *net = sock_net(smc->clcsock->sk);
844 INIT_WORK(&lgr->llc_event_work, smc_llc_event_work);
845 INIT_LIST_HEAD(&lgr->llc_event_q);
846 spin_lock_init(&lgr->llc_event_q_lock);
847 spin_lock_init(&lgr->llc_flow_lock);
848 init_waitqueue_head(&lgr->llc_waiter);
849 lgr->llc_testlink_time = net->ipv4.sysctl_tcp_keepalive_time;
852 /* called after lgr was removed from lgr_list */
853 void smc_llc_lgr_clear(struct smc_link_group *lgr)
855 smc_llc_event_flush(lgr);
856 wake_up_interruptible_all(&lgr->llc_waiter);
857 cancel_work_sync(&lgr->llc_event_work);
858 if (lgr->delayed_event) {
859 kfree(lgr->delayed_event);
860 lgr->delayed_event = NULL;
864 int smc_llc_link_init(struct smc_link *link)
866 init_completion(&link->llc_testlink_resp);
867 INIT_DELAYED_WORK(&link->llc_testlink_wrk, smc_llc_testlink_work);
871 void smc_llc_link_active(struct smc_link *link)
873 link->state = SMC_LNK_ACTIVE;
874 if (link->lgr->llc_testlink_time) {
875 link->llc_testlink_time = link->lgr->llc_testlink_time * HZ;
876 schedule_delayed_work(&link->llc_testlink_wrk,
877 link->llc_testlink_time);
881 void smc_llc_link_deleting(struct smc_link *link)
883 link->state = SMC_LNK_DELETING;
884 smc_wr_wakeup_tx_wait(link);
887 /* called in worker context */
888 void smc_llc_link_clear(struct smc_link *link)
890 complete(&link->llc_testlink_resp);
891 cancel_delayed_work_sync(&link->llc_testlink_wrk);
892 smc_wr_wakeup_reg_wait(link);
893 smc_wr_wakeup_tx_wait(link);
896 /* register a new rtoken at the remote peer (for all links) */
897 int smc_llc_do_confirm_rkey(struct smc_link *send_link,
898 struct smc_buf_desc *rmb_desc)
900 struct smc_link_group *lgr = send_link->lgr;
901 struct smc_llc_qentry *qentry = NULL;
904 rc = smc_llc_flow_initiate(lgr, SMC_LLC_FLOW_RKEY);
907 rc = smc_llc_send_confirm_rkey(send_link, rmb_desc);
910 /* receive CONFIRM RKEY response from server over RoCE fabric */
911 qentry = smc_llc_wait(lgr, send_link, SMC_LLC_WAIT_TIME,
912 SMC_LLC_CONFIRM_RKEY);
913 if (!qentry || (qentry->msg.raw.hdr.flags & SMC_LLC_FLAG_RKEY_NEG))
917 smc_llc_flow_qentry_del(&lgr->llc_flow_lcl);
918 smc_llc_flow_stop(lgr, &lgr->llc_flow_lcl);
922 /* unregister an rtoken at the remote peer */
923 int smc_llc_do_delete_rkey(struct smc_link_group *lgr,
924 struct smc_buf_desc *rmb_desc)
926 struct smc_llc_qentry *qentry = NULL;
927 struct smc_link *send_link;
930 send_link = smc_llc_usable_link(lgr);
934 rc = smc_llc_flow_initiate(lgr, SMC_LLC_FLOW_RKEY);
937 /* protected by llc_flow control */
938 rc = smc_llc_send_delete_rkey(send_link, rmb_desc);
941 /* receive DELETE RKEY response from server over RoCE fabric */
942 qentry = smc_llc_wait(lgr, send_link, SMC_LLC_WAIT_TIME,
943 SMC_LLC_DELETE_RKEY);
944 if (!qentry || (qentry->msg.raw.hdr.flags & SMC_LLC_FLAG_RKEY_NEG))
948 smc_llc_flow_qentry_del(&lgr->llc_flow_lcl);
949 smc_llc_flow_stop(lgr, &lgr->llc_flow_lcl);
953 /* evaluate confirm link request or response */
954 int smc_llc_eval_conf_link(struct smc_llc_qentry *qentry,
955 enum smc_llc_reqresp type)
957 if (type == SMC_LLC_REQ) /* SMC server assigns link_id */
958 qentry->link->link_id = qentry->msg.confirm_link.link_num;
959 if (!(qentry->msg.raw.hdr.flags & SMC_LLC_FLAG_NO_RMBE_EYEC))
964 /***************************** init, exit, misc ******************************/
966 static struct smc_wr_rx_handler smc_llc_rx_handlers[] = {
968 .handler = smc_llc_rx_handler,
969 .type = SMC_LLC_CONFIRM_LINK
972 .handler = smc_llc_rx_handler,
973 .type = SMC_LLC_TEST_LINK
976 .handler = smc_llc_rx_handler,
977 .type = SMC_LLC_ADD_LINK
980 .handler = smc_llc_rx_handler,
981 .type = SMC_LLC_DELETE_LINK
984 .handler = smc_llc_rx_handler,
985 .type = SMC_LLC_CONFIRM_RKEY
988 .handler = smc_llc_rx_handler,
989 .type = SMC_LLC_CONFIRM_RKEY_CONT
992 .handler = smc_llc_rx_handler,
993 .type = SMC_LLC_DELETE_RKEY
1000 int __init smc_llc_init(void)
1002 struct smc_wr_rx_handler *handler;
1005 for (handler = smc_llc_rx_handlers; handler->handler; handler++) {
1006 INIT_HLIST_NODE(&handler->list);
1007 rc = smc_wr_rx_register_handler(handler);