1 // SPDX-License-Identifier: GPL-2.0
3 * Shared Memory Communications over RDMA (SMC-R) and RoCE
5 * Link Layer Control (LLC)
7 * Copyright IBM Corp. 2016
9 * Author(s): Klaus Wacker <Klaus.Wacker@de.ibm.com>
10 * Ursula Braun <ubraun@linux.vnet.ibm.com>
14 #include <rdma/ib_verbs.h>
21 #define SMC_LLC_DATA_LEN 40
24 struct smc_wr_rx_hdr common;
26 #if defined(__BIG_ENDIAN_BITFIELD)
29 #elif defined(__LITTLE_ENDIAN_BITFIELD)
30 u8 add_link_rej_rsn:4,
36 #define SMC_LLC_FLAG_NO_RMBE_EYEC 0x03
38 struct smc_llc_msg_confirm_link { /* type 0x01 */
39 struct smc_llc_hdr hd;
40 u8 sender_mac[ETH_ALEN];
41 u8 sender_gid[SMC_GID_SIZE];
44 u8 link_uid[SMC_LGR_ID_SIZE];
49 #define SMC_LLC_FLAG_ADD_LNK_REJ 0x40
50 #define SMC_LLC_REJ_RSN_NO_ALT_PATH 1
52 #define SMC_LLC_ADD_LNK_MAX_LINKS 2
54 struct smc_llc_msg_add_link { /* type 0x02 */
55 struct smc_llc_hdr hd;
56 u8 sender_mac[ETH_ALEN];
58 u8 sender_gid[SMC_GID_SIZE];
61 u8 flags2; /* QP mtu */
66 #define SMC_LLC_FLAG_DEL_LINK_ALL 0x40
67 #define SMC_LLC_FLAG_DEL_LINK_ORDERLY 0x20
69 struct smc_llc_msg_del_link { /* type 0x04 */
70 struct smc_llc_hdr hd;
74 } __packed; /* format defined in RFC7609 */
76 struct smc_llc_msg_test_link { /* type 0x07 */
77 struct smc_llc_hdr hd;
82 struct smc_rmb_rtoken {
84 u8 num_rkeys; /* first rtoken byte of CONFIRM LINK msg */
85 /* is actually the num of rtokens, first */
86 /* rtoken is always for the current link */
87 u8 link_id; /* link id of the rtoken */
91 } __packed; /* format defined in RFC7609 */
93 #define SMC_LLC_RKEYS_PER_MSG 3
95 struct smc_llc_msg_confirm_rkey { /* type 0x06 */
96 struct smc_llc_hdr hd;
97 struct smc_rmb_rtoken rtoken[SMC_LLC_RKEYS_PER_MSG];
101 struct smc_llc_msg_confirm_rkey_cont { /* type 0x08 */
102 struct smc_llc_hdr hd;
104 struct smc_rmb_rtoken rtoken[SMC_LLC_RKEYS_PER_MSG];
107 #define SMC_LLC_DEL_RKEY_MAX 8
108 #define SMC_LLC_FLAG_RKEY_NEG 0x20
110 struct smc_llc_msg_delete_rkey { /* type 0x09 */
111 struct smc_llc_hdr hd;
120 struct smc_llc_msg_confirm_link confirm_link;
121 struct smc_llc_msg_add_link add_link;
122 struct smc_llc_msg_del_link delete_link;
124 struct smc_llc_msg_confirm_rkey confirm_rkey;
125 struct smc_llc_msg_confirm_rkey_cont confirm_rkey_cont;
126 struct smc_llc_msg_delete_rkey delete_rkey;
128 struct smc_llc_msg_test_link test_link;
130 struct smc_llc_hdr hdr;
131 u8 data[SMC_LLC_DATA_LEN];
135 #define SMC_LLC_FLAG_RESP 0x80
137 struct smc_llc_qentry {
138 struct list_head list;
139 struct smc_link *link;
140 union smc_llc_msg msg;
143 struct smc_llc_qentry *smc_llc_flow_qentry_clr(struct smc_llc_flow *flow)
145 struct smc_llc_qentry *qentry = flow->qentry;
151 void smc_llc_flow_qentry_del(struct smc_llc_flow *flow)
153 struct smc_llc_qentry *qentry;
156 qentry = flow->qentry;
162 static inline void smc_llc_flow_qentry_set(struct smc_llc_flow *flow,
163 struct smc_llc_qentry *qentry)
165 flow->qentry = qentry;
168 /* try to start a new llc flow, initiated by an incoming llc msg */
169 static bool smc_llc_flow_start(struct smc_llc_flow *flow,
170 struct smc_llc_qentry *qentry)
172 struct smc_link_group *lgr = qentry->link->lgr;
174 spin_lock_bh(&lgr->llc_flow_lock);
176 /* a flow is already active */
177 if ((qentry->msg.raw.hdr.common.type == SMC_LLC_ADD_LINK ||
178 qentry->msg.raw.hdr.common.type == SMC_LLC_DELETE_LINK) &&
179 !lgr->delayed_event) {
180 lgr->delayed_event = qentry;
182 /* forget this llc request */
185 spin_unlock_bh(&lgr->llc_flow_lock);
188 switch (qentry->msg.raw.hdr.common.type) {
189 case SMC_LLC_ADD_LINK:
190 flow->type = SMC_LLC_FLOW_ADD_LINK;
192 case SMC_LLC_DELETE_LINK:
193 flow->type = SMC_LLC_FLOW_DEL_LINK;
195 case SMC_LLC_CONFIRM_RKEY:
196 case SMC_LLC_DELETE_RKEY:
197 flow->type = SMC_LLC_FLOW_RKEY;
200 flow->type = SMC_LLC_FLOW_NONE;
202 if (qentry == lgr->delayed_event)
203 lgr->delayed_event = NULL;
204 spin_unlock_bh(&lgr->llc_flow_lock);
205 smc_llc_flow_qentry_set(flow, qentry);
209 /* start a new local llc flow, wait till current flow finished */
210 int smc_llc_flow_initiate(struct smc_link_group *lgr,
211 enum smc_llc_flowtype type)
213 enum smc_llc_flowtype allowed_remote = SMC_LLC_FLOW_NONE;
216 /* all flows except confirm_rkey and delete_rkey are exclusive,
217 * confirm/delete rkey flows can run concurrently (local and remote)
219 if (type == SMC_LLC_FLOW_RKEY)
220 allowed_remote = SMC_LLC_FLOW_RKEY;
222 if (list_empty(&lgr->list))
224 spin_lock_bh(&lgr->llc_flow_lock);
225 if (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
226 (lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
227 lgr->llc_flow_rmt.type == allowed_remote)) {
228 lgr->llc_flow_lcl.type = type;
229 spin_unlock_bh(&lgr->llc_flow_lock);
232 spin_unlock_bh(&lgr->llc_flow_lock);
233 rc = wait_event_interruptible_timeout(lgr->llc_waiter,
234 (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
235 (lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
236 lgr->llc_flow_rmt.type == allowed_remote)),
243 /* finish the current llc flow */
244 void smc_llc_flow_stop(struct smc_link_group *lgr, struct smc_llc_flow *flow)
246 spin_lock_bh(&lgr->llc_flow_lock);
247 memset(flow, 0, sizeof(*flow));
248 flow->type = SMC_LLC_FLOW_NONE;
249 spin_unlock_bh(&lgr->llc_flow_lock);
250 if (!list_empty(&lgr->list) && lgr->delayed_event &&
251 flow == &lgr->llc_flow_lcl)
252 schedule_work(&lgr->llc_event_work);
254 wake_up_interruptible(&lgr->llc_waiter);
257 /* lnk is optional and used for early wakeup when link goes down, useful in
258 * cases where we wait for a response on the link after we sent a request
260 struct smc_llc_qentry *smc_llc_wait(struct smc_link_group *lgr,
261 struct smc_link *lnk,
262 int time_out, u8 exp_msg)
264 struct smc_llc_flow *flow = &lgr->llc_flow_lcl;
266 wait_event_interruptible_timeout(lgr->llc_waiter,
268 (lnk && !smc_link_usable(lnk)) ||
269 list_empty(&lgr->list)),
272 (lnk && !smc_link_usable(lnk)) || list_empty(&lgr->list)) {
273 smc_llc_flow_qentry_del(flow);
276 if (exp_msg && flow->qentry->msg.raw.hdr.common.type != exp_msg) {
277 if (exp_msg == SMC_LLC_ADD_LINK &&
278 flow->qentry->msg.raw.hdr.common.type ==
279 SMC_LLC_DELETE_LINK) {
280 /* flow_start will delay the unexpected msg */
281 smc_llc_flow_start(&lgr->llc_flow_lcl,
282 smc_llc_flow_qentry_clr(flow));
285 smc_llc_flow_qentry_del(flow);
291 /********************************** send *************************************/
293 struct smc_llc_tx_pend {
296 /* handler for send/transmission completion of an LLC msg */
297 static void smc_llc_tx_handler(struct smc_wr_tx_pend_priv *pend,
298 struct smc_link *link,
299 enum ib_wc_status wc_status)
301 /* future work: handle wc_status error for recovery and failover */
305 * smc_llc_add_pending_send() - add LLC control message to pending WQE transmits
306 * @link: Pointer to SMC link used for sending LLC control message.
307 * @wr_buf: Out variable returning pointer to work request payload buffer.
308 * @pend: Out variable returning pointer to private pending WR tracking.
309 * It's the context the transmit complete handler will get.
311 * Reserves and pre-fills an entry for a pending work request send/tx.
312 * Used by mid-level smc_llc_send_msg() to prepare for later actual send/tx.
313 * Can sleep due to smc_get_ctrl_buf (if not in softirq context).
315 * Return: 0 on success, otherwise an error value.
317 static int smc_llc_add_pending_send(struct smc_link *link,
318 struct smc_wr_buf **wr_buf,
319 struct smc_wr_tx_pend_priv **pend)
323 rc = smc_wr_tx_get_free_slot(link, smc_llc_tx_handler, wr_buf, NULL,
328 sizeof(union smc_llc_msg) > SMC_WR_BUF_SIZE,
329 "must increase SMC_WR_BUF_SIZE to at least sizeof(struct smc_llc_msg)");
331 sizeof(union smc_llc_msg) != SMC_WR_TX_SIZE,
332 "must adapt SMC_WR_TX_SIZE to sizeof(struct smc_llc_msg); if not all smc_wr upper layer protocols use the same message size any more, must start to set link->wr_tx_sges[i].length on each individual smc_wr_tx_send()");
334 sizeof(struct smc_llc_tx_pend) > SMC_WR_TX_PEND_PRIV_SIZE,
335 "must increase SMC_WR_TX_PEND_PRIV_SIZE to at least sizeof(struct smc_llc_tx_pend)");
339 /* high-level API to send LLC confirm link */
340 int smc_llc_send_confirm_link(struct smc_link *link,
341 enum smc_llc_reqresp reqresp)
343 struct smc_link_group *lgr = smc_get_lgr(link);
344 struct smc_llc_msg_confirm_link *confllc;
345 struct smc_wr_tx_pend_priv *pend;
346 struct smc_wr_buf *wr_buf;
349 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
352 confllc = (struct smc_llc_msg_confirm_link *)wr_buf;
353 memset(confllc, 0, sizeof(*confllc));
354 confllc->hd.common.type = SMC_LLC_CONFIRM_LINK;
355 confllc->hd.length = sizeof(struct smc_llc_msg_confirm_link);
356 confllc->hd.flags |= SMC_LLC_FLAG_NO_RMBE_EYEC;
357 if (reqresp == SMC_LLC_RESP)
358 confllc->hd.flags |= SMC_LLC_FLAG_RESP;
359 memcpy(confllc->sender_mac, link->smcibdev->mac[link->ibport - 1],
361 memcpy(confllc->sender_gid, link->gid, SMC_GID_SIZE);
362 hton24(confllc->sender_qp_num, link->roce_qp->qp_num);
363 confllc->link_num = link->link_id;
364 memcpy(confllc->link_uid, lgr->id, SMC_LGR_ID_SIZE);
365 confllc->max_links = SMC_LLC_ADD_LNK_MAX_LINKS; /* enforce peer resp. */
366 /* send llc message */
367 rc = smc_wr_tx_send(link, pend);
371 /* send LLC confirm rkey request */
372 static int smc_llc_send_confirm_rkey(struct smc_link *link,
373 struct smc_buf_desc *rmb_desc)
375 struct smc_llc_msg_confirm_rkey *rkeyllc;
376 struct smc_wr_tx_pend_priv *pend;
377 struct smc_wr_buf *wr_buf;
380 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
383 rkeyllc = (struct smc_llc_msg_confirm_rkey *)wr_buf;
384 memset(rkeyllc, 0, sizeof(*rkeyllc));
385 rkeyllc->hd.common.type = SMC_LLC_CONFIRM_RKEY;
386 rkeyllc->hd.length = sizeof(struct smc_llc_msg_confirm_rkey);
387 rkeyllc->rtoken[0].rmb_key =
388 htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
389 rkeyllc->rtoken[0].rmb_vaddr = cpu_to_be64(
390 (u64)sg_dma_address(rmb_desc->sgt[link->link_idx].sgl));
391 /* send llc message */
392 rc = smc_wr_tx_send(link, pend);
396 /* send LLC delete rkey request */
397 static int smc_llc_send_delete_rkey(struct smc_link *link,
398 struct smc_buf_desc *rmb_desc)
400 struct smc_llc_msg_delete_rkey *rkeyllc;
401 struct smc_wr_tx_pend_priv *pend;
402 struct smc_wr_buf *wr_buf;
405 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
408 rkeyllc = (struct smc_llc_msg_delete_rkey *)wr_buf;
409 memset(rkeyllc, 0, sizeof(*rkeyllc));
410 rkeyllc->hd.common.type = SMC_LLC_DELETE_RKEY;
411 rkeyllc->hd.length = sizeof(struct smc_llc_msg_delete_rkey);
412 rkeyllc->num_rkeys = 1;
413 rkeyllc->rkey[0] = htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
414 /* send llc message */
415 rc = smc_wr_tx_send(link, pend);
419 /* prepare an add link message */
420 static void smc_llc_prep_add_link(struct smc_llc_msg_add_link *addllc,
421 struct smc_link *link, u8 mac[], u8 gid[],
422 enum smc_llc_reqresp reqresp)
424 memset(addllc, 0, sizeof(*addllc));
425 addllc->hd.common.type = SMC_LLC_ADD_LINK;
426 addllc->hd.length = sizeof(struct smc_llc_msg_add_link);
427 if (reqresp == SMC_LLC_RESP) {
428 addllc->hd.flags |= SMC_LLC_FLAG_RESP;
429 /* always reject more links for now */
430 addllc->hd.flags |= SMC_LLC_FLAG_ADD_LNK_REJ;
431 addllc->hd.add_link_rej_rsn = SMC_LLC_REJ_RSN_NO_ALT_PATH;
433 memcpy(addllc->sender_mac, mac, ETH_ALEN);
434 memcpy(addllc->sender_gid, gid, SMC_GID_SIZE);
437 /* send ADD LINK request or response */
438 int smc_llc_send_add_link(struct smc_link *link, u8 mac[], u8 gid[],
439 enum smc_llc_reqresp reqresp)
441 struct smc_llc_msg_add_link *addllc;
442 struct smc_wr_tx_pend_priv *pend;
443 struct smc_wr_buf *wr_buf;
446 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
449 addllc = (struct smc_llc_msg_add_link *)wr_buf;
450 smc_llc_prep_add_link(addllc, link, mac, gid, reqresp);
451 /* send llc message */
452 rc = smc_wr_tx_send(link, pend);
456 /* prepare a delete link message */
457 static void smc_llc_prep_delete_link(struct smc_llc_msg_del_link *delllc,
458 struct smc_link *link,
459 enum smc_llc_reqresp reqresp, bool orderly)
461 memset(delllc, 0, sizeof(*delllc));
462 delllc->hd.common.type = SMC_LLC_DELETE_LINK;
463 delllc->hd.length = sizeof(struct smc_llc_msg_add_link);
464 if (reqresp == SMC_LLC_RESP)
465 delllc->hd.flags |= SMC_LLC_FLAG_RESP;
466 /* DEL_LINK_ALL because only 1 link supported */
467 delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ALL;
469 delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ORDERLY;
470 delllc->link_num = link->link_id;
473 /* send DELETE LINK request or response */
474 int smc_llc_send_delete_link(struct smc_link *link,
475 enum smc_llc_reqresp reqresp, bool orderly)
477 struct smc_llc_msg_del_link *delllc;
478 struct smc_wr_tx_pend_priv *pend;
479 struct smc_wr_buf *wr_buf;
482 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
485 delllc = (struct smc_llc_msg_del_link *)wr_buf;
486 smc_llc_prep_delete_link(delllc, link, reqresp, orderly);
487 /* send llc message */
488 rc = smc_wr_tx_send(link, pend);
492 /* send LLC test link request */
493 static int smc_llc_send_test_link(struct smc_link *link, u8 user_data[16])
495 struct smc_llc_msg_test_link *testllc;
496 struct smc_wr_tx_pend_priv *pend;
497 struct smc_wr_buf *wr_buf;
500 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
503 testllc = (struct smc_llc_msg_test_link *)wr_buf;
504 memset(testllc, 0, sizeof(*testllc));
505 testllc->hd.common.type = SMC_LLC_TEST_LINK;
506 testllc->hd.length = sizeof(struct smc_llc_msg_test_link);
507 memcpy(testllc->user_data, user_data, sizeof(testllc->user_data));
508 /* send llc message */
509 rc = smc_wr_tx_send(link, pend);
513 /* schedule an llc send on link, may wait for buffers */
514 static int smc_llc_send_message(struct smc_link *link, void *llcbuf)
516 struct smc_wr_tx_pend_priv *pend;
517 struct smc_wr_buf *wr_buf;
520 if (!smc_link_usable(link))
522 rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
525 memcpy(wr_buf, llcbuf, sizeof(union smc_llc_msg));
526 return smc_wr_tx_send(link, pend);
529 /********************************* receive ***********************************/
531 static void smc_llc_rx_confirm_link(struct smc_link *link,
532 struct smc_llc_msg_confirm_link *llc)
534 struct smc_link_group *lgr = smc_get_lgr(link);
537 /* RMBE eyecatchers are not supported */
538 if (!(llc->hd.flags & SMC_LLC_FLAG_NO_RMBE_EYEC))
541 if (lgr->role == SMC_CLNT &&
542 link->state == SMC_LNK_ACTIVATING) {
543 link->llc_confirm_rc = conf_rc;
544 link->link_id = llc->link_num;
545 complete(&link->llc_confirm);
549 static void smc_llc_rx_add_link(struct smc_link *link,
550 struct smc_llc_msg_add_link *llc)
552 struct smc_link_group *lgr = smc_get_lgr(link);
554 if (link->state == SMC_LNK_ACTIVATING) {
555 complete(&link->llc_add);
559 if (lgr->role == SMC_SERV) {
560 smc_llc_prep_add_link(llc, link,
561 link->smcibdev->mac[link->ibport - 1],
562 link->gid, SMC_LLC_REQ);
565 smc_llc_prep_add_link(llc, link,
566 link->smcibdev->mac[link->ibport - 1],
567 link->gid, SMC_LLC_RESP);
569 smc_llc_send_message(link, llc);
572 static void smc_llc_rx_delete_link(struct smc_link *link,
573 struct smc_llc_msg_del_link *llc)
575 struct smc_link_group *lgr = smc_get_lgr(link);
578 smc_llc_link_deleting(link);
579 if (lgr->role == SMC_SERV) {
580 /* client asks to delete this link, send request */
581 smc_llc_prep_delete_link(llc, link, SMC_LLC_REQ, true);
583 /* server requests to delete this link, send response */
584 smc_llc_prep_delete_link(llc, link, SMC_LLC_RESP, true);
586 smc_llc_send_message(link, llc);
587 smc_lgr_terminate_sched(lgr);
590 static void smc_llc_rx_test_link(struct smc_link *link,
591 struct smc_llc_msg_test_link *llc)
593 llc->hd.flags |= SMC_LLC_FLAG_RESP;
594 smc_llc_send_message(link, llc);
597 static void smc_llc_rx_confirm_rkey(struct smc_link *link,
598 struct smc_llc_msg_confirm_rkey *llc)
602 rc = smc_rtoken_add(link,
603 llc->rtoken[0].rmb_vaddr,
604 llc->rtoken[0].rmb_key);
606 /* ignore rtokens for other links, we have only one link */
608 llc->hd.flags |= SMC_LLC_FLAG_RESP;
610 llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
611 smc_llc_send_message(link, llc);
614 static void smc_llc_rx_confirm_rkey_cont(struct smc_link *link,
615 struct smc_llc_msg_confirm_rkey_cont *llc)
617 /* ignore rtokens for other links, we have only one link */
618 llc->hd.flags |= SMC_LLC_FLAG_RESP;
619 smc_llc_send_message(link, llc);
622 static void smc_llc_rx_delete_rkey(struct smc_link *link,
623 struct smc_llc_msg_delete_rkey *llc)
628 max = min_t(u8, llc->num_rkeys, SMC_LLC_DEL_RKEY_MAX);
629 for (i = 0; i < max; i++) {
630 if (smc_rtoken_delete(link, llc->rkey[i]))
631 err_mask |= 1 << (SMC_LLC_DEL_RKEY_MAX - 1 - i);
635 llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
636 llc->err_mask = err_mask;
639 llc->hd.flags |= SMC_LLC_FLAG_RESP;
640 smc_llc_send_message(link, llc);
643 /* flush the llc event queue */
644 static void smc_llc_event_flush(struct smc_link_group *lgr)
646 struct smc_llc_qentry *qentry, *q;
648 spin_lock_bh(&lgr->llc_event_q_lock);
649 list_for_each_entry_safe(qentry, q, &lgr->llc_event_q, list) {
650 list_del_init(&qentry->list);
653 spin_unlock_bh(&lgr->llc_event_q_lock);
656 static void smc_llc_event_handler(struct smc_llc_qentry *qentry)
658 union smc_llc_msg *llc = &qentry->msg;
659 struct smc_link *link = qentry->link;
661 if (!smc_link_usable(link))
664 switch (llc->raw.hdr.common.type) {
665 case SMC_LLC_TEST_LINK:
666 smc_llc_rx_test_link(link, &llc->test_link);
668 case SMC_LLC_CONFIRM_LINK:
669 smc_llc_rx_confirm_link(link, &llc->confirm_link);
671 case SMC_LLC_ADD_LINK:
672 smc_llc_rx_add_link(link, &llc->add_link);
674 case SMC_LLC_DELETE_LINK:
675 smc_llc_rx_delete_link(link, &llc->delete_link);
677 case SMC_LLC_CONFIRM_RKEY:
678 smc_llc_rx_confirm_rkey(link, &llc->confirm_rkey);
680 case SMC_LLC_CONFIRM_RKEY_CONT:
681 smc_llc_rx_confirm_rkey_cont(link, &llc->confirm_rkey_cont);
683 case SMC_LLC_DELETE_RKEY:
684 smc_llc_rx_delete_rkey(link, &llc->delete_rkey);
691 /* worker to process llc messages on the event queue */
692 static void smc_llc_event_work(struct work_struct *work)
694 struct smc_link_group *lgr = container_of(work, struct smc_link_group,
696 struct smc_llc_qentry *qentry;
698 if (!lgr->llc_flow_lcl.type && lgr->delayed_event) {
699 if (smc_link_usable(lgr->delayed_event->link)) {
700 smc_llc_event_handler(lgr->delayed_event);
702 qentry = lgr->delayed_event;
703 lgr->delayed_event = NULL;
709 spin_lock_bh(&lgr->llc_event_q_lock);
710 if (!list_empty(&lgr->llc_event_q)) {
711 qentry = list_first_entry(&lgr->llc_event_q,
712 struct smc_llc_qentry, list);
713 list_del_init(&qentry->list);
714 spin_unlock_bh(&lgr->llc_event_q_lock);
715 smc_llc_event_handler(qentry);
718 spin_unlock_bh(&lgr->llc_event_q_lock);
721 /* process llc responses in tasklet context */
722 static void smc_llc_rx_response(struct smc_link *link,
723 struct smc_llc_qentry *qentry)
725 u8 llc_type = qentry->msg.raw.hdr.common.type;
726 union smc_llc_msg *llc = &qentry->msg;
730 case SMC_LLC_TEST_LINK:
731 if (link->state == SMC_LNK_ACTIVE)
732 complete(&link->llc_testlink_resp);
734 case SMC_LLC_CONFIRM_LINK:
735 if (!(llc->raw.hdr.flags & SMC_LLC_FLAG_NO_RMBE_EYEC))
737 if (link->lgr->role == SMC_SERV &&
738 link->state == SMC_LNK_ACTIVATING) {
739 link->llc_confirm_resp_rc = rc;
740 complete(&link->llc_confirm_resp);
743 case SMC_LLC_ADD_LINK:
744 if (link->state == SMC_LNK_ACTIVATING)
745 complete(&link->llc_add_resp);
747 case SMC_LLC_DELETE_LINK:
748 if (link->lgr->role == SMC_SERV)
749 smc_lgr_schedule_free_work_fast(link->lgr);
751 case SMC_LLC_CONFIRM_RKEY:
752 link->llc_confirm_rkey_resp_rc = llc->raw.hdr.flags &
753 SMC_LLC_FLAG_RKEY_NEG;
754 complete(&link->llc_confirm_rkey_resp);
756 case SMC_LLC_CONFIRM_RKEY_CONT:
757 /* unused as long as we don't send this type of msg */
759 case SMC_LLC_DELETE_RKEY:
760 link->llc_delete_rkey_resp_rc = llc->raw.hdr.flags &
761 SMC_LLC_FLAG_RKEY_NEG;
762 complete(&link->llc_delete_rkey_resp);
768 static void smc_llc_enqueue(struct smc_link *link, union smc_llc_msg *llc)
770 struct smc_link_group *lgr = link->lgr;
771 struct smc_llc_qentry *qentry;
774 qentry = kmalloc(sizeof(*qentry), GFP_ATOMIC);
778 INIT_LIST_HEAD(&qentry->list);
779 memcpy(&qentry->msg, llc, sizeof(union smc_llc_msg));
781 /* process responses immediately */
782 if (llc->raw.hdr.flags & SMC_LLC_FLAG_RESP) {
783 smc_llc_rx_response(link, qentry);
787 /* add requests to event queue */
788 spin_lock_irqsave(&lgr->llc_event_q_lock, flags);
789 list_add_tail(&qentry->list, &lgr->llc_event_q);
790 spin_unlock_irqrestore(&lgr->llc_event_q_lock, flags);
791 schedule_work(&link->lgr->llc_event_work);
794 /* copy received msg and add it to the event queue */
795 static void smc_llc_rx_handler(struct ib_wc *wc, void *buf)
797 struct smc_link *link = (struct smc_link *)wc->qp->qp_context;
798 union smc_llc_msg *llc = buf;
800 if (wc->byte_len < sizeof(*llc))
801 return; /* short message */
802 if (llc->raw.hdr.length != sizeof(*llc))
803 return; /* invalid message */
805 smc_llc_enqueue(link, llc);
808 /***************************** worker, utils *********************************/
810 static void smc_llc_testlink_work(struct work_struct *work)
812 struct smc_link *link = container_of(to_delayed_work(work),
813 struct smc_link, llc_testlink_wrk);
814 unsigned long next_interval;
815 unsigned long expire_time;
816 u8 user_data[16] = { 0 };
819 if (link->state != SMC_LNK_ACTIVE)
820 return; /* don't reschedule worker */
821 expire_time = link->wr_rx_tstamp + link->llc_testlink_time;
822 if (time_is_after_jiffies(expire_time)) {
823 next_interval = expire_time - jiffies;
826 reinit_completion(&link->llc_testlink_resp);
827 smc_llc_send_test_link(link, user_data);
828 /* receive TEST LINK response over RoCE fabric */
829 rc = wait_for_completion_interruptible_timeout(&link->llc_testlink_resp,
831 if (link->state != SMC_LNK_ACTIVE)
832 return; /* link state changed */
834 smc_lgr_terminate_sched(smc_get_lgr(link));
837 next_interval = link->llc_testlink_time;
839 schedule_delayed_work(&link->llc_testlink_wrk, next_interval);
842 void smc_llc_lgr_init(struct smc_link_group *lgr, struct smc_sock *smc)
844 struct net *net = sock_net(smc->clcsock->sk);
846 INIT_WORK(&lgr->llc_event_work, smc_llc_event_work);
847 INIT_LIST_HEAD(&lgr->llc_event_q);
848 spin_lock_init(&lgr->llc_event_q_lock);
849 spin_lock_init(&lgr->llc_flow_lock);
850 init_waitqueue_head(&lgr->llc_waiter);
851 lgr->llc_testlink_time = net->ipv4.sysctl_tcp_keepalive_time;
854 /* called after lgr was removed from lgr_list */
855 void smc_llc_lgr_clear(struct smc_link_group *lgr)
857 smc_llc_event_flush(lgr);
858 wake_up_interruptible_all(&lgr->llc_waiter);
859 cancel_work_sync(&lgr->llc_event_work);
860 if (lgr->delayed_event) {
861 kfree(lgr->delayed_event);
862 lgr->delayed_event = NULL;
866 int smc_llc_link_init(struct smc_link *link)
868 init_completion(&link->llc_confirm);
869 init_completion(&link->llc_confirm_resp);
870 init_completion(&link->llc_add);
871 init_completion(&link->llc_add_resp);
872 init_completion(&link->llc_confirm_rkey_resp);
873 init_completion(&link->llc_delete_rkey_resp);
874 mutex_init(&link->llc_delete_rkey_mutex);
875 init_completion(&link->llc_testlink_resp);
876 INIT_DELAYED_WORK(&link->llc_testlink_wrk, smc_llc_testlink_work);
880 void smc_llc_link_active(struct smc_link *link)
882 link->state = SMC_LNK_ACTIVE;
883 if (link->lgr->llc_testlink_time) {
884 link->llc_testlink_time = link->lgr->llc_testlink_time * HZ;
885 schedule_delayed_work(&link->llc_testlink_wrk,
886 link->llc_testlink_time);
890 void smc_llc_link_deleting(struct smc_link *link)
892 link->state = SMC_LNK_DELETING;
893 smc_wr_wakeup_tx_wait(link);
896 /* called in worker context */
897 void smc_llc_link_clear(struct smc_link *link)
899 complete(&link->llc_testlink_resp);
900 cancel_delayed_work_sync(&link->llc_testlink_wrk);
901 smc_wr_wakeup_reg_wait(link);
902 smc_wr_wakeup_tx_wait(link);
905 /* register a new rtoken at the remote peer */
906 int smc_llc_do_confirm_rkey(struct smc_link *link,
907 struct smc_buf_desc *rmb_desc)
911 /* protected by mutex smc_create_lgr_pending */
912 reinit_completion(&link->llc_confirm_rkey_resp);
913 rc = smc_llc_send_confirm_rkey(link, rmb_desc);
916 /* receive CONFIRM RKEY response from server over RoCE fabric */
917 rc = wait_for_completion_interruptible_timeout(
918 &link->llc_confirm_rkey_resp, SMC_LLC_WAIT_TIME);
919 if (rc <= 0 || link->llc_confirm_rkey_resp_rc)
924 /* unregister an rtoken at the remote peer */
925 int smc_llc_do_delete_rkey(struct smc_link *link,
926 struct smc_buf_desc *rmb_desc)
930 mutex_lock(&link->llc_delete_rkey_mutex);
931 if (link->state != SMC_LNK_ACTIVE)
933 reinit_completion(&link->llc_delete_rkey_resp);
934 rc = smc_llc_send_delete_rkey(link, rmb_desc);
937 /* receive DELETE RKEY response from server over RoCE fabric */
938 rc = wait_for_completion_interruptible_timeout(
939 &link->llc_delete_rkey_resp, SMC_LLC_WAIT_TIME);
940 if (rc <= 0 || link->llc_delete_rkey_resp_rc)
945 mutex_unlock(&link->llc_delete_rkey_mutex);
949 /***************************** init, exit, misc ******************************/
951 static struct smc_wr_rx_handler smc_llc_rx_handlers[] = {
953 .handler = smc_llc_rx_handler,
954 .type = SMC_LLC_CONFIRM_LINK
957 .handler = smc_llc_rx_handler,
958 .type = SMC_LLC_TEST_LINK
961 .handler = smc_llc_rx_handler,
962 .type = SMC_LLC_ADD_LINK
965 .handler = smc_llc_rx_handler,
966 .type = SMC_LLC_DELETE_LINK
969 .handler = smc_llc_rx_handler,
970 .type = SMC_LLC_CONFIRM_RKEY
973 .handler = smc_llc_rx_handler,
974 .type = SMC_LLC_CONFIRM_RKEY_CONT
977 .handler = smc_llc_rx_handler,
978 .type = SMC_LLC_DELETE_RKEY
985 int __init smc_llc_init(void)
987 struct smc_wr_rx_handler *handler;
990 for (handler = smc_llc_rx_handlers; handler->handler; handler++) {
991 INIT_HLIST_NODE(&handler->list);
992 rc = smc_wr_rx_register_handler(handler);