mirror of
https://mirrors.bfsu.edu.cn/git/linux.git
synced 2024-12-26 04:25:27 +08:00
555da9af82
The new framework allows to start specific types of LLC control flows, protects active flows and makes it possible to wait for flows to finish before starting a new flow. This mechanism is used for the LLC control layer to model flows like 'add link' or 'delete link' which need to send/receive several LLC messages and are not allowed to get interrupted by the wrong type of messages. 'Add link' or 'Delete link' messages arriving in the middle of a flow are delayed and processed when the current flow finished. Signed-off-by: Karsten Graul <kgraul@linux.ibm.com> Reviewed-by: Ursula Braun <ubraun@linux.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net>
986 lines
27 KiB
C
986 lines
27 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Shared Memory Communications over RDMA (SMC-R) and RoCE
|
|
*
|
|
* Link Layer Control (LLC)
|
|
*
|
|
* Copyright IBM Corp. 2016
|
|
*
|
|
* Author(s): Klaus Wacker <Klaus.Wacker@de.ibm.com>
|
|
* Ursula Braun <ubraun@linux.vnet.ibm.com>
|
|
*/
|
|
|
|
#include <net/tcp.h>
|
|
#include <rdma/ib_verbs.h>
|
|
|
|
#include "smc.h"
|
|
#include "smc_core.h"
|
|
#include "smc_clc.h"
|
|
#include "smc_llc.h"
|
|
|
|
#define SMC_LLC_DATA_LEN 40
|
|
|
|
struct smc_llc_hdr {
|
|
struct smc_wr_rx_hdr common;
|
|
u8 length; /* 44 */
|
|
#if defined(__BIG_ENDIAN_BITFIELD)
|
|
u8 reserved:4,
|
|
add_link_rej_rsn:4;
|
|
#elif defined(__LITTLE_ENDIAN_BITFIELD)
|
|
u8 add_link_rej_rsn:4,
|
|
reserved:4;
|
|
#endif
|
|
u8 flags;
|
|
};
|
|
|
|
#define SMC_LLC_FLAG_NO_RMBE_EYEC 0x03
|
|
|
|
struct smc_llc_msg_confirm_link { /* type 0x01 */
|
|
struct smc_llc_hdr hd;
|
|
u8 sender_mac[ETH_ALEN];
|
|
u8 sender_gid[SMC_GID_SIZE];
|
|
u8 sender_qp_num[3];
|
|
u8 link_num;
|
|
u8 link_uid[SMC_LGR_ID_SIZE];
|
|
u8 max_links;
|
|
u8 reserved[9];
|
|
};
|
|
|
|
#define SMC_LLC_FLAG_ADD_LNK_REJ 0x40
|
|
#define SMC_LLC_REJ_RSN_NO_ALT_PATH 1
|
|
|
|
#define SMC_LLC_ADD_LNK_MAX_LINKS 2
|
|
|
|
struct smc_llc_msg_add_link { /* type 0x02 */
|
|
struct smc_llc_hdr hd;
|
|
u8 sender_mac[ETH_ALEN];
|
|
u8 reserved2[2];
|
|
u8 sender_gid[SMC_GID_SIZE];
|
|
u8 sender_qp_num[3];
|
|
u8 link_num;
|
|
u8 flags2; /* QP mtu */
|
|
u8 initial_psn[3];
|
|
u8 reserved[8];
|
|
};
|
|
|
|
#define SMC_LLC_FLAG_DEL_LINK_ALL 0x40
|
|
#define SMC_LLC_FLAG_DEL_LINK_ORDERLY 0x20
|
|
|
|
struct smc_llc_msg_del_link { /* type 0x04 */
|
|
struct smc_llc_hdr hd;
|
|
u8 link_num;
|
|
__be32 reason;
|
|
u8 reserved[35];
|
|
} __packed; /* format defined in RFC7609 */
|
|
|
|
struct smc_llc_msg_test_link { /* type 0x07 */
|
|
struct smc_llc_hdr hd;
|
|
u8 user_data[16];
|
|
u8 reserved[24];
|
|
};
|
|
|
|
struct smc_rmb_rtoken {
|
|
union {
|
|
u8 num_rkeys; /* first rtoken byte of CONFIRM LINK msg */
|
|
/* is actually the num of rtokens, first */
|
|
/* rtoken is always for the current link */
|
|
u8 link_id; /* link id of the rtoken */
|
|
};
|
|
__be32 rmb_key;
|
|
__be64 rmb_vaddr;
|
|
} __packed; /* format defined in RFC7609 */
|
|
|
|
#define SMC_LLC_RKEYS_PER_MSG 3
|
|
|
|
struct smc_llc_msg_confirm_rkey { /* type 0x06 */
|
|
struct smc_llc_hdr hd;
|
|
struct smc_rmb_rtoken rtoken[SMC_LLC_RKEYS_PER_MSG];
|
|
u8 reserved;
|
|
};
|
|
|
|
struct smc_llc_msg_confirm_rkey_cont { /* type 0x08 */
|
|
struct smc_llc_hdr hd;
|
|
u8 num_rkeys;
|
|
struct smc_rmb_rtoken rtoken[SMC_LLC_RKEYS_PER_MSG];
|
|
};
|
|
|
|
#define SMC_LLC_DEL_RKEY_MAX 8
|
|
#define SMC_LLC_FLAG_RKEY_NEG 0x20
|
|
|
|
struct smc_llc_msg_delete_rkey { /* type 0x09 */
|
|
struct smc_llc_hdr hd;
|
|
u8 num_rkeys;
|
|
u8 err_mask;
|
|
u8 reserved[2];
|
|
__be32 rkey[8];
|
|
u8 reserved2[4];
|
|
};
|
|
|
|
union smc_llc_msg {
|
|
struct smc_llc_msg_confirm_link confirm_link;
|
|
struct smc_llc_msg_add_link add_link;
|
|
struct smc_llc_msg_del_link delete_link;
|
|
|
|
struct smc_llc_msg_confirm_rkey confirm_rkey;
|
|
struct smc_llc_msg_confirm_rkey_cont confirm_rkey_cont;
|
|
struct smc_llc_msg_delete_rkey delete_rkey;
|
|
|
|
struct smc_llc_msg_test_link test_link;
|
|
struct {
|
|
struct smc_llc_hdr hdr;
|
|
u8 data[SMC_LLC_DATA_LEN];
|
|
} raw;
|
|
};
|
|
|
|
#define SMC_LLC_FLAG_RESP 0x80
|
|
|
|
struct smc_llc_qentry {
|
|
struct list_head list;
|
|
struct smc_link *link;
|
|
union smc_llc_msg msg;
|
|
};
|
|
|
|
struct smc_llc_qentry *smc_llc_flow_qentry_clr(struct smc_llc_flow *flow)
|
|
{
|
|
struct smc_llc_qentry *qentry = flow->qentry;
|
|
|
|
flow->qentry = NULL;
|
|
return qentry;
|
|
}
|
|
|
|
void smc_llc_flow_qentry_del(struct smc_llc_flow *flow)
|
|
{
|
|
struct smc_llc_qentry *qentry;
|
|
|
|
if (flow->qentry) {
|
|
qentry = flow->qentry;
|
|
flow->qentry = NULL;
|
|
kfree(qentry);
|
|
}
|
|
}
|
|
|
|
static inline void smc_llc_flow_qentry_set(struct smc_llc_flow *flow,
|
|
struct smc_llc_qentry *qentry)
|
|
{
|
|
flow->qentry = qentry;
|
|
}
|
|
|
|
/* try to start a new llc flow, initiated by an incoming llc msg */
|
|
static bool smc_llc_flow_start(struct smc_llc_flow *flow,
|
|
struct smc_llc_qentry *qentry)
|
|
{
|
|
struct smc_link_group *lgr = qentry->link->lgr;
|
|
|
|
spin_lock_bh(&lgr->llc_flow_lock);
|
|
if (flow->type) {
|
|
/* a flow is already active */
|
|
if ((qentry->msg.raw.hdr.common.type == SMC_LLC_ADD_LINK ||
|
|
qentry->msg.raw.hdr.common.type == SMC_LLC_DELETE_LINK) &&
|
|
!lgr->delayed_event) {
|
|
lgr->delayed_event = qentry;
|
|
} else {
|
|
/* forget this llc request */
|
|
kfree(qentry);
|
|
}
|
|
spin_unlock_bh(&lgr->llc_flow_lock);
|
|
return false;
|
|
}
|
|
switch (qentry->msg.raw.hdr.common.type) {
|
|
case SMC_LLC_ADD_LINK:
|
|
flow->type = SMC_LLC_FLOW_ADD_LINK;
|
|
break;
|
|
case SMC_LLC_DELETE_LINK:
|
|
flow->type = SMC_LLC_FLOW_DEL_LINK;
|
|
break;
|
|
case SMC_LLC_CONFIRM_RKEY:
|
|
case SMC_LLC_DELETE_RKEY:
|
|
flow->type = SMC_LLC_FLOW_RKEY;
|
|
break;
|
|
default:
|
|
flow->type = SMC_LLC_FLOW_NONE;
|
|
}
|
|
if (qentry == lgr->delayed_event)
|
|
lgr->delayed_event = NULL;
|
|
spin_unlock_bh(&lgr->llc_flow_lock);
|
|
smc_llc_flow_qentry_set(flow, qentry);
|
|
return true;
|
|
}
|
|
|
|
/* start a new local llc flow, wait till current flow finished */
|
|
int smc_llc_flow_initiate(struct smc_link_group *lgr,
|
|
enum smc_llc_flowtype type)
|
|
{
|
|
enum smc_llc_flowtype allowed_remote = SMC_LLC_FLOW_NONE;
|
|
int rc;
|
|
|
|
/* all flows except confirm_rkey and delete_rkey are exclusive,
|
|
* confirm/delete rkey flows can run concurrently (local and remote)
|
|
*/
|
|
if (type == SMC_LLC_FLOW_RKEY)
|
|
allowed_remote = SMC_LLC_FLOW_RKEY;
|
|
again:
|
|
if (list_empty(&lgr->list))
|
|
return -ENODEV;
|
|
spin_lock_bh(&lgr->llc_flow_lock);
|
|
if (lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
|
|
(lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
|
|
lgr->llc_flow_rmt.type == allowed_remote)) {
|
|
lgr->llc_flow_lcl.type = type;
|
|
spin_unlock_bh(&lgr->llc_flow_lock);
|
|
return 0;
|
|
}
|
|
spin_unlock_bh(&lgr->llc_flow_lock);
|
|
rc = wait_event_interruptible_timeout(lgr->llc_waiter,
|
|
(lgr->llc_flow_lcl.type == SMC_LLC_FLOW_NONE &&
|
|
(lgr->llc_flow_rmt.type == SMC_LLC_FLOW_NONE ||
|
|
lgr->llc_flow_rmt.type == allowed_remote)),
|
|
SMC_LLC_WAIT_TIME);
|
|
if (!rc)
|
|
return -ETIMEDOUT;
|
|
goto again;
|
|
}
|
|
|
|
/* finish the current llc flow */
|
|
void smc_llc_flow_stop(struct smc_link_group *lgr, struct smc_llc_flow *flow)
|
|
{
|
|
spin_lock_bh(&lgr->llc_flow_lock);
|
|
memset(flow, 0, sizeof(*flow));
|
|
flow->type = SMC_LLC_FLOW_NONE;
|
|
spin_unlock_bh(&lgr->llc_flow_lock);
|
|
if (!list_empty(&lgr->list) && lgr->delayed_event &&
|
|
flow == &lgr->llc_flow_lcl)
|
|
schedule_work(&lgr->llc_event_work);
|
|
else
|
|
wake_up_interruptible(&lgr->llc_waiter);
|
|
}
|
|
|
|
/* lnk is optional and used for early wakeup when link goes down, useful in
|
|
* cases where we wait for a response on the link after we sent a request
|
|
*/
|
|
struct smc_llc_qentry *smc_llc_wait(struct smc_link_group *lgr,
|
|
struct smc_link *lnk,
|
|
int time_out, u8 exp_msg)
|
|
{
|
|
struct smc_llc_flow *flow = &lgr->llc_flow_lcl;
|
|
|
|
wait_event_interruptible_timeout(lgr->llc_waiter,
|
|
(flow->qentry ||
|
|
(lnk && !smc_link_usable(lnk)) ||
|
|
list_empty(&lgr->list)),
|
|
time_out);
|
|
if (!flow->qentry ||
|
|
(lnk && !smc_link_usable(lnk)) || list_empty(&lgr->list)) {
|
|
smc_llc_flow_qentry_del(flow);
|
|
goto out;
|
|
}
|
|
if (exp_msg && flow->qentry->msg.raw.hdr.common.type != exp_msg) {
|
|
if (exp_msg == SMC_LLC_ADD_LINK &&
|
|
flow->qentry->msg.raw.hdr.common.type ==
|
|
SMC_LLC_DELETE_LINK) {
|
|
/* flow_start will delay the unexpected msg */
|
|
smc_llc_flow_start(&lgr->llc_flow_lcl,
|
|
smc_llc_flow_qentry_clr(flow));
|
|
return NULL;
|
|
}
|
|
smc_llc_flow_qentry_del(flow);
|
|
}
|
|
out:
|
|
return flow->qentry;
|
|
}
|
|
|
|
/********************************** send *************************************/
|
|
|
|
struct smc_llc_tx_pend {
|
|
};
|
|
|
|
/* handler for send/transmission completion of an LLC msg */
|
|
static void smc_llc_tx_handler(struct smc_wr_tx_pend_priv *pend,
|
|
struct smc_link *link,
|
|
enum ib_wc_status wc_status)
|
|
{
|
|
/* future work: handle wc_status error for recovery and failover */
|
|
}
|
|
|
|
/**
|
|
* smc_llc_add_pending_send() - add LLC control message to pending WQE transmits
|
|
* @link: Pointer to SMC link used for sending LLC control message.
|
|
* @wr_buf: Out variable returning pointer to work request payload buffer.
|
|
* @pend: Out variable returning pointer to private pending WR tracking.
|
|
* It's the context the transmit complete handler will get.
|
|
*
|
|
* Reserves and pre-fills an entry for a pending work request send/tx.
|
|
* Used by mid-level smc_llc_send_msg() to prepare for later actual send/tx.
|
|
* Can sleep due to smc_get_ctrl_buf (if not in softirq context).
|
|
*
|
|
* Return: 0 on success, otherwise an error value.
|
|
*/
|
|
static int smc_llc_add_pending_send(struct smc_link *link,
|
|
struct smc_wr_buf **wr_buf,
|
|
struct smc_wr_tx_pend_priv **pend)
|
|
{
|
|
int rc;
|
|
|
|
rc = smc_wr_tx_get_free_slot(link, smc_llc_tx_handler, wr_buf, NULL,
|
|
pend);
|
|
if (rc < 0)
|
|
return rc;
|
|
BUILD_BUG_ON_MSG(
|
|
sizeof(union smc_llc_msg) > SMC_WR_BUF_SIZE,
|
|
"must increase SMC_WR_BUF_SIZE to at least sizeof(struct smc_llc_msg)");
|
|
BUILD_BUG_ON_MSG(
|
|
sizeof(union smc_llc_msg) != SMC_WR_TX_SIZE,
|
|
"must adapt SMC_WR_TX_SIZE to sizeof(struct smc_llc_msg); if not all smc_wr upper layer protocols use the same message size any more, must start to set link->wr_tx_sges[i].length on each individual smc_wr_tx_send()");
|
|
BUILD_BUG_ON_MSG(
|
|
sizeof(struct smc_llc_tx_pend) > SMC_WR_TX_PEND_PRIV_SIZE,
|
|
"must increase SMC_WR_TX_PEND_PRIV_SIZE to at least sizeof(struct smc_llc_tx_pend)");
|
|
return 0;
|
|
}
|
|
|
|
/* high-level API to send LLC confirm link */
|
|
int smc_llc_send_confirm_link(struct smc_link *link,
|
|
enum smc_llc_reqresp reqresp)
|
|
{
|
|
struct smc_link_group *lgr = smc_get_lgr(link);
|
|
struct smc_llc_msg_confirm_link *confllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
confllc = (struct smc_llc_msg_confirm_link *)wr_buf;
|
|
memset(confllc, 0, sizeof(*confllc));
|
|
confllc->hd.common.type = SMC_LLC_CONFIRM_LINK;
|
|
confllc->hd.length = sizeof(struct smc_llc_msg_confirm_link);
|
|
confllc->hd.flags |= SMC_LLC_FLAG_NO_RMBE_EYEC;
|
|
if (reqresp == SMC_LLC_RESP)
|
|
confllc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
memcpy(confllc->sender_mac, link->smcibdev->mac[link->ibport - 1],
|
|
ETH_ALEN);
|
|
memcpy(confllc->sender_gid, link->gid, SMC_GID_SIZE);
|
|
hton24(confllc->sender_qp_num, link->roce_qp->qp_num);
|
|
confllc->link_num = link->link_id;
|
|
memcpy(confllc->link_uid, lgr->id, SMC_LGR_ID_SIZE);
|
|
confllc->max_links = SMC_LLC_ADD_LNK_MAX_LINKS; /* enforce peer resp. */
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* send LLC confirm rkey request */
|
|
static int smc_llc_send_confirm_rkey(struct smc_link *link,
|
|
struct smc_buf_desc *rmb_desc)
|
|
{
|
|
struct smc_llc_msg_confirm_rkey *rkeyllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
rkeyllc = (struct smc_llc_msg_confirm_rkey *)wr_buf;
|
|
memset(rkeyllc, 0, sizeof(*rkeyllc));
|
|
rkeyllc->hd.common.type = SMC_LLC_CONFIRM_RKEY;
|
|
rkeyllc->hd.length = sizeof(struct smc_llc_msg_confirm_rkey);
|
|
rkeyllc->rtoken[0].rmb_key =
|
|
htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
|
|
rkeyllc->rtoken[0].rmb_vaddr = cpu_to_be64(
|
|
(u64)sg_dma_address(rmb_desc->sgt[link->link_idx].sgl));
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* send LLC delete rkey request */
|
|
static int smc_llc_send_delete_rkey(struct smc_link *link,
|
|
struct smc_buf_desc *rmb_desc)
|
|
{
|
|
struct smc_llc_msg_delete_rkey *rkeyllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
rkeyllc = (struct smc_llc_msg_delete_rkey *)wr_buf;
|
|
memset(rkeyllc, 0, sizeof(*rkeyllc));
|
|
rkeyllc->hd.common.type = SMC_LLC_DELETE_RKEY;
|
|
rkeyllc->hd.length = sizeof(struct smc_llc_msg_delete_rkey);
|
|
rkeyllc->num_rkeys = 1;
|
|
rkeyllc->rkey[0] = htonl(rmb_desc->mr_rx[link->link_idx]->rkey);
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* prepare an add link message */
|
|
static void smc_llc_prep_add_link(struct smc_llc_msg_add_link *addllc,
|
|
struct smc_link *link, u8 mac[], u8 gid[],
|
|
enum smc_llc_reqresp reqresp)
|
|
{
|
|
memset(addllc, 0, sizeof(*addllc));
|
|
addllc->hd.common.type = SMC_LLC_ADD_LINK;
|
|
addllc->hd.length = sizeof(struct smc_llc_msg_add_link);
|
|
if (reqresp == SMC_LLC_RESP) {
|
|
addllc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
/* always reject more links for now */
|
|
addllc->hd.flags |= SMC_LLC_FLAG_ADD_LNK_REJ;
|
|
addllc->hd.add_link_rej_rsn = SMC_LLC_REJ_RSN_NO_ALT_PATH;
|
|
}
|
|
memcpy(addllc->sender_mac, mac, ETH_ALEN);
|
|
memcpy(addllc->sender_gid, gid, SMC_GID_SIZE);
|
|
}
|
|
|
|
/* send ADD LINK request or response */
|
|
int smc_llc_send_add_link(struct smc_link *link, u8 mac[], u8 gid[],
|
|
enum smc_llc_reqresp reqresp)
|
|
{
|
|
struct smc_llc_msg_add_link *addllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
addllc = (struct smc_llc_msg_add_link *)wr_buf;
|
|
smc_llc_prep_add_link(addllc, link, mac, gid, reqresp);
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* prepare a delete link message */
|
|
static void smc_llc_prep_delete_link(struct smc_llc_msg_del_link *delllc,
|
|
struct smc_link *link,
|
|
enum smc_llc_reqresp reqresp, bool orderly)
|
|
{
|
|
memset(delllc, 0, sizeof(*delllc));
|
|
delllc->hd.common.type = SMC_LLC_DELETE_LINK;
|
|
delllc->hd.length = sizeof(struct smc_llc_msg_add_link);
|
|
if (reqresp == SMC_LLC_RESP)
|
|
delllc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
/* DEL_LINK_ALL because only 1 link supported */
|
|
delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ALL;
|
|
if (orderly)
|
|
delllc->hd.flags |= SMC_LLC_FLAG_DEL_LINK_ORDERLY;
|
|
delllc->link_num = link->link_id;
|
|
}
|
|
|
|
/* send DELETE LINK request or response */
|
|
int smc_llc_send_delete_link(struct smc_link *link,
|
|
enum smc_llc_reqresp reqresp, bool orderly)
|
|
{
|
|
struct smc_llc_msg_del_link *delllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
delllc = (struct smc_llc_msg_del_link *)wr_buf;
|
|
smc_llc_prep_delete_link(delllc, link, reqresp, orderly);
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* send LLC test link request */
|
|
static int smc_llc_send_test_link(struct smc_link *link, u8 user_data[16])
|
|
{
|
|
struct smc_llc_msg_test_link *testllc;
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
testllc = (struct smc_llc_msg_test_link *)wr_buf;
|
|
memset(testllc, 0, sizeof(*testllc));
|
|
testllc->hd.common.type = SMC_LLC_TEST_LINK;
|
|
testllc->hd.length = sizeof(struct smc_llc_msg_test_link);
|
|
memcpy(testllc->user_data, user_data, sizeof(testllc->user_data));
|
|
/* send llc message */
|
|
rc = smc_wr_tx_send(link, pend);
|
|
return rc;
|
|
}
|
|
|
|
/* schedule an llc send on link, may wait for buffers */
|
|
static int smc_llc_send_message(struct smc_link *link, void *llcbuf)
|
|
{
|
|
struct smc_wr_tx_pend_priv *pend;
|
|
struct smc_wr_buf *wr_buf;
|
|
int rc;
|
|
|
|
if (!smc_link_usable(link))
|
|
return -ENOLINK;
|
|
rc = smc_llc_add_pending_send(link, &wr_buf, &pend);
|
|
if (rc)
|
|
return rc;
|
|
memcpy(wr_buf, llcbuf, sizeof(union smc_llc_msg));
|
|
return smc_wr_tx_send(link, pend);
|
|
}
|
|
|
|
/********************************* receive ***********************************/
|
|
|
|
static void smc_llc_rx_confirm_link(struct smc_link *link,
|
|
struct smc_llc_msg_confirm_link *llc)
|
|
{
|
|
struct smc_link_group *lgr = smc_get_lgr(link);
|
|
int conf_rc = 0;
|
|
|
|
/* RMBE eyecatchers are not supported */
|
|
if (!(llc->hd.flags & SMC_LLC_FLAG_NO_RMBE_EYEC))
|
|
conf_rc = ENOTSUPP;
|
|
|
|
if (lgr->role == SMC_CLNT &&
|
|
link->state == SMC_LNK_ACTIVATING) {
|
|
link->llc_confirm_rc = conf_rc;
|
|
link->link_id = llc->link_num;
|
|
complete(&link->llc_confirm);
|
|
}
|
|
}
|
|
|
|
static void smc_llc_rx_add_link(struct smc_link *link,
|
|
struct smc_llc_msg_add_link *llc)
|
|
{
|
|
struct smc_link_group *lgr = smc_get_lgr(link);
|
|
|
|
if (link->state == SMC_LNK_ACTIVATING) {
|
|
complete(&link->llc_add);
|
|
return;
|
|
}
|
|
|
|
if (lgr->role == SMC_SERV) {
|
|
smc_llc_prep_add_link(llc, link,
|
|
link->smcibdev->mac[link->ibport - 1],
|
|
link->gid, SMC_LLC_REQ);
|
|
|
|
} else {
|
|
smc_llc_prep_add_link(llc, link,
|
|
link->smcibdev->mac[link->ibport - 1],
|
|
link->gid, SMC_LLC_RESP);
|
|
}
|
|
smc_llc_send_message(link, llc);
|
|
}
|
|
|
|
static void smc_llc_rx_delete_link(struct smc_link *link,
|
|
struct smc_llc_msg_del_link *llc)
|
|
{
|
|
struct smc_link_group *lgr = smc_get_lgr(link);
|
|
|
|
smc_lgr_forget(lgr);
|
|
smc_llc_link_deleting(link);
|
|
if (lgr->role == SMC_SERV) {
|
|
/* client asks to delete this link, send request */
|
|
smc_llc_prep_delete_link(llc, link, SMC_LLC_REQ, true);
|
|
} else {
|
|
/* server requests to delete this link, send response */
|
|
smc_llc_prep_delete_link(llc, link, SMC_LLC_RESP, true);
|
|
}
|
|
smc_llc_send_message(link, llc);
|
|
smc_lgr_terminate_sched(lgr);
|
|
}
|
|
|
|
static void smc_llc_rx_test_link(struct smc_link *link,
|
|
struct smc_llc_msg_test_link *llc)
|
|
{
|
|
llc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
smc_llc_send_message(link, llc);
|
|
}
|
|
|
|
static void smc_llc_rx_confirm_rkey(struct smc_link *link,
|
|
struct smc_llc_msg_confirm_rkey *llc)
|
|
{
|
|
int rc;
|
|
|
|
rc = smc_rtoken_add(link,
|
|
llc->rtoken[0].rmb_vaddr,
|
|
llc->rtoken[0].rmb_key);
|
|
|
|
/* ignore rtokens for other links, we have only one link */
|
|
|
|
llc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
if (rc < 0)
|
|
llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
|
|
smc_llc_send_message(link, llc);
|
|
}
|
|
|
|
static void smc_llc_rx_confirm_rkey_cont(struct smc_link *link,
|
|
struct smc_llc_msg_confirm_rkey_cont *llc)
|
|
{
|
|
/* ignore rtokens for other links, we have only one link */
|
|
llc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
smc_llc_send_message(link, llc);
|
|
}
|
|
|
|
static void smc_llc_rx_delete_rkey(struct smc_link *link,
|
|
struct smc_llc_msg_delete_rkey *llc)
|
|
{
|
|
u8 err_mask = 0;
|
|
int i, max;
|
|
|
|
max = min_t(u8, llc->num_rkeys, SMC_LLC_DEL_RKEY_MAX);
|
|
for (i = 0; i < max; i++) {
|
|
if (smc_rtoken_delete(link, llc->rkey[i]))
|
|
err_mask |= 1 << (SMC_LLC_DEL_RKEY_MAX - 1 - i);
|
|
}
|
|
|
|
if (err_mask) {
|
|
llc->hd.flags |= SMC_LLC_FLAG_RKEY_NEG;
|
|
llc->err_mask = err_mask;
|
|
}
|
|
|
|
llc->hd.flags |= SMC_LLC_FLAG_RESP;
|
|
smc_llc_send_message(link, llc);
|
|
}
|
|
|
|
/* flush the llc event queue */
|
|
static void smc_llc_event_flush(struct smc_link_group *lgr)
|
|
{
|
|
struct smc_llc_qentry *qentry, *q;
|
|
|
|
spin_lock_bh(&lgr->llc_event_q_lock);
|
|
list_for_each_entry_safe(qentry, q, &lgr->llc_event_q, list) {
|
|
list_del_init(&qentry->list);
|
|
kfree(qentry);
|
|
}
|
|
spin_unlock_bh(&lgr->llc_event_q_lock);
|
|
}
|
|
|
|
static void smc_llc_event_handler(struct smc_llc_qentry *qentry)
|
|
{
|
|
union smc_llc_msg *llc = &qentry->msg;
|
|
struct smc_link *link = qentry->link;
|
|
|
|
if (!smc_link_usable(link))
|
|
goto out;
|
|
|
|
switch (llc->raw.hdr.common.type) {
|
|
case SMC_LLC_TEST_LINK:
|
|
smc_llc_rx_test_link(link, &llc->test_link);
|
|
break;
|
|
case SMC_LLC_CONFIRM_LINK:
|
|
smc_llc_rx_confirm_link(link, &llc->confirm_link);
|
|
break;
|
|
case SMC_LLC_ADD_LINK:
|
|
smc_llc_rx_add_link(link, &llc->add_link);
|
|
break;
|
|
case SMC_LLC_DELETE_LINK:
|
|
smc_llc_rx_delete_link(link, &llc->delete_link);
|
|
break;
|
|
case SMC_LLC_CONFIRM_RKEY:
|
|
smc_llc_rx_confirm_rkey(link, &llc->confirm_rkey);
|
|
break;
|
|
case SMC_LLC_CONFIRM_RKEY_CONT:
|
|
smc_llc_rx_confirm_rkey_cont(link, &llc->confirm_rkey_cont);
|
|
break;
|
|
case SMC_LLC_DELETE_RKEY:
|
|
smc_llc_rx_delete_rkey(link, &llc->delete_rkey);
|
|
break;
|
|
}
|
|
out:
|
|
kfree(qentry);
|
|
}
|
|
|
|
/* worker to process llc messages on the event queue */
|
|
static void smc_llc_event_work(struct work_struct *work)
|
|
{
|
|
struct smc_link_group *lgr = container_of(work, struct smc_link_group,
|
|
llc_event_work);
|
|
struct smc_llc_qentry *qentry;
|
|
|
|
if (!lgr->llc_flow_lcl.type && lgr->delayed_event) {
|
|
if (smc_link_usable(lgr->delayed_event->link)) {
|
|
smc_llc_event_handler(lgr->delayed_event);
|
|
} else {
|
|
qentry = lgr->delayed_event;
|
|
lgr->delayed_event = NULL;
|
|
kfree(qentry);
|
|
}
|
|
}
|
|
|
|
again:
|
|
spin_lock_bh(&lgr->llc_event_q_lock);
|
|
if (!list_empty(&lgr->llc_event_q)) {
|
|
qentry = list_first_entry(&lgr->llc_event_q,
|
|
struct smc_llc_qentry, list);
|
|
list_del_init(&qentry->list);
|
|
spin_unlock_bh(&lgr->llc_event_q_lock);
|
|
smc_llc_event_handler(qentry);
|
|
goto again;
|
|
}
|
|
spin_unlock_bh(&lgr->llc_event_q_lock);
|
|
}
|
|
|
|
/* process llc responses in tasklet context */
|
|
static void smc_llc_rx_response(struct smc_link *link, union smc_llc_msg *llc)
|
|
{
|
|
int rc = 0;
|
|
|
|
switch (llc->raw.hdr.common.type) {
|
|
case SMC_LLC_TEST_LINK:
|
|
if (link->state == SMC_LNK_ACTIVE)
|
|
complete(&link->llc_testlink_resp);
|
|
break;
|
|
case SMC_LLC_CONFIRM_LINK:
|
|
if (!(llc->raw.hdr.flags & SMC_LLC_FLAG_NO_RMBE_EYEC))
|
|
rc = ENOTSUPP;
|
|
if (link->lgr->role == SMC_SERV &&
|
|
link->state == SMC_LNK_ACTIVATING) {
|
|
link->llc_confirm_resp_rc = rc;
|
|
complete(&link->llc_confirm_resp);
|
|
}
|
|
break;
|
|
case SMC_LLC_ADD_LINK:
|
|
if (link->state == SMC_LNK_ACTIVATING)
|
|
complete(&link->llc_add_resp);
|
|
break;
|
|
case SMC_LLC_DELETE_LINK:
|
|
if (link->lgr->role == SMC_SERV)
|
|
smc_lgr_schedule_free_work_fast(link->lgr);
|
|
break;
|
|
case SMC_LLC_CONFIRM_RKEY:
|
|
link->llc_confirm_rkey_resp_rc = llc->raw.hdr.flags &
|
|
SMC_LLC_FLAG_RKEY_NEG;
|
|
complete(&link->llc_confirm_rkey_resp);
|
|
break;
|
|
case SMC_LLC_CONFIRM_RKEY_CONT:
|
|
/* unused as long as we don't send this type of msg */
|
|
break;
|
|
case SMC_LLC_DELETE_RKEY:
|
|
link->llc_delete_rkey_resp_rc = llc->raw.hdr.flags &
|
|
SMC_LLC_FLAG_RKEY_NEG;
|
|
complete(&link->llc_delete_rkey_resp);
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* copy received msg and add it to the event queue */
|
|
static void smc_llc_rx_handler(struct ib_wc *wc, void *buf)
|
|
{
|
|
struct smc_link *link = (struct smc_link *)wc->qp->qp_context;
|
|
struct smc_link_group *lgr = link->lgr;
|
|
struct smc_llc_qentry *qentry;
|
|
union smc_llc_msg *llc = buf;
|
|
unsigned long flags;
|
|
|
|
if (wc->byte_len < sizeof(*llc))
|
|
return; /* short message */
|
|
if (llc->raw.hdr.length != sizeof(*llc))
|
|
return; /* invalid message */
|
|
|
|
/* process responses immediately */
|
|
if (llc->raw.hdr.flags & SMC_LLC_FLAG_RESP) {
|
|
smc_llc_rx_response(link, llc);
|
|
return;
|
|
}
|
|
|
|
qentry = kmalloc(sizeof(*qentry), GFP_ATOMIC);
|
|
if (!qentry)
|
|
return;
|
|
qentry->link = link;
|
|
INIT_LIST_HEAD(&qentry->list);
|
|
memcpy(&qentry->msg, llc, sizeof(union smc_llc_msg));
|
|
spin_lock_irqsave(&lgr->llc_event_q_lock, flags);
|
|
list_add_tail(&qentry->list, &lgr->llc_event_q);
|
|
spin_unlock_irqrestore(&lgr->llc_event_q_lock, flags);
|
|
schedule_work(&link->lgr->llc_event_work);
|
|
}
|
|
|
|
/***************************** worker, utils *********************************/
|
|
|
|
static void smc_llc_testlink_work(struct work_struct *work)
|
|
{
|
|
struct smc_link *link = container_of(to_delayed_work(work),
|
|
struct smc_link, llc_testlink_wrk);
|
|
unsigned long next_interval;
|
|
unsigned long expire_time;
|
|
u8 user_data[16] = { 0 };
|
|
int rc;
|
|
|
|
if (link->state != SMC_LNK_ACTIVE)
|
|
return; /* don't reschedule worker */
|
|
expire_time = link->wr_rx_tstamp + link->llc_testlink_time;
|
|
if (time_is_after_jiffies(expire_time)) {
|
|
next_interval = expire_time - jiffies;
|
|
goto out;
|
|
}
|
|
reinit_completion(&link->llc_testlink_resp);
|
|
smc_llc_send_test_link(link, user_data);
|
|
/* receive TEST LINK response over RoCE fabric */
|
|
rc = wait_for_completion_interruptible_timeout(&link->llc_testlink_resp,
|
|
SMC_LLC_WAIT_TIME);
|
|
if (link->state != SMC_LNK_ACTIVE)
|
|
return; /* link state changed */
|
|
if (rc <= 0) {
|
|
smc_lgr_terminate_sched(smc_get_lgr(link));
|
|
return;
|
|
}
|
|
next_interval = link->llc_testlink_time;
|
|
out:
|
|
schedule_delayed_work(&link->llc_testlink_wrk, next_interval);
|
|
}
|
|
|
|
void smc_llc_lgr_init(struct smc_link_group *lgr, struct smc_sock *smc)
|
|
{
|
|
struct net *net = sock_net(smc->clcsock->sk);
|
|
|
|
INIT_WORK(&lgr->llc_event_work, smc_llc_event_work);
|
|
INIT_LIST_HEAD(&lgr->llc_event_q);
|
|
spin_lock_init(&lgr->llc_event_q_lock);
|
|
spin_lock_init(&lgr->llc_flow_lock);
|
|
init_waitqueue_head(&lgr->llc_waiter);
|
|
lgr->llc_testlink_time = net->ipv4.sysctl_tcp_keepalive_time;
|
|
}
|
|
|
|
/* called after lgr was removed from lgr_list */
|
|
void smc_llc_lgr_clear(struct smc_link_group *lgr)
|
|
{
|
|
smc_llc_event_flush(lgr);
|
|
wake_up_interruptible_all(&lgr->llc_waiter);
|
|
cancel_work_sync(&lgr->llc_event_work);
|
|
if (lgr->delayed_event) {
|
|
kfree(lgr->delayed_event);
|
|
lgr->delayed_event = NULL;
|
|
}
|
|
}
|
|
|
|
int smc_llc_link_init(struct smc_link *link)
|
|
{
|
|
init_completion(&link->llc_confirm);
|
|
init_completion(&link->llc_confirm_resp);
|
|
init_completion(&link->llc_add);
|
|
init_completion(&link->llc_add_resp);
|
|
init_completion(&link->llc_confirm_rkey_resp);
|
|
init_completion(&link->llc_delete_rkey_resp);
|
|
mutex_init(&link->llc_delete_rkey_mutex);
|
|
init_completion(&link->llc_testlink_resp);
|
|
INIT_DELAYED_WORK(&link->llc_testlink_wrk, smc_llc_testlink_work);
|
|
return 0;
|
|
}
|
|
|
|
void smc_llc_link_active(struct smc_link *link)
|
|
{
|
|
link->state = SMC_LNK_ACTIVE;
|
|
if (link->lgr->llc_testlink_time) {
|
|
link->llc_testlink_time = link->lgr->llc_testlink_time * HZ;
|
|
schedule_delayed_work(&link->llc_testlink_wrk,
|
|
link->llc_testlink_time);
|
|
}
|
|
}
|
|
|
|
void smc_llc_link_deleting(struct smc_link *link)
|
|
{
|
|
link->state = SMC_LNK_DELETING;
|
|
smc_wr_wakeup_tx_wait(link);
|
|
}
|
|
|
|
/* called in worker context */
|
|
void smc_llc_link_clear(struct smc_link *link)
|
|
{
|
|
complete(&link->llc_testlink_resp);
|
|
cancel_delayed_work_sync(&link->llc_testlink_wrk);
|
|
smc_wr_wakeup_reg_wait(link);
|
|
smc_wr_wakeup_tx_wait(link);
|
|
}
|
|
|
|
/* register a new rtoken at the remote peer */
|
|
int smc_llc_do_confirm_rkey(struct smc_link *link,
|
|
struct smc_buf_desc *rmb_desc)
|
|
{
|
|
int rc;
|
|
|
|
/* protected by mutex smc_create_lgr_pending */
|
|
reinit_completion(&link->llc_confirm_rkey_resp);
|
|
rc = smc_llc_send_confirm_rkey(link, rmb_desc);
|
|
if (rc)
|
|
return rc;
|
|
/* receive CONFIRM RKEY response from server over RoCE fabric */
|
|
rc = wait_for_completion_interruptible_timeout(
|
|
&link->llc_confirm_rkey_resp, SMC_LLC_WAIT_TIME);
|
|
if (rc <= 0 || link->llc_confirm_rkey_resp_rc)
|
|
return -EFAULT;
|
|
return 0;
|
|
}
|
|
|
|
/* unregister an rtoken at the remote peer */
|
|
int smc_llc_do_delete_rkey(struct smc_link *link,
|
|
struct smc_buf_desc *rmb_desc)
|
|
{
|
|
int rc = 0;
|
|
|
|
mutex_lock(&link->llc_delete_rkey_mutex);
|
|
if (link->state != SMC_LNK_ACTIVE)
|
|
goto out;
|
|
reinit_completion(&link->llc_delete_rkey_resp);
|
|
rc = smc_llc_send_delete_rkey(link, rmb_desc);
|
|
if (rc)
|
|
goto out;
|
|
/* receive DELETE RKEY response from server over RoCE fabric */
|
|
rc = wait_for_completion_interruptible_timeout(
|
|
&link->llc_delete_rkey_resp, SMC_LLC_WAIT_TIME);
|
|
if (rc <= 0 || link->llc_delete_rkey_resp_rc)
|
|
rc = -EFAULT;
|
|
else
|
|
rc = 0;
|
|
out:
|
|
mutex_unlock(&link->llc_delete_rkey_mutex);
|
|
return rc;
|
|
}
|
|
|
|
/***************************** init, exit, misc ******************************/
|
|
|
|
static struct smc_wr_rx_handler smc_llc_rx_handlers[] = {
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_CONFIRM_LINK
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_TEST_LINK
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_ADD_LINK
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_DELETE_LINK
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_CONFIRM_RKEY
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_CONFIRM_RKEY_CONT
|
|
},
|
|
{
|
|
.handler = smc_llc_rx_handler,
|
|
.type = SMC_LLC_DELETE_RKEY
|
|
},
|
|
{
|
|
.handler = NULL,
|
|
}
|
|
};
|
|
|
|
int __init smc_llc_init(void)
|
|
{
|
|
struct smc_wr_rx_handler *handler;
|
|
int rc = 0;
|
|
|
|
for (handler = smc_llc_rx_handlers; handler->handler; handler++) {
|
|
INIT_HLIST_NODE(&handler->list);
|
|
rc = smc_wr_rx_register_handler(handler);
|
|
if (rc)
|
|
break;
|
|
}
|
|
return rc;
|
|
}
|