iw_cxgb4: RDMA write with immediate support

Adds iw_cxgb4 functionality to support RDMA_WRITE_WITH_IMMEDATE opcode.

Signed-off-by: Potnuri Bharat Teja <bharat@chelsio.com>
Signed-off-by: Steve Wise <swise@opengridcomputing.com>
Signed-off-by: Jason Gunthorpe <jgg@mellanox.com>
This commit is contained in:
Potnuri Bharat Teja 2018-08-02 11:33:03 +05:30 committed by Jason Gunthorpe
parent 8001b717f0
commit b9855f4ca0
5 changed files with 81 additions and 16 deletions

View File

@ -791,15 +791,32 @@ static int __c4iw_poll_cq_one(struct c4iw_cq *chp, struct c4iw_qp *qhp,
wc->byte_len = CQE_LEN(&cqe); wc->byte_len = CQE_LEN(&cqe);
else else
wc->byte_len = 0; wc->byte_len = 0;
wc->opcode = IB_WC_RECV;
if (CQE_OPCODE(&cqe) == FW_RI_SEND_WITH_INV || switch (CQE_OPCODE(&cqe)) {
CQE_OPCODE(&cqe) == FW_RI_SEND_WITH_SE_INV) { case FW_RI_SEND:
wc->opcode = IB_WC_RECV;
break;
case FW_RI_SEND_WITH_INV:
case FW_RI_SEND_WITH_SE_INV:
wc->opcode = IB_WC_RECV;
wc->ex.invalidate_rkey = CQE_WRID_STAG(&cqe); wc->ex.invalidate_rkey = CQE_WRID_STAG(&cqe);
wc->wc_flags |= IB_WC_WITH_INVALIDATE; wc->wc_flags |= IB_WC_WITH_INVALIDATE;
c4iw_invalidate_mr(qhp->rhp, wc->ex.invalidate_rkey); c4iw_invalidate_mr(qhp->rhp, wc->ex.invalidate_rkey);
break;
case FW_RI_WRITE_IMMEDIATE:
wc->opcode = IB_WC_RECV_RDMA_WITH_IMM;
wc->ex.imm_data = CQE_IMM_DATA(&cqe);
wc->wc_flags |= IB_WC_WITH_IMM;
break;
default:
pr_err("Unexpected opcode %d in the CQE received for QPID=0x%0x\n",
CQE_OPCODE(&cqe), CQE_QPID(&cqe));
ret = -EINVAL;
goto out;
} }
} else { } else {
switch (CQE_OPCODE(&cqe)) { switch (CQE_OPCODE(&cqe)) {
case FW_RI_WRITE_IMMEDIATE:
case FW_RI_RDMA_WRITE: case FW_RI_RDMA_WRITE:
wc->opcode = IB_WC_RDMA_WRITE; wc->opcode = IB_WC_RDMA_WRITE;
break; break;

View File

@ -555,7 +555,15 @@ static int build_rdma_write(struct t4_sq *sq, union t4_wr *wqe,
if (wr->num_sge > T4_MAX_SEND_SGE) if (wr->num_sge > T4_MAX_SEND_SGE)
return -EINVAL; return -EINVAL;
wqe->write.r2 = 0;
/*
* iWARP protocol supports 64 bit immediate data but rdma api
* limits it to 32bit.
*/
if (wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM)
wqe->write.iw_imm_data.ib_imm_data.imm_data32 = wr->ex.imm_data;
else
wqe->write.iw_imm_data.ib_imm_data.imm_data32 = 0;
wqe->write.stag_sink = cpu_to_be32(rdma_wr(wr)->rkey); wqe->write.stag_sink = cpu_to_be32(rdma_wr(wr)->rkey);
wqe->write.to_sink = cpu_to_be64(rdma_wr(wr)->remote_addr); wqe->write.to_sink = cpu_to_be64(rdma_wr(wr)->remote_addr);
if (wr->num_sge) { if (wr->num_sge) {
@ -848,6 +856,9 @@ static int ib_to_fw_opcode(int ib_opcode)
case IB_WR_RDMA_WRITE: case IB_WR_RDMA_WRITE:
opcode = FW_RI_RDMA_WRITE; opcode = FW_RI_RDMA_WRITE;
break; break;
case IB_WR_RDMA_WRITE_WITH_IMM:
opcode = FW_RI_WRITE_IMMEDIATE;
break;
case IB_WR_RDMA_READ: case IB_WR_RDMA_READ:
case IB_WR_RDMA_READ_WITH_INV: case IB_WR_RDMA_READ_WITH_INV:
opcode = FW_RI_READ_REQ; opcode = FW_RI_READ_REQ;
@ -970,6 +981,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
enum fw_wr_opcodes fw_opcode = 0; enum fw_wr_opcodes fw_opcode = 0;
enum fw_ri_wr_flags fw_flags; enum fw_ri_wr_flags fw_flags;
struct c4iw_qp *qhp; struct c4iw_qp *qhp;
struct c4iw_dev *rhp;
union t4_wr *wqe = NULL; union t4_wr *wqe = NULL;
u32 num_wrs; u32 num_wrs;
struct t4_swsqe *swsqe; struct t4_swsqe *swsqe;
@ -977,6 +989,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
u16 idx = 0; u16 idx = 0;
qhp = to_c4iw_qp(ibqp); qhp = to_c4iw_qp(ibqp);
rhp = qhp->rhp;
spin_lock_irqsave(&qhp->lock, flag); spin_lock_irqsave(&qhp->lock, flag);
/* /*
@ -1021,6 +1034,13 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
swsqe->opcode = FW_RI_SEND_WITH_INV; swsqe->opcode = FW_RI_SEND_WITH_INV;
err = build_rdma_send(&qhp->wq.sq, wqe, wr, &len16); err = build_rdma_send(&qhp->wq.sq, wqe, wr, &len16);
break; break;
case IB_WR_RDMA_WRITE_WITH_IMM:
if (unlikely(!rhp->rdev.lldi.write_w_imm_support)) {
err = -EINVAL;
break;
}
fw_flags |= FW_RI_RDMA_WRITE_WITH_IMMEDIATE;
/*FALLTHROUGH*/
case IB_WR_RDMA_WRITE: case IB_WR_RDMA_WRITE:
fw_opcode = FW_RI_RDMA_WRITE_WR; fw_opcode = FW_RI_RDMA_WRITE_WR;
swsqe->opcode = FW_RI_RDMA_WRITE; swsqe->opcode = FW_RI_RDMA_WRITE;
@ -1031,8 +1051,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
fw_opcode = FW_RI_RDMA_READ_WR; fw_opcode = FW_RI_RDMA_READ_WR;
swsqe->opcode = FW_RI_READ_REQ; swsqe->opcode = FW_RI_READ_REQ;
if (wr->opcode == IB_WR_RDMA_READ_WITH_INV) { if (wr->opcode == IB_WR_RDMA_READ_WITH_INV) {
c4iw_invalidate_mr(qhp->rhp, c4iw_invalidate_mr(rhp, wr->sg_list[0].lkey);
wr->sg_list[0].lkey);
fw_flags = FW_RI_RDMA_READ_INVALIDATE; fw_flags = FW_RI_RDMA_READ_INVALIDATE;
} else { } else {
fw_flags = 0; fw_flags = 0;
@ -1048,7 +1067,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
struct c4iw_mr *mhp = to_c4iw_mr(reg_wr(wr)->mr); struct c4iw_mr *mhp = to_c4iw_mr(reg_wr(wr)->mr);
swsqe->opcode = FW_RI_FAST_REGISTER; swsqe->opcode = FW_RI_FAST_REGISTER;
if (qhp->rhp->rdev.lldi.fr_nsmr_tpte_wr_support && if (rhp->rdev.lldi.fr_nsmr_tpte_wr_support &&
!mhp->attr.state && mhp->mpl_len <= 2) { !mhp->attr.state && mhp->mpl_len <= 2) {
fw_opcode = FW_RI_FR_NSMR_TPTE_WR; fw_opcode = FW_RI_FR_NSMR_TPTE_WR;
build_tpte_memreg(&wqe->fr_tpte, reg_wr(wr), build_tpte_memreg(&wqe->fr_tpte, reg_wr(wr),
@ -1057,7 +1076,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
fw_opcode = FW_RI_FR_NSMR_WR; fw_opcode = FW_RI_FR_NSMR_WR;
err = build_memreg(&qhp->wq.sq, wqe, reg_wr(wr), err = build_memreg(&qhp->wq.sq, wqe, reg_wr(wr),
mhp, &len16, mhp, &len16,
qhp->rhp->rdev.lldi.ulptx_memwrite_dsgl); rhp->rdev.lldi.ulptx_memwrite_dsgl);
if (err) if (err)
break; break;
} }
@ -1070,7 +1089,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
fw_opcode = FW_RI_INV_LSTAG_WR; fw_opcode = FW_RI_INV_LSTAG_WR;
swsqe->opcode = FW_RI_LOCAL_INV; swsqe->opcode = FW_RI_LOCAL_INV;
err = build_inv_stag(wqe, wr, &len16); err = build_inv_stag(wqe, wr, &len16);
c4iw_invalidate_mr(qhp->rhp, wr->ex.invalidate_rkey); c4iw_invalidate_mr(rhp, wr->ex.invalidate_rkey);
break; break;
default: default:
pr_warn("%s post of type=%d TBD!\n", __func__, pr_warn("%s post of type=%d TBD!\n", __func__,
@ -1089,7 +1108,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
swsqe->wr_id = wr->wr_id; swsqe->wr_id = wr->wr_id;
if (c4iw_wr_log) { if (c4iw_wr_log) {
swsqe->sge_ts = cxgb4_read_sge_timestamp( swsqe->sge_ts = cxgb4_read_sge_timestamp(
qhp->rhp->rdev.lldi.ports[0]); rhp->rdev.lldi.ports[0]);
swsqe->host_time = ktime_get(); swsqe->host_time = ktime_get();
} }
@ -1103,7 +1122,7 @@ int c4iw_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
t4_sq_produce(&qhp->wq, len16); t4_sq_produce(&qhp->wq, len16);
idx += DIV_ROUND_UP(len16*16, T4_EQ_ENTRY_SIZE); idx += DIV_ROUND_UP(len16*16, T4_EQ_ENTRY_SIZE);
} }
if (!qhp->rhp->rdev.status_page->db_off) { if (!rhp->rdev.status_page->db_off) {
t4_ring_sq_db(&qhp->wq, idx, wqe); t4_ring_sq_db(&qhp->wq, idx, wqe);
spin_unlock_irqrestore(&qhp->lock, flag); spin_unlock_irqrestore(&qhp->lock, flag);
} else { } else {
@ -2098,6 +2117,8 @@ struct ib_qp *c4iw_create_qp(struct ib_pd *pd, struct ib_qp_init_attr *attrs,
} }
uresp.flags = C4IW_QPF_ONCHIP; uresp.flags = C4IW_QPF_ONCHIP;
} }
if (rhp->rdev.lldi.write_w_imm_support)
uresp.flags |= C4IW_QPF_WRITE_W_IMM;
uresp.qid_mask = rhp->rdev.qpmask; uresp.qid_mask = rhp->rdev.qpmask;
uresp.sqid = qhp->wq.sq.qid; uresp.sqid = qhp->wq.sq.qid;
uresp.sq_size = qhp->wq.sq.size; uresp.sq_size = qhp->wq.sq.size;

View File

@ -190,7 +190,19 @@ struct t4_cqe {
__be32 abs_rqe_idx; __be32 abs_rqe_idx;
} srcqe; } srcqe;
struct { struct {
__be64 imm_data; __be32 mo;
__be32 msn;
/*
* Use union for immediate data to be consistent with
* stack's 32 bit data and iWARP spec's 64 bit data.
*/
union {
struct {
__be32 imm_data32;
u32 reserved;
} ib_imm_data;
__be64 imm_data64;
} iw_imm_data;
} imm_data_rcqe; } imm_data_rcqe;
u64 drain_cookie; u64 drain_cookie;
@ -253,6 +265,8 @@ struct t4_cqe {
#define CQE_WRID_STAG(x) (be32_to_cpu((x)->u.rcqe.stag)) #define CQE_WRID_STAG(x) (be32_to_cpu((x)->u.rcqe.stag))
#define CQE_WRID_MSN(x) (be32_to_cpu((x)->u.rcqe.msn)) #define CQE_WRID_MSN(x) (be32_to_cpu((x)->u.rcqe.msn))
#define CQE_ABS_RQE_IDX(x) (be32_to_cpu((x)->u.srcqe.abs_rqe_idx)) #define CQE_ABS_RQE_IDX(x) (be32_to_cpu((x)->u.srcqe.abs_rqe_idx))
#define CQE_IMM_DATA(x)( \
(x)->u.imm_data_rcqe.iw_imm_data.ib_imm_data.imm_data32)
/* used for SQ completion processing */ /* used for SQ completion processing */
#define CQE_WRID_SQ_IDX(x) ((x)->u.scqe.cidx) #define CQE_WRID_SQ_IDX(x) ((x)->u.scqe.cidx)

View File

@ -50,7 +50,8 @@ enum fw_ri_wr_opcode {
FW_RI_BYPASS = 0xd, FW_RI_BYPASS = 0xd,
FW_RI_RECEIVE = 0xe, FW_RI_RECEIVE = 0xe,
FW_RI_SGE_EC_CR_RETURN = 0xf FW_RI_SGE_EC_CR_RETURN = 0xf,
FW_RI_WRITE_IMMEDIATE = FW_RI_RDMA_INIT
}; };
enum fw_ri_wr_flags { enum fw_ri_wr_flags {
@ -59,7 +60,8 @@ enum fw_ri_wr_flags {
FW_RI_SOLICITED_EVENT_FLAG = 0x04, FW_RI_SOLICITED_EVENT_FLAG = 0x04,
FW_RI_READ_FENCE_FLAG = 0x08, FW_RI_READ_FENCE_FLAG = 0x08,
FW_RI_LOCAL_FENCE_FLAG = 0x10, FW_RI_LOCAL_FENCE_FLAG = 0x10,
FW_RI_RDMA_READ_INVALIDATE = 0x20 FW_RI_RDMA_READ_INVALIDATE = 0x20,
FW_RI_RDMA_WRITE_WITH_IMMEDIATE = 0x40
}; };
enum fw_ri_mpa_attrs { enum fw_ri_mpa_attrs {
@ -546,7 +548,17 @@ struct fw_ri_rdma_write_wr {
__u16 wrid; __u16 wrid;
__u8 r1[3]; __u8 r1[3];
__u8 len16; __u8 len16;
__be64 r2; /*
* Use union for immediate data to be consistent with stack's 32 bit
* data and iWARP spec's 64 bit data.
*/
union {
struct {
__be32 imm_data32;
u32 reserved;
} ib_imm_data;
__be64 imm_data64;
} iw_imm_data;
__be32 plen; __be32 plen;
__be32 stag_sink; __be32 stag_sink;
__be64 to_sink; __be64 to_sink;

View File

@ -65,7 +65,8 @@ struct c4iw_create_cq_resp {
}; };
enum { enum {
C4IW_QPF_ONCHIP = (1 << 0) C4IW_QPF_ONCHIP = (1 << 0),
C4IW_QPF_WRITE_W_IMM = (1 << 1)
}; };
struct c4iw_create_qp_resp { struct c4iw_create_qp_resp {