RE: [PATCH rdma-core] libqedr: add support for SRQ's

"Bason, Yuval" <Yuval.Bason@xxxxxxxxxx> · Tue, 10 Jul 2018 09:28:45 +0000



> From: Leon Romanovsky [mailto:leon@xxxxxxxxxx]
> Sent: Monday, July 9, 2018 10:03 AM
> On Sun, Jul 08, 2018 at 03:27:03PM +0300, Yuval Bason wrote:
> > From: Yuval Bason <Yuval.Bason@xxxxxxxxxx>
> >
> > Enable SRQ's for rdma-core.
> >
> 
> This patch will be applied in rdma-core, so there is no need to mention
> "rdma-core" in commit message.
> 
> > SRQ rdma-core implementation is pretty straight forward, except
> > perhaps the Way that the driver udpates FW producers: they are updated
> > using a mapped buffer that FW reads, and not doorbells Like RQ / SQ.
> >
> > Signed-off-by: Yuval Bason <yuval.bason@xxxxxxxxxx>
> > Signed-off-by: Michal Kalderon <michal.kalderon@xxxxxxxxxx>
> > ---
> >  kernel-headers/rdma/qedr-abi.h |  15 ++
> >  providers/qedr/qelr.h          |  43 ++++++
> >  providers/qedr/qelr_abi.h      |   2 +
> >  providers/qedr/qelr_main.c     |   7 +
> >  providers/qedr/qelr_verbs.c    | 337
> +++++++++++++++++++++++++++++++++++++++++
> >  providers/qedr/qelr_verbs.h    |   9 ++
> >  providers/qedr/rdma_common.h   |   1 +
> >  7 files changed, 414 insertions(+)
> >
> > diff --git a/kernel-headers/rdma/qedr-abi.h
> > b/kernel-headers/rdma/qedr-abi.h index 24c658b..9031344 100644
> > --- a/kernel-headers/rdma/qedr-abi.h
> > +++ b/kernel-headers/rdma/qedr-abi.h
> > @@ -111,4 +111,19 @@ struct qedr_create_qp_uresp {
> >  	__u32 reserved;
> >  };
> >
> > +struct qedr_create_srq_ureq {
> > +	/* user space virtual address of producer pair */
> > +	__u64 prod_pair_addr;
> > +
> > +	/* SRQ */
> > +	__u64 srq_addr;		/* user space virtual address of SRQ
> buffer */
> > +	__u64 srq_len;		/* length of SRQ buffer */
> > +};
> > +
> > +struct qedr_create_srq_uresp {
> > +	__u16 srq_id;
> > +	__u16 reserved0;
> > +	__u32 reserved1;
> > +};
> 
> Please provide separate commit in proper format for changes in kernel-
> headers folder. Use kernel-headers/update script for that.
Thanks, wasn't aware of this script.
> 
> > +
> >  #endif /* __QEDR_USER_H__ */
> > diff --git a/providers/qedr/qelr.h b/providers/qedr/qelr.h index
> > 0b2e4a2..eeebfe0 100644
> > --- a/providers/qedr/qelr.h
> > +++ b/providers/qedr/qelr.h
> > @@ -61,6 +61,7 @@ enum DP_MODULE {
> >  	QELR_MSG_QP		= (QELR_MSG_SQ | QELR_MSG_RQ),
> >  	QELR_MSG_MR		= 0x80000,
> >  	QELR_MSG_INIT		= 0x100000,
> > +	QELR_MSG_SRQ		= 0x200000,
> >  	/* to be added...up to 0x8000000 */
> >  };
> >
> > @@ -128,8 +129,10 @@ struct qelr_devctx {
> >
> >  	uint32_t		max_send_wr;
> >  	uint32_t		max_recv_wr;
> > +	uint32_t		max_srq_wr;
> >  	uint32_t		sges_per_send_wr;
> >  	uint32_t		sges_per_recv_wr;
> > +	uint32_t		sges_per_srq_wr;
> >  	int			max_cqes;
> >  };
> >
> > @@ -221,6 +224,27 @@ struct qelr_dpm {
> >  	struct qelr_rdma_ext    *rdma_ext;
> >  };
> >
> > +struct qelr_srq_hwq_info {
> > +	uint32_t max_sges;
> > +	uint32_t max_wr;
> > +	struct qelr_chain chain;
> > +	uint32_t wqe_prod;     /* WQE prod index in HW ring */
> > +	uint32_t sge_prod;     /* SGE prod index in HW ring */
> > +	uint32_t wr_prod_cnt;  /* wr producer count */
> > +	uint32_t wr_cons_cnt;  /* wr consumer count */
> > +	uint32_t num_elems;
> > +
> > +	void  *virt_prod_pair_addr;  /* producer pair virtual address */
> > +	uint64_t phy_prod_pair_addr; /* producer pair physical address */ };
> > +
> > +struct qelr_srq {
> > +	struct ibv_srq ibv_srq;
> > +	struct qelr_srq_hwq_info hw_srq;
> > +	uint16_t srq_id;
> > +	pthread_spinlock_t lock;
> > +};
> > +
> >  struct qelr_qp {
> >  	struct ibv_qp				ibv_qp;
> >  	pthread_spinlock_t			q_lock;
> > @@ -247,6 +271,7 @@ struct qelr_qp {
> >  	int					sq_sig_all;
> >  	int					atomic_supported;
> >  	uint8_t					edpm_disabled;
> > +	struct qelr_srq				*srq;
> >  };
> >
> >  static inline struct qelr_devctx *get_qelr_ctx(struct ibv_context
> > *ibctx) @@ -274,6 +299,11 @@ static inline struct qelr_cq
> *get_qelr_cq(struct ibv_cq *ibcq)
> >  	return container_of(ibcq, struct qelr_cq, ibv_cq);  }
> >
> > +static inline struct qelr_srq *get_qelr_srq(struct ibv_srq *ibsrq) {
> > +	return container_of(ibsrq, struct qelr_srq, ibv_srq); }
> > +
> >  #define SET_FIELD(value, name, flag)				\
> >  	do {							\
> >  		(value) &= ~(name ## _MASK << name ## _SHIFT);	\
> > @@ -308,6 +338,19 @@ static inline struct qelr_cq *get_qelr_cq(struct
> ibv_cq *ibcq)
> >  		(sge)->flags = htole32(vflags);		\
> >  	} while (0)
> >
> > +#define SRQ_HDR_SET(hdr, vwr_id, num_sge)			\
> > +	do {							\
> > +		TYPEPTR_ADDR_SET(hdr, wr_id, vwr_id);		\
> > +		(hdr)->num_sges = num_sge;			\
> > +	} while (0)
> > +
> > +#define SRQ_SGE_SET(sge, vaddr, vlength, vlkey)			\
> > +	do {							\
> > +		TYPEPTR_ADDR_SET(sge, addr, vaddr);		\
> > +		(sge)->length = htole32(vlength);		\
> > +		(sge)->l_key = htole32(vlkey);		\
> > +	} while (0)
> > +
> >  #define U64_HI(val) ((uint32_t)(((uint64_t)(uintptr_t)(val)) >> 32))
> > #define U64_LO(val) ((uint32_t)(((uint64_t)(uintptr_t)(val)) &
> > 0xffffffff))  #define HILO_U64(hi, lo) ((uintptr_t)((((uint64_t)(hi))
> > << 32) + (lo))) diff --git a/providers/qedr/qelr_abi.h
> > b/providers/qedr/qelr_abi.h index 3666845..c674ddc 100644
> > --- a/providers/qedr/qelr_abi.h
> > +++ b/providers/qedr/qelr_abi.h
> > @@ -49,5 +49,7 @@ DECLARE_DRV_CMD(qelr_get_context,
> IB_USER_VERBS_CMD_GET_CONTEXT,
> >  		empty, qedr_alloc_ucontext_resp);
> >  DECLARE_DRV_CMD(qelr_reg_mr, IB_USER_VERBS_CMD_REG_MR,
> >  		empty, empty);
> > +DECLARE_DRV_CMD(qelr_create_srq,
> IB_USER_VERBS_CMD_CREATE_SRQ,
> > +		qedr_create_srq_ureq, qedr_create_srq_uresp);
> >
> >  #endif /* __QELR_ABI_H__ */
> > diff --git a/providers/qedr/qelr_main.c b/providers/qedr/qelr_main.c
> > index e99fc88..40742fb 100644
> > --- a/providers/qedr/qelr_main.c
> > +++ b/providers/qedr/qelr_main.c
> > @@ -96,6 +96,11 @@ static const struct verbs_context_ops qelr_ctx_ops =
> {
> >  	.query_qp = qelr_query_qp,
> >  	.modify_qp = qelr_modify_qp,
> >  	.destroy_qp = qelr_destroy_qp,
> > +	.create_srq = qelr_create_srq,
> > +	.destroy_srq = qelr_destroy_srq,
> > +	.modify_srq = qelr_modify_srq,
> > +	.query_srq = qelr_query_srq,
> > +	.post_srq_recv = qelr_post_srq_recv,
> >  	.post_send = qelr_post_send,
> >  	.post_recv = qelr_post_recv,
> >  	.async_event = qelr_async_event,
> > @@ -183,8 +188,10 @@ static struct verbs_context
> *qelr_alloc_context(struct ibv_device *ibdev,
> >  	ctx->db_size = resp.db_size;
> >  	ctx->max_send_wr = resp.max_send_wr;
> >  	ctx->max_recv_wr = resp.max_recv_wr;
> > +	ctx->max_srq_wr = resp.max_srq_wr;
> >  	ctx->sges_per_send_wr = resp.sges_per_send_wr;
> >  	ctx->sges_per_recv_wr = resp.sges_per_recv_wr;
> > +	ctx->sges_per_srq_wr = resp.sges_per_recv_wr;
> >  	ctx->max_cqes = resp.max_cqes;
> >
> >  	ctx->db_addr = mmap(NULL, ctx->db_size, PROT_WRITE,
> MAP_SHARED, diff
> > --git a/providers/qedr/qelr_verbs.c b/providers/qedr/qelr_verbs.c
> > index 28ea094..4bd155d 100644
> > --- a/providers/qedr/qelr_verbs.c
> > +++ b/providers/qedr/qelr_verbs.c
> > @@ -61,6 +61,7 @@
> >
> >  #define IS_IWARP(_dev)		(_dev->node_type ==
> IBV_NODE_RNIC)
> >  #define IS_ROCE(_dev)		(_dev->node_type ==
> IBV_NODE_CA)
> > +#define HILO_64(hi, lo) ((((uint64_t)(hi)) << 32) + (lo))
> 
> This is one-time-use macro, let's don't obfuscate code without reason.
Will fix.
> 
> >
> >  static void qelr_inc_sw_cons_u16(struct qelr_qp_hwq_info *info)  { @@
> > -313,6 +314,180 @@ int qelr_destroy_cq(struct ibv_cq *ibv_cq)
> >  	return 0;
> >  }
> >
> 
> Please clean both functions below to follow common style, like hfi1,
> mlx4, mlx5, rxe, mthca, ocrdma, rxe and vmw_pvrdma did.
Will fix for this patch and take more notice for next patches.
> 
> > +int qelr_query_srq(struct ibv_srq *ibv_srq, struct ibv_srq_attr *attr)
> > +{
> > +	struct qelr_devctx *cxt = get_qelr_ctx(ibv_srq->context);
> > +	struct qelr_srq *srq = get_qelr_srq(ibv_srq);
> > +	struct ibv_query_srq cmd;
> > +	int rc;
> > +
> > +	rc = ibv_cmd_query_srq(ibv_srq, attr, &cmd, sizeof(cmd));
> > +	if (rc) {
> > +		DP_ERR(cxt->dbg_fp, "query srq: failed to query %p, got
> %d.\n",
> > +		       srq, rc);
> > +		return rc;
> > +	}
> > +
> > +	DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +		   "query srq: successfully queried %p\n", srq);
> > +
> > +	return 0;
> > +}
> > +
> > +int qelr_modify_srq(struct ibv_srq *ibv_srq, struct ibv_srq_attr *attr,
> > +		    int attr_mask)
> > +{
> > +	struct qelr_devctx *cxt = get_qelr_ctx(ibv_srq->context);
> > +	struct qelr_srq *srq = get_qelr_srq(ibv_srq);
> > +	struct ibv_modify_srq cmd;
> > +	int rc;
> > +
> > +	rc = ibv_cmd_modify_srq(ibv_srq, attr, attr_mask, &cmd,
> sizeof(cmd));
> > +	if (rc) {
> > +		DP_ERR(cxt->dbg_fp,
> > +		       "modify srq: failed to modify %p, got %d.\n", srq, rc);
> > +		return rc;
> > +	}
> > +
> > +	DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +		   "modify srq: successfully modified %p\n", srq);
> > +
> > +	return 0;
> > +}
> > +
> > +static void qelr_destroy_srq_buffers(struct ibv_srq *ibv_srq)
> > +{
> > +	struct qelr_srq *srq = get_qelr_srq(ibv_srq);
> > +	uint32_t *virt_prod_pair_addr;
> > +	uint32_t prod_size;
> > +
> > +	qelr_chain_free(&srq->hw_srq.chain);
> > +
> > +	virt_prod_pair_addr = srq->hw_srq.virt_prod_pair_addr;
> > +	prod_size = sizeof(struct rdma_srq_producers);
> > +
> > +	ibv_dofork_range(virt_prod_pair_addr, prod_size);
> > +	munmap(virt_prod_pair_addr, prod_size);
> > +}
> > +
> > +int qelr_destroy_srq(struct ibv_srq *ibv_srq)
> > +{
> > +	struct qelr_devctx *cxt = get_qelr_ctx(ibv_srq->context);
> > +	struct qelr_srq *srq = get_qelr_srq(ibv_srq);
> > +	int rc;
> > +
> > +	rc = ibv_cmd_destroy_srq(ibv_srq);
> > +	if (rc) {
> > +		DP_ERR(cxt->dbg_fp,
> > +		       "destroy srq: failed to destroy %p, got %d.\n", srq, rc);
> > +		return rc;
> > +	}
> > +
> > +	DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +		   "destroy srq: successfully destroyed %p\n", srq);
> > +
> > +	qelr_destroy_srq_buffers(ibv_srq);
> > +	free(srq);
> > +
> > +	return 0;
> > +}
> 
> The same comment as before, please use common style.
> 
> > +
> > +static inline void
> > +qelr_create_srq_configure_req(struct qelr_srq *srq,
> > +			      struct qelr_create_srq *req)
> > +{
> > +	req->srq_addr = (uintptr_t)srq->hw_srq.chain.first_addr;
> > +	req->srq_len = srq->hw_srq.chain.size;
> > +	req->prod_pair_addr = (uintptr_t)srq->hw_srq.virt_prod_pair_addr;
> > +}
> > +
> > +static inline int qelr_create_srq_buffers(struct qelr_devctx *cxt,
> > +					  struct qelr_srq *srq,
> > +					  struct ibv_srq_init_attr *attrs)
> > +{
> > +	uint32_t max_wr, max_sges;
> > +	int chain_size, prod_size;
> > +	void *addr;
> > +	int rc;
> > +
> > +	max_wr = attrs->attr.max_wr;
> > +	if (!max_wr)
> > +		return -EINVAL;
> > +
> > +	max_wr = min_t(uint32_t, max_wr, cxt->max_srq_wr);
> > +	max_sges = max_wr * (cxt->sges_per_srq_wr + 1); /* +1 for header
> */
> > +	chain_size = max_sges * QELR_RQE_ELEMENT_SIZE;
> > +
> > +	rc = qelr_chain_alloc(&srq->hw_srq.chain, chain_size,
> > +			      cxt->kernel_page_size,
> QELR_RQE_ELEMENT_SIZE);
> > +	if (rc) {
> > +		DP_ERR(cxt->dbg_fp,
> > +		       "create srq: failed to map srq, got %d", rc);
> > +		return rc;
> > +	}
> > +
> > +	prod_size = sizeof(struct rdma_srq_producers);
> > +	addr = mmap(NULL, prod_size, PROT_READ | PROT_WRITE,
> > +		    MAP_PRIVATE | MAP_ANONYMOUS, -1,
> > +		    0);
> > +	if (addr == MAP_FAILED) {
> > +		DP_ERR(cxt->dbg_fp,
> > +		       "create srq: failed to map producer, got %d", errno);
> > +		qelr_chain_free(&srq->hw_srq.chain);
> > +		return errno;
> > +	}
> > +
> > +	rc = ibv_dontfork_range(addr, prod_size);
> > +	if (rc) {
> > +		munmap(addr, prod_size);
> > +		qelr_chain_free(&srq->hw_srq.chain);
> > +		return rc;
> > +	}
> > +
> > +	srq->hw_srq.virt_prod_pair_addr = addr;
> > +	srq->hw_srq.max_sges = cxt->sges_per_srq_wr;
> > +	srq->hw_srq.max_wr = max_wr;
> > +
> > +	return 0;
> > +}
> > +
> > +struct ibv_srq *qelr_create_srq(struct ibv_pd *pd,
> > +				struct ibv_srq_init_attr *init_attr)
> > +{
> > +	struct qelr_devctx *cxt = get_qelr_ctx(pd->context);
> > +	struct qelr_create_srq req;
> > +	struct qelr_create_srq_resp resp;
> > +	struct qelr_srq *srq;
> > +	int rc, status = 0;
> > +
> > +	srq = calloc(1, sizeof(*srq));
> > +	if (!srq)
> > +		goto err0;
> > +
> > +	rc = qelr_create_srq_buffers(cxt, srq, init_attr);
> > +	if (rc)
> > +		goto err1;
> > +
> > +	pthread_spin_init(&srq->lock, PTHREAD_PROCESS_PRIVATE);
> > +	qelr_create_srq_configure_req(srq, &req);
> > +	status = ibv_cmd_create_srq(pd, &srq->ibv_srq, init_attr,
> &req.ibv_cmd,
> > +				    sizeof(req), &resp.ibv_resp, sizeof(resp));
> > +	if (status)
> > +		goto err1;
> > +
> > +	DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +		   "create srq: successfully created %p.\n", srq);
> > +	return &srq->ibv_srq;
> > +
> > +err1:
> > +	qelr_destroy_srq_buffers(&srq->ibv_srq);
> > +	free(srq);
> > +err0:
> > +	DP_ERR(cxt->dbg_fp,
> > +	       "create srq: failed to create %p.\n", srq);
> 
> Does this code work? The amount of debug prints is astonishing for
> library which is going to be installed in all modern distributions.
Note taken. Will revisit.
> 
> > +	return NULL;
> > +}
> > +
> >  static void qelr_free_rq(struct qelr_qp *qp)
> >  {
> >  	free(qp->rqe_wr_id);
> > @@ -333,6 +508,11 @@ static void qelr_chain_free_rq(struct qelr_qp *qp)
> >  	qelr_chain_free(&qp->rq.chain);
> >  }
> >
> > +static inline bool qelr_qp_has_srq(struct qelr_qp *qp)
> > +{
> > +	return !!qp->srq;
> > +}
> > +
> 
> Please don't obfuscate code, there is no need to add such trivial check
> as inline function in driver code.
Will fix.
> 
> >  static inline int qelr_create_qp_buffers_sq(struct qelr_devctx *cxt,
> >  					    struct qelr_qp *qp,
> >  					    struct ibv_qp_init_attr *attrs)
> > @@ -531,6 +711,9 @@ struct ibv_qp *qelr_create_qp(struct ibv_pd *pd,
> >  	if (!qp)
> >  		return NULL;
> >
> > +	if (attrs->srq)
> > +		qp->srq = get_qelr_srq(attrs->srq);
> > +
> >  	rc = qelr_create_qp_buffers(cxt, qp, attrs);
> >  	if (rc)
> >  		goto err0;
> > @@ -1485,6 +1668,107 @@ int qelr_post_send(struct ibv_qp *ib_qp, struct
> ibv_send_wr *wr,
> >  	return rc;
> >  }
> >
> > +static uint32_t qelr_srq_elem_left(struct qelr_srq_hwq_info *hw_srq)
> > +{
> > +	uint32_t used;
> > +
> > +	/* Calculate number of elements used based on producer
> > +	 * count and consumer count and subtract it from max
> > +	 * work request supported so that we get elements left.
> > +	 */
> > +	used = (uint32_t)(((uint64_t)((uint64_t)~0U) + 1 +
> > +			  (uint64_t)(hw_srq->wr_prod_cnt)) -
> > +			  (uint64_t)hw_srq->wr_cons_cnt);
> > +
> > +	return hw_srq->max_wr - used;
> > +}
> > +
> > +int qelr_post_srq_recv(struct ibv_srq *ibsrq, struct ibv_recv_wr *wr,
> > +		       struct ibv_recv_wr **bad_wr)
> > +{
> > +	struct qelr_devctx *cxt = get_qelr_ctx(ibsrq->context);
> > +	struct qelr_srq *srq = get_qelr_srq(ibsrq);
> > +	struct qelr_srq_hwq_info *hw_srq = &srq->hw_srq;
> > +	struct qelr_chain *chain;
> > +	int status = 0;
> > +
> > +	pthread_spin_lock(&srq->lock);
> > +
> > +	chain = &srq->hw_srq.chain;
> > +	while (wr) {
> > +		struct rdma_srq_wqe_header *hdr;
> > +		int i;
> > +
> > +		if (!qelr_srq_elem_left(hw_srq) ||
> > +		    wr->num_sge > srq->hw_srq.max_sges) {
> > +			DP_ERR(cxt->dbg_fp,
> > +			       "Can't post WR  (%d,%d) || (%d > %d)\n",
> > +			       hw_srq->wr_prod_cnt, hw_srq->wr_cons_cnt,
> > +			       wr->num_sge,
> > +			       srq->hw_srq.max_sges);
> > +			status = -ENOMEM;
> > +			*bad_wr = wr;
> > +			break;
> > +		}
> > +
> > +		hdr = qelr_chain_produce(chain);
> > +
> > +		/* Set number of sge and work request id in header */
> > +		SRQ_HDR_SET(hdr, wr->wr_id, wr->num_sge);
> > +
> > +		/* PBL is maintained in case of WR granularity.
> > +		 * So increment WR producer in case we post a WR.
> > +		 */
> > +		hw_srq->wr_prod_cnt++;
> > +		hw_srq->wqe_prod++;
> > +		hw_srq->sge_prod++;
> > +
> > +		DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +			   "SRQ WR: SGEs: %d with wr_id[%d] = %lx\n",
> > +			    wr->num_sge, hw_srq->wqe_prod, wr->wr_id);
> > +
> > +		for (i = 0; i < wr->num_sge; i++) {
> > +			struct rdma_srq_sge *srq_sge;
> > +
> > +			srq_sge = qelr_chain_produce(chain);
> > +			/* Set SGE length, lkey and address */
> > +			SRQ_SGE_SET(srq_sge, wr->sg_list[i].addr,
> > +				    wr->sg_list[i].length, wr->sg_list[i].lkey);
> > +
> > +			DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +				   "[%d]: len %d key %x addr %x:%x\n",
> > +				   i, srq_sge->length, srq_sge->l_key,
> > +				   srq_sge->addr.hi, srq_sge->addr.lo);
> > +			hw_srq->sge_prod++;
> > +		}
> > +
> > +		/* Flush WQE and SGE information before updating producer
> */
> > +		mmio_wc_start();
> > +
> > +		/* SRQ producer is 8 bytes. Need to update SGE producer
> index
> > +		 * in first 4 bytes and need to update WQE producer in
> > +		 * next 4 bytes.
> > +		 */
> > +
> > +		struct rdma_srq_producers *virt_prod;
> > +
> > +		virt_prod = srq->hw_srq.virt_prod_pair_addr;
> > +		virt_prod->sge_prod = hw_srq->sge_prod;
> > +		virt_prod->wqe_prod = hw_srq->wqe_prod;
> > +
> > +		/* Flush producer after updating it. */
> > +		mmio_flush_writes();
> > +		wr = wr->next;
> > +	}
> > +
> > +	DP_VERBOSE(cxt->dbg_fp, QELR_MSG_SRQ,
> > +		   "POST: Elements in SRQ: %d\n",
> > +		   qelr_chain_get_elem_left_u32(chain));
> > +	pthread_spin_unlock(&srq->lock);
> > +
> > +	return status;
> > +}
> > +
> >  int qelr_post_recv(struct ibv_qp *ibqp, struct ibv_recv_wr *wr,
> >  		   struct ibv_recv_wr **bad_wr)
> >  {
> > @@ -1494,6 +1778,13 @@ int qelr_post_recv(struct ibv_qp *ibqp, struct
> ibv_recv_wr *wr,
> >  	uint16_t db_val;
> >  	uint8_t iwarp = IS_IWARP(ibqp->context->device);
> >
> > +	if (unlikely(qelr_qp_has_srq(qp))) {
> 
> Does this unlikely gain anything?
I guess performance wise not much, but this is indeed unlikely condition. 
> 
> > +		DP_ERR(cxt->dbg_fp,
> > +		       "QP is associated with SRQ, cannot post RQ buffers\n");
> > +		*bad_wr = wr;
> > +		return -EINVAL;
> > +	}
> > +
> >  	pthread_spin_lock(&qp->q_lock);
> >
> >  	if (!iwarp && qp->state == QELR_QPS_RST) {
> > @@ -1826,6 +2117,32 @@ static void __process_resp_one(struct qelr_qp
> *qp, struct qelr_cq *cq,
> >  	wc->qp_num = qp->qp_id;
> >  }
> >
> > +static int process_resp_one_srq(struct qelr_qp *qp, struct qelr_cq *cq,
> > +				struct ibv_wc *wc,
> > +				struct rdma_cqe_responder *resp)
> > +{
> > +	struct qelr_srq_hwq_info *hw_srq = &qp->srq->hw_srq;
> > +	uint64_t wr_id;
> > +
> > +	wr_id = HILO_64(resp->srq_wr_id.hi, resp->srq_wr_id.lo);
> > +
> > +	if (resp->status ==
> RDMA_CQE_RESP_STS_WORK_REQUEST_FLUSHED_ERR) {
> > +		wc->byte_len = 0;
> > +		wc->status = IBV_WC_WR_FLUSH_ERR;
> > +		wc->qp_num = qp->qp_id;
> > +		wc->wr_id = wr_id;
> > +	} else {
> > +		__process_resp_one(qp, cq, wc, resp, wr_id);
> > +	}
> > +
> > +	/* PBL is maintained in case of WR granularity.
> > +	 * So increment WR consumer after consuming WR
> > +	 */
> > +	hw_srq->wr_cons_cnt++;
> > +
> > +	return 1;
> > +}
> > +
> >  static int process_resp_one(struct qelr_qp *qp, struct qelr_cq *cq,
> >  			    struct ibv_wc *wc, struct rdma_cqe_responder
> *resp)
> >  {
> > @@ -1891,6 +2208,19 @@ static void try_consume_resp_cqe(struct
> qelr_cq *cq, struct qelr_qp *qp,
> >  	}
> >  }
> >
> > +static int qelr_poll_cq_resp_srq(struct qelr_qp *qp, struct qelr_cq *cq,
> > +				 int num_entries, struct ibv_wc *wc,
> > +				 struct rdma_cqe_responder *resp, int
> *update)
> > +{
> > +	int cnt;
> > +
> > +	cnt = process_resp_one_srq(qp, cq, wc, resp);
> > +	consume_cqe(cq);
> > +	*update |= 1;
> > +
> > +	return cnt;
> > +}
> > +
> >  static int qelr_poll_cq_resp(struct qelr_qp *qp, struct qelr_cq *cq,
> >  			     int num_entries, struct ibv_wc *wc,
> >  			     struct rdma_cqe_responder *resp, int *update)
> > @@ -1952,6 +2282,10 @@ int qelr_poll_cq(struct ibv_cq *ibcq, int
> num_entries, struct ibv_wc *wc)
> >  			cnt = qelr_poll_cq_resp(qp, cq, num_entries, wc,
> >  						&cqe->resp, &update);
> >  			break;
> > +		case RDMA_CQE_TYPE_RESPONDER_SRQ:
> > +			cnt = qelr_poll_cq_resp_srq(qp, cq, num_entries,
> wc,
> > +						    &cqe->resp, &update);
> > +			break;
> >  		case RDMA_CQE_TYPE_INVALID:
> >  		default:
> >  			printf("Error: invalid CQE type = %d\n",
> > @@ -2018,6 +2352,9 @@ void qelr_async_event(struct ibv_async_event
> *event)
> >  	case IBV_EVENT_COMM_EST:
> >  	case IBV_EVENT_QP_LAST_WQE_REACHED:
> >  		break;
> > +	case IBV_EVENT_SRQ_LIMIT_REACHED:
> > +	case IBV_EVENT_SRQ_ERR:
> 
> If you are here, please put /* fail through */ comment for gcc-7.
> 
> > +		return;
> >  	case IBV_EVENT_PORT_ACTIVE:
> >  	case IBV_EVENT_PORT_ERR:
> >  		break;
> > diff --git a/providers/qedr/qelr_verbs.h b/providers/qedr/qelr_verbs.h
> > index 50d1182..26802c3 100644
> > --- a/providers/qedr/qelr_verbs.h
> > +++ b/providers/qedr/qelr_verbs.h
> > @@ -73,5 +73,14 @@ int qelr_post_send(struct ibv_qp *ib_qp, struct
> ibv_send_wr *wr,
> >  int qelr_post_recv(struct ibv_qp *ibqp, struct ibv_recv_wr *wr,
> >  		   struct ibv_recv_wr **bad_wr);
> >
> > +int qelr_query_srq(struct ibv_srq *ibv_srq, struct ibv_srq_attr *attr);
> > +int qelr_modify_srq(struct ibv_srq *ibv_srq, struct ibv_srq_attr *attr,
> > +		    int attr_mask);
> > +struct ibv_srq *qelr_create_srq(struct ibv_pd *pd,
> > +				struct ibv_srq_init_attr *init_attr);
> > +int qelr_destroy_srq(struct ibv_srq *ibv_srq);
> > +int qelr_post_srq_recv(struct ibv_srq *ibsrq, struct ibv_recv_wr *wr,
> > +		       struct ibv_recv_wr **bad_wr);
> > +
> >  void qelr_async_event(struct ibv_async_event *event);
> >  #endif /* __QELR_VERBS_H__ */
> > diff --git a/providers/qedr/rdma_common.h
> b/providers/qedr/rdma_common.h
> > index 0707e17..f2d76bb 100644
> > --- a/providers/qedr/rdma_common.h
> > +++ b/providers/qedr/rdma_common.h
> > @@ -53,6 +53,7 @@
> >  #define RDMA_MAX_CQS				(64*1024)
> >  #define RDMA_MAX_TIDS				(128*1024-1)
> >  #define RDMA_MAX_PDS				(64*1024)
> > +#define RDMA_MAX_SRQS				(32*1024)
> >
> >  #define RDMA_NUM_STATISTIC_COUNTERS
> 	MAX_NUM_VPORTS
> >  #define RDMA_NUM_STATISTIC_COUNTERS_K2
> 	MAX_NUM_VPORTS_K2
> > --
> > 2.9.5
> >
> > --
> > To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
> > the body of a message to majordomo@xxxxxxxxxxxxxxx
> > More majordomo info at  http://vger.kernel.org/majordomo-info.html
--
To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html