RE: Re: [PATCH for-next v3 07/12] RDMA/erdma: Add verbs header file

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 




> -----Original Message-----
> From: dust.li <dust.li@xxxxxxxxxxxxxxxxx>
> Sent: Tuesday, 22 February 2022 11:41
> To: Cheng Xu <chengyou.xc@xxxxxxxxxxxxxxx>; jgg@xxxxxxxx;
> dledford@xxxxxxxxxx
> Cc: leon@xxxxxxxxxx; linux-rdma@xxxxxxxxxxxxxxx;
> KaiShen@xxxxxxxxxxxxxxxxx; chengyou@xxxxxxxxxxxxxxxxx;
> tonylu@xxxxxxxxxxxxxxxxx
> Subject: [EXTERNAL] Re: [PATCH for-next v3 07/12] RDMA/erdma: Add verbs
> header file
> 
> On Thu, Feb 17, 2022 at 11:01:11AM +0800, Cheng Xu wrote:
> >From: Cheng Xu <chengyou@xxxxxxxxxxxxxxxxx>
> >
> >This header file defines the main structrues and functions used for RDMA
> >Verbs, including qp, cq, mr ucontext, etc,.
> >
> >Signed-off-by: Cheng Xu <chengyou@xxxxxxxxxxxxxxxxx>
> >---
> > drivers/infiniband/hw/erdma/erdma_verbs.h | 345 ++++++++++++++++++++++
> > 1 file changed, 345 insertions(+)
> > create mode 100644 drivers/infiniband/hw/erdma/erdma_verbs.h
> >
> >diff --git a/drivers/infiniband/hw/erdma/erdma_verbs.h
> b/drivers/infiniband/hw/erdma/erdma_verbs.h
> >new file mode 100644
> >index 000000000000..261f8c0bdff3
> >--- /dev/null
> >+++ b/drivers/infiniband/hw/erdma/erdma_verbs.h
> >@@ -0,0 +1,345 @@
> >+/* SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause */
> >+
> >+/* Authors: Cheng Xu <chengyou@xxxxxxxxxxxxxxxxx> */
> >+/*          Kai Shen <kaishen@xxxxxxxxxxxxxxxxx> */
> >+/* Copyright (c) 2020-2022, Alibaba Group. */
> 
> Maybe it's better to use a single '/**/' for multilines in the comment.
> 
> >+
> >+#ifndef __ERDMA_VERBS_H__
> >+#define __ERDMA_VERBS_H__
> >+
> >+#include <linux/errno.h>
> >+
> >+#include <rdma/iw_cm.h>
> >+#include <rdma/ib_verbs.h>
> >+#include <rdma/ib_user_verbs.h>
> >+
> >+#include "erdma.h"
> >+#include "erdma_cm.h"
> >+#include "erdma_hw.h"
> >+
> >+/* RDMA Capbility. */

Capability

> >+#define ERDMA_MAX_PD (128 * 1024)
> >+#define ERDMA_MAX_SEND_WR 4096
> >+#define ERDMA_MAX_ORD 128
> >+#define ERDMA_MAX_IRD 128
> >+#define ERDMA_MAX_SGE_RD 1
> >+#define ERDMA_MAX_FMR 0
> >+#define ERDMA_MAX_SRQ 0 /* not support srq now. */
> >+#define ERDMA_MAX_SRQ_WR 0 /* not support srq now. */
> >+#define ERDMA_MAX_SRQ_SGE 0 /* not support srq now. */
> >+#define ERDMA_MAX_CONTEXT (128 * 1024)
> >+#define ERDMA_MAX_SEND_SGE 6
> >+#define ERDMA_MAX_RECV_SGE 1
> >+#define ERDMA_MAX_INLINE (sizeof(struct erdma_sge) *
> (ERDMA_MAX_SEND_SGE))

Wouldn't it make sense to define MAX_INLINE in
the abi header file? The user level application
also wants to know about it.

And, is the value correct? I did not check how the
user data are carried over, but (from siw) I assume
data are kept in sge[1] .. sge[n-1], and sge[0]
would carry len information and point to sge[1] for
data? With that it would be (ERDMA_MAX_SEND_SGE - 1)
here.


> >+#define ERDMA_MAX_FRMR_PA 512
> >+
> >+enum {
> >+	ERDMA_MMAP_IO_NC = 0, /* no cache */
> >+};
> >+
> >+struct erdma_user_mmap_entry {
> >+	struct rdma_user_mmap_entry rdma_entry;
> >+	u64 address;
> >+	u8 mmap_flag;
> >+};
> >+
> >+struct erdma_ucontext {
> >+	struct ib_ucontext ibucontext;
> >+	struct erdma_dev *dev;
> >+
> >+	u32 sdb_type;
> >+	u32 sdb_idx;
> >+	u32 sdb_page_idx;
> >+	u32 sdb_page_off;
> >+	u64 sdb;
> >+	u64 rdb;
> >+	u64 cdb;
> >+
> >+	struct rdma_user_mmap_entry *sq_db_mmap_entry;
> >+	struct rdma_user_mmap_entry *rq_db_mmap_entry;
> >+	struct rdma_user_mmap_entry *cq_db_mmap_entry;
> >+
> >+	/* doorbell records */
> >+	struct list_head dbrecords_page_list;
> >+	struct mutex dbrecords_page_mutex;
> >+};
> >+
> >+struct erdma_pd {
> >+	struct ib_pd ibpd;
> >+	u32 pdn;
> >+};
> >+
> >+/*
> >+ * MemoryRegion definition.
> >+ */
> >+#define ERDMA_MAX_INLINE_MTT_ENTRIES 4
> >+#define MTT_SIZE(x) (x << 3) /* per mtt takes 8 Bytes. */
> >+#define ERDMA_MR_MAX_MTT_CNT 524288
> >+#define ERDMA_MTT_ENTRY_SIZE 8
> >+
> >+#define ERDMA_MR_TYPE_NORMAL 0
> >+#define ERDMA_MR_TYPE_FRMR 1
> >+#define ERDMA_MR_TYPE_DMA 2
> >+
> >+#define ERDMA_MR_INLINE_MTT 0
> >+#define ERDMA_MR_INDIRECT_MTT 1
> >+
> >+#define ERDMA_MR_ACC_LR BIT(0)
> >+#define ERDMA_MR_ACC_LW BIT(1)
> >+#define ERDMA_MR_ACC_RR BIT(2)
> >+#define ERDMA_MR_ACC_RW BIT(3)
> >+
> >+struct erdma_mem {
> >+	struct ib_umem *umem;
> >+	void *mtt_buf;
> >+	u32 mtt_type;
> >+	u32 page_size;
> >+	u32 page_offset;
> >+	u32 page_cnt;
> >+	u32 mtt_nents;
> >+
> >+	u64 va;
> >+	u64 len;
> >+
> >+	u64 mtt_entry[ERDMA_MAX_INLINE_MTT_ENTRIES];
> >+};
> >+
> >+struct erdma_mr {
> >+	struct ib_mr ibmr;
> >+	struct erdma_mem mem;
> >+	u8 type;
> >+	u8 access;
> >+	u8 valid;
> >+};
> >+
> >+struct erdma_user_dbrecords_page {
> >+	struct list_head list;
> >+	struct ib_umem *umem;
> >+	u64 va;
> >+	int refcnt;
> >+};
> >+
> >+struct erdma_uqp {
> >+	struct erdma_mem sq_mtt;
> >+	struct erdma_mem rq_mtt;
> >+
> >+	dma_addr_t sq_db_info_dma_addr;
> >+	dma_addr_t rq_db_info_dma_addr;
> >+
> >+	struct erdma_user_dbrecords_page *user_dbr_page;
> >+
> >+	u32 rq_offset;
> >+};
> >+struct erdma_kqp {
> >+	u16 sq_pi;
> >+	u16 sq_ci;
> >+
> >+	u16 rq_pi;
> >+	u16 rq_ci;
> >+
> >+	u64 *swr_tbl;
> >+	u64 *rwr_tbl;
> >+
> >+	void *hw_sq_db;
> >+	void *hw_rq_db;
> >+
> >+	void *sq_buf;
> >+	dma_addr_t sq_buf_dma_addr;
> >+
> >+	void *rq_buf;
> >+	dma_addr_t rq_buf_dma_addr;
> >+
> >+	void *sq_db_info;
> >+	void *rq_db_info;
> >+
> >+	u8 sig_all;
> >+};
> >+
> >+enum erdma_qp_state {
> >+	ERDMA_QP_STATE_IDLE = 0,
> >+	ERDMA_QP_STATE_RTR = 1,
> >+	ERDMA_QP_STATE_RTS = 2,
> >+	ERDMA_QP_STATE_CLOSING = 3,
> >+	ERDMA_QP_STATE_TERMINATE = 4,
> >+	ERDMA_QP_STATE_ERROR = 5,
> 
> Do we reserve 6 here on purpose ?
> 
> >+	ERDMA_QP_STATE_UNDEF = 7,
> >+	ERDMA_QP_STATE_COUNT = 8
> >+};
> >+
> >+enum erdma_qp_attr_mask {
> >+	ERDMA_QP_ATTR_STATE = (1 << 0),
> >+	ERDMA_QP_ATTR_LLP_HANDLE = (1 << 2),
> >+	ERDMA_QP_ATTR_ORD = (1 << 3),
> >+	ERDMA_QP_ATTR_IRD = (1 << 4),
> >+	ERDMA_QP_ATTR_SQ_SIZE = (1 << 5),
> >+	ERDMA_QP_ATTR_RQ_SIZE = (1 << 6),
> >+	ERDMA_QP_ATTR_MPA = (1 << 7)
> >+};
> >+
> >+struct erdma_qp_attrs {
> >+	enum erdma_qp_state state;
> >+	u32 sq_size;
> >+	u32 rq_size;
> >+	u32 orq_size;
> >+	u32 irq_size;
> >+	u32 max_send_sge;
> >+	u32 max_recv_sge;
> >+};
> >+
> >+struct erdma_qp {
> >+	struct ib_qp ibqp;
> >+	struct kref ref;
> >+	struct completion safe_free;
> >+	struct erdma_dev *dev;
> >+	struct erdma_cep *cep;
> >+	struct rw_semaphore state_lock;
> >+
> >+	union {
> >+		struct erdma_kqp kern_qp;
> >+		struct erdma_uqp user_qp;
> >+	};
> >+
> >+	struct erdma_cq *scq;
> >+	struct erdma_cq *rcq;
> >+
> >+	struct erdma_qp_attrs attrs;
> >+	spinlock_t lock;
> >+
> >+	enum erdma_cc_method cc_method;
> >+#define ERDMA_QP_ACTIVE 0
> >+#define ERDMA_QP_PASSIVE 1
> >+	u8 qp_type;
> >+	u8 private_data_len;
> >+};
> >+
> >+struct erdma_kcq_info {
> >+	struct erdma_cqe *qbuf;
> >+	dma_addr_t qbuf_dma_addr;
> >+	u32 ci;
> >+	u32 owner;
> >+	u32 cmdsn;
> >+
> >+	spinlock_t lock;
> >+	u8 __iomem *db;
> >+	u64 *db_record;
> >+};
> >+
> >+struct erdma_ucq_info {
> >+	struct erdma_mem qbuf_mtt;
> >+	struct erdma_user_dbrecords_page *user_dbr_page;
> >+	dma_addr_t db_info_dma_addr;
> >+};
> >+
> >+struct erdma_cq {
> >+	struct ib_cq ibcq;
> >+	u32 cqn;
> >+
> >+	u32 depth;
> >+	u32 assoc_eqn;
> >+
> >+	union {
> >+		struct erdma_kcq_info kern_cq;
> >+		struct erdma_ucq_info user_cq;
> >+	};
> >+};
> >+
> >+#define QP_ID(qp) ((qp)->ibqp.qp_num)
> >+
> >+static inline struct erdma_qp *find_qp_by_qpn(struct erdma_dev *dev, int
> id)
> >+{
> >+	return (struct erdma_qp *)xa_load(&dev->qp_xa, id);
> >+}
> >+
> >+static inline struct erdma_cq *find_cq_by_cqn(struct erdma_dev *dev, int
> id)
> >+{
> >+	return (struct erdma_cq *)xa_load(&dev->cq_xa, id);
> >+}
> >+
> >+void erdma_qp_get(struct erdma_qp *qp);
> >+void erdma_qp_put(struct erdma_qp *qp);
> >+int erdma_modify_qp_internal(struct erdma_qp *qp, struct erdma_qp_attrs
> *attrs,
> >+			     enum erdma_qp_attr_mask mask);
> >+void erdma_qp_llp_close(struct erdma_qp *qp);
> >+void erdma_qp_cm_drop(struct erdma_qp *qp);
> >+
> >+static inline struct erdma_ucontext *to_ectx(struct ib_ucontext *ibctx)
> >+{
> >+	return container_of(ibctx, struct erdma_ucontext, ibucontext);
> >+}
> >+
> >+static inline struct erdma_pd *to_epd(struct ib_pd *pd)
> >+{
> >+	return container_of(pd, struct erdma_pd, ibpd);
> >+}
> >+
> >+static inline struct erdma_mr *to_emr(struct ib_mr *ibmr)
> >+{
> >+	return container_of(ibmr, struct erdma_mr, ibmr);
> >+}
> >+
> >+static inline struct erdma_qp *to_eqp(struct ib_qp *qp)
> >+{
> >+	return container_of(qp, struct erdma_qp, ibqp);
> >+}
> >+
> >+static inline struct erdma_cq *to_ecq(struct ib_cq *ibcq)
> >+{
> >+	return container_of(ibcq, struct erdma_cq, ibcq);
> >+}
> >+
> >+static inline struct erdma_user_mmap_entry *
> >+to_emmap(struct rdma_user_mmap_entry *ibmmap)
> >+{
> >+	return container_of(ibmmap, struct erdma_user_mmap_entry,
> rdma_entry);
> >+}
> >+
> >+static inline void *get_sq_entry(struct erdma_qp *qp, u16 idx)
> >+{
> >+	idx &= (qp->attrs.sq_size - 1);
> >+	return qp->kern_qp.sq_buf + (idx << SQEBB_SHIFT);
> >+}
> >+
> >+int erdma_alloc_ucontext(struct ib_ucontext *ctx, struct ib_udata
> *data);
> >+void erdma_dealloc_ucontext(struct ib_ucontext *ctx);
> >+int erdma_query_device(struct ib_device *dev, struct ib_device_attr
> *attr,
> >+		       struct ib_udata *data);
> >+int erdma_get_port_immutable(struct ib_device *dev, u32 port,
> >+			     struct ib_port_immutable *ib_port_immutable);
> >+int erdma_create_cq(struct ib_cq *cq, const struct ib_cq_init_attr
> *attr,
> >+		    struct ib_udata *data);
> >+int erdma_query_port(struct ib_device *dev, u32 port,
> >+		     struct ib_port_attr *attr);
> >+int erdma_query_gid(struct ib_device *dev, u32 port, int idx,
> >+		    union ib_gid *gid);
> >+int erdma_alloc_pd(struct ib_pd *pd, struct ib_udata *data);
> >+int erdma_dealloc_pd(struct ib_pd *ibpd, struct ib_udata *udata);
> >+int erdma_create_qp(struct ib_qp *ibqp, struct ib_qp_init_attr *attr,
> >+		    struct ib_udata *data);
> >+int erdma_query_qp(struct ib_qp *qp, struct ib_qp_attr *attr, int mask,
> >+		   struct ib_qp_init_attr *init_attr);
> >+int erdma_modify_qp(struct ib_qp *qp, struct ib_qp_attr *attr, int mask,
> >+		    struct ib_udata *data);
> >+int erdma_destroy_qp(struct ib_qp *ibqp, struct ib_udata *udata);
> >+int erdma_destroy_cq(struct ib_cq *ibcq, struct ib_udata *udata);
> >+int erdma_req_notify_cq(struct ib_cq *cq, enum ib_cq_notify_flags
> flags);
> >+struct ib_mr *erdma_reg_user_mr(struct ib_pd *ibpd, u64 start, u64 len,
> >+				u64 virt, int access, struct ib_udata *udata);
> >+struct ib_mr *erdma_get_dma_mr(struct ib_pd *ibpd, int rights);
> >+int erdma_dereg_mr(struct ib_mr *mr, struct ib_udata *data);
> >+int erdma_mmap(struct ib_ucontext *ctx, struct vm_area_struct *vma);
> >+void erdma_qp_get_ref(struct ib_qp *qp);
> >+void erdma_qp_put_ref(struct ib_qp *qp);
> >+struct ib_qp *erdma_get_ibqp(struct ib_device *dev, int id);
> >+int erdma_post_send(struct ib_qp *qp, const struct ib_send_wr *send_wr,
> >+		    const struct ib_send_wr **bad_send_wr);
> >+int erdma_post_recv(struct ib_qp *qp, const struct ib_recv_wr *recv_wr,
> >+		    const struct ib_recv_wr **bad_recv_wr);
> >+int erdma_poll_cq(struct ib_cq *cq, int num_entries, struct ib_wc *wc);
> >+struct ib_mr *erdma_ib_alloc_mr(struct ib_pd *ibpd, enum ib_mr_type
> mr_type,
> >+				u32 max_num_sg);
> >+int erdma_map_mr_sg(struct ib_mr *ibmr, struct scatterlist *sg, int
> sg_nents,
> >+		    unsigned int *sg_offset);
> >+struct net_device *erdma_get_netdev(struct ib_device *device, u32
> port_num);
> >+void erdma_port_event(struct erdma_dev *dev, enum ib_event_type reason);
> >+
> >+#endif
> >--
> >2.27.0




[Index of Archives]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Photo]     [Yosemite News]     [Yosemite Photos]     [Linux Kernel]     [Linux SCSI]     [XFree86]

  Powered by Linux