On Sat, Oct 16, 2021 at 08:06:21PM -0600, Jens Axboe wrote: > Take advantage of struct io_comp_batch, if passed in to the nvme poll > handler. If it's set, rather than complete each request individually > inline, store them in the io_comp_batch list. We only do so for requests > that will complete successfully, anything else will be completed inline as > before. > > Signed-off-by: Jens Axboe <axboe@xxxxxxxxx> > --- > drivers/nvme/host/core.c | 17 ++++++++++++++--- > drivers/nvme/host/nvme.h | 14 ++++++++++++++ > drivers/nvme/host/pci.c | 31 +++++++++++++++++++++++++------ > 3 files changed, 53 insertions(+), 9 deletions(-) > > diff --git a/drivers/nvme/host/core.c b/drivers/nvme/host/core.c > index c2c2e8545292..4eadecc67c91 100644 > --- a/drivers/nvme/host/core.c > +++ b/drivers/nvme/host/core.c > @@ -346,15 +346,19 @@ static inline enum nvme_disposition nvme_decide_disposition(struct request *req) > return RETRY; > } > > -static inline void nvme_end_req(struct request *req) > +static inline void nvme_end_req_zoned(struct request *req) > { > - blk_status_t status = nvme_error_status(nvme_req(req)->status); > - > if (IS_ENABLED(CONFIG_BLK_DEV_ZONED) && > req_op(req) == REQ_OP_ZONE_APPEND) > req->__sector = nvme_lba_to_sect(req->q->queuedata, > le64_to_cpu(nvme_req(req)->result.u64)); > +} > + > +static inline void nvme_end_req(struct request *req) > +{ > + blk_status_t status = nvme_error_status(nvme_req(req)->status); > > + nvme_end_req_zoned(req); > nvme_trace_bio_complete(req); > blk_mq_end_request(req, status); > } > @@ -381,6 +385,13 @@ void nvme_complete_rq(struct request *req) > } > EXPORT_SYMBOL_GPL(nvme_complete_rq); > > +void nvme_complete_batch_req(struct request *req) > +{ > + nvme_cleanup_cmd(req); > + nvme_end_req_zoned(req); > +} > +EXPORT_SYMBOL_GPL(nvme_complete_batch_req); > + > /* > * Called to unwind from ->queue_rq on a failed command submission so that the > * multipathing code gets called to potentially failover to another path. > diff --git a/drivers/nvme/host/nvme.h b/drivers/nvme/host/nvme.h > index ed79a6c7e804..ef2467b93adb 100644 > --- a/drivers/nvme/host/nvme.h > +++ b/drivers/nvme/host/nvme.h > @@ -638,6 +638,20 @@ static inline bool nvme_is_aen_req(u16 qid, __u16 command_id) > } > > void nvme_complete_rq(struct request *req); > +void nvme_complete_batch_req(struct request *req); > + > +static __always_inline void nvme_complete_batch(struct io_comp_batch *iob, > + void (*fn)(struct request *rq)) > +{ > + struct request *req; > + > + rq_list_for_each(&iob->req_list, req) { > + fn(req); > + nvme_complete_batch_req(req); > + } > + blk_mq_end_request_batch(iob); > +} > + > blk_status_t nvme_host_path_error(struct request *req); > bool nvme_cancel_request(struct request *req, void *data, bool reserved); > void nvme_cancel_tagset(struct nvme_ctrl *ctrl); > diff --git a/drivers/nvme/host/pci.c b/drivers/nvme/host/pci.c > index d1ab9250101a..e916d5e167c1 100644 > --- a/drivers/nvme/host/pci.c > +++ b/drivers/nvme/host/pci.c > @@ -959,7 +959,7 @@ static blk_status_t nvme_queue_rq(struct blk_mq_hw_ctx *hctx, > return ret; > } > > -static void nvme_pci_complete_rq(struct request *req) > +static __always_inline void nvme_pci_unmap_rq(struct request *req) > { > struct nvme_iod *iod = blk_mq_rq_to_pdu(req); > struct nvme_dev *dev = iod->nvmeq->dev; > @@ -969,9 +969,19 @@ static void nvme_pci_complete_rq(struct request *req) > rq_integrity_vec(req)->bv_len, rq_data_dir(req)); > if (blk_rq_nr_phys_segments(req)) > nvme_unmap_data(dev, req); > +} > + > +static void nvme_pci_complete_rq(struct request *req) > +{ > + nvme_pci_unmap_rq(req); > nvme_complete_rq(req); > } > > +static void nvme_pci_complete_batch(struct io_comp_batch *iob) > +{ > + nvme_complete_batch(iob, nvme_pci_unmap_rq); > +} > + > /* We read the CQE phase first to check if the rest of the entry is valid */ > static inline bool nvme_cqe_pending(struct nvme_queue *nvmeq) > { > @@ -996,7 +1006,8 @@ static inline struct blk_mq_tags *nvme_queue_tagset(struct nvme_queue *nvmeq) > return nvmeq->dev->tagset.tags[nvmeq->qid - 1]; > } > > -static inline void nvme_handle_cqe(struct nvme_queue *nvmeq, u16 idx) > +static inline void nvme_handle_cqe(struct nvme_queue *nvmeq, > + struct io_comp_batch *iob, u16 idx) > { > struct nvme_completion *cqe = &nvmeq->cqes[idx]; > __u16 command_id = READ_ONCE(cqe->command_id); > @@ -1023,7 +1034,9 @@ static inline void nvme_handle_cqe(struct nvme_queue *nvmeq, u16 idx) > } > > trace_nvme_sq(req, cqe->sq_head, nvmeq->sq_tail); > - if (!nvme_try_complete_req(req, cqe->status, cqe->result)) > + if (!nvme_try_complete_req(req, cqe->status, cqe->result) && > + !blk_mq_add_to_batch(req, iob, nvme_req(req)->status, > + nvme_pci_complete_batch)) > nvme_pci_complete_rq(req); > } > > @@ -1039,7 +1052,8 @@ static inline void nvme_update_cq_head(struct nvme_queue *nvmeq) > } > } > > -static inline int nvme_process_cq(struct nvme_queue *nvmeq) > +static inline int nvme_poll_cq(struct nvme_queue *nvmeq, > + struct io_comp_batch *iob) > { > int found = 0; > > @@ -1050,7 +1064,7 @@ static inline int nvme_process_cq(struct nvme_queue *nvmeq) > * the cqe requires a full read memory barrier > */ > dma_rmb(); > - nvme_handle_cqe(nvmeq, nvmeq->cq_head); > + nvme_handle_cqe(nvmeq, iob, nvmeq->cq_head); > nvme_update_cq_head(nvmeq); > } > > @@ -1059,6 +1073,11 @@ static inline int nvme_process_cq(struct nvme_queue *nvmeq) > return found; > } > > +static inline int nvme_process_cq(struct nvme_queue *nvmeq) > +{ > + return nvme_poll_cq(nvmeq, NULL); > + } Extra whitespace here. But I'd prefer to just drop this wrapping, and just add the io_comp_batch argument to nvme_process_cq.