On 3 April 2015 at 13:26, Chuanxiao Dong <chuanxiao.dong@xxxxxxxxx> wrote: > Use qdepth for mmc request fetching. Currently the request fetching > mechanism indicate the qdepth is only 2. Certainly this patch requires some more information. First start out explaining what this patch does, then why. That will help me understand better. > > Signed-off-by: Chuanxiao Dong <chuanxiao.dong@xxxxxxxxx> > --- > drivers/mmc/card/block.c | 43 ++++++---- > drivers/mmc/card/queue.c | 209 +++++++++++++++++++++++----------------------- > drivers/mmc/card/queue.h | 8 +- > 3 files changed, 139 insertions(+), 121 deletions(-) > > diff --git a/drivers/mmc/card/block.c b/drivers/mmc/card/block.c > index ed62d6b..2407f52 100644 > --- a/drivers/mmc/card/block.c > +++ b/drivers/mmc/card/block.c > @@ -122,6 +122,7 @@ struct mmc_blk_data { > struct device_attribute force_ro; > struct device_attribute power_ro_lock; > int area_type; > + struct mmc_queue *mq_curr; > }; > > static DEFINE_MUTEX(open_lock); > @@ -138,6 +139,7 @@ MODULE_PARM_DESC(perdev_minors, "Minors numbers to allocate per device"); > static inline int mmc_blk_part_switch(struct mmc_card *card, > struct mmc_blk_data *md); > static int get_card_status(struct mmc_card *card, u32 *status, int retries); > +static int mmc_blk_issue_rw_rq(struct mmc_queue *mq, struct request *rqc); > > static inline void mmc_blk_clear_packed(struct mmc_queue_req *mqrq) > { > @@ -653,6 +655,13 @@ static inline int mmc_blk_part_switch(struct mmc_card *card, > if (mmc_card_mmc(card)) { > u8 part_config = card->ext_csd.part_config; > > + /* > + * before switching partition, needs to make > + * sure there is no active transferring in previous > + * queue > + */ > + mmc_blk_issue_rw_rq(main_md->mq_curr, NULL); > + > part_config &= ~EXT_CSD_PART_CONFIG_ACC_MASK; > part_config |= md->part_type; > > @@ -666,6 +675,7 @@ static inline int mmc_blk_part_switch(struct mmc_card *card, > } > > main_md->part_curr = md->part_type; > + main_md->mq_curr = &md->queue; > return 0; > } > > @@ -1827,11 +1837,13 @@ static int mmc_blk_issue_rw_rq(struct mmc_queue *mq, struct request *rqc) > const u8 packed_nr = 2; > u8 reqs = 0; > > - if (!rqc && !mq->mqrq_prev->req) > + if (!rqc && !atomic_read(&mq->active_slots)) > return 0; > > - if (rqc) > + if (rqc) { > reqs = mmc_blk_prep_packed_list(mq, rqc); > + atomic_inc(&mq->active_slots); "active_slots", could we try to find a better name to this variable. It makes me think of HW mmc slots. :-) > + } > > do { > if (rqc) { > @@ -1856,11 +1868,8 @@ static int mmc_blk_issue_rw_rq(struct mmc_queue *mq, struct request *rqc) > } else > areq = NULL; > areq = mmc_start_req(card->host, areq, (int *) &status); > - if (!areq) { > - if (status == MMC_BLK_NEW_REQUEST) > - mq->flags |= MMC_QUEUE_NEW_REQUEST; > + if (!areq) > return 0; > - } > > mq_rq = container_of(areq, struct mmc_queue_req, mmc_active); > brq = &mq_rq->brq; > @@ -1968,6 +1977,9 @@ static int mmc_blk_issue_rw_rq(struct mmc_queue *mq, struct request *rqc) > } > } while (ret); > > + clear_bit_unlock(mq_rq->task_id, &mq->cmdqslot); > + atomic_dec(&mq->active_slots); I noticed that you are using atomic_* to manage the counts for active slots. Could eloborate why this is needed? > + > return 1; > > cmd_abort: > @@ -1982,10 +1994,14 @@ static int mmc_blk_issue_rw_rq(struct mmc_queue *mq, struct request *rqc) > } > > start_new_req: > + clear_bit_unlock(mq_rq->task_id, &mq->cmdqslot); > + atomic_dec(&mq->active_slots); > if (rqc) { > if (mmc_card_removed(card)) { > rqc->cmd_flags |= REQ_QUIET; > blk_end_request_all(rqc, -EIO); > + clear_bit_unlock(mq->mqrq_cur->task_id, &mq->cmdqslot); > + atomic_dec(&mq->active_slots); > } else { > /* > * If current request is packed, it needs to put back. > @@ -2011,7 +2027,7 @@ static int mmc_blk_issue_rq(struct mmc_queue *mq, struct request *req) > unsigned long flags; > unsigned int cmd_flags = req ? req->cmd_flags : 0; > > - if (req && !mq->mqrq_prev->req) > + if (!atomic_read(&mq->active_slots)) > /* claim host only for the first request */ > mmc_get_card(card); > > @@ -2024,10 +2040,9 @@ static int mmc_blk_issue_rq(struct mmc_queue *mq, struct request *req) > goto out; > } > > - mq->flags &= ~MMC_QUEUE_NEW_REQUEST; > if (cmd_flags & REQ_DISCARD) { > /* complete ongoing async transfer before issuing discard */ > - if (card->host->areq) > + if (atomic_read(&mq->active_slots)) > mmc_blk_issue_rw_rq(mq, NULL); > if (req->cmd_flags & REQ_SECURE) > ret = mmc_blk_issue_secdiscard_rq(mq, req); > @@ -2035,11 +2050,11 @@ static int mmc_blk_issue_rq(struct mmc_queue *mq, struct request *req) > ret = mmc_blk_issue_discard_rq(mq, req); > } else if (cmd_flags & REQ_FLUSH) { > /* complete ongoing async transfer before issuing flush */ > - if (card->host->areq) > + if (atomic_read(&mq->active_slots)) > mmc_blk_issue_rw_rq(mq, NULL); > ret = mmc_blk_issue_flush(mq, req); > } else { > - if (!req && host->areq) { > + if (!req && (atomic_read(&mq->active_slots) == 1)) { > spin_lock_irqsave(&host->context_info.lock, flags); > host->context_info.is_waiting_last_req = true; > spin_unlock_irqrestore(&host->context_info.lock, flags); > @@ -2048,13 +2063,12 @@ static int mmc_blk_issue_rq(struct mmc_queue *mq, struct request *req) > } > > out: > - if ((!req && !(mq->flags & MMC_QUEUE_NEW_REQUEST)) || > - (cmd_flags & MMC_REQ_SPECIAL_MASK)) > + if (!atomic_read(&mq->active_slots)) > /* > * Release host when there are no more requests > * and after special request(discard, flush) is done. > * In case sepecial request, there is no reentry to > - * the 'mmc_blk_issue_rq' with 'mqrq_prev->req'. > + * the 'mmc_blk_issue_rq'. > */ > mmc_put_card(card); > return ret; > @@ -2436,6 +2450,7 @@ static int mmc_blk_probe(struct device *dev) > md = mmc_blk_alloc(card); > if (IS_ERR(md)) > return PTR_ERR(md); > + md->mq_curr = &md->queue; > > string_get_size((u64)get_capacity(md->disk) << 9, STRING_UNITS_2, > cap_str, sizeof(cap_str)); > diff --git a/drivers/mmc/card/queue.c b/drivers/mmc/card/queue.c > index 236d194..c2d32e2 100644 > --- a/drivers/mmc/card/queue.c > +++ b/drivers/mmc/card/queue.c > @@ -46,6 +46,27 @@ static int mmc_prep_request(struct request_queue *q, struct request *req) > return BLKPREP_OK; > } > > +static bool mmc_queue_get_free_slot(struct mmc_queue *mq, > + unsigned long *free_slot) > +{ > + unsigned long slot; > + int i; > + > + if (!mq || !free_slot) > + return false; > + > + do { > + slot = find_first_zero_bit(&mq->cmdqslot, mq->qdepth); > + if (slot >= mq->qdepth) > + return false; > + > + i = test_and_set_bit_lock(slot, &mq->cmdqslot); > + } while (i); > + > + *free_slot = slot; > + return true; > +} > + > static int mmc_queue_thread(void *d) > { > struct mmc_queue *mq = d; > @@ -56,39 +77,23 @@ static int mmc_queue_thread(void *d) > down(&mq->thread_sem); > do { > struct request *req = NULL; > - struct mmc_queue_req *tmp; > - unsigned int cmd_flags = 0; > + unsigned long i; > > spin_lock_irq(q->queue_lock); > set_current_state(TASK_INTERRUPTIBLE); > req = blk_fetch_request(q); > - mq->mqrq_cur->req = req; > spin_unlock_irq(q->queue_lock); > > - if (req || mq->mqrq_prev->req) { > + if (req && !(req->cmd_flags & (REQ_DISCARD | REQ_FLUSH))) { > + while (!mmc_queue_get_free_slot(mq, &i)) > + mq->issue_fn(mq, NULL); > + mq->mqrq_cur = &mq->mqrq[i]; > + mq->mqrq_cur->req = req; > + } > + > + if (req || atomic_read(&mq->active_slots)) { > set_current_state(TASK_RUNNING); > - cmd_flags = req ? req->cmd_flags : 0; > mq->issue_fn(mq, req); > - if (mq->flags & MMC_QUEUE_NEW_REQUEST) { > - mq->flags &= ~MMC_QUEUE_NEW_REQUEST; > - continue; /* fetch again */ > - } > - > - /* > - * Current request becomes previous request > - * and vice versa. > - * In case of special requests, current request > - * has been finished. Do not assign it to previous > - * request. > - */ > - if (cmd_flags & MMC_REQ_SPECIAL_MASK) > - mq->mqrq_cur->req = NULL; > - > - mq->mqrq_prev->brq.mrq.data = NULL; > - mq->mqrq_prev->req = NULL; > - tmp = mq->mqrq_prev; > - mq->mqrq_prev = mq->mqrq_cur; > - mq->mqrq_cur = tmp; > } else { > if (kthread_should_stop()) { > set_current_state(TASK_RUNNING); > @@ -126,7 +131,7 @@ static void mmc_request_fn(struct request_queue *q) > } > > cntx = &mq->card->host->context_info; > - if (!mq->mqrq_cur->req && mq->mqrq_prev->req) { > + if (atomic_read(&mq->active_slots)) { > /* > * New MMC request arrived when MMC thread may be > * blocked on the previous request to be complete > @@ -138,7 +143,7 @@ static void mmc_request_fn(struct request_queue *q) > wake_up_interruptible(&cntx->wait); > } > spin_unlock_irqrestore(&cntx->lock, flags); > - } else if (!mq->mqrq_cur->req && !mq->mqrq_prev->req) > + } else > wake_up_process(mq->thread); > } > > @@ -192,9 +197,9 @@ int mmc_init_queue(struct mmc_queue *mq, struct mmc_card *card, > { > struct mmc_host *host = card->host; > u64 limit = BLK_BOUNCE_HIGH; > - int ret; > - struct mmc_queue_req *mqrq_cur = &mq->mqrq[0]; > - struct mmc_queue_req *mqrq_prev = &mq->mqrq[1]; > + int ret, i = 0; > + struct mmc_queue_req *mqrq = mq->mqrq; > + bool sg_allocated = false; > > if (mmc_dev(host)->dma_mask && *mmc_dev(host)->dma_mask) > limit = (u64)dma_max_pfn(mmc_dev(host)) << PAGE_SHIFT; > @@ -204,8 +209,16 @@ int mmc_init_queue(struct mmc_queue *mq, struct mmc_card *card, > if (!mq->queue) > return -ENOMEM; > > - mq->mqrq_cur = mqrq_cur; > - mq->mqrq_prev = mqrq_prev; > + mq->qdepth = 2; > + mq->mqrq = kcalloc(mq->qdepth, sizeof(struct mmc_queue_req), > + GFP_KERNEL); > + if (!mq->mqrq) > + return -ENOMEM; > + > + mqrq = mq->mqrq; > + for (i = 0; i < mq->qdepth; i++) > + mqrq[i].task_id = i; > + > mq->queue->queuedata = mq; > > blk_queue_prep_rq(mq->queue, mmc_prep_request); > @@ -227,65 +240,61 @@ int mmc_init_queue(struct mmc_queue *mq, struct mmc_card *card, > if (bouncesz > (host->max_blk_count * 512)) > bouncesz = host->max_blk_count * 512; > > + /* > + * init i to be -1 so if bounce_buf is not allcated > + * at all, then we don't need to free it for errors > + */ Possible the part below could be split up in a refactoring patch that precedes $subject patch. What do you think? > + i = -1; > if (bouncesz > 512) { > - mqrq_cur->bounce_buf = kmalloc(bouncesz, GFP_KERNEL); > - if (!mqrq_cur->bounce_buf) { > - pr_warn("%s: unable to allocate bounce cur buffer\n", > - mmc_card_name(card)); > - } else { > - mqrq_prev->bounce_buf = > - kmalloc(bouncesz, GFP_KERNEL); > - if (!mqrq_prev->bounce_buf) { > - pr_warn("%s: unable to allocate bounce prev buffer\n", > - mmc_card_name(card)); > - kfree(mqrq_cur->bounce_buf); > - mqrq_cur->bounce_buf = NULL; > - } > + for (i = 0; i < mq->qdepth; i++) { > + mqrq[i].bounce_buf = > + kmalloc(bouncesz, GFP_KERNEL); > + if (!mqrq[i].bounce_buf) > + break; > } > } > > - if (mqrq_cur->bounce_buf && mqrq_prev->bounce_buf) { > + /* > + * if i is not equal to mq->qdept, > + * then means there is no bounce_buf > + */ > + if (i != mq->qdepth) { > + for (; i >= 0; i--) { > + kfree(mqrq[i].bounce_buf); > + mqrq[i].bounce_buf = NULL; > + } > + } else { > blk_queue_bounce_limit(mq->queue, BLK_BOUNCE_ANY); > blk_queue_max_hw_sectors(mq->queue, bouncesz / 512); > blk_queue_max_segments(mq->queue, bouncesz / 512); > blk_queue_max_segment_size(mq->queue, bouncesz); > > - mqrq_cur->sg = mmc_alloc_sg(1, &ret); > - if (ret) > - goto cleanup_queue; > - > - mqrq_cur->bounce_sg = > - mmc_alloc_sg(bouncesz / 512, &ret); > - if (ret) > - goto cleanup_queue; > - > - mqrq_prev->sg = mmc_alloc_sg(1, &ret); > - if (ret) > - goto cleanup_queue; > - > - mqrq_prev->bounce_sg = > - mmc_alloc_sg(bouncesz / 512, &ret); > - if (ret) > - goto cleanup_queue; > + for (i = 0; i < mq->qdepth; i++) { > + mqrq[i].sg = mmc_alloc_sg(1, &ret); > + if (ret) > + goto cleanup_queue; > + mqrq[i].bounce_sg = > + mmc_alloc_sg(bouncesz / 512, &ret); > + if (ret) > + goto cleanup_queue; > + } > + sg_allocated = true; > } > } > #endif > > - if (!mqrq_cur->bounce_buf && !mqrq_prev->bounce_buf) { > + if (!sg_allocated) { > blk_queue_bounce_limit(mq->queue, limit); > blk_queue_max_hw_sectors(mq->queue, > min(host->max_blk_count, host->max_req_size / 512)); > blk_queue_max_segments(mq->queue, host->max_segs); > blk_queue_max_segment_size(mq->queue, host->max_seg_size); > > - mqrq_cur->sg = mmc_alloc_sg(host->max_segs, &ret); > - if (ret) > - goto cleanup_queue; > - > - > - mqrq_prev->sg = mmc_alloc_sg(host->max_segs, &ret); > - if (ret) > - goto cleanup_queue; > + for (i = 0; i < mq->qdepth; i++) { > + mqrq[i].sg = mmc_alloc_sg(host->max_segs, &ret); > + if (ret) > + goto cleanup_queue; > + } > } > > sema_init(&mq->thread_sem, 1); > @@ -300,21 +309,18 @@ int mmc_init_queue(struct mmc_queue *mq, struct mmc_card *card, > > return 0; > free_bounce_sg: > - kfree(mqrq_cur->bounce_sg); > - mqrq_cur->bounce_sg = NULL; > - kfree(mqrq_prev->bounce_sg); > - mqrq_prev->bounce_sg = NULL; > + for (i = 0; i < mq->qdepth; i++) { > + kfree(mqrq[i].bounce_sg); > + mqrq[i].bounce_sg = NULL; > + } > > cleanup_queue: > - kfree(mqrq_cur->sg); > - mqrq_cur->sg = NULL; > - kfree(mqrq_cur->bounce_buf); > - mqrq_cur->bounce_buf = NULL; > - > - kfree(mqrq_prev->sg); > - mqrq_prev->sg = NULL; > - kfree(mqrq_prev->bounce_buf); > - mqrq_prev->bounce_buf = NULL; > + for (i = 0; i < mq->qdepth; i++) { > + kfree(mqrq[i].sg); > + mqrq[i].sg = NULL; > + kfree(mqrq[i].bounce_buf); > + mqrq[i].bounce_buf = NULL; > + } > > blk_cleanup_queue(mq->queue); > return ret; > @@ -324,8 +330,7 @@ void mmc_cleanup_queue(struct mmc_queue *mq) > { > struct request_queue *q = mq->queue; > unsigned long flags; > - struct mmc_queue_req *mqrq_cur = mq->mqrq_cur; > - struct mmc_queue_req *mqrq_prev = mq->mqrq_prev; > + int i; > > /* Make sure the queue isn't suspended, as that will deadlock */ > mmc_queue_resume(mq); > @@ -339,23 +344,14 @@ void mmc_cleanup_queue(struct mmc_queue *mq) > blk_start_queue(q); > spin_unlock_irqrestore(q->queue_lock, flags); > > - kfree(mqrq_cur->bounce_sg); > - mqrq_cur->bounce_sg = NULL; > - > - kfree(mqrq_cur->sg); > - mqrq_cur->sg = NULL; > - > - kfree(mqrq_cur->bounce_buf); > - mqrq_cur->bounce_buf = NULL; > - > - kfree(mqrq_prev->bounce_sg); > - mqrq_prev->bounce_sg = NULL; > - > - kfree(mqrq_prev->sg); > - mqrq_prev->sg = NULL; > - > - kfree(mqrq_prev->bounce_buf); > - mqrq_prev->bounce_buf = NULL; > + for (i = 0; i < mq->qdepth; i++) { > + kfree(mq->mqrq[i].bounce_sg); > + mq->mqrq[i].bounce_sg = NULL; > + kfree(mq->mqrq[i].sg); > + mq->mqrq[i].sg = NULL; > + kfree(mq->mqrq[i].bounce_buf); > + mq->mqrq[i].bounce_buf = NULL; > + } > > mq->card = NULL; > } > @@ -367,6 +363,11 @@ int mmc_packed_init(struct mmc_queue *mq, struct mmc_card *card) > struct mmc_queue_req *mqrq_prev = &mq->mqrq[1]; > int ret = 0; > > + /* > + * the qdepth for PACK CMD is 2 > + */ > + if (!mqrq_cur || !mqrq_prev) > + return -ENOMEM; > > mqrq_cur->packed = kzalloc(sizeof(struct mmc_packed), GFP_KERNEL); > if (!mqrq_cur->packed) { > diff --git a/drivers/mmc/card/queue.h b/drivers/mmc/card/queue.h > index b129ddc..4f590bc 100644 > --- a/drivers/mmc/card/queue.h > +++ b/drivers/mmc/card/queue.h > @@ -42,6 +42,7 @@ struct mmc_queue_req { > struct mmc_async_req mmc_active; > enum mmc_packed_type cmd_type; > struct mmc_packed *packed; > + int task_id; /* mmc slot number */ The variable is named "task_id", but the comment says mmc slot number. It's a bit confusing. > }; > > struct mmc_queue { > @@ -50,14 +51,15 @@ struct mmc_queue { > struct semaphore thread_sem; > unsigned int flags; > #define MMC_QUEUE_SUSPENDED (1 << 0) > -#define MMC_QUEUE_NEW_REQUEST (1 << 1) > > int (*issue_fn)(struct mmc_queue *, struct request *); > void *data; > struct request_queue *queue; > - struct mmc_queue_req mqrq[2]; > + struct mmc_queue_req *mqrq; > struct mmc_queue_req *mqrq_cur; > - struct mmc_queue_req *mqrq_prev; > + unsigned long cmdqslot; > + unsigned long qdepth; > + atomic_t active_slots; > }; > > extern int mmc_init_queue(struct mmc_queue *, struct mmc_card *, spinlock_t *, > -- Kind regards Uffe -- To unsubscribe from this list: send the line "unsubscribe linux-mmc" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html