There is no reliable way to submit and wait in a single syscall, as io_submit_sqes() may under-consume sqes (in case of an early error). Then it will wait for not-yet-submitted requests, deadlocking the user in most cases. Don't wait/poll if can't submit all sqes, and return -EAGAIN Signed-off-by: Pavel Begunkov <asml.silence@xxxxxxxxx> --- v2: cap min_complete if submitted partially (Jens Axboe) fs/io_uring.c | 15 ++++++++++----- 1 file changed, 10 insertions(+), 5 deletions(-) diff --git a/fs/io_uring.c b/fs/io_uring.c index c2f66e30a812..4c281f382bec 100644 --- a/fs/io_uring.c +++ b/fs/io_uring.c @@ -3526,11 +3526,8 @@ static int io_submit_sqes(struct io_ring_ctx *ctx, unsigned int nr, unsigned int sqe_flags; req = io_get_req(ctx, statep); - if (unlikely(!req)) { - if (!submitted) - submitted = -EAGAIN; + if (unlikely(!req)) break; - } if (!io_get_sqring(ctx, req)) { __io_free_req(req); break; @@ -4910,6 +4907,14 @@ SYSCALL_DEFINE6(io_uring_enter, unsigned int, fd, u32, to_submit, submitted = io_submit_sqes(ctx, to_submit, f.file, fd, &cur_mm, false); mutex_unlock(&ctx->uring_lock); + + if (submitted != to_submit) { + if (!submitted) { + submitted = -EAGAIN; + goto done; + } + min_complete = min(min_complete, (u32)submitted); + } } if (flags & IORING_ENTER_GETEVENTS) { unsigned nr_events = 0; @@ -4922,7 +4927,7 @@ SYSCALL_DEFINE6(io_uring_enter, unsigned int, fd, u32, to_submit, ret = io_cqring_wait(ctx, min_complete, sig, sigsz); } } - +done: percpu_ref_put(&ctx->refs); out_fput: fdput(f); -- 2.24.0