[20/22] aio: enable polling for IOCTX_FLAG_SQTHREAD

Message ID	20181221192236.12866-21-axboe@kernel.dk (mailing list archive)
State	New, archived
Headers	show Return-Path: <linux-block-owner@kernel.org> From: Jens Axboe <axboe@kernel.dk> To: linux-fsdevel@vger.kernel.org, linux-aio@kvack.org, linux-block@vger.kernel.org Cc: hch@lst.de, viro@zeniv.linux.org.uk, Jens Axboe <axboe@kernel.dk> Subject: [PATCH 20/22] aio: enable polling for IOCTX_FLAG_SQTHREAD Date: Fri, 21 Dec 2018 12:22:34 -0700 Message-Id: <20181221192236.12866-21-axboe@kernel.dk> In-Reply-To: <20181221192236.12866-1-axboe@kernel.dk> References: <20181221192236.12866-1-axboe@kernel.dk> Sender: linux-block-owner@vger.kernel.org Precedence: bulk
Series	[01/22] fs: add an iopoll method to struct file_operations \| expand [01/22] fs: add an iopoll method to struct file_operations [02/22] block: add bio_set_polled() helper [03/22] block: wire up block device iopoll method [04/22] block: use REQ_HIPRI_ASYNC for non-sync polled IO [05/22] block: use bio_set_polled() helper for O_DIRECT [06/22] iomap: wire up the iopoll method [07/22] aio: add io_setup2() system call [08/22] aio: support for IO polling [09/22] aio: add submission side request cache [10/22] fs: add fget_many() and fput_many() [11/22] aio: use fget/fput_many() for file references [12/22] aio: split iocb init from allocation [13/22] aio: batch aio_kiocb allocation [14/22] aio: split old ring complete out from aio_complete() [15/22] aio: pass in user index to __io_submit_one() [16/22] aio: add support for submission/completion rings [17/22] block: implement bio helper to add iter bvec pages to bio [18/22] aio: add support for pre-mapped user IO buffers [19/22] aio: support kernel side submission for aio with SCQRING [20/22] aio: enable polling for IOCTX_FLAG_SQTHREAD [21/22] aio: utilize io_event->res2 for CQ ring [22/22] aio: add my copyright

diff --git a/fs/aio.c b/fs/aio.c index cd4a61642b46..8894c9299b39 100644 --- a/fs/aio.c +++ b/fs/aio.c @@ -120,6 +120,7 @@ struct aio_mapped_ubuf { struct aio_sq_offload { struct task_struct *thread; /* if using a thread */ + bool thread_poll; struct workqueue_struct *wq; /* wq offload */ struct mm_struct *mm; struct files_struct *files; @@ -340,6 +341,7 @@ static void aio_iocb_buffer_unmap(struct kioctx *); static void aio_scqring_unmap(struct kioctx *); static void aio_iopoll_reap_events(struct kioctx *); static const struct iocb *aio_iocb_from_index(struct kioctx *ctx, unsigned idx); +static void aio_sq_wq_submit_work(struct work_struct *work); static struct file *aio_private_file(struct kioctx *ctx, loff_t nr_pages) { @@ -1773,6 +1775,9 @@ static int aio_sq_thread_start(struct kioctx *ctx) if (!aso->files) goto err; + if (ctx->flags & IOCTX_FLAG_SQPOLL) + aso->thread_poll = true; + if (ctx->flags & IOCTX_FLAG_SQTHREAD) { char name[32]; @@ -1786,7 +1791,8 @@ static int aio_sq_thread_start(struct kioctx *ctx) goto err; } wake_up_process(aso->thread); - } else if (ctx->flags & IOCTX_FLAG_SQWQ) { + } + if (ctx->flags & IOCTX_FLAG_SQWQ) { int concurrency; /* Do QD, or 2 * CPUS, whatever is smallest */ @@ -1862,7 +1868,8 @@ static void aio_scqring_unmap(struct kioctx *ctx) kthread_park(aso->thread); kthread_stop(aso->thread); aso->thread = NULL; - } else if (aso->wq) { + } + if (aso->wq) { destroy_workqueue(aso->wq); aso->wq = NULL; } @@ -2080,7 +2087,7 @@ SYSCALL_DEFINE5(io_setup2, u32, nr_events, u32, flags, if (flags & ~(IOCTX_FLAG_IOPOLL | IOCTX_FLAG_SCQRING | IOCTX_FLAG_FIXEDBUFS | IOCTX_FLAG_SQTHREAD | - IOCTX_FLAG_SQWQ)) + IOCTX_FLAG_SQWQ | IOCTX_FLAG_SQPOLL)) return -EINVAL; ret = get_user(ctx, ctxp); @@ -3153,28 +3160,69 @@ struct iocb_submit { unsigned int index; }; +struct aio_io_work { + struct work_struct work; + struct kioctx *ctx; + struct iocb iocb; + unsigned iocb_index; +}; + +static int aio_queue_async_work(struct kioctx *ctx, struct iocb_submit *is) +{ + struct aio_io_work *work; + + work = kmalloc(sizeof(*work), GFP_KERNEL); + if (work) { + memcpy(&work->iocb, is->iocb, sizeof(*is->iocb)); + work->iocb_index = is->index; + INIT_WORK(&work->work, aio_sq_wq_submit_work); + work->ctx = ctx; + queue_work(ctx->sq_offload.wq, &work->work); + return 0; + } + + return -ENOMEM; +} + static int aio_submit_iocbs(struct kioctx *ctx, struct iocb_submit *iocbs, unsigned int nr, struct mm_struct *cur_mm, bool mm_fault) { struct aio_submit_state state, *statep = NULL; int ret, i, submitted = 0; + bool force_nonblock; if (nr > AIO_PLUG_THRESHOLD) { aio_submit_state_start(&state, ctx, nr); statep = &state; } + /* + * Having both a thread and a workqueue only makes sense for buffered + * IO, where we can't submit in an async fashion. Use the NOWAIT + * trick from the SQ thread, and punt to the workqueue if we can't + * satisfy this iocb without blocking. This is only necessary + * for buffered IO with sqthread polled submission. + */ + force_nonblock = (ctx->flags & IOCTX_FLAG_SQWQ) != 0; + for (i = 0; i < nr; i++) { - if (unlikely(mm_fault)) + if (unlikely(mm_fault)) { ret = -EFAULT; - else + } else { ret = __io_submit_one(ctx, iocbs[i].iocb, iocbs[i].index, statep, false, - !cur_mm, false); - if (!ret) { - submitted++; - continue; + !cur_mm, force_nonblock); + /* nogo, submit to workqueue */ + if (force_nonblock && + (ret == -EAGAIN || ctx->submit_eagain)) { + ctx->submit_eagain = 0; + ret = aio_queue_async_work(ctx, &iocbs[i]); + } + if (!ret) { + submitted++; + continue; + } } aio_fill_cq_error(ctx, iocbs[i].iocb, ret); @@ -3187,17 +3235,23 @@ static int aio_submit_iocbs(struct kioctx *ctx, struct iocb_submit *iocbs, } /* - * sq thread only supports O_DIRECT or FIXEDBUFS IO + * SQ thread is woken if the app asked for offloaded submission. This can + * be either O_DIRECT, in which case we do submissions directly, or it can + * be buffered IO, in which case we do them inline if we can do so without + * blocking. If we can't, then we punt to a workqueue. */ static int aio_sq_thread(void *data) { struct iocb_submit iocbs[AIO_IOPOLL_BATCH]; struct kioctx *ctx = data; + struct aio_sq_ring *ring = ctx->sq_ring.ring; struct aio_sq_offload *aso = &ctx->sq_offload; struct mm_struct *cur_mm = NULL; struct files_struct *old_files; mm_segment_t old_fs; DEFINE_WAIT(wait); + unsigned inflight; + unsigned long timeout; old_files = current->files; current->files = aso->files; @@ -3205,15 +3259,50 @@ static int aio_sq_thread(void *data) old_fs = get_fs(); set_fs(USER_DS); + timeout = inflight = 0; while (!kthread_should_stop()) { const struct iocb *iocb; bool mm_fault = false; unsigned nhead, index; int i; + if (aso->thread_poll && inflight) { + unsigned int nr_events = 0; + + /* + * Buffered IO, just pretend everything completed. + * We don't have to poll completions for that. + */ + if (ctx->flags & IOCTX_FLAG_IOPOLL) + __aio_iopoll_check(ctx, NULL, &nr_events, 0, -1U); + else + nr_events = inflight; + + inflight -= nr_events; + if (!inflight) + timeout = jiffies + HZ; + } + iocb = aio_peek_sqring(ctx, &index, &nhead); if (!iocb) { + /* + * If we're polling, let us spin for a second without + * work before going to sleep. + */ + if (aso->thread_poll) { + if (inflight || !time_after(jiffies, timeout)) { + cpu_relax(); + continue; + } + } prepare_to_wait(&aso->wait, &wait, TASK_INTERRUPTIBLE); + + /* Tell userspace we may need a wakeup call */ + if (aso->thread_poll) { + ring->kflags |= IORING_SQ_NEED_WAKEUP; + smp_wmb(); + } + iocb = aio_peek_sqring(ctx, &index, &nhead); if (!iocb) { /* @@ -3235,6 +3324,9 @@ static int aio_sq_thread(void *data) if (signal_pending(current)) flush_signals(current); schedule(); + + if (aso->thread_poll) + ring->kflags &= ~IORING_SQ_NEED_WAKEUP; } finish_wait(&aso->wait, &wait); if (!iocb) @@ -3260,7 +3352,7 @@ static int aio_sq_thread(void *data) aio_commit_sqring(ctx, nhead); } while ((iocb = aio_peek_sqring(ctx, &index, &nhead)) != NULL); - aio_submit_iocbs(ctx, iocbs, i, cur_mm, mm_fault); + inflight += aio_submit_iocbs(ctx, iocbs, i, cur_mm, mm_fault); } current->files = old_files; set_fs(old_fs); @@ -3271,13 +3363,6 @@ static int aio_sq_thread(void *data) return 0; } -struct aio_io_work { - struct work_struct work; - struct kioctx *ctx; - struct iocb iocb; - unsigned iocb_index; -}; - static void aio_sq_wq_submit_work(struct work_struct *work) { struct aio_io_work *aiw = container_of(work, struct aio_io_work, work); @@ -3347,7 +3432,6 @@ static bool aio_sq_try_inline(struct kioctx *ctx, const struct iocb *iocb, static int aio_sq_wq_submit(struct kioctx *ctx, unsigned int to_submit) { - struct aio_io_work *work; const struct iocb *iocb; unsigned nhead, index; int ret, queued; @@ -3356,18 +3440,17 @@ static int aio_sq_wq_submit(struct kioctx *ctx, unsigned int to_submit) while ((iocb = aio_peek_sqring(ctx, &index, &nhead)) != NULL) { ret = aio_sq_try_inline(ctx, iocb, index); if (!ret) { - work = kmalloc(sizeof(*work), GFP_KERNEL); - if (!work) { - ret = -ENOMEM; + struct iocb_submit is = { + .iocb = iocb, + .index = index + }; + + ret = aio_queue_async_work(ctx, &is); + if (ret) break; - } - memcpy(&work->iocb, iocb, sizeof(*iocb)); - aio_commit_sqring(ctx, nhead); - work->iocb_index = index; - INIT_WORK(&work->work, aio_sq_wq_submit_work); - work->ctx = ctx; - queue_work(ctx->sq_offload.wq, &work->work); } + + aio_commit_sqring(ctx, nhead); queued++; if (queued == to_submit) break; diff --git a/include/uapi/linux/aio_abi.h b/include/uapi/linux/aio_abi.h index b09b1976e038..26173de01fee 100644 --- a/include/uapi/linux/aio_abi.h +++ b/include/uapi/linux/aio_abi.h @@ -113,6 +113,9 @@ struct iocb { #define IOCTX_FLAG_FIXEDBUFS (1 << 2) /* IO buffers are fixed */ #define IOCTX_FLAG_SQTHREAD (1 << 3) /* Use SQ thread */ #define IOCTX_FLAG_SQWQ (1 << 4) /* Use SQ workqueue */ +#define IOCTX_FLAG_SQPOLL (1 << 5) /* SQ thread polls */ + +#define IORING_SQ_NEED_WAKEUP (1 << 0) /* needs io_ring_enter wakeup */ struct aio_sq_ring { union { @@ -121,6 +124,7 @@ struct aio_sq_ring { u32 tail; /* app producer tail */ u32 nr_events; /* max events in ring */ u16 sq_thread_cpu; + u16 kflags; /* kernel info to app */ u64 iocbs; /* setup pointer to app iocbs */ }; u32 pad[16];

[20/22] aio: enable polling for IOCTX_FLAG_SQTHREAD

Commit Message

Patch