From: Suparna Bhattacharya <suparna@in.ibm.com> This patch tries be a little fairer across multiple io contexts in handling retries, helping make sure progress happens uniformly across different io contexts (especially if they are acting on independent queues). It splices the ioctx runlist before processing it in __aio_run_iocbs. If new iocbs get added to the ctx in meantime, it queues a fresh workqueue entry instead of handling them righaway, so that other ioctxs' retries get a chance to be processed before the newer entries in the queue. This might make a difference in a situation where retries are getting queued very fast on one ioctx, while the workqueue entry for another ioctx is stuck behind it. I've only seen this occasionally earlier and can't recreate it consistently, but may be worth trying out. fs/aio.c | 22 +++++++++++++++++----- 1 files changed, 17 insertions(+), 5 deletions(-) diff -puN fs/aio.c~aio-splice-runlist fs/aio.c --- 25/fs/aio.c~aio-splice-runlist 2003-11-11 10:15:20.000000000 -0800 +++ 25-akpm/fs/aio.c 2003-11-11 10:15:20.000000000 -0800 @@ -767,13 +767,15 @@ out: * Assumes it is operating within the aio issuer's mm * context. Expects to be called with ctx->ctx_lock held */ -static void __aio_run_iocbs(struct kioctx *ctx) +static int __aio_run_iocbs(struct kioctx *ctx) { struct kiocb *iocb; int count = 0; + LIST_HEAD(run_list); - while (!list_empty(&ctx->run_list)) { - iocb = list_entry(ctx->run_list.next, struct kiocb, + list_splice_init(&ctx->run_list, &run_list); + while (!list_empty(&run_list)) { + iocb = list_entry(run_list.next, struct kiocb, ki_run_list); list_del(&iocb->ki_run_list); /* @@ -786,6 +788,9 @@ static void __aio_run_iocbs(struct kioct count++; } aio_run++; + if (!list_empty(&ctx->run_list)) + return 1; + return 0; } /* @@ -797,9 +802,13 @@ static void __aio_run_iocbs(struct kioct */ static inline void aio_run_iocbs(struct kioctx *ctx) { + int requeue; + spin_lock_irq(&ctx->ctx_lock); - __aio_run_iocbs(ctx); + requeue = __aio_run_iocbs(ctx); spin_unlock_irq(&ctx->ctx_lock); + if (requeue) + queue_work(aio_wq, &ctx->wq); } /* @@ -815,14 +824,17 @@ static void aio_kick_handler(void *data) { struct kioctx *ctx = data; mm_segment_t oldfs = get_fs(); + int requeue; set_fs(USER_DS); use_mm(ctx->mm); spin_lock_irq(&ctx->ctx_lock); - __aio_run_iocbs(ctx); + requeue = __aio_run_iocbs(ctx); unuse_mm(ctx->mm); spin_unlock_irq(&ctx->ctx_lock); set_fs(oldfs); + if (requeue) + queue_work(aio_wq, &ctx->wq); } _