aio: use xchg() instead of completion_lock

author Kent Overstreet <koverstreet@google.com>

Sun, 10 Mar 2013 10:55:42 +0000 (21:55 +1100)

committer Stephen Rothwell <sfr@canb.auug.org.au>

Tue, 12 Mar 2013 03:57:43 +0000 (14:57 +1100)
author Kent Overstreet <koverstreet@google.com>
Sun, 10 Mar 2013 10:55:42 +0000 (21:55 +1100)
committer Stephen Rothwell <sfr@canb.auug.org.au>
Tue, 12 Mar 2013 03:57:43 +0000 (14:57 +1100)
diff --git a/fs/aio.c b/fs/aio.c

index 89fa4dbf1f8a77e6a5cd90b99937046d1a38bae6..51ebd2dcd632f48438348b4b8776109e5ca1d2c0 100644 (file)
--- a/fs/aio.c
+++ b/fs/aio.c
@@ -102,11 +102,11 @@ struct kioctx {
         struct {
                 struct mutex    ring_lock;
                 wait_queue_head_t wait;
+               unsigned        shadow_tail;
         } ____cacheline_aligned_in_smp;
  
         struct {
                 unsigned        tail;
-               spinlock_t      completion_lock;
         } ____cacheline_aligned_in_smp;
  
         struct page             *internal_pages[AIO_RING_PAGES];
@@ -321,9 +321,9 @@ static void free_ioctx(struct kioctx *ctx)
         kunmap_atomic(ring);
  
         while (atomic_read(&ctx->reqs_available) < ctx->nr) {
-               wait_event(ctx->wait, head != ctx->tail);
+               wait_event(ctx->wait, head != ctx->shadow_tail);
  
-               avail = (head < ctx->tail ? ctx->tail : ctx->nr) - head;
+               avail = (head < ctx->shadow_tail ? ctx->shadow_tail : ctx->nr) - head;
  
                 atomic_add(avail, &ctx->reqs_available);
                 head += avail;
@@ -388,7 +388,6 @@ static struct kioctx *ioctx_alloc(unsigned nr_events)
         rcu_read_unlock();
  
         spin_lock_init(&ctx->ctx_lock);
-       spin_lock_init(&ctx->completion_lock);
         mutex_init(&ctx->ring_lock);
         init_waitqueue_head(&ctx->wait);
  
@@ -686,18 +685,19 @@ void aio_complete(struct kiocb *iocb, long res, long res2)
                  * free_ioctx()
                  */
                 atomic_inc(&ctx->reqs_available);
+               smp_mb__after_atomic_inc();
                 /* Still need the wake_up in case free_ioctx is waiting */
                 goto put_rq;
         }
  
         /*
-        * Add a completion event to the ring buffer. Must be done holding
-        * ctx->ctx_lock to prevent other code from messing with the tail
-        * pointer since we might be called from irq context.
+        * Add a completion event to the ring buffer; ctx->tail is both our lock
+        * and the canonical version of the tail pointer.
          */
-       spin_lock_irqsave(&ctx->completion_lock, flags);
+       local_irq_save(flags);
+       while ((tail = xchg(&ctx->tail, UINT_MAX)) == UINT_MAX)
+               cpu_relax();
  
-       tail = ctx->tail;
         pos = tail + AIO_EVENTS_OFFSET;
  
         if (++tail >= ctx->nr)
@@ -723,14 +723,18 @@ void aio_complete(struct kiocb *iocb, long res, long res2)
          */
         smp_wmb();      /* make event visible before updating tail */
  
-       ctx->tail = tail;
+       ctx->shadow_tail = tail;
  
         ring = kmap_atomic(ctx->ring_pages[0]);
         ring->tail = tail;
         kunmap_atomic(ring);
         flush_dcache_page(ctx->ring_pages[0]);
  
-       spin_unlock_irqrestore(&ctx->completion_lock, flags);
+       /* unlock, make new tail visible before checking waitlist */
+       smp_mb();
+
+       ctx->tail = tail;
+       local_irq_restore(flags);
  
         pr_debug("added to ring %p at [%u]\n", iocb, tail);
  
@@ -746,14 +750,6 @@ put_rq:
         /* everything turned out well, dispose of the aiocb. */
         aio_put_req(iocb);
  
-       /*
-        * We have to order our ring_info tail store above and test
-        * of the wait list below outside the wait lock.  This is
-        * like in wake_up_bit() where clearing a bit has to be
-        * ordered with the unlocked test.
-        */
-       smp_mb();
-
         if (waitqueue_active(&ctx->wait))
                 wake_up(&ctx->wait);
  
@@ -781,19 +777,19 @@ static int aio_read_events_ring(struct kioctx *ctx,
         head = ring->head;
         kunmap_atomic(ring);
  
-       pr_debug("h%u t%u m%u\n", head, ctx->tail, ctx->nr);
+       pr_debug("h%u t%u m%u\n", head, ctx->shadow_tail, ctx->nr);
  
-       if (head == ctx->tail)
+       if (head == ctx->shadow_tail)
                 goto out;
  
         __set_current_state(TASK_RUNNING);
  
         while (ret < nr) {
-               unsigned i = (head < ctx->tail ? ctx->tail : ctx->nr) - head;
+               unsigned i = (head < ctx->shadow_tail ? ctx->shadow_tail : ctx->nr) - head;
                 struct io_event *ev;
                 struct page *page;
  
-               if (head == ctx->tail)
+               if (head == ctx->shadow_tail)
                         break;
  
                 i = min_t(int, i, nr - ret);
@@ -823,7 +819,7 @@ static int aio_read_events_ring(struct kioctx *ctx,
         kunmap_atomic(ring);
         flush_dcache_page(ctx->ring_pages[0]);
  
-       pr_debug("%d  h%u t%u\n", ret, head, ctx->tail);
+       pr_debug("%d  h%u t%u\n", ret, head, ctx->shadow_tail);
  
         put_reqs_available(ctx, ret);
  out:
author	Kent Overstreet <koverstreet@google.com>
	Sun, 10 Mar 2013 10:55:42 +0000 (21:55 +1100)
committer	Stephen Rothwell <sfr@canb.auug.org.au>
	Tue, 12 Mar 2013 03:57:43 +0000 (14:57 +1100)