pnfsblock: bl_write_pagelist

author Fred Isaman <iisaman@citi.umich.edu>

Sun, 31 Jul 2011 00:52:54 +0000 (20:52 -0400)

committer Trond Myklebust <Trond.Myklebust@netapp.com>

Sun, 31 Jul 2011 16:18:17 +0000 (12:18 -0400)
author Fred Isaman <iisaman@citi.umich.edu>
Sun, 31 Jul 2011 00:52:54 +0000 (20:52 -0400)
committer Trond Myklebust <Trond.Myklebust@netapp.com>
Sun, 31 Jul 2011 16:18:17 +0000 (12:18 -0400)
diff --git a/fs/nfs/blocklayout/blocklayout.c b/fs/nfs/blocklayout/blocklayout.c

index facb5ba2120484b866c74888f6d5da2ed730f9fd..2e373826db802907313ecb21214e5d698b824337 100644 (file)
--- a/fs/nfs/blocklayout/blocklayout.c
+++ b/fs/nfs/blocklayout/blocklayout.c
@@ -74,6 +74,19 @@ static int is_hole(struct pnfs_block_extent *be, sector_t isect)
                 return !bl_is_sector_init(be->be_inval, isect);
  }
  
+/* Given the be associated with isect, determine if page data can be
+ * written to disk.
+ */
+static int is_writable(struct pnfs_block_extent *be, sector_t isect)
+{
+       if (be->be_state == PNFS_BLOCK_READWRITE_DATA)
+               return 1;
+       else if (be->be_state != PNFS_BLOCK_INVALID_DATA)
+               return 0;
+       else
+               return bl_is_sector_init(be->be_inval, isect);
+}
+
  /* The data we are handed might be spread across several bios.  We need
   * to track when the last one is finished.
   */
@@ -316,11 +329,121 @@ out:
         return PNFS_NOT_ATTEMPTED;
  }
  
+/* This is basically copied from mpage_end_io_read */
+static void bl_end_io_write(struct bio *bio, int err)
+{
+       struct parallel_io *par = bio->bi_private;
+       const int uptodate = test_bit(BIO_UPTODATE, &bio->bi_flags);
+       struct nfs_write_data *wdata = (struct nfs_write_data *)par->data;
+
+       if (!uptodate) {
+               if (!wdata->pnfs_error)
+                       wdata->pnfs_error = -EIO;
+               bl_set_lo_fail(wdata->lseg);
+       }
+       bio_put(bio);
+       put_parallel(par);
+}
+
+/* Function scheduled for call during bl_end_par_io_write,
+ * it marks sectors as written and extends the commitlist.
+ */
+static void bl_write_cleanup(struct work_struct *work)
+{
+       struct rpc_task *task;
+       struct nfs_write_data *wdata;
+       dprintk("%s enter\n", __func__);
+       task = container_of(work, struct rpc_task, u.tk_work);
+       wdata = container_of(task, struct nfs_write_data, task);
+       pnfs_ld_write_done(wdata);
+}
+
+/* Called when last of bios associated with a bl_write_pagelist call finishes */
+static void
+bl_end_par_io_write(void *data)
+{
+       struct nfs_write_data *wdata = data;
+
+       /* STUB - ignoring error handling */
+       wdata->task.tk_status = 0;
+       wdata->verf.committed = NFS_FILE_SYNC;
+       INIT_WORK(&wdata->task.u.tk_work, bl_write_cleanup);
+       schedule_work(&wdata->task.u.tk_work);
+}
+
  static enum pnfs_try_status
-bl_write_pagelist(struct nfs_write_data *wdata,
-                 int sync)
+bl_write_pagelist(struct nfs_write_data *wdata, int sync)
  {
-       return PNFS_NOT_ATTEMPTED;
+       int i;
+       struct bio *bio = NULL;
+       struct pnfs_block_extent *be = NULL;
+       sector_t isect, extent_length = 0;
+       struct parallel_io *par;
+       loff_t offset = wdata->args.offset;
+       size_t count = wdata->args.count;
+       struct page **pages = wdata->args.pages;
+       int pg_index = wdata->args.pgbase >> PAGE_CACHE_SHIFT;
+
+       dprintk("%s enter, %Zu@%lld\n", __func__, count, offset);
+       /* At this point, wdata->pages is a (sequential) list of nfs_pages.
+        * We want to write each, and if there is an error remove it from
+        * list and call
+        * nfs_retry_request(req) to have it redone using nfs.
+        * QUEST? Do as block or per req?  Think have to do per block
+        * as part of end_bio
+        */
+       par = alloc_parallel(wdata);
+       if (!par)
+               return PNFS_NOT_ATTEMPTED;
+       par->call_ops = *wdata->mds_ops;
+       par->call_ops.rpc_call_done = bl_rpc_do_nothing;
+       par->pnfs_callback = bl_end_par_io_write;
+       /* At this point, have to be more careful with error handling */
+
+       isect = (sector_t) ((offset & (long)PAGE_CACHE_MASK) >> SECTOR_SHIFT);
+       for (i = pg_index; i < wdata->npages ; i++) {
+               if (!extent_length) {
+                       /* We've used up the previous extent */
+                       bl_put_extent(be);
+                       bio = bl_submit_bio(WRITE, bio);
+                       /* Get the next one */
+                       be = bl_find_get_extent(BLK_LSEG2EXT(wdata->lseg),
+                                            isect, NULL);
+                       if (!be || !is_writable(be, isect)) {
+                               wdata->pnfs_error = -ENOMEM;
+                               goto out;
+                       }
+                       extent_length = be->be_length -
+                               (isect - be->be_f_offset);
+               }
+               for (;;) {
+                       if (!bio) {
+                               bio = bio_alloc(GFP_NOIO, wdata->npages - i);
+                               if (!bio) {
+                                       wdata->pnfs_error = -ENOMEM;
+                                       goto out;
+                               }
+                               bio->bi_sector = isect - be->be_f_offset +
+                                       be->be_v_offset;
+                               bio->bi_bdev = be->be_mdev;
+                               bio->bi_end_io = bl_end_io_write;
+                               bio->bi_private = par;
+                       }
+                       if (bio_add_page(bio, pages[i], PAGE_SIZE, 0))
+                               break;
+                       bio = bl_submit_bio(WRITE, bio);
+               }
+               isect += PAGE_CACHE_SECTORS;
+               extent_length -= PAGE_CACHE_SECTORS;
+       }
+       wdata->res.count = (isect << SECTOR_SHIFT) - (offset);
+       if (count < wdata->res.count)
+               wdata->res.count = count;
+out:
+       bl_put_extent(be);
+       bl_submit_bio(WRITE, bio);
+       put_parallel(par);
+       return PNFS_ATTEMPTED;
  }
  
  /* FIXME - range ignored */
author	Fred Isaman <iisaman@citi.umich.edu>
	Sun, 31 Jul 2011 00:52:54 +0000 (20:52 -0400)
committer	Trond Myklebust <Trond.Myklebust@netapp.com>
	Sun, 31 Jul 2011 16:18:17 +0000 (12:18 -0400)