Whamcloud - gitweb
LU-4198 clio: AIO support for direct IO
[fs/lustre-release.git] / lustre / llite / vvp_page.c
index f6ff571..0c9d552 100644 (file)
  *
  * You should have received a copy of the GNU General Public License
  * version 2 along with this program; If not, see
- * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
- *
- * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
- * CA 95054 USA or visit www.sun.com if you need additional information or
- * have any questions.
+ * http://www.gnu.org/licenses/gpl-2.0.html
  *
  * GPL HEADER END
  */
@@ -27,7 +23,7 @@
  * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
  * Use is subject to license terms.
  *
- * Copyright (c) 2011, 2014, Intel Corporation.
+ * Copyright (c) 2011, 2017, Intel Corporation.
  */
 /*
  * This file is part of Lustre, http://www.lustre.org/
  *
  */
 
-static void vvp_page_fini_common(struct vvp_page *vpg)
+static void vvp_page_fini_common(struct vvp_page *vpg, struct pagevec *pvec)
 {
        struct page *vmpage = vpg->vpg_page;
 
        LASSERT(vmpage != NULL);
-       page_cache_release(vmpage);
+       if (pvec) {
+               if (!pagevec_add(pvec, vmpage))
+                       pagevec_release(pvec);
+       } else {
+               put_page(vmpage);
+       }
 }
 
 static void vvp_page_fini(const struct lu_env *env,
-                         struct cl_page_slice *slice)
+                         struct cl_page_slice *slice,
+                         struct pagevec *pvec)
 {
        struct vvp_page *vpg     = cl2vvp_page(slice);
        struct page     *vmpage  = vpg->vpg_page;
@@ -77,7 +79,7 @@ static void vvp_page_fini(const struct lu_env *env,
         * VPG_FREEING state.
         */
        LASSERT((struct cl_page *)vmpage->private != slice->cpl_page);
-       vvp_page_fini_common(vpg);
+       vvp_page_fini_common(vpg, pvec);
 }
 
 static int vvp_page_own(const struct lu_env *env,
@@ -87,6 +89,8 @@ static int vvp_page_own(const struct lu_env *env,
        struct vvp_page *vpg    = cl2vvp_page(slice);
        struct page     *vmpage = vpg->vpg_page;
 
+       ENTRY;
+
        LASSERT(vmpage != NULL);
        if (nonblock) {
                if (!trylock_page(vmpage))
@@ -103,7 +107,7 @@ static int vvp_page_own(const struct lu_env *env,
        lock_page(vmpage);
        wait_on_page_writeback(vmpage);
 
-       return 0;
+       RETURN(0);
 }
 
 static void vvp_page_assume(const struct lu_env *env,
@@ -132,10 +136,14 @@ static void vvp_page_disown(const struct lu_env *env,
 {
        struct page *vmpage = cl2vm_page(slice);
 
+       ENTRY;
+
        LASSERT(vmpage != NULL);
        LASSERT(PageLocked(vmpage));
 
        unlock_page(cl2vm_page(slice));
+
+       EXIT;
 }
 
 static void vvp_page_discard(const struct lu_env *env,
@@ -151,7 +159,7 @@ static void vvp_page_discard(const struct lu_env *env,
        if (vpg->vpg_defer_uptodate && !vpg->vpg_ra_used)
                ll_ra_stats_inc(vmpage->mapping->host, RA_STAT_DISCARDED);
 
-       ll_invalidate_page(vmpage);
+       generic_error_remove_page(vmpage->mapping, vmpage);
 }
 
 static void vvp_page_delete(const struct lu_env *env,
@@ -167,13 +175,10 @@ static void vvp_page_delete(const struct lu_env *env,
        LASSERT((struct cl_page *)vmpage->private == page);
        LASSERT(inode == vvp_object_inode(obj));
 
-       vvp_write_complete(cl2vvp(obj), cl2vvp_page(slice));
-
        /* Drop the reference count held in vvp_page_init */
        refc = atomic_dec_return(&page->cp_ref);
        LASSERTF(refc >= 1, "page = %p, refc = %d\n", page, refc);
 
-       ClearPageUptodate(vmpage);
        ClearPagePrivate(vmpage);
        vmpage->private = 0;
        /*
@@ -216,12 +221,15 @@ static int vvp_page_prep_write(const struct lu_env *env,
                                struct cl_io *unused)
 {
        struct page *vmpage = cl2vm_page(slice);
+       struct cl_page *pg = slice->cpl_page;
 
        LASSERT(PageLocked(vmpage));
        LASSERT(!PageDirty(vmpage));
 
-       set_page_writeback(vmpage);
-       vvp_write_pending(cl2vvp(slice->cpl_obj), cl2vvp_page(slice));
+       /* ll_writepage path is not a sync write, so need to set page writeback
+        * flag */
+       if (pg->cp_sync_io == NULL)
+               set_page_writeback(vmpage);
 
        return 0;
 }
@@ -246,8 +254,8 @@ static void vvp_vmpage_error(struct inode *inode, struct page *vmpage, int ioret
                else
                        set_bit(AS_EIO, &inode->i_mapping->flags);
 
-               if ((ioret == -ESHUTDOWN || ioret == -EINTR) &&
-                    obj->vob_discard_page_warned == 0) {
+               if ((ioret == -ESHUTDOWN || ioret == -EINTR ||
+                    ioret == -EIO) && obj->vob_discard_page_warned == 0) {
                        obj->vob_discard_page_warned = 1;
                        ll_dirty_page_discard_warn(vmpage, ioret);
                }
@@ -273,8 +281,14 @@ static void vvp_page_completion_read(const struct lu_env *env,
        if (ioret == 0)  {
                if (!vpg->vpg_defer_uptodate)
                        cl_page_export(env, page, 1);
-       } else {
+       } else if (vpg->vpg_defer_uptodate) {
                vpg->vpg_defer_uptodate = 0;
+               if (ioret == -EWOULDBLOCK) {
+                       /* mirror read failed, it needs to destroy the page
+                        * because subpage would be from wrong osc when trying
+                        * to read from a new mirror */
+                       generic_error_remove_page(vmpage->mapping, vmpage);
+               }
        }
 
        if (page->cp_sync_io == NULL)
@@ -292,32 +306,21 @@ static void vvp_page_completion_write(const struct lu_env *env,
        struct page     *vmpage = vpg->vpg_page;
        ENTRY;
 
-       LASSERT(ergo(pg->cp_sync_io != NULL, PageLocked(vmpage)));
-       LASSERT(PageWriteback(vmpage));
-
        CL_PAGE_HEADER(D_PAGE, env, pg, "completing WRITE with %d\n", ioret);
 
-       /*
-        * TODO: Actually it makes sense to add the page into oap pending
-        * list again and so that we don't need to take the page out from
-        * SoM write pending list, if we just meet a recoverable error,
-        * -ENOMEM, etc.
-        * To implement this, we just need to return a non zero value in
-        * ->cpo_completion method. The underlying transfer should be notified
-        * and then re-add the page into pending transfer queue.  -jay
-        */
-
-       vpg->vpg_write_queued = 0;
-       vvp_write_complete(cl2vvp(slice->cpl_obj), vpg);
-
-       /*
-        * Only mark the page error only when it's an async write because
-        * applications won't wait for IO to finish.
-        */
-       if (pg->cp_sync_io == NULL)
+       if (pg->cp_sync_io != NULL) {
+               LASSERT(PageLocked(vmpage));
+               LASSERT(!PageWriteback(vmpage));
+       } else {
+               LASSERT(PageWriteback(vmpage));
+               /*
+                * Only mark the page error only when it's an async write
+                * because applications won't wait for IO to finish.
+                */
                vvp_vmpage_error(vvp_object_inode(pg->cp_obj), vmpage, ioret);
 
-       end_page_writeback(vmpage);
+               end_page_writeback(vmpage);
+       }
        EXIT;
 }
 
@@ -348,8 +351,6 @@ static int vvp_page_make_ready(const struct lu_env *env,
                /* This actually clears the dirty bit in the radix
                 * tree. */
                set_page_writeback(vmpage);
-               vvp_write_pending(cl2vvp(slice->cpl_obj),
-                               cl2vvp_page(slice));
                CL_PAGE_HEADER(D_PAGE, env, pg, "readied\n");
        } else if (pg->cp_state == CPS_PAGEOUT) {
                /* is it possible for osc_flush_async_page() to already
@@ -364,23 +365,6 @@ static int vvp_page_make_ready(const struct lu_env *env,
        RETURN(result);
 }
 
-static int vvp_page_is_under_lock(const struct lu_env *env,
-                                 const struct cl_page_slice *slice,
-                                 struct cl_io *io, pgoff_t *max_index)
-{
-       ENTRY;
-
-       if (io->ci_type == CIT_READ || io->ci_type == CIT_WRITE ||
-           io->ci_type == CIT_FAULT) {
-               struct vvp_io *cio = vvp_env_io(env);
-
-               if (unlikely(cio->cui_fd->fd_flags & LL_FILE_GROUP_LOCKED))
-                       *max_index = CL_PAGE_EOF;
-       }
-       RETURN(0);
-}
-
-
 static int vvp_page_print(const struct lu_env *env,
                          const struct cl_page_slice *slice,
                          void *cookie, lu_printer_t printer)
@@ -388,10 +372,9 @@ static int vvp_page_print(const struct lu_env *env,
        struct vvp_page *vpg    = cl2vvp_page(slice);
        struct page     *vmpage = vpg->vpg_page;
 
-       (*printer)(env, cookie, LUSTRE_VVP_NAME"-page@%p(%d:%d:%d) "
+       (*printer)(env, cookie, LUSTRE_VVP_NAME"-page@%p(%d:%d) "
                   "vm@%p ",
-                  vpg, vpg->vpg_defer_uptodate, vpg->vpg_ra_used,
-                  vpg->vpg_write_queued, vmpage);
+                  vpg, vpg->vpg_defer_uptodate, vpg->vpg_ra_used, vmpage);
 
        if (vmpage != NULL) {
                (*printer)(env, cookie, "%lx %d:%d %lx %lu %slru",
@@ -428,7 +411,6 @@ static const struct cl_page_operations vvp_page_ops = {
        .cpo_is_vmlocked   = vvp_page_is_vmlocked,
        .cpo_fini          = vvp_page_fini,
        .cpo_print         = vvp_page_print,
-       .cpo_is_under_lock = vvp_page_is_under_lock,
        .io = {
                [CRT_READ] = {
                        .cpo_prep       = vvp_page_prep_read,
@@ -443,56 +425,12 @@ static const struct cl_page_operations vvp_page_ops = {
        },
 };
 
-static int vvp_transient_page_prep(const struct lu_env *env,
-                                  const struct cl_page_slice *slice,
-                                  struct cl_io *unused)
-{
-       ENTRY;
-       /* transient page should always be sent. */
-       RETURN(0);
-}
-
-static void vvp_transient_page_verify(const struct cl_page *page)
-{
-}
-
-static int vvp_transient_page_own(const struct lu_env *env,
-                                  const struct cl_page_slice *slice,
-                                  struct cl_io *unused, int nonblock)
-{
-        vvp_transient_page_verify(slice->cpl_page);
-        return 0;
-}
-
-static void vvp_transient_page_assume(const struct lu_env *env,
-                                      const struct cl_page_slice *slice,
-                                      struct cl_io *unused)
-{
-        vvp_transient_page_verify(slice->cpl_page);
-}
-
-static void vvp_transient_page_unassume(const struct lu_env *env,
-                                        const struct cl_page_slice *slice,
-                                        struct cl_io *unused)
-{
-        vvp_transient_page_verify(slice->cpl_page);
-}
-
-static void vvp_transient_page_disown(const struct lu_env *env,
-                                      const struct cl_page_slice *slice,
-                                      struct cl_io *unused)
-{
-        vvp_transient_page_verify(slice->cpl_page);
-}
-
 static void vvp_transient_page_discard(const struct lu_env *env,
                                        const struct cl_page_slice *slice,
                                        struct cl_io *unused)
 {
         struct cl_page *page = slice->cpl_page;
 
-        vvp_transient_page_verify(slice->cpl_page);
-
         /*
          * For transient pages, remove it from the radix tree.
          */
@@ -502,54 +440,25 @@ static void vvp_transient_page_discard(const struct lu_env *env,
 static int vvp_transient_page_is_vmlocked(const struct lu_env *env,
                                          const struct cl_page_slice *slice)
 {
-       struct inode    *inode = vvp_object_inode(slice->cpl_obj);
-       int     locked;
-
-       locked = !mutex_trylock(&inode->i_mutex);
-       if (!locked)
-               mutex_unlock(&inode->i_mutex);
-       return locked ? -EBUSY : -ENODATA;
-}
-
-static void
-vvp_transient_page_completion(const struct lu_env *env,
-                              const struct cl_page_slice *slice,
-                              int ioret)
-{
-        vvp_transient_page_verify(slice->cpl_page);
+       return -EBUSY;
 }
 
 static void vvp_transient_page_fini(const struct lu_env *env,
-                                   struct cl_page_slice *slice)
+                                   struct cl_page_slice *slice,
+                                   struct pagevec *pvec)
 {
        struct vvp_page *vpg = cl2vvp_page(slice);
-       struct cl_page *clp = slice->cpl_page;
-       struct vvp_object *clobj = cl2vvp(clp->cp_obj);
+       struct vvp_object *clobj = cl2vvp(slice->cpl_obj);
 
-       vvp_page_fini_common(vpg);
+       vvp_page_fini_common(vpg, pvec);
        atomic_dec(&clobj->vob_transient_pages);
 }
 
 static const struct cl_page_operations vvp_transient_page_ops = {
-       .cpo_own                = vvp_transient_page_own,
-       .cpo_assume             = vvp_transient_page_assume,
-       .cpo_unassume           = vvp_transient_page_unassume,
-       .cpo_disown             = vvp_transient_page_disown,
        .cpo_discard            = vvp_transient_page_discard,
        .cpo_fini               = vvp_transient_page_fini,
        .cpo_is_vmlocked        = vvp_transient_page_is_vmlocked,
        .cpo_print              = vvp_page_print,
-       .cpo_is_under_lock      = vvp_page_is_under_lock,
-       .io = {
-               [CRT_READ] = {
-                       .cpo_prep       = vvp_transient_page_prep,
-                       .cpo_completion = vvp_transient_page_completion,
-               },
-               [CRT_WRITE] = {
-                       .cpo_prep       = vvp_transient_page_prep,
-                       .cpo_completion = vvp_transient_page_completion,
-               }
-       }
 };
 
 int vvp_page_init(const struct lu_env *env, struct cl_object *obj,
@@ -561,9 +470,8 @@ int vvp_page_init(const struct lu_env *env, struct cl_object *obj,
        CLOBINVRNT(env, obj, vvp_object_invariant(obj));
 
        vpg->vpg_page = vmpage;
-       page_cache_get(vmpage);
+       get_page(vmpage);
 
-       INIT_LIST_HEAD(&vpg->vpg_pending_linkage);
        if (page->cp_type == CPT_CACHEABLE) {
                /* in cache, decref in vvp_page_delete */
                atomic_inc(&page->cp_ref);