LU-1669 vvp: Use lockless __generic_file_aio_write

author Prakash Surya <surya1@llnl.gov>

Thu, 3 Oct 2013 00:16:51 +0000 (17:16 -0700)

committer Oleg Drokin <oleg.drokin@intel.com>

Fri, 12 Sep 2014 17:38:37 +0000 (17:38 +0000)
author Prakash Surya <surya1@llnl.gov>
Thu, 3 Oct 2013 00:16:51 +0000 (17:16 -0700)
committer Oleg Drokin <oleg.drokin@intel.com>
Fri, 12 Sep 2014 17:38:37 +0000 (17:38 +0000)
diff --git a/lustre/llite/rw26.c b/lustre/llite/rw26.c

index b605fa4..b9c8293 100644 (file)
--- a/lustre/llite/rw26.c
+++ b/lustre/llite/rw26.c
@@ -412,13 +412,6 @@ static ssize_t ll_direct_IO_26(int rw, struct kiocb *iocb,
          io = ccc_env_io(env)->cui_cl.cis_io;
          LASSERT(io != NULL);
  
-       /* 0. Need locking between buffered and direct access. and race with
-        *    size changing by concurrent truncates and writes.
-        * 1. Need inode mutex to operate transient pages.
-        */
-       if (rw == READ)
-               mutex_lock(&inode->i_mutex);
-
          LASSERT(obj->cob_transient_pages == 0);
          for (seg = 0; seg < nr_segs; seg++) {
                  long iov_left = iov[seg].iov_len;
@@ -480,8 +473,6 @@ static ssize_t ll_direct_IO_26(int rw, struct kiocb *iocb,
          }
  out:
         LASSERT(obj->cob_transient_pages == 0);
-       if (rw == READ)
-               mutex_unlock(&inode->i_mutex);
  
          if (tot_bytes > 0) {
                 struct ccc_io *cio = ccc_env_io(env);
diff --git a/lustre/llite/vvp_io.c b/lustre/llite/vvp_io.c

index df42e28..728f802 100644 (file)
--- a/lustre/llite/vvp_io.c
+++ b/lustre/llite/vvp_io.c
@@ -800,14 +800,33 @@ static int vvp_io_write_start(const struct lu_env *env,
                 LASSERT(cio->cui_iocb->ki_pos == pos);
         }
  
-        CDEBUG(D_VFSTRACE, "write: [%lli, %lli)\n", pos, pos + (long long)cnt);
+       CDEBUG(D_VFSTRACE, "write: [%lli, %lli)\n", pos, pos + (long long)cnt);
  
-        if (cio->cui_iov == NULL) /* from a temp io in ll_cl_init(). */
-                result = 0;
-        else
-               result = generic_file_aio_write(cio->cui_iocb,
-                                               cio->cui_iov, cio->cui_nrsegs,
-                                               cio->cui_iocb->ki_pos);
+       if (cio->cui_iov == NULL) {
+               /* from a temp io in ll_cl_init(). */
+               result = 0;
+       } else {
+               /*
+                * When using the locked AIO function (generic_file_aio_write())
+                * testing has shown the inode mutex to be a limiting factor
+                * with multi-threaded single shared file performance. To get
+                * around this, we now use the lockless version. To maintain
+                * consistency, proper locking to protect against writes,
+                * trucates, etc. is handled in the higher layers of lustre.
+                */
+               result = __generic_file_aio_write(cio->cui_iocb,
+                                                 cio->cui_iov, cio->cui_nrsegs,
+                                                 &cio->cui_iocb->ki_pos);
+               if (result > 0 || result == -EIOCBQUEUED) {
+                       ssize_t err;
+
+                       err = generic_write_sync(cio->cui_iocb->ki_filp,
+                                                pos, result);
+                       if (err < 0 && result > 0)
+                               result = err;
+               }
+
+       }
         if (result > 0) {
                 result = vvp_io_write_commit(env, io);
                 if (cio->u.write.cui_written > 0) {
diff --git a/lustre/llite/vvp_page.c b/lustre/llite/vvp_page.c

index d031f8b..158b7fe 100644 (file)
--- a/lustre/llite/vvp_page.c
+++ b/lustre/llite/vvp_page.c
@@ -424,9 +424,6 @@ static const struct cl_page_operations vvp_page_ops = {
  
  static void vvp_transient_page_verify(const struct cl_page *page)
  {
-       struct inode *inode = ccc_object_inode(page->cp_obj);
-
-       LASSERT(!mutex_trylock(&inode->i_mutex));
  }
  
  static int vvp_transient_page_own(const struct lu_env *env,
@@ -500,7 +497,6 @@ static void vvp_transient_page_fini(const struct lu_env *env,
         struct ccc_object *clobj = cl2ccc(clp->cp_obj);
  
         vvp_page_fini_common(cp);
-       LASSERT(!mutex_trylock(&clobj->cob_inode->i_mutex));
         clobj->cob_transient_pages--;
  }
  
@@ -548,7 +544,6 @@ int vvp_page_init(const struct lu_env *env, struct cl_object *obj,
         } else {
                 struct ccc_object *clobj = cl2ccc(obj);
  
-               LASSERT(!mutex_trylock(&clobj->cob_inode->i_mutex));
                 cl_page_slice_add(page, &cpg->cpg_cl, obj, index,
                                 &vvp_transient_page_ops);
                 clobj->cob_transient_pages++;
diff --git a/lustre/obdclass/cl_page.c b/lustre/obdclass/cl_page.c

index 6e70d46..7badb8b 100644 (file)
--- a/lustre/obdclass/cl_page.c
+++ b/lustre/obdclass/cl_page.c
@@ -278,11 +278,6 @@ EXPORT_SYMBOL(cl_page_find);
  
  static inline int cl_page_invariant(const struct cl_page *pg)
  {
-       /*
-        * Page invariant is protected by a VM lock.
-        */
-       LINVRNT(cl_page_is_vmlocked(NULL, pg));
-
         return cl_page_in_use_noref(pg);
  }
  
@@ -958,7 +953,6 @@ void cl_page_completion(const struct lu_env *env,
                                 (const struct lu_env *,
                                  const struct cl_page_slice *, int), ioret);
          if (anchor) {
-                LASSERT(cl_page_is_vmlocked(env, pg));
                  LASSERT(pg->cp_sync_io == anchor);
                  pg->cp_sync_io = NULL;
         }
author	Prakash Surya <surya1@llnl.gov>
	Thu, 3 Oct 2013 00:16:51 +0000 (17:16 -0700)
committer	Oleg Drokin <oleg.drokin@intel.com>
	Fri, 12 Sep 2014 17:38:37 +0000 (17:38 +0000)
lustre/llite/rw26.c		patch \| blob \| history
lustre/llite/vvp_io.c		patch \| blob \| history
lustre/llite/vvp_page.c		patch \| blob \| history
lustre/obdclass/cl_page.c		patch \| blob \| history