Whamcloud - gitweb
LU-6271 osc: handle osc eviction correctly
[fs/lustre-release.git] / lustre / osc / osc_object.c
index 728b758..16bb564 100644 (file)
@@ -75,16 +75,11 @@ static int osc_object_init(const struct lu_env *env, struct lu_object *obj,
 {
         struct osc_object           *osc   = lu2osc(obj);
         const struct cl_object_conf *cconf = lu2cl_conf(conf);
-        int i;
 
         osc->oo_oinfo = cconf->u.coc_oinfo;
 #ifdef CONFIG_LUSTRE_DEBUG_EXPENSIVE_CHECK
        mutex_init(&osc->oo_debug_mutex);
 #endif
-       spin_lock_init(&osc->oo_seatbelt);
-        for (i = 0; i < CRT_NR; ++i)
-               INIT_LIST_HEAD(&osc->oo_inflight[i]);
-
        INIT_LIST_HEAD(&osc->oo_ready_item);
        INIT_LIST_HEAD(&osc->oo_hp_ready_item);
        INIT_LIST_HEAD(&osc->oo_write_item);
@@ -102,6 +97,9 @@ static int osc_object_init(const struct lu_env *env, struct lu_object *obj,
        spin_lock_init(&osc->oo_ol_spin);
        INIT_LIST_HEAD(&osc->oo_ol_list);
 
+       atomic_set(&osc->oo_nr_ios, 0);
+       init_waitqueue_head(&osc->oo_io_waitq);
+
        cl_object_page_init(lu2cl(obj), sizeof(struct osc_page));
 
        return 0;
@@ -110,10 +108,6 @@ static int osc_object_init(const struct lu_env *env, struct lu_object *obj,
 static void osc_object_free(const struct lu_env *env, struct lu_object *obj)
 {
        struct osc_object *osc = lu2osc(obj);
-       int i;
-
-       for (i = 0; i < CRT_NR; ++i)
-               LASSERT(list_empty(&osc->oo_inflight[i]));
 
        LASSERT(list_empty(&osc->oo_ready_item));
        LASSERT(list_empty(&osc->oo_hp_ready_item));
@@ -128,6 +122,7 @@ static void osc_object_free(const struct lu_env *env, struct lu_object *obj)
        LASSERT(atomic_read(&osc->oo_nr_reads) == 0);
        LASSERT(atomic_read(&osc->oo_nr_writes) == 0);
        LASSERT(list_empty(&osc->oo_ol_list));
+       LASSERT(atomic_read(&osc->oo_nr_ios) == 0);
 
        lu_object_fini(obj);
        OBD_SLAB_FREE_PTR(osc, osc_object_kmem);
@@ -230,6 +225,116 @@ static int osc_object_prune(const struct lu_env *env, struct cl_object *obj)
                              osc_object_ast_clear, osc);
        return 0;
 }
+/**
+ * Find any ldlm lock covers the osc object.
+ * \retval 0   not found
+ * \retval 1   find one
+ * \retval < 0 error
+ */
+static int osc_object_find_cbdata(const struct lu_env *env,
+                                 struct cl_object *obj, ldlm_iterator_t iter,
+                                 void *data)
+{
+       struct ldlm_res_id              res_id;
+       struct obd_device               *obd;
+       int                             rc = 0;
+
+       ostid_build_res_name(&cl2osc(obj)->oo_oinfo->loi_oi, &res_id);
+       obd = obj->co_lu.lo_dev->ld_obd;
+       rc = ldlm_resource_iterate(obd->obd_namespace, &res_id, iter, data);
+       if (rc == LDLM_ITER_STOP)
+               return 1;
+
+       if (rc == LDLM_ITER_CONTINUE)
+               return 0;
+
+       return rc;
+}
+
+static int osc_object_fiemap(const struct lu_env *env, struct cl_object *obj,
+                            struct ll_fiemap_info_key *fmkey,
+                            struct fiemap *fiemap, size_t *buflen)
+{
+       struct obd_export *exp = osc_export(cl2osc(obj));
+       struct ldlm_res_id resid;
+       union ldlm_policy_data policy;
+       struct lustre_handle lockh;
+       enum ldlm_mode mode = LCK_MINMODE;
+       struct ptlrpc_request *req;
+       struct fiemap *reply;
+       char *tmp;
+       int rc;
+       ENTRY;
+
+       fmkey->lfik_oa.o_oi = cl2osc(obj)->oo_oinfo->loi_oi;
+       if (!(fmkey->lfik_fiemap.fm_flags & FIEMAP_FLAG_SYNC))
+               goto skip_locking;
+
+       policy.l_extent.start = fmkey->lfik_fiemap.fm_start & PAGE_CACHE_MASK;
+
+       if (OBD_OBJECT_EOF - fmkey->lfik_fiemap.fm_length <=
+           fmkey->lfik_fiemap.fm_start + PAGE_CACHE_SIZE - 1)
+               policy.l_extent.end = OBD_OBJECT_EOF;
+       else
+               policy.l_extent.end = (fmkey->lfik_fiemap.fm_start +
+                                      fmkey->lfik_fiemap.fm_length +
+                                      PAGE_CACHE_SIZE - 1) & PAGE_CACHE_MASK;
+
+       ostid_build_res_name(&fmkey->lfik_oa.o_oi, &resid);
+       mode = ldlm_lock_match(exp->exp_obd->obd_namespace,
+                              LDLM_FL_BLOCK_GRANTED | LDLM_FL_LVB_READY,
+                              &resid, LDLM_EXTENT, &policy,
+                              LCK_PR | LCK_PW, &lockh, 0);
+       if (mode) { /* lock is cached on client */
+               if (mode != LCK_PR) {
+                       ldlm_lock_addref(&lockh, LCK_PR);
+                       ldlm_lock_decref(&lockh, LCK_PW);
+               }
+       } else { /* no cached lock, needs acquire lock on server side */
+               fmkey->lfik_oa.o_valid |= OBD_MD_FLFLAGS;
+               fmkey->lfik_oa.o_flags |= OBD_FL_SRVLOCK;
+       }
+
+skip_locking:
+       req = ptlrpc_request_alloc(class_exp2cliimp(exp),
+                                  &RQF_OST_GET_INFO_FIEMAP);
+       if (req == NULL)
+               GOTO(drop_lock, rc = -ENOMEM);
+
+       req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_KEY, RCL_CLIENT,
+                            sizeof(*fmkey));
+       req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_VAL, RCL_CLIENT,
+                            *buflen);
+       req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_VAL, RCL_SERVER,
+                            *buflen);
+
+       rc = ptlrpc_request_pack(req, LUSTRE_OST_VERSION, OST_GET_INFO);
+       if (rc != 0) {
+               ptlrpc_request_free(req);
+               GOTO(drop_lock, rc);
+       }
+       tmp = req_capsule_client_get(&req->rq_pill, &RMF_FIEMAP_KEY);
+       memcpy(tmp, fmkey, sizeof(*fmkey));
+       tmp = req_capsule_client_get(&req->rq_pill, &RMF_FIEMAP_VAL);
+       memcpy(tmp, fiemap, *buflen);
+       ptlrpc_request_set_replen(req);
+
+       rc = ptlrpc_queue_wait(req);
+       if (rc != 0)
+               GOTO(fini_req, rc);
+
+       reply = req_capsule_server_get(&req->rq_pill, &RMF_FIEMAP_VAL);
+       if (reply == NULL)
+               GOTO(fini_req, rc = -EPROTO);
+
+       memcpy(fiemap, reply, *buflen);
+fini_req:
+       ptlrpc_req_finished(req);
+drop_lock:
+       if (mode)
+               ldlm_lock_decref(&lockh, LCK_PR);
+       RETURN(rc);
+}
 
 void osc_object_set_contended(struct osc_object *obj)
 {
@@ -276,7 +381,9 @@ static const struct cl_object_operations osc_ops = {
        .coo_attr_get     = osc_attr_get,
        .coo_attr_update  = osc_attr_update,
        .coo_glimpse      = osc_object_glimpse,
-       .coo_prune        = osc_object_prune
+       .coo_prune        = osc_object_prune,
+       .coo_find_cbdata  = osc_object_find_cbdata,
+       .coo_fiemap       = osc_object_fiemap,
 };
 
 static const struct lu_object_operations osc_lu_obj_ops = {
@@ -305,4 +412,20 @@ struct lu_object *osc_object_alloc(const struct lu_env *env,
        return obj;
 }
 
+int osc_object_invalidate(const struct lu_env *env, struct osc_object *osc)
+{
+       struct l_wait_info lwi = { 0 };
+       ENTRY;
+
+       CDEBUG(D_INODE, "Invalidate osc object: %p, # of active IOs: %d\n",
+              osc, atomic_read(&osc->oo_nr_ios));
+
+       l_wait_event(osc->oo_io_waitq, atomic_read(&osc->oo_nr_ios) == 0, &lwi);
+
+       /* Discard all pages of this object. */
+       osc_cache_truncate_start(env, osc, 0, NULL);
+
+       RETURN(0);
+}
+
 /** @} osc */