Whamcloud - gitweb
LU-12681 osc: wrong cache of LVB attrs
[fs/lustre-release.git] / lustre / osc / osc_object.c
1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * General Public License version 2 for more details (a copy is included
14  * in the LICENSE file that accompanied this code).
15  *
16  * You should have received a copy of the GNU General Public License
17  * version 2 along with this program; If not, see
18  * http://www.gnu.org/licenses/gpl-2.0.html
19  *
20  * GPL HEADER END
21  */
22 /*
23  * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
24  * Use is subject to license terms.
25  *
26  * Copyright (c) 2011, 2017, Intel Corporation.
27  */
28 /*
29  * This file is part of Lustre, http://www.lustre.org/
30  * Lustre is a trademark of Sun Microsystems, Inc.
31  *
32  * Implementation of cl_object for OSC layer.
33  *
34  *   Author: Nikita Danilov <nikita.danilov@sun.com>
35  *   Author: Jinshan Xiong <jinshan.xiong@intel.com>
36  */
37
38 #define DEBUG_SUBSYSTEM S_OSC
39 #include <lustre_osc.h>
40
41 #include "osc_internal.h"
42
43 /** \addtogroup osc
44  *  @{
45  */
46
47 /*****************************************************************************
48  *
49  * Object operations.
50  *
51  */
52 static void osc_obj_build_res_name(struct osc_object *osc,
53                                    struct ldlm_res_id *resname)
54 {
55         ostid_build_res_name(&osc->oo_oinfo->loi_oi, resname);
56 }
57
58 static const struct osc_object_operations osc_object_ops = {
59         .oto_build_res_name = osc_obj_build_res_name,
60         .oto_dlmlock_at_pgoff = osc_obj_dlmlock_at_pgoff,
61 };
62
63 int osc_object_init(const struct lu_env *env, struct lu_object *obj,
64                     const struct lu_object_conf *conf)
65 {
66         struct osc_object           *osc   = lu2osc(obj);
67         const struct cl_object_conf *cconf = lu2cl_conf(conf);
68
69         osc->oo_oinfo = cconf->u.coc_oinfo;
70 #ifdef CONFIG_LUSTRE_DEBUG_EXPENSIVE_CHECK
71         mutex_init(&osc->oo_debug_mutex);
72 #endif
73         INIT_LIST_HEAD(&osc->oo_ready_item);
74         INIT_LIST_HEAD(&osc->oo_hp_ready_item);
75         INIT_LIST_HEAD(&osc->oo_write_item);
76         INIT_LIST_HEAD(&osc->oo_read_item);
77
78         osc->oo_root.rb_node = NULL;
79         INIT_LIST_HEAD(&osc->oo_hp_exts);
80         INIT_LIST_HEAD(&osc->oo_urgent_exts);
81         INIT_LIST_HEAD(&osc->oo_full_exts);
82         INIT_LIST_HEAD(&osc->oo_reading_exts);
83         atomic_set(&osc->oo_nr_reads, 0);
84         atomic_set(&osc->oo_nr_writes, 0);
85         spin_lock_init(&osc->oo_lock);
86         spin_lock_init(&osc->oo_tree_lock);
87         spin_lock_init(&osc->oo_ol_spin);
88         INIT_LIST_HEAD(&osc->oo_ol_list);
89
90         atomic_set(&osc->oo_nr_ios, 0);
91         init_waitqueue_head(&osc->oo_io_waitq);
92
93         LASSERT(osc->oo_obj_ops != NULL);
94
95         cl_object_page_init(lu2cl(obj), sizeof(struct osc_page));
96
97         return 0;
98 }
99 EXPORT_SYMBOL(osc_object_init);
100
101 void osc_object_free(const struct lu_env *env, struct lu_object *obj)
102 {
103         struct osc_object *osc = lu2osc(obj);
104
105         LASSERT(list_empty(&osc->oo_ready_item));
106         LASSERT(list_empty(&osc->oo_hp_ready_item));
107         LASSERT(list_empty(&osc->oo_write_item));
108         LASSERT(list_empty(&osc->oo_read_item));
109
110         LASSERT(osc->oo_root.rb_node == NULL);
111         LASSERT(list_empty(&osc->oo_hp_exts));
112         LASSERT(list_empty(&osc->oo_urgent_exts));
113         LASSERT(list_empty(&osc->oo_full_exts));
114         LASSERT(list_empty(&osc->oo_reading_exts));
115         LASSERT(atomic_read(&osc->oo_nr_reads) == 0);
116         LASSERT(atomic_read(&osc->oo_nr_writes) == 0);
117         LASSERT(list_empty(&osc->oo_ol_list));
118         LASSERT(atomic_read(&osc->oo_nr_ios) == 0);
119
120         lu_object_fini(obj);
121         OBD_SLAB_FREE_PTR(osc, osc_object_kmem);
122 }
123 EXPORT_SYMBOL(osc_object_free);
124
125 int osc_lvb_print(const struct lu_env *env, void *cookie,
126                   lu_printer_t p, const struct ost_lvb *lvb)
127 {
128         return (*p)(env, cookie, "size: %llu mtime: %llu atime: %llu "
129                     "ctime: %llu blocks: %llu",
130                     lvb->lvb_size, lvb->lvb_mtime, lvb->lvb_atime,
131                     lvb->lvb_ctime, lvb->lvb_blocks);
132 }
133 EXPORT_SYMBOL(osc_lvb_print);
134
135 int osc_object_print(const struct lu_env *env, void *cookie,
136                      lu_printer_t p, const struct lu_object *obj)
137 {
138         struct osc_object *osc = lu2osc(obj);
139         struct lov_oinfo *oinfo = osc->oo_oinfo;
140         struct osc_async_rc *ar = &oinfo->loi_ar;
141
142         (*p)(env, cookie, "id: "DOSTID" "
143              "idx: %d gen: %d kms_valid: %u kms %llu "
144              "rc: %d force_sync: %d min_xid: %llu ",
145              POSTID(&oinfo->loi_oi), oinfo->loi_ost_idx,
146              oinfo->loi_ost_gen, oinfo->loi_kms_valid, oinfo->loi_kms,
147              ar->ar_rc, ar->ar_force_sync, ar->ar_min_xid);
148         osc_lvb_print(env, cookie, p, &oinfo->loi_lvb);
149         return 0;
150 }
151 EXPORT_SYMBOL(osc_object_print);
152
153
154 int osc_attr_get(const struct lu_env *env, struct cl_object *obj,
155                  struct cl_attr *attr)
156 {
157         struct lov_oinfo *oinfo = cl2osc(obj)->oo_oinfo;
158
159         cl_lvb2attr(attr, &oinfo->loi_lvb);
160         attr->cat_kms = oinfo->loi_kms_valid ? oinfo->loi_kms : 0;
161         return 0;
162 }
163 EXPORT_SYMBOL(osc_attr_get);
164
165 int osc_attr_update(const struct lu_env *env, struct cl_object *obj,
166                     const struct cl_attr *attr, unsigned valid)
167 {
168         struct lov_oinfo *oinfo = cl2osc(obj)->oo_oinfo;
169         struct ost_lvb   *lvb   = &oinfo->loi_lvb;
170
171         if (valid & CAT_SIZE)
172                 lvb->lvb_size = attr->cat_size;
173         if (valid & CAT_MTIME)
174                 lvb->lvb_mtime = attr->cat_mtime;
175         if (valid & CAT_ATIME)
176                 lvb->lvb_atime = attr->cat_atime;
177         if (valid & CAT_CTIME)
178                 lvb->lvb_ctime = attr->cat_ctime;
179         if (valid & CAT_BLOCKS)
180                 lvb->lvb_blocks = attr->cat_blocks;
181         if (valid & CAT_KMS) {
182                 CDEBUG(D_CACHE, "set kms from %lluto %llu\n",
183                        oinfo->loi_kms, (__u64)attr->cat_kms);
184                 loi_kms_set(oinfo, attr->cat_kms);
185         }
186         return 0;
187 }
188 EXPORT_SYMBOL(osc_attr_update);
189
190 int osc_object_glimpse(const struct lu_env *env, const struct cl_object *obj,
191                        struct ost_lvb *lvb)
192 {
193         struct lov_oinfo *oinfo = cl2osc(obj)->oo_oinfo;
194
195         lvb->lvb_size = oinfo->loi_kms;
196         lvb->lvb_blocks = oinfo->loi_lvb.lvb_blocks;
197         return 0;
198 }
199 EXPORT_SYMBOL(osc_object_glimpse);
200
201 static int osc_object_ast_clear(struct ldlm_lock *lock, void *data)
202 {
203         struct osc_object *osc = (struct osc_object *)data;
204         struct ost_lvb *lvb = lock->l_lvb_data;
205         struct lov_oinfo *oinfo;
206         ENTRY;
207
208         if (lock->l_ast_data == data) {
209                 lock->l_ast_data = NULL;
210
211                 LASSERT(osc != NULL);
212                 LASSERT(osc->oo_oinfo != NULL);
213                 LASSERT(lvb != NULL);
214
215                 /* Updates lvb in lock by the cached oinfo */
216                 oinfo = osc->oo_oinfo;
217                 cl_object_attr_lock(&osc->oo_cl);
218                 memcpy(lvb, &oinfo->loi_lvb, sizeof(oinfo->loi_lvb));
219                 cl_object_attr_unlock(&osc->oo_cl);
220
221                 LDLM_DEBUG(lock, "update lvb size %llu blocks %llu [cma]time: "
222                            "%llu %llu %llu", lvb->lvb_size, lvb->lvb_blocks,
223                            lvb->lvb_ctime, lvb->lvb_mtime, lvb->lvb_atime);
224
225                 ldlm_clear_lvb_cached(lock);
226         }
227         RETURN(LDLM_ITER_CONTINUE);
228 }
229
230 int osc_object_prune(const struct lu_env *env, struct cl_object *obj)
231 {
232         struct osc_object  *osc = cl2osc(obj);
233         struct ldlm_res_id *resname = &osc_env_info(env)->oti_resname;
234
235         /* DLM locks don't hold a reference of osc_object so we have to
236          * clear it before the object is being destroyed. */
237         osc_build_res_name(osc, resname);
238         ldlm_resource_iterate(osc_export(osc)->exp_obd->obd_namespace, resname,
239                               osc_object_ast_clear, osc);
240         return 0;
241 }
242 EXPORT_SYMBOL(osc_object_prune);
243
244 static int osc_object_fiemap(const struct lu_env *env, struct cl_object *obj,
245                              struct ll_fiemap_info_key *fmkey,
246                              struct fiemap *fiemap, size_t *buflen)
247 {
248         struct obd_export *exp = osc_export(cl2osc(obj));
249         struct ldlm_res_id resid;
250         union ldlm_policy_data policy;
251         struct lustre_handle lockh;
252         enum ldlm_mode mode = LCK_MINMODE;
253         struct ptlrpc_request *req;
254         struct fiemap *reply;
255         char *tmp;
256         int rc;
257         ENTRY;
258
259         fmkey->lfik_oa.o_oi = cl2osc(obj)->oo_oinfo->loi_oi;
260         if (!(fmkey->lfik_fiemap.fm_flags & FIEMAP_FLAG_SYNC))
261                 goto skip_locking;
262
263         policy.l_extent.start = fmkey->lfik_fiemap.fm_start & PAGE_MASK;
264
265         if (OBD_OBJECT_EOF - fmkey->lfik_fiemap.fm_length <=
266             fmkey->lfik_fiemap.fm_start + PAGE_SIZE - 1)
267                 policy.l_extent.end = OBD_OBJECT_EOF;
268         else
269                 policy.l_extent.end = (fmkey->lfik_fiemap.fm_start +
270                                        fmkey->lfik_fiemap.fm_length +
271                                        PAGE_SIZE - 1) & PAGE_MASK;
272
273         ostid_build_res_name(&fmkey->lfik_oa.o_oi, &resid);
274         mode = ldlm_lock_match(exp->exp_obd->obd_namespace,
275                                LDLM_FL_BLOCK_GRANTED | LDLM_FL_LVB_READY,
276                                &resid, LDLM_EXTENT, &policy,
277                                LCK_PR | LCK_PW, &lockh, 0);
278         if (mode) { /* lock is cached on client */
279                 if (mode != LCK_PR) {
280                         ldlm_lock_addref(&lockh, LCK_PR);
281                         ldlm_lock_decref(&lockh, LCK_PW);
282                 }
283         } else { /* no cached lock, needs acquire lock on server side */
284                 fmkey->lfik_oa.o_valid |= OBD_MD_FLFLAGS;
285                 fmkey->lfik_oa.o_flags |= OBD_FL_SRVLOCK;
286         }
287
288 skip_locking:
289         req = ptlrpc_request_alloc(class_exp2cliimp(exp),
290                                    &RQF_OST_GET_INFO_FIEMAP);
291         if (req == NULL)
292                 GOTO(drop_lock, rc = -ENOMEM);
293
294         req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_KEY, RCL_CLIENT,
295                              sizeof(*fmkey));
296         req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_VAL, RCL_CLIENT,
297                              *buflen);
298         req_capsule_set_size(&req->rq_pill, &RMF_FIEMAP_VAL, RCL_SERVER,
299                              *buflen);
300
301         rc = ptlrpc_request_pack(req, LUSTRE_OST_VERSION, OST_GET_INFO);
302         if (rc != 0) {
303                 ptlrpc_request_free(req);
304                 GOTO(drop_lock, rc);
305         }
306         tmp = req_capsule_client_get(&req->rq_pill, &RMF_FIEMAP_KEY);
307         memcpy(tmp, fmkey, sizeof(*fmkey));
308         tmp = req_capsule_client_get(&req->rq_pill, &RMF_FIEMAP_VAL);
309         memcpy(tmp, fiemap, *buflen);
310         ptlrpc_request_set_replen(req);
311
312         rc = ptlrpc_queue_wait(req);
313         if (rc != 0)
314                 GOTO(fini_req, rc);
315
316         reply = req_capsule_server_get(&req->rq_pill, &RMF_FIEMAP_VAL);
317         if (reply == NULL)
318                 GOTO(fini_req, rc = -EPROTO);
319
320         memcpy(fiemap, reply, *buflen);
321 fini_req:
322         ptlrpc_req_finished(req);
323 drop_lock:
324         if (mode)
325                 ldlm_lock_decref(&lockh, LCK_PR);
326         RETURN(rc);
327 }
328
329 int osc_object_is_contended(struct osc_object *obj)
330 {
331         struct osc_device *dev = lu2osc_dev(obj->oo_cl.co_lu.lo_dev);
332         time64_t osc_contention_time = dev->od_contention_time;
333         ktime_t retry_time;
334
335         if (OBD_FAIL_CHECK(OBD_FAIL_OSC_OBJECT_CONTENTION))
336                 return 1;
337
338         if (!obj->oo_contended)
339                 return 0;
340
341         /*
342          * I like copy-paste. the code is copied from
343          * ll_file_is_contended.
344          */
345         retry_time = ktime_add_ns(obj->oo_contention_time,
346                                   osc_contention_time * NSEC_PER_SEC);
347         if (ktime_after(ktime_get(), retry_time)) {
348                 osc_object_clear_contended(obj);
349                 return 0;
350         }
351         return 1;
352 }
353 EXPORT_SYMBOL(osc_object_is_contended);
354
355 /**
356  * Implementation of struct cl_object_operations::coo_req_attr_set() for osc
357  * layer. osc is responsible for struct obdo::o_id and struct obdo::o_seq
358  * fields.
359  */
360 static void osc_req_attr_set(const struct lu_env *env, struct cl_object *obj,
361                              struct cl_req_attr *attr)
362 {
363         struct lov_oinfo *oinfo;
364         struct obdo      *oa;
365         struct ost_lvb   *lvb;
366         u64               flags = attr->cra_flags;
367
368         oinfo   = cl2osc(obj)->oo_oinfo;
369         lvb     = &oinfo->loi_lvb;
370         oa      = attr->cra_oa;
371
372         if ((flags & OBD_MD_FLMTIME) != 0) {
373                 oa->o_mtime = lvb->lvb_mtime;
374                 oa->o_valid |= OBD_MD_FLMTIME;
375         }
376         if ((flags & OBD_MD_FLATIME) != 0) {
377                 oa->o_atime = lvb->lvb_atime;
378                 oa->o_valid |= OBD_MD_FLATIME;
379         }
380         if ((flags & OBD_MD_FLCTIME) != 0) {
381                 oa->o_ctime = lvb->lvb_ctime;
382                 oa->o_valid |= OBD_MD_FLCTIME;
383         }
384         if (flags & OBD_MD_FLGROUP) {
385                 ostid_set_seq(&oa->o_oi, ostid_seq(&oinfo->loi_oi));
386                 oa->o_valid |= OBD_MD_FLGROUP;
387         }
388         if (flags & OBD_MD_FLID) {
389                 int rc;
390
391                 rc = ostid_set_id(&oa->o_oi, ostid_id(&oinfo->loi_oi));
392                 if (rc) {
393                         CERROR("Bad %llu to set " DOSTID " : rc %d\n",
394                                (unsigned long long)ostid_id(&oinfo->loi_oi),
395                                POSTID(&oa->o_oi), rc);
396                 }
397                 oa->o_valid |= OBD_MD_FLID;
398         }
399         if (flags & OBD_MD_FLHANDLE) {
400                 struct ldlm_lock *lock;
401                 struct osc_page *opg;
402
403                 opg = osc_cl_page_osc(attr->cra_page, cl2osc(obj));
404                 lock = osc_dlmlock_at_pgoff(env, cl2osc(obj), osc_index(opg),
405                                 OSC_DAP_FL_TEST_LOCK | OSC_DAP_FL_CANCELING);
406                 if (lock == NULL && !opg->ops_srvlock) {
407                         struct ldlm_resource *res;
408                         struct ldlm_res_id *resname;
409
410                         CL_PAGE_DEBUG(D_ERROR, env, attr->cra_page,
411                                       "uncovered page!\n");
412
413                         resname = &osc_env_info(env)->oti_resname;
414                         ostid_build_res_name(&oinfo->loi_oi, resname);
415                         res = ldlm_resource_get(
416                                 osc_export(cl2osc(obj))->exp_obd->obd_namespace,
417                                 NULL, resname, LDLM_EXTENT, 0);
418                         ldlm_resource_dump(D_ERROR, res);
419
420                         libcfs_debug_dumpstack(NULL);
421                         LBUG();
422                 }
423
424                 /* check for lockless io. */
425                 if (lock != NULL) {
426                         oa->o_handle = lock->l_remote_handle;
427                         oa->o_valid |= OBD_MD_FLHANDLE;
428                         LDLM_LOCK_PUT(lock);
429                 }
430         }
431 }
432
433 static const struct cl_object_operations osc_ops = {
434         .coo_page_init    = osc_page_init,
435         .coo_lock_init    = osc_lock_init,
436         .coo_io_init      = osc_io_init,
437         .coo_attr_get     = osc_attr_get,
438         .coo_attr_update  = osc_attr_update,
439         .coo_glimpse      = osc_object_glimpse,
440         .coo_prune        = osc_object_prune,
441         .coo_fiemap       = osc_object_fiemap,
442         .coo_req_attr_set = osc_req_attr_set
443 };
444
445 static const struct lu_object_operations osc_lu_obj_ops = {
446         .loo_object_init      = osc_object_init,
447         .loo_object_release   = NULL,
448         .loo_object_free      = osc_object_free,
449         .loo_object_print     = osc_object_print,
450         .loo_object_invariant = NULL
451 };
452
453 struct lu_object *osc_object_alloc(const struct lu_env *env,
454                                    const struct lu_object_header *unused,
455                                    struct lu_device *dev)
456 {
457         struct osc_object *osc;
458         struct lu_object  *obj;
459
460         OBD_SLAB_ALLOC_PTR_GFP(osc, osc_object_kmem, GFP_NOFS);
461         if (osc != NULL) {
462                 obj = osc2lu(osc);
463                 lu_object_init(obj, NULL, dev);
464                 osc->oo_cl.co_ops = &osc_ops;
465                 obj->lo_ops = &osc_lu_obj_ops;
466                 osc->oo_obj_ops = &osc_object_ops;
467         } else
468                 obj = NULL;
469         return obj;
470 }
471
472 int osc_object_invalidate(const struct lu_env *env, struct osc_object *osc)
473 {
474         struct l_wait_info lwi = { 0 };
475         ENTRY;
476
477         CDEBUG(D_INODE, "Invalidate osc object: %p, # of active IOs: %d\n",
478                osc, atomic_read(&osc->oo_nr_ios));
479
480         l_wait_event(osc->oo_io_waitq, atomic_read(&osc->oo_nr_ios) == 0, &lwi);
481
482         /* Discard all dirty pages of this object. */
483         osc_cache_truncate_start(env, osc, 0, NULL);
484
485         /* Discard all caching pages */
486         osc_lock_discard_pages(env, osc, 0, CL_PAGE_EOF, true);
487
488         /* Clear ast data of dlm lock. Do this after discarding all pages */
489         osc_object_prune(env, osc2cl(osc));
490
491         RETURN(0);
492 }
493 EXPORT_SYMBOL(osc_object_invalidate);
494 /** @} osc */