Whamcloud - gitweb
b=20595
[fs/lustre-release.git] / lustre / lmv / lmv_object.c
1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2  * vim:expandtab:shiftwidth=8:tabstop=8:
3  *
4  * GPL HEADER START
5  *
6  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License version 2 only,
10  * as published by the Free Software Foundation.
11  *
12  * This program is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License version 2 for more details (a copy is included
16  * in the LICENSE file that accompanied this code).
17  *
18  * You should have received a copy of the GNU General Public License
19  * version 2 along with this program; If not, see
20  * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
21  *
22  * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
23  * CA 95054 USA or visit www.sun.com if you need additional information or
24  * have any questions.
25  *
26  * GPL HEADER END
27  */
28 /*
29  * Copyright  2008 Sun Microsystems, Inc. All rights reserved
30  * Use is subject to license terms.
31  */
32 /*
33  * This file is part of Lustre, http://www.lustre.org/
34  * Lustre is a trademark of Sun Microsystems, Inc.
35  */
36
37 #ifndef EXPORT_SYMTAB
38 # define EXPORT_SYMTAB
39 #endif
40 #define DEBUG_SUBSYSTEM S_LMV
41 #ifdef __KERNEL__
42 #include <linux/slab.h>
43 #include <linux/module.h>
44 #include <linux/init.h>
45 #include <linux/slab.h>
46 #include <linux/pagemap.h>
47 #include <asm/div64.h>
48 #include <linux/seq_file.h>
49 #else
50 #include <liblustre.h>
51 #endif
52
53 #include <lustre/lustre_idl.h>
54 #include <obd_support.h>
55 #include <lustre_lib.h>
56 #include <lustre_net.h>
57 #include <lustre_dlm.h>
58 #include <obd_class.h>
59 #include <lprocfs_status.h>
60 #include "lmv_internal.h"
61
62 extern cfs_mem_cache_t *lmv_object_cache;
63 extern atomic_t lmv_object_count;
64
65 static CFS_LIST_HEAD(obj_list);
66 static spinlock_t obj_list_lock = SPIN_LOCK_UNLOCKED;
67
68 struct lmv_object *lmv_object_alloc(struct obd_device *obd,
69                                     const struct lu_fid *fid,
70                                     struct lmv_stripe_md *mea)
71 {
72         struct lmv_obd          *lmv = &obd->u.lmv;
73         unsigned int             obj_size;
74         struct lmv_object       *obj;
75         int                      i;
76
77         LASSERT(mea->mea_magic == MEA_MAGIC_LAST_CHAR
78                 || mea->mea_magic == MEA_MAGIC_ALL_CHARS
79                 || mea->mea_magic == MEA_MAGIC_HASH_SEGMENT);
80
81         OBD_SLAB_ALLOC_PTR(obj, lmv_object_cache);
82         if (!obj)
83                 return NULL;
84
85         atomic_inc(&lmv_object_count);
86
87         obj->lo_fid = *fid;
88         obj->lo_obd = obd;
89         obj->lo_state = 0;
90         obj->lo_hashtype = mea->mea_magic;
91
92         init_MUTEX(&obj->lo_guard);
93         atomic_set(&obj->lo_count, 0);
94         obj->lo_objcount = mea->mea_count;
95
96         obj_size = sizeof(struct lmv_stripe) * 
97                 lmv->desc.ld_tgt_count;
98
99         OBD_ALLOC(obj->lo_stripes, obj_size);
100         if (!obj->lo_stripes)
101                 goto err_obj;
102
103         memset(obj->lo_stripes, 0, obj_size);
104
105         CDEBUG(D_INODE, "Allocate object for "DFID"\n", 
106                PFID(fid));
107         for (i = 0; i < mea->mea_count; i++) {
108                 int rc;
109
110                 CDEBUG(D_INODE, "Process subobject "DFID"\n", 
111                        PFID(&mea->mea_ids[i]));
112                 obj->lo_stripes[i].ls_fid = mea->mea_ids[i];
113                 LASSERT(fid_is_sane(&obj->lo_stripes[i].ls_fid));
114
115                 /*
116                  * Cache slave mds number to use it in all cases it is needed
117                  * instead of constant lookup.
118                  */
119                 rc = lmv_fld_lookup(lmv, &obj->lo_stripes[i].ls_fid,
120                                     &obj->lo_stripes[i].ls_mds);
121                 if (rc)
122                         goto err_obj;
123         }
124
125         return obj;
126 err_obj:
127         OBD_FREE(obj, sizeof(*obj));
128         return NULL;
129 }
130
131 void lmv_object_free(struct lmv_object *obj)
132 {
133         struct lmv_obd          *lmv = &obj->lo_obd->u.lmv;
134         unsigned int             obj_size;
135
136         LASSERT(!atomic_read(&obj->lo_count));
137
138         obj_size = sizeof(struct lmv_stripe) *
139                 lmv->desc.ld_tgt_count;
140
141         OBD_FREE(obj->lo_stripes, obj_size);
142         OBD_SLAB_FREE(obj, lmv_object_cache, sizeof(*obj));
143         atomic_dec(&lmv_object_count);
144 }
145
146 static void __lmv_object_add(struct lmv_object *obj)
147 {
148         atomic_inc(&obj->lo_count);
149         list_add(&obj->lo_list, &obj_list);
150 }
151
152 void lmv_object_add(struct lmv_object *obj)
153 {
154         spin_lock(&obj_list_lock);
155         __lmv_object_add(obj);
156         spin_unlock(&obj_list_lock);
157 }
158
159 static void __lmv_object_del(struct lmv_object *obj)
160 {
161         list_del(&obj->lo_list);
162         lmv_object_free(obj);
163 }
164
165 void lmv_object_del(struct lmv_object *obj)
166 {
167         spin_lock(&obj_list_lock);
168         __lmv_object_del(obj);
169         spin_unlock(&obj_list_lock);
170 }
171
172 static struct lmv_object *__lmv_object_get(struct lmv_object *obj)
173 {
174         LASSERT(obj != NULL);
175         atomic_inc(&obj->lo_count);
176         return obj;
177 }
178
179 struct lmv_object *lmv_object_get(struct lmv_object *obj)
180 {
181         spin_lock(&obj_list_lock);
182         __lmv_object_get(obj);
183         spin_unlock(&obj_list_lock);
184         return obj;
185 }
186
187 static void __lmv_object_put(struct lmv_object *obj)
188 {
189         LASSERT(obj);
190
191         if (atomic_dec_and_test(&obj->lo_count)) {
192                 CDEBUG(D_INODE, "Last reference to "DFID" - "
193                        "destroying\n", PFID(&obj->lo_fid));
194                 __lmv_object_del(obj);
195         }
196 }
197
198 void lmv_object_put(struct lmv_object *obj)
199 {
200         spin_lock(&obj_list_lock);
201         __lmv_object_put(obj);
202         spin_unlock(&obj_list_lock);
203 }
204
205 void lmv_object_put_unlock(struct lmv_object *obj)
206 {
207         lmv_object_unlock(obj);
208         lmv_object_put(obj);
209 }
210
211 static struct lmv_object *__lmv_object_find(struct obd_device *obd, const struct lu_fid *fid)
212 {
213         struct lmv_object       *obj;
214         struct list_head        *cur;
215
216         list_for_each(cur, &obj_list) {
217                 obj = list_entry(cur, struct lmv_object, lo_list);
218
219                 /* 
220                  * Check if object is in destroying phase. If so - skip
221                  * it. 
222                  */
223                 if (obj->lo_state & O_FREEING)
224                         continue;
225
226                 /*
227                  * We should make sure, that we have found object belong to
228                  * passed obd. It is possible that, object manager will have two
229                  * objects with the same fid belong to different obds, if client
230                  * and mds runs on the same host. May be it is good idea to have
231                  * objects list associated with obd.
232                  */
233                 if (obj->lo_obd != obd)
234                         continue;
235
236                 /* 
237                  * Check if this is what we're looking for. 
238                  */
239                 if (lu_fid_eq(&obj->lo_fid, fid))
240                         return __lmv_object_get(obj);
241         }
242
243         return NULL;
244 }
245
246 struct lmv_object *lmv_object_find(struct obd_device *obd, 
247                                    const struct lu_fid *fid)
248 {
249         struct lmv_object       *obj;
250         ENTRY;
251
252         spin_lock(&obj_list_lock);
253         obj = __lmv_object_find(obd, fid);
254         spin_unlock(&obj_list_lock);
255
256         RETURN(obj);
257 }
258
259 struct lmv_object *lmv_object_find_lock(struct obd_device *obd, 
260                                         const struct lu_fid *fid)
261 {
262         struct lmv_object       *obj;
263         ENTRY;
264
265         obj = lmv_object_find(obd, fid);
266         if (obj)
267                 lmv_object_lock(obj);
268
269         RETURN(obj);
270 }
271
272 static struct lmv_object *__lmv_object_create(struct obd_device *obd, 
273                                               const struct lu_fid *fid,
274                                               struct lmv_stripe_md *mea)
275 {
276         struct lmv_object       *new;
277         struct lmv_object       *obj;
278         ENTRY;
279
280         obj = lmv_object_find(obd, fid);
281         if (obj)
282                 RETURN(obj);
283
284         new = lmv_object_alloc(obd, fid, mea);
285         if (!new)
286                 RETURN(NULL);
287
288         /* 
289          * Check if someone created it already while we were dealing with
290          * allocating @obj. 
291          */
292         spin_lock(&obj_list_lock);
293         obj = __lmv_object_find(obd, fid);
294         if (obj) {
295                 /* 
296                  * Someone created it already - put @obj and getting out. 
297                  */
298                 spin_unlock(&obj_list_lock);
299                 lmv_object_free(new);
300                 RETURN(obj);
301         }
302
303         __lmv_object_add(new);
304         __lmv_object_get(new);
305
306         spin_unlock(&obj_list_lock);
307
308         CDEBUG(D_INODE, "New obj in lmv cache: "DFID"\n",
309                PFID(fid));
310
311         RETURN(new);
312 }
313
314 struct lmv_object *lmv_object_create(struct obd_export *exp, 
315                                      const struct lu_fid *fid,
316                                      struct lmv_stripe_md *mea)
317 {
318         struct obd_device       *obd = exp->exp_obd;
319         struct lmv_obd          *lmv = &obd->u.lmv;
320         struct ptlrpc_request   *req = NULL;
321         struct lmv_tgt_desc     *tgt;
322         struct lmv_object       *obj;
323         struct lustre_md         md;
324         int                      mealen;
325         int                      rc;
326         ENTRY;
327
328         CDEBUG(D_INODE, "Get mea for "DFID" and create lmv obj\n",
329                PFID(fid));
330
331         md.mea = NULL;
332         
333         if (mea == NULL) {
334                 __u64 valid;
335
336                 CDEBUG(D_INODE, "Mea isn't passed in, get it now\n");
337                 mealen = lmv_get_easize(lmv);
338
339                 /* 
340                  * Time to update mea of parent fid. 
341                  */
342                 md.mea = NULL;
343                 valid = OBD_MD_FLEASIZE | OBD_MD_FLDIREA | OBD_MD_MEA;
344
345                 tgt = lmv_find_target(lmv, fid);
346                 if (IS_ERR(tgt))
347                         GOTO(cleanup, obj = (void *)tgt);
348
349                 rc = md_getattr(tgt->ltd_exp, fid, NULL, valid, mealen, &req);
350                 if (rc) {
351                         CERROR("md_getattr() failed, error %d\n", rc);
352                         GOTO(cleanup, obj = ERR_PTR(rc));
353                 }
354
355                 rc = md_get_lustre_md(exp, req, NULL, exp, &md);
356                 if (rc) {
357                         CERROR("md_get_lustre_md() failed, error %d\n", rc);
358                         GOTO(cleanup, obj = ERR_PTR(rc));
359                 }
360
361                 if (md.mea == NULL)
362                         GOTO(cleanup, obj = ERR_PTR(-ENODATA));
363
364                 mea = md.mea;
365         }
366
367         /* 
368          * Got mea, now create obj for it. 
369          */
370         obj = __lmv_object_create(obd, fid, mea);
371         if (!obj) {
372                 CERROR("Can't create new object "DFID"\n",
373                        PFID(fid));
374                 GOTO(cleanup, obj = ERR_PTR(-ENOMEM));
375         }
376
377         if (md.mea != NULL)
378                 obd_free_memmd(exp, (void *)&md.mea);
379
380         EXIT;
381 cleanup:
382         if (req)
383                 ptlrpc_req_finished(req);
384         return obj;
385 }
386
387 int lmv_object_delete(struct obd_export *exp, const struct lu_fid *fid)
388 {
389         struct obd_device       *obd = exp->exp_obd;
390         struct lmv_object       *obj;
391         int                      rc = 0;
392         ENTRY;
393
394         spin_lock(&obj_list_lock);
395         obj = __lmv_object_find(obd, fid);
396         if (obj) {
397                 obj->lo_state |= O_FREEING;
398                 __lmv_object_put(obj);
399                 __lmv_object_put(obj);
400                 rc = 1;
401         }
402         spin_unlock(&obj_list_lock);
403         RETURN(rc);
404 }
405
406 int lmv_object_setup(struct obd_device *obd)
407 {
408         ENTRY;
409         LASSERT(obd != NULL);
410
411         CDEBUG(D_INFO, "LMV object manager setup (%s)\n",
412                obd->obd_uuid.uuid);
413
414         RETURN(0);
415 }
416
417 void lmv_object_cleanup(struct obd_device *obd)
418 {
419         struct list_head        *cur;
420         struct list_head        *tmp;
421         struct lmv_object       *obj;
422         ENTRY;
423
424         CDEBUG(D_INFO, "LMV object manager cleanup (%s)\n",
425                obd->obd_uuid.uuid);
426
427         spin_lock(&obj_list_lock);
428         list_for_each_safe(cur, tmp, &obj_list) {
429                 obj = list_entry(cur, struct lmv_object, lo_list);
430
431                 if (obj->lo_obd != obd)
432                         continue;
433
434                 obj->lo_state |= O_FREEING;
435                 if (atomic_read(&obj->lo_count) > 1) {
436                         CERROR("Object "DFID" has count (%d)\n", 
437                                PFID(&obj->lo_fid), atomic_read(&obj->lo_count));
438                 }
439                 __lmv_object_put(obj);
440         }
441         spin_unlock(&obj_list_lock);
442         EXIT;
443 }