Whamcloud - gitweb
Branch HEAD
[fs/lustre-release.git] / lustre / obdclass / llog_obd.c
index 9c9abb7..cc27ba9 100644 (file)
@@ -1,10 +1,25 @@
-
 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
  * vim:expandtab:shiftwidth=8:tabstop=8:
  *
- *   You should have received a copy of the GNU General Public License
- *   along with Lustre; if not, write to the Free Software
- *   Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+ *  Copyright (C) 2005 Cluster File Systems, Inc.
+ *
+ *   This file is part of the Lustre file system, http://www.lustre.org
+ *   Lustre is a trademark of Cluster File Systems, Inc.
+ *
+ *   You may have signed or agreed to another license before downloading
+ *   this software.  If so, you are bound by the terms and conditions
+ *   of that agreement, and the following does not apply to you.  See the
+ *   LICENSE file included with this distribution for more information.
+ *
+ *   If you did not agree to a different license, then this copy of Lustre
+ *   is open source software; you can redistribute it and/or modify it
+ *   under the terms of version 2 of the GNU General Public License as
+ *   published by the Free Software Foundation.
+ *
+ *   In either case, Lustre is distributed in the hope that it will be
+ *   useful, but WITHOUT ANY WARRANTY; without even the implied warranty
+ *   of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *   license text for more details.
  */
 
 #define DEBUG_SUBSYSTEM S_LOG
 #define EXPORT_SYMTAB
 #endif
 
-#ifdef __KERNEL__
-#include <linux/fs.h>
-#else
+#ifndef __KERNEL__
 #include <liblustre.h>
 #endif
 
-#include <linux/obd_class.h>
-#include <linux/lustre_log.h>
-#include <portals/list.h>
+#include <obd_class.h>
+#include <lustre_log.h>
+#include <libcfs/list.h>
 #include "llog_internal.h"
 
 /* helper functions for calling the llog obd methods */
+static struct llog_ctxt* llog_new_ctxt(struct obd_device *obd)
+{
+        struct llog_ctxt *ctxt;
+
+        OBD_ALLOC_PTR(ctxt);
+        if (!ctxt)
+                return NULL;
 
-int llog_setup(struct obd_device *obd, int index, struct obd_device *disk_obd, 
-               int count, struct llog_logid *logid, struct llog_operations *op)
+        ctxt->loc_obd = obd;
+        atomic_set(&ctxt->loc_refcount, 1);
+
+        return ctxt;
+}
+
+static void llog_ctxt_destroy(struct llog_ctxt *ctxt)
+{
+        if (ctxt->loc_exp)
+                class_export_put(ctxt->loc_exp);
+        if (ctxt->loc_imp) {
+                class_import_put(ctxt->loc_imp);
+                ctxt->loc_imp = NULL;
+        }
+
+        OBD_FREE_PTR(ctxt);
+        return;
+}
+
+int __llog_ctxt_put(struct llog_ctxt *ctxt)
+{
+        struct obd_llog_group *olg = ctxt->loc_olg;
+        struct obd_device *obd;
+        int rc = 0;
+
+        spin_lock(&olg->olg_lock);
+        if (!atomic_dec_and_test(&ctxt->loc_refcount)) {
+                spin_unlock(&olg->olg_lock);
+                return rc;
+        }
+        olg->olg_ctxts[ctxt->loc_idx] = NULL;
+        spin_unlock(&olg->olg_lock);
+
+        obd = ctxt->loc_obd;
+        spin_lock(&obd->obd_dev_lock);
+        spin_unlock(&obd->obd_dev_lock); /* sync with llog ctxt user thread */
+        LASSERT(obd->obd_stopping == 1 || obd->obd_set_up == 0);
+        /* cleanup the llog ctxt here */
+        if (CTXTP(ctxt, cleanup))
+                rc = CTXTP(ctxt, cleanup)(ctxt);
+
+        llog_ctxt_destroy(ctxt);
+        wake_up(&olg->olg_waitq);
+        return rc;
+}
+EXPORT_SYMBOL(__llog_ctxt_put);
+
+int llog_cleanup(struct llog_ctxt *ctxt)
+{
+        struct l_wait_info lwi = LWI_INTR(LWI_ON_SIGNAL_NOOP, NULL);
+        struct obd_llog_group *olg;
+        int rc, idx;
+        ENTRY;
+
+        if (!ctxt) {
+                CERROR("No ctxt\n");
+                RETURN(-ENODEV);
+        }
+
+        olg = ctxt->loc_olg;
+        idx = ctxt->loc_idx;
+
+        /* banlance the ctxt get when calling llog_cleanup */
+        LASSERT(atomic_read(&ctxt->loc_refcount) > 1);
+        llog_ctxt_put(ctxt);
+
+        /* try to free the ctxt */
+        rc = __llog_ctxt_put(ctxt);
+
+        l_wait_event(olg->olg_waitq,
+                     llog_group_ctxt_null(olg, idx), &lwi);
+
+        RETURN(rc);
+}
+EXPORT_SYMBOL(llog_cleanup);
+
+int llog_setup(struct obd_device *obd,  struct obd_llog_group *olg, int index,
+               struct obd_device *disk_obd, int count, struct llog_logid *logid,
+               struct llog_operations *op)
 {
         int rc = 0;
         struct llog_ctxt *ctxt;
@@ -36,47 +133,52 @@ int llog_setup(struct obd_device *obd, int index, struct obd_device *disk_obd,
         if (index < 0 || index >= LLOG_MAX_CTXTS)
                 RETURN(-EFAULT);
 
-        OBD_ALLOC(ctxt, sizeof(*ctxt));
+        LASSERT(olg != NULL);
+        ctxt = llog_group_get_ctxt(olg, index);
+
+        /* in some recovery cases, obd_llog_ctxt might already be set,
+         * but llogs might still be zero, for example in obd_filter recovery */
+        if (ctxt) {
+                /* mds_lov_update_mds might call here multiple times. So if the
+                   llog is already set up then don't to do it again. */
+                CDEBUG(D_CONFIG, "obd %s ctxt %d already set up\n",
+                       obd->obd_name, index);
+                LASSERT(ctxt->loc_olg == olg);
+                LASSERT(ctxt->loc_obd == obd);
+                LASSERT(ctxt->loc_exp == disk_obd->obd_self_export);
+                LASSERT(ctxt->loc_logops == op);
+                llog_ctxt_put(ctxt);
+                GOTO(out, rc = 0);
+        }
+        ctxt = llog_new_ctxt(obd);
         if (!ctxt)
-                RETURN(-ENOMEM);
+                GOTO(out, rc = -ENOMEM);
 
-        obd->obd_llog_ctxt[index] = ctxt;
+        rc = llog_group_set_ctxt(olg, ctxt, index);
+        if (rc) {
+                llog_ctxt_destroy(ctxt);
+                if (rc == -EEXIST)
+                        rc = 0;
+                GOTO(out, rc);
+        }
         ctxt->loc_obd = obd;
         ctxt->loc_exp = class_export_get(disk_obd->obd_self_export);
+        ctxt->loc_olg = olg;
         ctxt->loc_idx = index;
         ctxt->loc_logops = op;
         sema_init(&ctxt->loc_sem, 1);
 
         if (op->lop_setup)
-                rc = op->lop_setup(obd, index, disk_obd, count, logid);
-        if (ctxt && rc) 
-                OBD_FREE(ctxt, sizeof(*ctxt));
+                rc = op->lop_setup(obd, olg, index, disk_obd, count, logid);
 
+        if (rc) {
+                llog_ctxt_destroy(ctxt);
+        }
+out:
         RETURN(rc);
 }
 EXPORT_SYMBOL(llog_setup);
 
-int llog_cleanup(struct llog_ctxt *ctxt)
-{
-        int rc = 0;
-        ENTRY;
-
-        down(&ctxt->loc_sem);
-        LASSERT(ctxt);
-
-        if (CTXTP(ctxt, cleanup))
-                rc = CTXTP(ctxt, cleanup)(ctxt);
-
-        ctxt->loc_obd->obd_llog_ctxt[ctxt->loc_idx] = NULL;
-        class_export_put(ctxt->loc_exp);
-        ctxt->loc_exp = NULL;
-        up(&ctxt->loc_sem);
-        OBD_FREE(ctxt, sizeof(*ctxt));
-
-        RETURN(rc);
-}
-EXPORT_SYMBOL(llog_cleanup);
-
 int llog_sync(struct llog_ctxt *ctxt, struct obd_export *exp)
 {
         int rc = 0;
@@ -84,29 +186,32 @@ int llog_sync(struct llog_ctxt *ctxt, struct obd_export *exp)
 
         if (!ctxt)
                 RETURN(0);
-        down(&ctxt->loc_sem);
-        if (ctxt->loc_llcd && CTXTP(ctxt, sync))
+
+        if (CTXTP(ctxt, sync))
                 rc = CTXTP(ctxt, sync)(ctxt, exp);
-        else
-                up(&ctxt->loc_sem);
 
         RETURN(rc);
 }
 EXPORT_SYMBOL(llog_sync);
 
-int llog_add(struct llog_ctxt *ctxt,
-                 struct llog_rec_hdr *rec, struct lov_stripe_md *lsm,
-                 struct llog_cookie *logcookies, int numcookies)
+int llog_add(struct llog_ctxt *ctxt, struct llog_rec_hdr *rec,
+                struct lov_stripe_md *lsm, struct llog_cookie *logcookies,
+                int numcookies)
 {
+        __u32 cap;
         int rc;
         ENTRY;
 
-        LASSERT(ctxt);
-        down(&ctxt->loc_sem);
+        if (!ctxt) {
+                CERROR("No ctxt\n");
+                RETURN(-ENODEV);
+        }
+        
         CTXT_CHECK_OP(ctxt, add, -EOPNOTSUPP);
-
+       cap = current->cap_effective;             
+        cap_raise(current->cap_effective, CAP_SYS_RESOURCE);
         rc = CTXTP(ctxt, add)(ctxt, rec, lsm, logcookies, numcookies);
-        up(&ctxt->loc_sem);
+       current->cap_effective = cap; 
         RETURN(rc);
 }
 EXPORT_SYMBOL(llog_add);
@@ -117,7 +222,11 @@ int llog_cancel(struct llog_ctxt *ctxt, struct lov_stripe_md *lsm,
         int rc;
         ENTRY;
 
-        LASSERT(ctxt);
+        if (!ctxt) {
+                CERROR("No ctxt\n");
+                RETURN(-ENODEV);
+        }
+        
         CTXT_CHECK_OP(ctxt, cancel, -EOPNOTSUPP);
         rc = CTXTP(ctxt, cancel)(ctxt, lsm, count, cookies, flags);
         RETURN(rc);
@@ -125,7 +234,7 @@ int llog_cancel(struct llog_ctxt *ctxt, struct lov_stripe_md *lsm,
 EXPORT_SYMBOL(llog_cancel);
 
 /* callback func for llog_process in llog_obd_origin_setup */
-static int cat_cancel_cb(struct llog_handle *cathandle, 
+static int cat_cancel_cb(struct llog_handle *cathandle,
                           struct llog_rec_hdr *rec, void *data)
 {
         struct llog_logid_rec *lir = (struct llog_logid_rec *)rec;
@@ -134,39 +243,39 @@ static int cat_cancel_cb(struct llog_handle *cathandle,
         int rc, index;
         ENTRY;
 
-        if (le32_to_cpu(rec->lrh_type) != LLOG_LOGID_MAGIC) {
+        if (rec->lrh_type != LLOG_LOGID_MAGIC) {
                 CERROR("invalid record in catalog\n");
                 RETURN(-EINVAL);
         }
-        CWARN("processing log "LPX64":%x at index %u of catalog "LPX64"\n", 
-               lir->lid_id.lgl_oid, lir->lid_id.lgl_ogen,
-               le32_to_cpu(rec->lrh_index), cathandle->lgh_id.lgl_oid);
+        CDEBUG(D_HA, "processing log "LPX64":%x at index %u of catalog "
+               LPX64"\n", lir->lid_id.lgl_oid, lir->lid_id.lgl_ogen,
+               rec->lrh_index, cathandle->lgh_id.lgl_oid);
 
         rc = llog_cat_id2handle(cathandle, &loghandle, &lir->lid_id);
         if (rc) {
-                CERROR("Cannot find handle for log "LPX64"\n", lir->lid_id.lgl_oid);
+                CERROR("Cannot find handle for log "LPX64"\n",
+                       lir->lid_id.lgl_oid);
                 RETURN(rc);
-        }        
-        
+        }
+
         llh = loghandle->lgh_hdr;
-        if ((le32_to_cpu(llh->llh_flags) & LLOG_F_ZAP_WHEN_EMPTY) &&
-            (le32_to_cpu(llh->llh_count) == 1)) {
+        if ((llh->llh_flags & LLOG_F_ZAP_WHEN_EMPTY) &&
+            (llh->llh_count == 1)) {
                 rc = llog_destroy(loghandle);
                 if (rc)
-                        CERROR("failure destroying log during postsetup: %d\n", rc);
-                LASSERT(rc == 0);
+                        CERROR("failure destroying log in postsetup: %d\n", rc);
 
                 index = loghandle->u.phd.phd_cookie.lgc_index;
-                if (cathandle->u.chd.chd_current_log == loghandle)
-                        cathandle->u.chd.chd_current_log = NULL;
                 llog_free_handle(loghandle);
-                                                                                                                
+
                 LASSERT(index);
+                llog_cat_set_first_idx(cathandle, index);
                 rc = llog_cancel_rec(cathandle, index);
                 if (rc == 0)
-                        CWARN("cancel log "LPX64":%x at index %u of catalog "LPX64"\n", 
-                               lir->lid_id.lgl_oid, lir->lid_id.lgl_ogen,
-                               le32_to_cpu(rec->lrh_index), cathandle->lgh_id.lgl_oid);
+                        CDEBUG(D_HA, "cancel log "LPX64":%x at index %u of catalog "
+                              LPX64"\n", lir->lid_id.lgl_oid,
+                              lir->lid_id.lgl_ogen, rec->lrh_index,
+                              cathandle->lgh_id.lgl_oid);
         }
 
         RETURN(rc);
@@ -174,12 +283,13 @@ static int cat_cancel_cb(struct llog_handle *cathandle,
 
 /* lop_setup method for filter/osc */
 // XXX how to set exports
-int llog_obd_origin_setup(struct obd_device *obd, int index, struct obd_device *disk_obd,
-                          int count, struct llog_logid *logid)
+int llog_obd_origin_setup(struct obd_device *obd, struct obd_llog_group *olg,
+                          int index, struct obd_device *disk_obd, int count,
+                          struct llog_logid *logid)
 {
         struct llog_ctxt *ctxt;
         struct llog_handle *handle;
-        struct obd_run_ctxt saved;
+        struct lvfs_run_ctxt saved;
         int rc;
         ENTRY;
 
@@ -187,38 +297,35 @@ int llog_obd_origin_setup(struct obd_device *obd, int index, struct obd_device *
                 RETURN(0);
 
         LASSERT(count == 1);
-        
-        ctxt = llog_get_context(obd, index);
+
+        LASSERT(olg != NULL);
+        ctxt = llog_group_get_ctxt(olg, index);
+
         LASSERT(ctxt);
-        log_gen_init(ctxt);
+        llog_gen_init(ctxt);
 
-        down(&ctxt->loc_sem);
         if (logid->lgl_oid)
                 rc = llog_create(ctxt, &handle, logid, NULL);
         else {
                 rc = llog_create(ctxt, &handle, NULL, NULL);
-                if (!rc) 
+                if (!rc)
                         *logid = handle->lgh_id;
         }
-        if (rc) 
+        if (rc)
                 GOTO(out, rc);
 
         ctxt->loc_handle = handle;
-        push_ctxt(&saved, &disk_obd->obd_ctxt, NULL);
+        push_ctxt(&saved, &disk_obd->obd_lvfs_ctxt, NULL);
         rc = llog_init_handle(handle, LLOG_F_IS_CAT, NULL);
-        pop_ctxt(&saved, &disk_obd->obd_ctxt, NULL);
+        pop_ctxt(&saved, &disk_obd->obd_lvfs_ctxt, NULL);
         if (rc)
                 GOTO(out, rc);
 
-        rc = llog_process(handle, (llog_cb_t)cat_cancel_cb, NULL);
-        if (rc) 
+        rc = llog_process(handle, (llog_cb_t)cat_cancel_cb, NULL, NULL);
+        if (rc)
                 CERROR("llog_process with cat_cancel_cb failed: %d\n", rc);
- out:
-        up(&ctxt->loc_sem);
-        if (ctxt && rc) {
-                obd->obd_llog_ctxt[index] = NULL;
-                OBD_FREE(ctxt, sizeof(*ctxt));
-        }
+out:
+        llog_ctxt_put(ctxt);
         RETURN(rc);
 }
 EXPORT_SYMBOL(llog_obd_origin_setup);
@@ -229,42 +336,42 @@ int llog_obd_origin_cleanup(struct llog_ctxt *ctxt)
         struct llog_log_hdr *llh;
         int rc, index;
         ENTRY;
-        
+
         if (!ctxt)
-                return 0;
+                RETURN(0);
 
         cathandle = ctxt->loc_handle;
         if (cathandle) {
-                list_for_each_entry_safe(loghandle, n, &cathandle->u.chd.chd_head, 
-                                 u.phd.phd_entry) {
+                list_for_each_entry_safe(loghandle, n,
+                                         &cathandle->u.chd.chd_head,
+                                         u.phd.phd_entry) {
                         llh = loghandle->lgh_hdr;
-                        if ((le32_to_cpu(llh->llh_flags) & LLOG_F_ZAP_WHEN_EMPTY) &&
-                            (le32_to_cpu(llh->llh_count) == 1)) {
+                        if ((llh->llh_flags &
+                                LLOG_F_ZAP_WHEN_EMPTY) &&
+                            (llh->llh_count == 1)) {
                                 rc = llog_destroy(loghandle);
                                 if (rc)
-                                        CERROR("failure destroying log during cleanup: %d\n",
-                                               rc);
-                                LASSERT(rc == 0);
+                                        CERROR("failure destroying log during "
+                                               "cleanup: %d\n", rc);
 
                                 index = loghandle->u.phd.phd_cookie.lgc_index;
-                                if (cathandle->u.chd.chd_current_log == loghandle)
-                                        cathandle->u.chd.chd_current_log = NULL;
                                 llog_free_handle(loghandle);
-                                                                                                                             
+
                                 LASSERT(index);
+                                llog_cat_set_first_idx(cathandle, index);
                                 rc = llog_cancel_rec(cathandle, index);
                                 if (rc == 0)
-                                        CWARN("cancel plain log at index %u of catalog "LPX64"\n", 
-                                              index, cathandle->lgh_id.lgl_oid);
+                                        CDEBUG(D_RPCTRACE, "cancel plain log at"
+                                               "index %u of catalog "LPX64"\n",
+                                               index,cathandle->lgh_id.lgl_oid);
                         }
                 }
                 llog_cat_put(ctxt->loc_handle);
         }
-        return 0;
+        RETURN(0);
 }
 EXPORT_SYMBOL(llog_obd_origin_cleanup);
 
-
 /* add for obdfilter/sz and mds/unlink */
 int llog_obd_origin_add(struct llog_ctxt *ctxt,
                         struct llog_rec_hdr *rec, struct lov_stripe_md *lsm,
@@ -283,19 +390,20 @@ int llog_obd_origin_add(struct llog_ctxt *ctxt,
 }
 EXPORT_SYMBOL(llog_obd_origin_add);
 
-int llog_cat_initialize(struct obd_device *obd, int count)
+int llog_cat_initialize(struct obd_device *obd, struct obd_llog_group *olg,
+                        int count, struct obd_uuid *uuid)
 {
-        struct llog_logid *idarray;
+        char name[32] = CATLIST;
+        struct llog_catid *idarray = NULL;
         int size = sizeof(*idarray) * count;
-        char name[32] = "CATLIST";
         int rc;
         ENTRY;
 
-        OBD_ALLOC(idarray, size);
-        if (!idarray)
-                RETURN(-ENOMEM);
-
-        memset(idarray, 0, size);
+        if (count) {
+                OBD_VMALLOC(idarray, size);
+                if (!idarray)
+                        RETURN(-ENOMEM);
+        }
 
         rc = llog_get_cat_list(obd, obd, name, count, idarray);
         if (rc) {
@@ -303,7 +411,7 @@ int llog_cat_initialize(struct obd_device *obd, int count)
                 GOTO(out, rc);
         }
 
-        rc = obd_llog_init(obd, obd, count, idarray);
+        rc = obd_llog_init(obd, olg, obd, count, idarray, uuid);
         if (rc) {
                 CERROR("rc: %d\n", rc);
                 GOTO(out, rc);
@@ -314,22 +422,24 @@ int llog_cat_initialize(struct obd_device *obd, int count)
                 CERROR("rc: %d\n", rc);
                 GOTO(out, rc);
         }
-                        
+
  out:
-        OBD_FREE(idarray, size);
+        if (idarray)
+                OBD_VFREE(idarray, size);
         RETURN(rc);
 }
 EXPORT_SYMBOL(llog_cat_initialize);
 
-int obd_llog_init(struct obd_device *obd, struct obd_device *disk_obd,
-                  int count, struct llog_logid *logid)
+int obd_llog_init(struct obd_device *obd, struct obd_llog_group *olg,
+                  struct obd_device *disk_obd, int count,
+                  struct llog_catid *logid, struct obd_uuid *uuid)
 {
         int rc;
         ENTRY;
-        OBD_CHECK_OP(obd, llog_init, 0);
+        OBD_CHECK_DT_OP(obd, llog_init, 0);
         OBD_COUNTER_INCREMENT(obd, llog_init);
 
-        rc = OBP(obd, llog_init)(obd, disk_obd, count, logid);
+        rc = OBP(obd, llog_init)(obd, olg, disk_obd, count, logid, uuid);
         RETURN(rc);
 }
 EXPORT_SYMBOL(obd_llog_init);
@@ -338,10 +448,11 @@ int obd_llog_finish(struct obd_device *obd, int count)
 {
         int rc;
         ENTRY;
-        OBD_CHECK_OP(obd, llog_finish, 0);
+        OBD_CHECK_DT_OP(obd, llog_finish, 0);
         OBD_COUNTER_INCREMENT(obd, llog_finish);
 
         rc = OBP(obd, llog_finish)(obd, count);
         RETURN(rc);
 }
 EXPORT_SYMBOL(obd_llog_finish);
+