/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*- * vim:expandtab:shiftwidth=8:tabstop=8: * * Copyright (C) 2001-2003 Cluster File Systems, Inc. * Author: Andreas Dilger * * This file is part of Lustre, http://www.lustre.org. * * Lustre is free software; you can redistribute it and/or * modify it under the terms of version 2 of the GNU General Public * License as published by the Free Software Foundation. * * Lustre is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Lustre; if not, write to the Free Software * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. * * OST<->MDS recovery logging infrastructure. * * Invariants in implementation: * - we do not share logs among different OST<->MDS connections, so that * if an OST or MDS fails it need only look at log(s) relevant to itself */ #define DEBUG_SUBSYSTEM S_LOG #ifndef EXPORT_SYMTAB #define EXPORT_SYMTAB #endif #ifdef __KERNEL__ #include #else #include #endif #include #include /* Create a new log handle and add it to the open list. * This log handle will be closed when all of the records in it are removed. * * Assumes caller has already pushed us into the kernel context and is locking. */ static struct llog_handle *llog_cat_new_log(struct llog_handle *cathandle) { struct llog_handle *loghandle; struct llog_log_hdr *llh; struct llog_logid_rec rec; int rc, index, bitmap_size; ENTRY; llh = cathandle->lgh_hdr; bitmap_size = sizeof(llh->llh_bitmap) * 8; index = (cathandle->lgh_last_idx + 1) % bitmap_size; /* maximum number of available slots in catalog is bitmap_size - 2 */ if (llh->llh_cat_idx == cpu_to_le32(index)) { CERROR("no free catalog slots for log...\n"); RETURN(ERR_PTR(-ENOSPC)); } else { if (index == 0) index = 1; if (ext2_set_bit(index, llh->llh_bitmap)) { CERROR("argh, index %u already set in log bitmap?\n", index); LBUG(); /* should never happen */ } cathandle->lgh_last_idx = index; llh->llh_count = cpu_to_le32(le32_to_cpu(llh->llh_count) + 1); llh->llh_tail.lrt_index = cpu_to_le32(index); } rc = llog_create(cathandle->lgh_ctxt, &loghandle, NULL, NULL); if (rc) { CERROR("cannot create new log, error = %d\n", rc); RETURN(ERR_PTR(rc)); } rc = llog_init_handle(loghandle, LLOG_F_IS_PLAIN | LLOG_F_ZAP_WHEN_EMPTY, &cathandle->lgh_hdr->llh_tgtuuid); if (rc) GOTO(out_destroy, rc); CDEBUG(D_HA, "new recovery log "LPX64":%x for index %u of catalog " LPX64"\n", loghandle->lgh_id.lgl_oid, loghandle->lgh_id.lgl_ogen, index, cathandle->lgh_id.lgl_oid); /* build the record for this log in the catalog */ rec.lid_hdr.lrh_len = cpu_to_le32(sizeof(rec)); rec.lid_hdr.lrh_index = cpu_to_le32(index); rec.lid_hdr.lrh_type = cpu_to_le32(LLOG_LOGID_MAGIC); rec.lid_id = loghandle->lgh_id; rec.lid_tail.lrt_len = cpu_to_le32(sizeof(rec)); rec.lid_tail.lrt_index = cpu_to_le32(index); /* update the catalog: header and record */ rc = llog_write_rec(cathandle, &rec.lid_hdr, &loghandle->u.phd.phd_cookie, 1, NULL, index); if (rc < 0) GOTO(out_destroy, rc); loghandle->lgh_hdr->llh_cat_idx = cpu_to_le32(index); cathandle->u.chd.chd_current_log = loghandle; LASSERT(list_empty(&loghandle->u.phd.phd_entry)); list_add_tail(&loghandle->u.phd.phd_entry, &cathandle->u.chd.chd_head); out_destroy: if (rc < 0) llog_destroy(loghandle); RETURN(loghandle); } /* Open an existent log handle and add it to the open list. * This log handle will be closed when all of the records in it are removed. * * Assumes caller has already pushed us into the kernel context and is locking. * We return a lock on the handle to ensure nobody yanks it from us. */ int llog_cat_id2handle(struct llog_handle *cathandle, struct llog_handle **res, struct llog_logid *logid) { struct llog_handle *loghandle; int rc = 0; ENTRY; if (cathandle == NULL) RETURN(-EBADF); list_for_each_entry(loghandle, &cathandle->u.chd.chd_head, u.phd.phd_entry) { struct llog_logid *cgl = &loghandle->lgh_id; if (cgl->lgl_oid == logid->lgl_oid) { if (cgl->lgl_ogen != logid->lgl_ogen) { CERROR("log "LPX64" generation %x != %x\n", logid->lgl_oid, cgl->lgl_ogen, logid->lgl_ogen); continue; } loghandle->u.phd.phd_cat_handle = cathandle; GOTO(out, rc = 0); } } rc = llog_create(cathandle->lgh_ctxt, &loghandle, logid, NULL); if (rc) { CERROR("error opening log id "LPX64":%x: rc %d\n", logid->lgl_oid, logid->lgl_ogen, rc); } else { rc = llog_init_handle(loghandle, LLOG_F_IS_PLAIN, NULL); if (!rc) { list_add(&loghandle->u.phd.phd_entry, &cathandle->u.chd.chd_head); } } if (!rc) { loghandle->u.phd.phd_cat_handle = cathandle; loghandle->u.phd.phd_cookie.lgc_lgl = cathandle->lgh_id; loghandle->u.phd.phd_cookie.lgc_index = le32_to_cpu(loghandle->lgh_hdr->llh_cat_idx); } out: *res = loghandle; RETURN(rc); } EXPORT_SYMBOL(llog_cat_id2handle); int llog_cat_put(struct llog_handle *cathandle) { struct llog_handle *loghandle, *n; int rc; ENTRY; list_for_each_entry_safe(loghandle, n, &cathandle->u.chd.chd_head, u.phd.phd_entry) { int err = llog_close(loghandle); if (err) CERROR("error closing loghandle\n"); } rc = llog_close(cathandle); RETURN(rc); } EXPORT_SYMBOL(llog_cat_put); /* Return the currently active log handle. If the current log handle doesn't * have enough space left for the current record, start a new one. * * If reclen is 0, we only want to know what the currently active log is, * otherwise we get a lock on this log so nobody can steal our space. * * Assumes caller has already pushed us into the kernel context and is locking. * * NOTE: loghandle is write-locked upon successful return */ static struct llog_handle *llog_cat_current_log(struct llog_handle *cathandle, int create) { struct llog_handle *loghandle = NULL; ENTRY; down_read(&cathandle->lgh_lock); loghandle = cathandle->u.chd.chd_current_log; if (loghandle) { struct llog_log_hdr *llh = loghandle->lgh_hdr; if (loghandle->lgh_last_idx < (sizeof(llh->llh_bitmap)*8) - 1) { down_write(&loghandle->lgh_lock); up_read(&cathandle->lgh_lock); RETURN(loghandle); } } if (!create) { if (loghandle) down_write(&loghandle->lgh_lock); up_read(&cathandle->lgh_lock); RETURN(loghandle); } up_read(&cathandle->lgh_lock); /* time to create new log */ /* first, we have to make sure the state hasn't changed */ down_write(&cathandle->lgh_lock); loghandle = cathandle->u.chd.chd_current_log; if (loghandle) { struct llog_log_hdr *llh = loghandle->lgh_hdr; if (loghandle->lgh_last_idx < (sizeof(llh->llh_bitmap)*8) - 1) { down_write(&loghandle->lgh_lock); up_write(&cathandle->lgh_lock); RETURN(loghandle); } } CDEBUG(D_INODE, "creating new log\n"); loghandle = llog_cat_new_log(cathandle); if (!IS_ERR(loghandle)) down_write(&loghandle->lgh_lock); up_write(&cathandle->lgh_lock); RETURN(loghandle); } /* Add a single record to the recovery log(s) using a catalog * Returns as llog_write_record * * Assumes caller has already pushed us into the kernel context. */ int llog_cat_add_rec(struct llog_handle *cathandle, struct llog_rec_hdr *rec, struct llog_cookie *reccookie, void *buf) { struct llog_handle *loghandle; int rc; ENTRY; LASSERT(le32_to_cpu(rec->lrh_len) <= LLOG_CHUNK_SIZE); loghandle = llog_cat_current_log(cathandle, 1); if (IS_ERR(loghandle)) RETURN(PTR_ERR(loghandle)); /* loghandle is already locked by llog_cat_current_log() for us */ rc = llog_write_rec(loghandle, rec, reccookie, 1, buf, -1); up_write(&loghandle->lgh_lock); RETURN(rc); } EXPORT_SYMBOL(llog_cat_add_rec); /* For each cookie in the cookie array, we clear the log in-use bit and either: * - the log is empty, so mark it free in the catalog header and delete it * - the log is not empty, just write out the log header * * The cookies may be in different log files, so we need to get new logs * each time. * * Assumes caller has already pushed us into the kernel context. */ int llog_cat_cancel_records(struct llog_handle *cathandle, int count, struct llog_cookie *cookies) { int i, index, rc = 0; ENTRY; down_write(&cathandle->lgh_lock); for (i = 0; i < count; i++, cookies++) { struct llog_handle *loghandle; struct llog_logid *lgl = &cookies->lgc_lgl; rc = llog_cat_id2handle(cathandle, &loghandle, lgl); if (rc) { CERROR("Cannot find log "LPX64"\n", lgl->lgl_oid); break; } down_write(&loghandle->lgh_lock); rc = llog_cancel_rec(loghandle, cookies->lgc_index); up_write(&loghandle->lgh_lock); if (rc == 1) { /* log has been destroyed */ index = loghandle->u.phd.phd_cookie.lgc_index; if (cathandle->u.chd.chd_current_log == loghandle) cathandle->u.chd.chd_current_log = NULL; llog_free_handle(loghandle); LASSERT(index); llog_cat_set_first_idx(cathandle, index); rc = llog_cancel_rec(cathandle, index); if (rc == 0) CDEBUG(D_HA, "cancel plain log at index %u " "of catalog "LPX64"\n", index, cathandle->lgh_id.lgl_oid); } } up_write(&cathandle->lgh_lock); RETURN(rc); } EXPORT_SYMBOL(llog_cat_cancel_records); static int llog_cat_process_cb(struct llog_handle *cat_llh, struct llog_rec_hdr *rec, void *data) { struct llog_process_data *d = data; struct llog_logid_rec *lir = (struct llog_logid_rec *)rec; struct llog_handle *llh; int rc; if (le32_to_cpu(rec->lrh_type) != LLOG_LOGID_MAGIC) { CERROR("invalid record in catalog\n"); RETURN(-EINVAL); } CWARN("processing log "LPX64":%x at index %u of catalog "LPX64"\n", lir->lid_id.lgl_oid, lir->lid_id.lgl_ogen, le32_to_cpu(rec->lrh_index), cat_llh->lgh_id.lgl_oid); rc = llog_cat_id2handle(cat_llh, &llh, &lir->lid_id); if (rc) { CERROR("Cannot find handle for log "LPX64"\n", lir->lid_id.lgl_oid); RETURN(rc); } rc = llog_process(llh, d->lpd_cb, d->lpd_data, NULL); RETURN(rc); } int llog_cat_process(struct llog_handle *cat_llh, llog_cb_t cb, void *data) { struct llog_process_data d; struct llog_process_cat_data cd; struct llog_log_hdr *llh = cat_llh->lgh_hdr; int rc; ENTRY; LASSERT(llh->llh_flags &cpu_to_le32(LLOG_F_IS_CAT)); d.lpd_data = data; d.lpd_cb = cb; if (llh->llh_cat_idx > cat_llh->lgh_last_idx) { CWARN("catalog "LPX64" crosses index zero\n", cat_llh->lgh_id.lgl_oid); cd.first_idx = le32_to_cpu(llh->llh_cat_idx); cd.last_idx = 0; rc = llog_process(cat_llh, llog_cat_process_cb, &d, &cd); if (rc != 0) RETURN(rc); cd.first_idx = 0; cd.last_idx = cat_llh->lgh_last_idx; rc = llog_process(cat_llh, llog_cat_process_cb, &d, &cd); } else { rc = llog_process(cat_llh, llog_cat_process_cb, &d, NULL); } RETURN(rc); } EXPORT_SYMBOL(llog_cat_process); static int llog_cat_reverse_process_cb(struct llog_handle *cat_llh, struct llog_rec_hdr *rec, void *data) { struct llog_process_data *d = data; struct llog_logid_rec *lir = (struct llog_logid_rec *)rec; struct llog_handle *llh; int rc; if (le32_to_cpu(rec->lrh_type) != LLOG_LOGID_MAGIC) { CERROR("invalid record in catalog\n"); RETURN(-EINVAL); } CWARN("processing log "LPX64":%x at index %u of catalog "LPX64"\n", lir->lid_id.lgl_oid, lir->lid_id.lgl_ogen, le32_to_cpu(rec->lrh_index), cat_llh->lgh_id.lgl_oid); rc = llog_cat_id2handle(cat_llh, &llh, &lir->lid_id); if (rc) { CERROR("Cannot find handle for log "LPX64"\n", lir->lid_id.lgl_oid); RETURN(rc); } rc = llog_reverse_process(llh, d->lpd_cb, d->lpd_data, NULL); RETURN(rc); } int llog_cat_reverse_process(struct llog_handle *cat_llh, llog_cb_t cb, void *data) { struct llog_process_data d; struct llog_process_cat_data cd; struct llog_log_hdr *llh = cat_llh->lgh_hdr; int rc; ENTRY; LASSERT(llh->llh_flags &cpu_to_le32(LLOG_F_IS_CAT)); d.lpd_data = data; d.lpd_cb = cb; if (llh->llh_cat_idx > cat_llh->lgh_last_idx) { CWARN("catalog "LPX64" crosses index zero\n", cat_llh->lgh_id.lgl_oid); cd.first_idx = 0; cd.last_idx = cat_llh->lgh_last_idx; rc = llog_reverse_process(cat_llh, llog_cat_reverse_process_cb, &d, &cd); if (rc != 0) RETURN(rc); cd.first_idx = le32_to_cpu(llh->llh_cat_idx); cd.last_idx = 0; rc = llog_reverse_process(cat_llh, llog_cat_reverse_process_cb, &d, &cd); } else { rc = llog_reverse_process(cat_llh, llog_cat_reverse_process_cb, &d, NULL); } RETURN(rc); } EXPORT_SYMBOL(llog_cat_reverse_process); int llog_cat_set_first_idx(struct llog_handle *cathandle, int index) { struct llog_log_hdr *llh = cathandle->lgh_hdr; int i, bitmap_size, idx; ENTRY; bitmap_size = sizeof(llh->llh_bitmap) * 8; if (llh->llh_cat_idx == cpu_to_le32(index - 1)) { idx = le32_to_cpu(llh->llh_cat_idx) + 1; llh->llh_cat_idx = cpu_to_le32(idx); if (idx == cathandle->lgh_last_idx) goto out; for (i = (index + 1) % bitmap_size; i != cathandle->lgh_last_idx; i = (i + 1) % bitmap_size) { if (!ext2_test_bit(i, llh->llh_bitmap)) { idx = le32_to_cpu(llh->llh_cat_idx) + 1; llh->llh_cat_idx = cpu_to_le32(idx); } else if (i == 0) { llh->llh_cat_idx = 0; } else { break; } } out: CDEBUG(D_HA, "set catalog "LPX64" first idx %u\n", cathandle->lgh_id.lgl_oid,le32_to_cpu(llh->llh_cat_idx)); } RETURN(0); } EXPORT_SYMBOL(llog_cat_set_first_idx); int llog_catalog_add(struct llog_ctxt *ctxt, struct llog_rec_hdr *rec, void *buf, struct llog_cookie *logcookies, int numcookies, void *data) { struct llog_handle *cathandle; int rc; ENTRY; cathandle = ctxt->loc_handle; LASSERT(cathandle != NULL); rc = llog_cat_add_rec(cathandle, rec, logcookies, buf); if (rc != 1) CERROR("write one catalog record failed: %d\n", rc); RETURN(rc); } EXPORT_SYMBOL(llog_catalog_add); int llog_catalog_cancel(struct llog_ctxt *ctxt, int count, struct llog_cookie *cookies, int flags, void *data) { struct llog_handle *cathandle; int rc; ENTRY; if (cookies == NULL || count == 0) RETURN(-EINVAL); cathandle = ctxt->loc_handle; LASSERT(cathandle != NULL); rc = llog_cat_cancel_records(cathandle, count, cookies); RETURN(rc); } EXPORT_SYMBOL(llog_catalog_cancel); int llog_catalog_setup(struct llog_ctxt **res, char *name, struct obd_export *exp, struct lvfs_run_ctxt *lvfs_ctxt, struct fsfilt_operations *fsops, struct dentry *logs_de, struct dentry *objects_de) { struct llog_ctxt *ctxt; struct llog_catid catid; struct llog_handle *handle; int rc; ENTRY; OBD_ALLOC(ctxt, sizeof(*ctxt)); if (!ctxt) RETURN(-ENOMEM); *res = ctxt; /* marking this ctxt alone. */ ctxt->loc_alone = 1; ctxt->loc_fsops = fsops; ctxt->loc_lvfs_ctxt = lvfs_ctxt; ctxt->loc_exp = exp; ctxt->loc_logs_dir = logs_de; ctxt->loc_objects_dir = objects_de; ctxt->loc_logops = &llog_lvfs_ops; ctxt->loc_logops->lop_add = llog_catalog_add; ctxt->loc_logops->lop_cancel = llog_catalog_cancel; memset(&catid, 0, sizeof(struct llog_catid)); rc = llog_get_cat_list(lvfs_ctxt, fsops, name, 1, &catid); if (rc) { CERROR("error llog_get_cat_list rc: %d\n", rc); RETURN(rc); } if (catid.lci_logid.lgl_oid) rc = llog_create(ctxt, &handle, &catid.lci_logid, 0); else { rc = llog_create(ctxt, &handle, NULL, NULL); if (!rc) catid.lci_logid = handle->lgh_id; } if (rc) GOTO(out, rc); ctxt->loc_handle = handle; rc = llog_init_handle(handle, LLOG_F_IS_CAT, NULL); if (rc) GOTO(out, rc); rc = llog_put_cat_list(lvfs_ctxt, fsops, name, 1, &catid); if (rc) CERROR("error llog_get_cat_list rc: %d\n", rc); out: if (ctxt && rc) OBD_FREE(ctxt, sizeof(*ctxt)); RETURN(rc); } EXPORT_SYMBOL(llog_catalog_setup); int llog_catalog_cleanup(struct llog_ctxt *ctxt) { struct llog_handle *cathandle, *n, *loghandle; struct llog_log_hdr *llh; int rc, index; ENTRY; if (!ctxt) return 0; cathandle = ctxt->loc_handle; if (cathandle) { list_for_each_entry_safe(loghandle, n, &cathandle->u.chd.chd_head, u.phd.phd_entry) { llh = loghandle->lgh_hdr; if ((le32_to_cpu(llh->llh_flags) & LLOG_F_ZAP_WHEN_EMPTY) && (le32_to_cpu(llh->llh_count) == 1)) { rc = llog_destroy(loghandle); if (rc) CERROR("failure destroying log during " "cleanup: %d\n", rc); LASSERT(rc == 0); index = loghandle->u.phd.phd_cookie.lgc_index; llog_free_handle(loghandle); LASSERT(index); llog_cat_set_first_idx(cathandle, index); rc = llog_cancel_rec(cathandle, index); if (rc == 0) CDEBUG(D_HA, "cancel plain log at index" " %u of catalog "LPX64"\n", index,cathandle->lgh_id.lgl_oid); } } llog_cat_put(ctxt->loc_handle); } return 0; } EXPORT_SYMBOL(llog_catalog_cleanup); int llog_cat_half_bottom(struct llog_cookie *cookie, struct llog_handle *handle) { struct llog_handle *loghandle; struct llog_logid *lgl = &cookie->lgc_lgl; int rc; down_read(&handle->lgh_lock); rc = llog_cat_id2handle(handle, &loghandle, lgl); if (rc) GOTO(out, rc); if (2 * loghandle->lgh_hdr->llh_cat_idx <= handle->lgh_last_idx + handle->lgh_hdr->llh_cat_idx + 1) rc = 1; else rc = 0; out: up_read(&handle->lgh_lock); RETURN(rc); } EXPORT_SYMBOL(llog_cat_half_bottom);