1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
6 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License version 2 only,
10 * as published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License version 2 for more details (a copy is included
16 * in the LICENSE file that accompanied this code).
18 * You should have received a copy of the GNU General Public License
19 * version 2 along with this program; If not, see
20 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
22 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
23 * CA 95054 USA or visit www.sun.com if you need additional information or
29 * Copyright 2008 Sun Microsystems, Inc. All rights reserved
30 * Use is subject to license terms.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
36 * lustre/lov/lov_log.c
38 * Author: Phil Schwan <phil@clusterfs.com>
39 * Author: Peter Braam <braam@clusterfs.com>
40 * Author: Mike Shaver <shaver@clusterfs.com>
44 # define EXPORT_SYMTAB
46 #define DEBUG_SUBSYSTEM S_LOV
48 #include <libcfs/libcfs.h>
50 #include <liblustre.h>
53 #include <obd_support.h>
54 #include <lustre_lib.h>
55 #include <lustre_net.h>
56 #include <lustre/lustre_idl.h>
57 #include <lustre_dlm.h>
58 #include <lustre_mds.h>
59 #include <obd_class.h>
62 #include <lprocfs_status.h>
64 #include "lov_internal.h"
66 /* Add log records for each OSC that this object is striped over, and return
67 * cookies for each one. We _would_ have nice abstraction here, except that
68 * we need to keep cookies in stripe order, even if some are NULL, so that
69 * the right cookies are passed back to the right OSTs at the client side.
70 * Unset cookies should be all-zero (which will never occur naturally). */
71 static int lov_llog_origin_add(struct llog_ctxt *ctxt, struct llog_rec_hdr *rec,
72 struct lov_stripe_md *lsm,
73 struct llog_cookie *logcookies, int numcookies)
75 struct obd_device *obd = ctxt->loc_obd;
76 struct lov_obd *lov = &obd->u.lov;
77 int i, rc = 0, cookies = 0;
80 LASSERTF(logcookies && numcookies >= lsm->lsm_stripe_count,
81 "logcookies %p, numcookies %d lsm->lsm_stripe_count %d \n",
82 logcookies, numcookies, lsm->lsm_stripe_count);
84 for (i = 0; i < lsm->lsm_stripe_count; i++) {
85 struct lov_oinfo *loi = lsm->lsm_oinfo[i];
86 struct obd_device *child =
87 lov->lov_tgts[loi->loi_ost_idx]->ltd_exp->exp_obd;
88 struct llog_ctxt *cctxt = llog_get_context(child, ctxt->loc_idx);
90 /* fill mds unlink/setattr log record */
91 switch (rec->lrh_type) {
92 case MDS_UNLINK_REC: {
93 struct llog_unlink_rec *lur = (struct llog_unlink_rec *)rec;
94 lur->lur_oid = loi->loi_id;
95 lur->lur_ogr = loi->loi_gr;
98 case MDS_SETATTR_REC: {
99 struct llog_setattr_rec *lsr = (struct llog_setattr_rec *)rec;
100 lsr->lsr_oid = loi->loi_id;
101 lsr->lsr_ogr = loi->loi_gr;
104 case MDS_SETATTR64_REC: {
105 struct llog_setattr64_rec *lsr = (struct llog_setattr64_rec *)rec;
106 lsr->lsr_oid = loi->loi_id;
107 lsr->lsr_ogr = loi->loi_gr;
113 LASSERT(lsm->lsm_object_gr == loi->loi_gr);
114 /* inject error in llog_add() below */
115 if (OBD_FAIL_CHECK(OBD_FAIL_MDS_FAIL_LOV_LOG_ADD)) {
116 llog_ctxt_put(cctxt);
119 rc = llog_add(cctxt, rec, NULL, logcookies + cookies,
120 numcookies - cookies);
121 llog_ctxt_put(cctxt);
123 CERROR("Can't add llog (rc = %d) for stripe %i\n",
125 memset(logcookies + cookies, 0,
126 sizeof(struct llog_cookie));
127 rc = 1; /* skip this cookie */
129 /* Note that rc is always 1 if llog_add was successful */
135 static int lov_llog_origin_connect(struct llog_ctxt *ctxt,
136 struct llog_logid *logid,
137 struct llog_gen *gen,
138 struct obd_uuid *uuid)
140 struct obd_device *obd = ctxt->loc_obd;
141 struct lov_obd *lov = &obd->u.lov;
142 int i, rc = 0, err = 0;
146 for (i = 0; i < lov->desc.ld_tgt_count; i++) {
147 struct obd_device *child;
148 struct llog_ctxt *cctxt;
150 if (!lov->lov_tgts[i] || !lov->lov_tgts[i]->ltd_active)
152 if (uuid && !obd_uuid_equals(uuid, &lov->lov_tgts[i]->ltd_uuid))
154 CDEBUG(D_CONFIG, "connect %d/%d\n", i, lov->desc.ld_tgt_count);
155 child = lov->lov_tgts[i]->ltd_exp->exp_obd;
156 cctxt = llog_get_context(child, ctxt->loc_idx);
157 rc = llog_connect(cctxt, logid, gen, uuid);
158 llog_ctxt_put(cctxt);
161 CERROR("error osc_llog_connect tgt %d (%d)\n", i, rc);
171 /* the replicators commit callback */
172 static int lov_llog_repl_cancel(struct llog_ctxt *ctxt, struct lov_stripe_md *lsm,
173 int count, struct llog_cookie *cookies, int flags)
176 struct obd_device *obd = ctxt->loc_obd;
180 LASSERT(lsm != NULL);
181 LASSERT(count == lsm->lsm_stripe_count);
185 for (i = 0; i < count; i++, cookies++) {
186 struct lov_oinfo *loi = lsm->lsm_oinfo[i];
187 struct obd_device *child =
188 lov->lov_tgts[loi->loi_ost_idx]->ltd_exp->exp_obd;
189 struct llog_ctxt *cctxt =
190 llog_get_context(child, ctxt->loc_idx);
193 err = llog_cancel(cctxt, NULL, 1, cookies, flags);
194 llog_ctxt_put(cctxt);
195 if (err && lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
196 CERROR("error: objid "LPX64" subobj "LPX64
197 " on OST idx %d: rc = %d\n", lsm->lsm_object_id,
198 loi->loi_id, loi->loi_ost_idx, err);
207 static struct llog_operations lov_mds_ost_orig_logops = {
208 lop_add: lov_llog_origin_add,
209 lop_connect: lov_llog_origin_connect
212 static struct llog_operations lov_size_repl_logops = {
213 lop_cancel: lov_llog_repl_cancel
216 int lov_llog_init(struct obd_device *obd, struct obd_llog_group *olg,
217 struct obd_device *disk_obd, int *index)
219 struct lov_obd *lov = &obd->u.lov;
220 struct obd_device *child;
224 LASSERT(olg == &obd->obd_olg);
225 rc = llog_setup(obd, olg, LLOG_MDS_OST_ORIG_CTXT, disk_obd, 0, NULL,
226 &lov_mds_ost_orig_logops);
230 rc = llog_setup(obd, olg, LLOG_SIZE_REPL_CTXT, disk_obd, 0, NULL,
231 &lov_size_repl_logops);
233 GOTO(err_cleanup, rc);
236 /* count may not match lov->desc.ld_tgt_count during dynamic ost add */
237 for (i = 0; i < lov->desc.ld_tgt_count; i++) {
238 if (!lov->lov_tgts[i])
241 if (index && i != *index)
244 child = lov->lov_tgts[i]->ltd_obd;
245 rc = obd_llog_init(child, &child->obd_olg, disk_obd, &i);
247 CERROR("error osc_llog_init idx %d osc '%s' tgt '%s' "
248 "(rc=%d)\n", i, child->obd_name,
249 disk_obd->obd_name, rc);
253 GOTO(err_cleanup, rc);
256 struct llog_ctxt *ctxt =
257 llog_get_context(obd, LLOG_SIZE_REPL_CTXT);
260 ctxt = llog_get_context(obd, LLOG_MDS_OST_ORIG_CTXT);
267 int lov_llog_finish(struct obd_device *obd, int count)
269 struct llog_ctxt *ctxt;
273 /* cleanup our llogs only if the ctxts have been setup
274 * (client lov doesn't setup, mds lov does). */
275 ctxt = llog_get_context(obd, LLOG_MDS_OST_ORIG_CTXT);
277 rc = llog_cleanup(ctxt);
279 ctxt = llog_get_context(obd, LLOG_SIZE_REPL_CTXT);
281 rc2 = llog_cleanup(ctxt);
285 /* lov->tgt llogs are cleaned during osc_cleanup. */