1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
6 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License version 2 only,
10 * as published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License version 2 for more details (a copy is included
16 * in the LICENSE file that accompanied this code).
18 * You should have received a copy of the GNU General Public License
19 * version 2 along with this program; If not, see
20 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
22 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
23 * CA 95054 USA or visit www.sun.com if you need additional information or
29 * Copyright 2008 Sun Microsystems, Inc. All rights reserved
30 * Use is subject to license terms.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
36 * lustre/include/lustre_log.h
38 * Generic infrastructure for managing a collection of logs.
39 * These logs are used for:
41 * - orphan recovery: OST adds record on create
42 * - mtime/size consistency: the OST adds a record on first write
43 * - open/unlinked objects: OST adds a record on destroy
45 * - mds unlink log: the MDS adds an entry upon delete
47 * - raid1 replication log between OST's
48 * - MDS replication logs
54 #if defined(__linux__)
55 #include <linux/lustre_log.h>
56 #elif defined(__APPLE__)
57 #include <darwin/lustre_log.h>
58 #elif defined(__WINNT__)
59 #include <winnt/lustre_log.h>
61 #error Unsupported operating system.
66 #include <lustre/lustre_idl.h>
68 #define LOG_NAME_LIMIT(logname, name) \
69 snprintf(logname, sizeof(logname), "LOGS/%s", name)
70 #define LLOG_EEMPTY 4711
72 struct plain_handle_data {
73 struct list_head phd_entry;
74 struct llog_handle *phd_cat_handle;
75 struct llog_cookie phd_cookie; /* cookie of this log in its cat */
79 struct cat_handle_data {
80 struct list_head chd_head;
81 struct llog_handle *chd_current_log; /* currently open log */
84 /* In-memory descriptor for a log object or log catalog */
86 struct rw_semaphore lgh_lock;
87 struct llog_logid lgh_id; /* id of this log */
88 struct llog_log_hdr *lgh_hdr;
89 struct file *lgh_file;
91 int lgh_cur_idx; /* used during llog_process */
92 __u64 lgh_cur_offset; /* used during llog_process */
93 struct llog_ctxt *lgh_ctxt;
95 struct plain_handle_data phd;
96 struct cat_handle_data chd;
100 /* llog.c - general API */
101 typedef int (*llog_cb_t)(struct llog_handle *, struct llog_rec_hdr *, void *);
102 typedef int (*llog_fill_rec_cb_t)(struct llog_rec_hdr *rec, void *data);
103 extern struct llog_handle *llog_alloc_handle(void);
104 int llog_init_handle(struct llog_handle *handle, int flags,
105 struct obd_uuid *uuid);
106 extern void llog_free_handle(struct llog_handle *handle);
107 int llog_process(struct llog_handle *loghandle, llog_cb_t cb,
108 void *data, void *catdata);
109 int llog_reverse_process(struct llog_handle *loghandle, llog_cb_t cb,
110 void *data, void *catdata);
111 extern int llog_cancel_rec(struct llog_handle *loghandle, int index);
112 extern int llog_close(struct llog_handle *cathandle);
113 extern int llog_get_size(struct llog_handle *loghandle);
115 /* llog_cat.c - catalog api */
116 struct llog_process_data {
118 * Any useful data needed while processing catalog. This is
119 * passed later to process callback.
123 * Catalog process callback function, called for each record
129 struct llog_process_cat_data {
131 * Temporary stored first_idx while scanning log.
135 * Temporary stored last_idx while scanning log.
140 struct llog_process_cat_args {
142 * Llog context used in recovery thread on OST (recov_thread.c)
144 struct llog_ctxt *lpca_ctxt;
146 * Llog callback used in recovery thread on OST (recov_thread.c)
150 * Data pointer for llog callback.
155 int llog_cat_put(struct llog_handle *cathandle);
156 int llog_cat_add_rec(struct llog_handle *cathandle, struct llog_rec_hdr *rec,
157 struct llog_cookie *reccookie, void *buf);
158 int llog_cat_cancel_records(struct llog_handle *cathandle, int count,
159 struct llog_cookie *cookies);
160 int llog_cat_process(struct llog_handle *cat_llh, llog_cb_t cb, void *data);
161 int llog_cat_process_thread(void *data);
162 int llog_cat_reverse_process(struct llog_handle *cat_llh, llog_cb_t cb, void *data);
163 int llog_cat_set_first_idx(struct llog_handle *cathandle, int index);
166 int llog_setup(struct obd_device *obd, int index, struct obd_device *disk_obd,
167 int count, struct llog_logid *logid,struct llog_operations *op);
168 int __llog_ctxt_put(struct llog_ctxt *ctxt);
169 int llog_cleanup(struct llog_ctxt *);
170 int llog_sync(struct llog_ctxt *ctxt, struct obd_export *exp);
171 int llog_add(struct llog_ctxt *ctxt, struct llog_rec_hdr *rec,
172 struct lov_stripe_md *lsm, struct llog_cookie *logcookies,
174 int llog_cancel(struct llog_ctxt *, struct lov_stripe_md *lsm,
175 int count, struct llog_cookie *cookies, int flags);
177 int llog_obd_origin_setup(struct obd_device *obd, int index,
178 struct obd_device *disk_obd, int count,
179 struct llog_logid *logid);
180 int llog_obd_origin_cleanup(struct llog_ctxt *ctxt);
181 int llog_obd_origin_add(struct llog_ctxt *ctxt,
182 struct llog_rec_hdr *rec, struct lov_stripe_md *lsm,
183 struct llog_cookie *logcookies, int numcookies);
185 int obd_llog_init(struct obd_device *obd, struct obd_device *disk_obd,
188 int obd_llog_finish(struct obd_device *obd, int count);
191 int llog_ioctl(struct llog_ctxt *ctxt, int cmd, struct obd_ioctl_data *data);
192 int llog_catalog_list(struct obd_device *obd, int count,
193 struct obd_ioctl_data *data);
196 int llog_initiator_connect(struct llog_ctxt *ctxt);
197 int llog_receptor_accept(struct llog_ctxt *ctxt, struct obd_import *imp);
198 int llog_origin_connect(struct llog_ctxt *ctxt,
199 struct llog_logid *logid, struct llog_gen *gen,
200 struct obd_uuid *uuid);
201 int llog_handle_connect(struct ptlrpc_request *req);
204 int llog_obd_repl_cancel(struct llog_ctxt *ctxt,
205 struct lov_stripe_md *lsm, int count,
206 struct llog_cookie *cookies, int flags);
207 int llog_obd_repl_sync(struct llog_ctxt *ctxt, struct obd_export *exp);
208 int llog_obd_repl_connect(struct llog_ctxt *ctxt,
209 struct llog_logid *logid, struct llog_gen *gen,
210 struct obd_uuid *uuid);
212 struct llog_operations {
213 int (*lop_write_rec)(struct llog_handle *loghandle,
214 struct llog_rec_hdr *rec,
215 struct llog_cookie *logcookies, int numcookies,
217 int (*lop_destroy)(struct llog_handle *handle);
218 int (*lop_next_block)(struct llog_handle *h, int *curr_idx,
219 int next_idx, __u64 *offset, void *buf, int len);
220 int (*lop_prev_block)(struct llog_handle *h,
221 int prev_idx, void *buf, int len);
222 int (*lop_create)(struct llog_ctxt *ctxt, struct llog_handle **,
223 struct llog_logid *logid, char *name);
224 int (*lop_close)(struct llog_handle *handle);
225 int (*lop_read_header)(struct llog_handle *handle);
227 int (*lop_setup)(struct obd_device *obd, int ctxt_idx,
228 struct obd_device *disk_obd, int count,
229 struct llog_logid *logid);
230 int (*lop_sync)(struct llog_ctxt *ctxt, struct obd_export *exp);
231 int (*lop_cleanup)(struct llog_ctxt *ctxt);
232 int (*lop_add)(struct llog_ctxt *ctxt, struct llog_rec_hdr *rec,
233 struct lov_stripe_md *lsm,
234 struct llog_cookie *logcookies, int numcookies);
235 int (*lop_cancel)(struct llog_ctxt *ctxt, struct lov_stripe_md *lsm,
236 int count, struct llog_cookie *cookies, int flags);
237 int (*lop_connect)(struct llog_ctxt *ctxt,
238 struct llog_logid *logid, struct llog_gen *gen,
239 struct obd_uuid *uuid);
240 /* XXX add 2 more: commit callbacks and llog recovery functions */
244 extern struct llog_operations llog_lvfs_ops;
245 int llog_get_cat_list(struct obd_device *obd, struct obd_device *disk_obd,
246 char *name, int idx, int count,
247 struct llog_catid *idarray);
249 int llog_put_cat_list(struct obd_device *obd, struct obd_device *disk_obd,
250 char *name, int idx, int count, struct llog_catid *idarray);
252 #define LLOG_CTXT_FLAG_UNINITIALIZED 0x00000001
255 int loc_idx; /* my index the obd array of ctxt's */
256 struct llog_gen loc_gen;
257 struct obd_device *loc_obd; /* points back to the containing obd*/
258 struct obd_export *loc_exp; /* parent "disk" export (e.g. MDS) */
259 struct obd_import *loc_imp; /* to use in RPC's: can be backward
261 struct llog_operations *loc_logops;
262 struct llog_handle *loc_handle;
263 struct llog_canceld_ctxt *loc_llcd;
264 struct semaphore loc_sem; /* protects loc_llcd and loc_imp */
265 atomic_t loc_refcount;
266 struct llog_commit_master *loc_lcm;
268 long loc_flags; /* flags, see above defines */
271 #define LCM_NAME_SIZE 64
273 struct llog_commit_master {
275 * Thread control flags (start, stop, etc.)
279 * Number of llcds onthis lcm.
283 * Thread control structure. Used for control commit thread.
285 struct ptlrpcd_ctl lcm_pc;
287 * Lock protecting list of llcds.
291 * Llcds in flight for debugging purposes.
293 struct list_head lcm_llcds;
295 * Commit thread name buffer. Only used for thread start.
297 char lcm_name[LCM_NAME_SIZE];
300 struct llog_canceld_ctxt {
302 * Llog context this llcd is attached to. Used for accessing
303 * ->loc_import and others in process of canceling cookies
304 * gathered in this llcd.
306 struct llog_ctxt *llcd_ctxt;
308 * Cancel thread control stucture pointer. Used for accessing
309 * it to see if should stop processing and other needs.
311 struct llog_commit_master *llcd_lcm;
313 * Maximal llcd size. Used in calculations on how much of room
314 * left in llcd to cookie comming cookies.
318 * Link to lcm llcds list.
320 struct list_head llcd_list;
322 * Current llcd size while gathering cookies. This should not be
323 * more than ->llcd_size. Used for determining if we need to
324 * send this llcd (if full) and allocate new one. This is also
325 * used for copying new cookie at the end of buffer.
327 int llcd_cookiebytes;
329 * Pointer to the start of cookies buffer.
331 struct llog_cookie llcd_cookies[0];
334 /* ptlrpc/recov_thread.c */
335 extern struct llog_commit_master *llog_recov_thread_init(char *name);
336 extern void llog_recov_thread_fini(struct llog_commit_master *lcm,
338 extern int llog_recov_thread_start(struct llog_commit_master *lcm);
339 extern void llog_recov_thread_stop(struct llog_commit_master *lcm,
342 static inline void llog_gen_init(struct llog_ctxt *ctxt)
344 struct obd_device *obd = ctxt->loc_exp->exp_obd;
346 if (!strcmp(obd->obd_type->typ_name, LUSTRE_MDS_NAME))
347 ctxt->loc_gen.mnt_cnt = obd->u.mds.mds_mount_count;
348 else if (!strstr(obd->obd_type->typ_name, LUSTRE_OST_NAME))
349 ctxt->loc_gen.mnt_cnt = obd->u.filter.fo_mount_count;
351 ctxt->loc_gen.mnt_cnt = 0;
354 static inline int llog_gen_lt(struct llog_gen a, struct llog_gen b)
356 if (a.mnt_cnt < b.mnt_cnt)
358 if (a.mnt_cnt > b.mnt_cnt)
360 return(a.conn_cnt < b.conn_cnt ? 1 : 0);
363 #define LLOG_GEN_INC(gen) ((gen).conn_cnt ++)
364 #define LLOG_PROC_BREAK 0x0001
365 #define LLOG_DEL_RECORD 0x0002
367 static inline int llog_obd2ops(struct llog_ctxt *ctxt,
368 struct llog_operations **lop)
373 *lop = ctxt->loc_logops;
380 static inline int llog_handle2ops(struct llog_handle *loghandle,
381 struct llog_operations **lop)
383 if (loghandle == NULL)
386 return llog_obd2ops(loghandle->lgh_ctxt, lop);
389 static inline int llog_data_len(int len)
391 return size_round(len);
394 #define llog_ctxt_get(ctxt) \
396 struct llog_ctxt *ctxt_ = ctxt; \
397 LASSERT(atomic_read(&ctxt_->loc_refcount) > 0); \
398 atomic_inc(&ctxt_->loc_refcount); \
399 CDEBUG(D_INFO, "GETting ctxt %p : new refcount %d\n", ctxt_, \
400 atomic_read(&ctxt_->loc_refcount)); \
404 #define llog_ctxt_put(ctxt) \
406 if ((ctxt) == NULL) \
408 LASSERT(atomic_read(&(ctxt)->loc_refcount) > 0); \
409 LASSERT(atomic_read(&(ctxt)->loc_refcount) < 0x5a5a5a); \
410 CDEBUG(D_INFO, "PUTting ctxt %p : new refcount %d\n", (ctxt), \
411 atomic_read(&(ctxt)->loc_refcount) - 1); \
412 __llog_ctxt_put(ctxt); \
415 static inline struct llog_ctxt *llog_get_context(struct obd_device *obd,
418 struct llog_ctxt *ctxt;
420 if (index < 0 || index >= LLOG_MAX_CTXTS) {
421 CDEBUG(D_INFO, "obd %p bad index %d\n", obd, index);
425 spin_lock(&obd->obd_dev_lock);
426 if (obd->obd_llog_ctxt[index] == NULL) {
427 spin_unlock(&obd->obd_dev_lock);
428 CDEBUG(D_INFO,"obd %p and ctxt index %d is NULL \n",obd,index);
431 ctxt = llog_ctxt_get(obd->obd_llog_ctxt[index]);
432 spin_unlock(&obd->obd_dev_lock);
436 static inline int llog_ctxt_null(struct obd_device *obd, int index)
438 return (obd->obd_llog_ctxt[index] == NULL);
441 static inline int llog_write_rec(struct llog_handle *handle,
442 struct llog_rec_hdr *rec,
443 struct llog_cookie *logcookies,
444 int numcookies, void *buf, int idx)
446 struct llog_operations *lop;
447 int raised, rc, buflen;
450 rc = llog_handle2ops(handle, &lop);
453 if (lop->lop_write_rec == NULL)
457 buflen = rec->lrh_len + sizeof(struct llog_rec_hdr)
458 + sizeof(struct llog_rec_tail);
460 buflen = rec->lrh_len;
461 LASSERT(size_round(buflen) == buflen);
463 raised = cfs_cap_raised(CFS_CAP_SYS_RESOURCE);
465 cfs_cap_raise(CFS_CAP_SYS_RESOURCE);
466 rc = lop->lop_write_rec(handle, rec, logcookies, numcookies, buf, idx);
468 cfs_cap_lower(CFS_CAP_SYS_RESOURCE);
472 static inline int llog_read_header(struct llog_handle *handle)
474 struct llog_operations *lop;
478 rc = llog_handle2ops(handle, &lop);
481 if (lop->lop_read_header == NULL)
484 rc = lop->lop_read_header(handle);
488 static inline int llog_destroy(struct llog_handle *handle)
490 struct llog_operations *lop;
494 rc = llog_handle2ops(handle, &lop);
497 if (lop->lop_destroy == NULL)
500 rc = lop->lop_destroy(handle);
505 static inline int llog_cancel(struct obd_export *exp,
506 struct lov_stripe_md *lsm, int count,
507 struct llog_cookie *cookies, int flags)
509 struct llog_operations *lop;
513 rc = llog_handle2ops(loghandle, &lop);
516 if (lop->lop_cancel == NULL)
519 rc = lop->lop_cancel(exp, lsm, count, cookies, flags);
524 static inline int llog_next_block(struct llog_handle *loghandle, int *cur_idx,
525 int next_idx, __u64 *cur_offset, void *buf,
528 struct llog_operations *lop;
532 rc = llog_handle2ops(loghandle, &lop);
535 if (lop->lop_next_block == NULL)
538 rc = lop->lop_next_block(loghandle, cur_idx, next_idx, cur_offset, buf,
543 static inline int llog_prev_block(struct llog_handle *loghandle,
544 int prev_idx, void *buf, int len)
546 struct llog_operations *lop;
550 rc = llog_handle2ops(loghandle, &lop);
553 if (lop->lop_prev_block == NULL)
556 rc = lop->lop_prev_block(loghandle, prev_idx, buf, len);
560 static inline int llog_create(struct llog_ctxt *ctxt, struct llog_handle **res,
561 struct llog_logid *logid, char *name)
563 struct llog_operations *lop;
567 rc = llog_obd2ops(ctxt, &lop);
570 if (lop->lop_create == NULL)
573 raised = cfs_cap_raised(CFS_CAP_SYS_RESOURCE);
575 cfs_cap_raise(CFS_CAP_SYS_RESOURCE);
576 rc = lop->lop_create(ctxt, res, logid, name);
578 cfs_cap_lower(CFS_CAP_SYS_RESOURCE);
582 static inline int llog_connect(struct llog_ctxt *ctxt,
583 struct llog_logid *logid, struct llog_gen *gen,
584 struct obd_uuid *uuid)
586 struct llog_operations *lop;
590 rc = llog_obd2ops(ctxt, &lop);
593 if (lop->lop_connect == NULL)
596 rc = lop->lop_connect(ctxt, logid, gen, uuid);