1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
5 * Lustre filesystem abstraction routines
7 * Copyright (C) 2004 Cluster File Systems, Inc.
9 * This file is part of Lustre, http://www.lustre.org.
11 * Lustre is free software; you can redistribute it and/or
12 * modify it under the terms of version 2 of the GNU General Public
13 * License as published by the Free Software Foundation.
15 * Lustre is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
20 * You should have received a copy of the GNU General Public License
21 * along with Lustre; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
25 # define EXPORT_SYMTAB
28 #define DEBUG_SUBSYSTEM S_SM
30 #include <linux/kmod.h>
31 #include <linux/init.h>
33 #include <linux/slab.h>
34 #include <linux/obd_class.h>
35 #include <linux/obd_support.h>
36 #include <linux/lustre_lib.h>
37 #include <linux/lustre_idl.h>
38 #include <linux/lustre_fsfilt.h>
39 #include <linux/lustre_smfs.h>
40 #include "smfs_internal.h"
42 #define KML_BUF_REC_INIT(buffer, pbuf, len) \
44 pbuf = buffer + sizeof(int); \
48 #define KML_BUF_REC_END(buffer, length, pbuf) \
51 memcpy(buffer, &len, sizeof(len)); \
52 length += sizeof(int); \
53 pbuf = buffer + length; \
56 static smfs_pack_rec_func smfs_get_rec_pack_type(struct super_block *sb)
59 struct smfs_super_info *smsi = S2SMI(sb);
61 idx = GET_REC_PACK_TYPE_INDEX(smsi->smsi_flags);
62 return smsi->smsi_pack_rec[idx];
65 static int smfs_post_kml_rec(struct inode *dir, void *de, void *data1,
68 static int smfs_rec_post_hook(struct inode *inode, void *dentry,
69 void *data1, void *data2, int op, void *handle)
74 if (smfs_do_rec(inode))
75 rc = smfs_post_kml_rec(inode, dentry, data1, data2, op);
80 #define KML_HOOK "kml_hook"
82 int smfs_rec_init(struct super_block *sb)
85 struct smfs_super_info *smfs_info = S2SMI(sb);
86 struct smfs_hook_ops *rec_hops = NULL;
89 SMFS_SET_REC(smfs_info);
91 rc = ost_rec_pack_init(smfs_info);
95 rc = mds_rec_pack_init(smfs_info);
99 rec_hops = smfs_alloc_hook_ops(KML_HOOK, NULL, smfs_rec_post_hook);
103 rc = smfs_register_hook_ops(smfs_info, rec_hops);
104 if (rc && rec_hops) {
105 smfs_unregister_hook_ops(smfs_info, rec_hops->smh_name);
106 smfs_free_hook_ops(rec_hops);
111 int smfs_rec_cleanup(struct smfs_super_info *smfs_info)
113 struct smfs_hook_ops *rec_hops;
117 rec_hops = smfs_unregister_hook_ops(smfs_info, KML_HOOK);
118 smfs_free_hook_ops(rec_hops);
119 SMFS_CLEAN_REC(smfs_info);
125 copy_inode_attr(struct iattr *iattr, struct inode *inode)
127 iattr->ia_mode = inode->i_mode;
128 iattr->ia_uid = inode->i_uid;
129 iattr->ia_gid = inode->i_gid;
130 iattr->ia_atime = inode->i_atime;
131 iattr->ia_ctime = inode->i_ctime;
132 iattr->ia_mtime = inode->i_mtime;
133 iattr->ia_size = inode->i_size;
136 static inline int unpack_rec_data(char **p_buffer, int *size,
137 char *in_data, char *args_data)
144 args_len = strlen(args_data);
146 *size = *((int*)(in_data));
147 rc = *size + sizeof(int);
149 OBD_ALLOC(*p_buffer, *size + args_len + 1);
153 /* first copy reint dir. */
155 memcpy(*p_buffer, args_data, args_len);
157 /* then copy the node name. */
158 memcpy(*p_buffer + args_len,
159 (in_data + sizeof(int)), *size);
166 int smfs_rec_unpack(struct smfs_proc_args *args, char *record,
167 char **pbuf, int *opcode)
169 int offset = *(int *)(record);
170 char *tmp = record + offset + sizeof(int);
172 *opcode = *(int *)tmp;
173 *pbuf = tmp + sizeof(*opcode);
176 EXPORT_SYMBOL(smfs_rec_unpack);
178 int smfs_start_rec(struct super_block *sb, struct vfsmount *mnt)
180 struct dentry *dentry;
181 struct lvfs_run_ctxt saved;
185 if (SMFS_INIT_REC(S2SMI(sb)) ||
186 (!SMFS_DO_REC(S2SMI(sb)) && !SMFS_CACHE_HOOK(S2SMI(sb))))
189 rc = smfs_llog_setup(sb, mnt);
192 push_ctxt(&saved, S2SMI(sb)->smsi_ctxt, NULL);
193 dentry = simple_mkdir(current->fs->pwd, "DELETE", 0777, 1);
194 if (IS_ERR(dentry)) {
195 rc = PTR_ERR(dentry);
196 CERROR("cannot create DELETE directory: rc = %d\n", rc);
197 GOTO(err_exit, rc = -EINVAL);
199 S2SMI(sb)->smsi_delete_dir = dentry;
202 SMFS_SET_INIT_REC(S2SMI(sb));
204 pop_ctxt(&saved, S2SMI(sb)->smsi_ctxt, NULL);
207 if (S2SMI(sb)->smsi_ctxt)
208 OBD_FREE(S2SMI(sb)->smsi_ctxt, sizeof(struct lvfs_run_ctxt));
211 EXPORT_SYMBOL(smfs_start_rec);
213 int smfs_post_setup(struct super_block *sb, struct vfsmount *mnt)
215 struct lvfs_run_ctxt *current_ctxt = NULL;
216 struct smfs_super_info *smb = S2SMI(sb);
219 OBD_ALLOC(current_ctxt, sizeof(*current_ctxt));
222 OBD_SET_CTXT_MAGIC(current_ctxt);
224 current_ctxt->pwdmnt = mnt;
225 current_ctxt->pwd = mnt->mnt_root;
226 current_ctxt->fs = get_ds();
227 smb->smsi_ctxt = current_ctxt;
231 EXPORT_SYMBOL(smfs_post_setup);
233 int smfs_post_cleanup(struct super_block *sb)
235 struct smfs_super_info *smb = S2SMI(sb);
239 OBD_FREE(S2SMI(sb)->smsi_ctxt, sizeof(struct lvfs_run_ctxt));
242 EXPORT_SYMBOL(smfs_post_cleanup);
244 int smfs_stop_rec(struct super_block *sb)
249 if (!SMFS_INIT_REC(S2SMI(sb)) ||
250 (!SMFS_DO_REC(S2SMI(sb)) && !SMFS_CACHE_HOOK(S2SMI(sb))))
253 rc = smfs_llog_cleanup(sb);
255 SMFS_CLEAN_INIT_REC(S2SMI(sb));
257 if (S2SMI(sb)->smsi_delete_dir) {
258 l_dput(S2SMI(sb)->smsi_delete_dir);
259 S2SMI(sb)->smsi_delete_dir = NULL;
263 EXPORT_SYMBOL(smfs_stop_rec);
265 int smfs_write_extents(struct inode *dir, struct dentry *dentry,
266 unsigned long from, unsigned long num)
268 return smfs_post_rec_write(dir, dentry, &from, &num);
270 EXPORT_SYMBOL(smfs_write_extents);
272 int smfs_rec_setattr(struct inode *dir, struct dentry *dentry,
275 return smfs_post_rec_setattr(dir, dentry, attr, NULL);
277 EXPORT_SYMBOL(smfs_rec_setattr);
279 int smfs_rec_md(struct inode *inode, void *lmm, int lmm_size)
281 char *set_lmm = NULL;
285 if (!SMFS_DO_REC(S2SMI(inode->i_sb)))
289 OBD_ALLOC(set_lmm, lmm_size + sizeof(lmm_size));
292 memcpy(set_lmm, &lmm_size, sizeof(lmm_size));
293 memcpy(set_lmm + sizeof(lmm_size), lmm, lmm_size);
294 rc = smfs_post_rec_setattr(inode, NULL, NULL, set_lmm);
296 CERROR("Error: Record md for inode %lu rc=%d\n",
301 OBD_FREE(set_lmm, lmm_size + sizeof(lmm_size));
304 EXPORT_SYMBOL(smfs_rec_md);
306 int smfs_rec_precreate(struct dentry *dentry, int *num, struct obdo *oa)
308 return smfs_post_rec_create(dentry->d_inode, dentry, num, oa);
310 EXPORT_SYMBOL(smfs_rec_precreate);
312 int smfs_process_rec(struct super_block *sb,
313 int count, char *dir, int flags)
315 struct llog_ctxt *ctxt;
316 struct llog_handle *loghandle;
317 struct smfs_proc_args args;
321 if (!SMFS_INIT_REC(S2SMI(sb))) {
322 CWARN("Did not start up rec server \n");
326 memset(&args, 0, sizeof(struct smfs_proc_args));
328 args.sr_count = count;
330 args.sr_flags = flags ;
331 ctxt = S2SMI(sb)->smsi_rec_log;
332 loghandle = ctxt->loc_handle;
335 if (SMFS_DO_REINT_REC(flags)) {
336 struct llog_gen_rec *lgr;
338 /* for reint rec, we need insert a gen rec to identify
339 * the end of the rec.*/
340 OBD_ALLOC(lgr, sizeof(*lgr));
343 lgr->lgr_hdr.lrh_len = lgr->lgr_tail.lrt_len = sizeof(*lgr);
344 lgr->lgr_hdr.lrh_type = LLOG_GEN_REC;
345 lgr->lgr_gen = ctxt->loc_gen;
346 rc = llog_add(ctxt, &lgr->lgr_hdr, NULL, NULL, 1,
348 OBD_FREE(lgr, sizeof(*lgr));
353 SET_REC_COUNT_FLAGS(args.sr_flags, SMFS_REC_ALL);
356 if (SMFS_DO_REINT_REC(flags))
357 rc = llog_cat_process(loghandle, ctxt->llog_proc_cb,
360 rc = llog_cat_reverse_process(loghandle,
363 if (rc == LLOG_PROC_BREAK)
369 /*smfs_path is gotten from intermezzo*/
370 static char* smfs_path(struct dentry *dentry, struct dentry *root, char *buffer,
373 char * end = buffer + buflen;
374 char * name = buffer;
375 char * buf_end = buffer + buflen;
385 struct dentry * parent;
390 parent = dentry->d_parent;
391 if (dentry == parent)
393 namelen = dentry->d_name.len;
394 buflen -= namelen + 1;
398 memcpy(end, dentry->d_name.name, namelen);
404 while (end != buf_end)
410 static int smfs_log_path(struct super_block *sb,
411 struct dentry *dentry,
415 struct dentry *root=sb->s_root;
416 char *p_name = buffer + sizeof(int);
422 name = smfs_path(dentry, root, p_name, buffer_len - sizeof(int));
423 namelen = cpu_to_le32(strlen(p_name));
424 memcpy(buffer, &namelen, sizeof(int));
426 namelen += sizeof(int);
430 static inline int log_it(char *buffer, void *data, int length)
432 memcpy(buffer, &length, sizeof(int));
433 memcpy(buffer + sizeof(int), data, length);
434 return (sizeof(int) + length);
437 static int smfs_pack_rec (char *buffer, struct dentry *dentry,
438 struct inode *dir, void *data1,
441 smfs_pack_rec_func pack_func;
443 pack_func = smfs_get_rec_pack_type(dir->i_sb);
446 return pack_func(buffer, dentry, dir, data1, data2, op);
449 int smfs_post_rec_create(struct inode *dir, struct dentry *dentry,
450 void *data1, void *data2)
452 struct smfs_super_info *sinfo;
453 char *buffer = NULL, *pbuf;
454 int rc = 0, length = 0, buf_len = 0;
457 sinfo = S2SMI(dentry->d_inode->i_sb);
461 OBD_ALLOC(buffer, PAGE_SIZE);
463 GOTO(exit, rc = -ENOMEM);
466 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
467 rc = smfs_log_path(dir->i_sb, dentry, pbuf, buf_len);
471 KML_BUF_REC_END(buffer, length, pbuf);
473 rc = smfs_pack_rec(pbuf, dentry, dir,
474 data1, data2, REINT_CREATE);
479 rc = smfs_llog_add_rec(sinfo, (void*)buffer, length);
482 OBD_FREE(buffer, PAGE_SIZE);
487 static int smfs_post_rec_link(struct inode *dir, struct dentry *dentry,
488 void *data1, void *data2)
490 struct dentry *new_dentry = (struct dentry *)data1;
491 int rc = 0, length = 0, buf_len = 0;
492 char *buffer = NULL, *pbuf = NULL;
493 struct smfs_super_info *sinfo;
496 sinfo = S2SMI(dir->i_sb);
499 OBD_ALLOC(buffer, PAGE_SIZE);
501 GOTO(exit, rc = -ENOMEM);
504 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
506 rc = smfs_log_path(dir->i_sb, dentry, pbuf, buf_len);
511 KML_BUF_REC_END(buffer, length, pbuf);
513 rc = smfs_pack_rec(pbuf, dentry, dir, dentry,
514 new_dentry, REINT_LINK);
519 rc = smfs_llog_add_rec(sinfo, (void *)buffer, length);
522 OBD_FREE(buffer, PAGE_SIZE);
527 static int smfs_post_rec_unlink(struct inode *dir, struct dentry *dentry,
528 void *data1, void *data2)
530 struct smfs_super_info *sinfo;
531 int mode = *((int*)data1);
532 char *buffer = NULL, *pbuf = NULL;
533 int length = 0, rc = 0, buf_len = 0;
536 sinfo = S2SMI(dentry->d_inode->i_sb);
540 OBD_ALLOC(buffer, PAGE_SIZE);
542 GOTO(exit, rc = -ENOMEM);
545 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
546 rc = smfs_log_path(dir->i_sb, dentry, pbuf, buf_len);
551 KML_BUF_REC_END(buffer, length, pbuf);
552 rc = smfs_pack_rec(pbuf, dentry, dir,
553 &mode, NULL, REINT_UNLINK);
559 rc = smfs_llog_add_rec(sinfo, (void*)buffer, length);
562 OBD_FREE(buffer, PAGE_SIZE);
567 static int smfs_post_rec_rename(struct inode *dir, struct dentry *dentry,
568 void *data1, void *data2)
570 struct smfs_super_info *sinfo;
571 struct inode *new_dir = (struct inode *)data1;
572 struct dentry *new_dentry = (struct dentry *)data2;
573 char *buffer = NULL, *pbuf = NULL;
574 int rc = 0, length = 0, buf_len = 0;
577 sinfo = S2SMI(dir->i_sb);
581 OBD_ALLOC(buffer, PAGE_SIZE);
583 GOTO(exit, rc = -ENOMEM);
586 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
587 rc = smfs_log_path(dir->i_sb, dentry, pbuf, buf_len);
595 /* record new_dentry path. */
596 rc = smfs_log_path(dir->i_sb, new_dentry, pbuf, buf_len);
601 KML_BUF_REC_END(buffer, length, pbuf);
603 rc = smfs_pack_rec(pbuf, dentry, dir,
604 new_dir, new_dentry, REINT_RENAME);
609 rc = smfs_llog_add_rec(sinfo, (void*)buffer, length);
612 OBD_FREE(buffer, PAGE_SIZE);
616 static int smfs_insert_extents_ea(struct inode *inode, size_t from, loff_t num)
618 struct fsfilt_operations *fsfilt = S2SMI(inode->i_sb)->sm_fsfilt;
622 if (SMFS_INODE_OVER_WRITE(inode))
625 rc = fsfilt->fs_insert_extents_ea(inode, OFF2BLKS(from, inode),
626 SIZE2BLKS(num, inode));
630 static int smfs_remove_extents_ea(struct inode *inode, size_t from, loff_t num)
632 struct fsfilt_operations *fsfilt = S2SMI(inode->i_sb)->sm_fsfilt;
636 rc = fsfilt->fs_remove_extents_ea(inode, OFF2BLKS(from, inode),
637 SIZE2BLKS(num, inode));
642 static int smfs_remove_all_extents_ea(struct inode *inode)
644 struct fsfilt_operations *fsfilt = S2SMI(inode->i_sb)->sm_fsfilt;
648 rc = fsfilt->fs_remove_extents_ea(inode, 0, 0xffffffff);
651 static int smfs_init_extents_ea(struct inode *inode)
653 struct fsfilt_operations *fsfilt = S2SMI(inode->i_sb)->sm_fsfilt;
657 rc = fsfilt->fs_init_extents_ea(inode);
661 static int smfs_set_dirty_flags(struct inode *inode, int flags)
663 struct fsfilt_operations *fsfilt = S2SMI(inode->i_sb)->sm_fsfilt;
668 if (SMFS_INODE_OVER_WRITE(inode))
670 /*FIXME later, the blocks needed in journal here will be recalculated*/
671 handle = smfs_trans_start(inode, FSFILT_OP_SETATTR, NULL);
672 if (IS_ERR(handle)) {
673 CERROR("smfs_set_dirty_flag:no space for transaction\n");
676 if ((!SMFS_INODE_DIRTY_WRITE(inode) && (!SMFS_INODE_OVER_WRITE(inode))) ||
677 ((flags == SMFS_OVER_WRITE) && (SMFS_INODE_DIRTY_WRITE(inode)))) {
678 rc = fsfilt->fs_set_xattr(inode, handle, REINT_EXTENTS_FLAGS,
679 &flags, sizeof(int));
683 if (flags == SMFS_OVER_WRITE)
684 SMFS_SET_INODE_OVER_WRITE(inode);
686 SMFS_SET_INODE_DIRTY_WRITE(inode);
688 smfs_trans_commit(inode, handle, 0);
692 int smfs_post_rec_setattr(struct inode *inode, struct dentry *dentry,
693 void *data1, void *data2)
695 struct smfs_super_info *sinfo;
696 struct iattr *attr = (struct iattr *)data1;
697 char *buffer = NULL, *pbuf;
698 int rc = 0, length = 0, buf_len = 0;
701 sinfo = S2SMI(inode->i_sb);
705 OBD_ALLOC(buffer, PAGE_SIZE);
707 GOTO(exit, rc = -ENOMEM);
710 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
711 rc = smfs_log_path(inode->i_sb, dentry, pbuf, buf_len);
716 KML_BUF_REC_END(buffer, length, pbuf);
718 rc = smfs_pack_rec(pbuf, dentry, inode,
719 data1, data2, REINT_SETATTR);
725 rc = smfs_llog_add_rec(sinfo, (void*)buffer, length);
727 if (attr && attr->ia_valid & ATTR_SIZE) {
728 smfs_remove_extents_ea(inode, attr->ia_size,
730 if (attr->ia_size == 0)
731 smfs_set_dirty_flags(inode, SMFS_OVER_WRITE);
733 smfs_set_dirty_flags(inode, SMFS_DIRTY_WRITE);
738 OBD_FREE(buffer, PAGE_SIZE);
742 static int all_blocks_present_ea(struct inode *inode)
749 int smfs_post_rec_write(struct inode *dir, struct dentry *dentry, void *data1,
752 struct smfs_super_info *sinfo;
753 char *buffer = NULL, *pbuf;
754 int rc = 0, length = 0, buf_len = 0;
757 if (!SMFS_INODE_OVER_WRITE(dentry->d_inode) &&
758 !SMFS_INODE_DIRTY_WRITE(dentry->d_inode)) {
759 sinfo = S2SMI(dentry->d_inode->i_sb);
763 OBD_ALLOC(buffer, PAGE_SIZE);
765 GOTO(exit, rc = -ENOMEM);
768 KML_BUF_REC_INIT(buffer, pbuf, buf_len);
769 rc = smfs_log_path(dir->i_sb, dentry, pbuf, buf_len);
774 memcpy(buffer, &rc, sizeof(int));
775 length = rc + sizeof(int);
777 rc = smfs_pack_rec(pbuf, dentry, dir,
778 data1, data2, REINT_WRITE);
784 rc = smfs_llog_add_rec(sinfo, (void*)buffer, length);
787 rc = smfs_init_extents_ea(dentry->d_inode);
791 if (dentry->d_inode->i_size == 0) {
792 smfs_set_dirty_flags(dentry->d_inode, SMFS_OVER_WRITE);
795 loff_t off = *((loff_t*)data1);
796 size_t count = *((size_t*)data2);
798 rc = smfs_insert_extents_ea(dentry->d_inode, off, count);
801 if (all_blocks_present_ea(dentry->d_inode)){
802 smfs_set_dirty_flags(dentry->d_inode, SMFS_OVER_WRITE);
803 smfs_remove_all_extents_ea(dentry->d_inode);
805 smfs_set_dirty_flags(dentry->d_inode, SMFS_DIRTY_WRITE);
810 OBD_FREE(buffer, PAGE_SIZE);
814 typedef int (*post_kml_rec)(struct inode *dir, struct dentry *dentry,
815 void *data1, void *data2);
817 static post_kml_rec smfs_kml_post[HOOK_MAX + 1] = {
818 [HOOK_CREATE] smfs_post_rec_create,
820 [HOOK_LINK] smfs_post_rec_link,
821 [HOOK_UNLINK] smfs_post_rec_unlink,
822 [HOOK_SYMLINK] smfs_post_rec_create,
823 [HOOK_MKDIR] smfs_post_rec_create,
824 [HOOK_RMDIR] smfs_post_rec_unlink,
825 [HOOK_MKNOD] smfs_post_rec_create,
826 [HOOK_RENAME] smfs_post_rec_rename,
827 [HOOK_SETATTR] smfs_post_rec_setattr,
828 [HOOK_WRITE] smfs_post_rec_write,
831 static int smfs_post_kml_rec(struct inode *dir, void *de, void *data1,
834 if (smfs_kml_post[op]) {
835 struct dentry *dentry = (struct dentry *)de;
836 return smfs_kml_post[op](dir, dentry, data1, data2);