Whamcloud - gitweb
- KML fixes and updates due to SMFS plugin API.
[fs/lustre-release.git] / lustre / smfs / fsfilt.c
1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2  * vim:expandtab:shiftwidth=8:tabstop=8:
3  *
4  *  lustre/lib/fsfilt_smfs.c
5  *  Lustre filesystem abstraction routines
6  *
7  *  Copyright (C) 2004 Cluster File Systems, Inc.
8  *   Author: Wang Di <wangdi@clusterfs.com>
9  *
10  *   This file is part of Lustre, http://www.lustre.org.
11  *
12  *   Lustre is free software; you can redistribute it and/or
13  *   modify it under the terms of version 2 of the GNU General Public
14  *   License as published by the Free Software Foundation.
15  *
16  *   Lustre is distributed in the hope that it will be useful,
17  *   but WITHOUT ANY WARRANTY; without even the implied warranty of
18  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
19  *   GNU General Public License for more details.
20  *
21  *   You should have received a copy of the GNU General Public License
22  *   along with Lustre; if not, write to the Free Software
23  *   Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
24  */
25
26 #define DEBUG_SUBSYSTEM S_SM
27
28 #include <linux/fs.h>
29 #include <linux/jbd.h>
30 #include <linux/slab.h>
31 #include <linux/pagemap.h>
32 #include <linux/quotaops.h>
33 #include <linux/version.h>
34 #include <libcfs/kp30.h>
35 #include <linux/obd.h>
36 #include <linux/obd_class.h>
37
38 #include <linux/lustre_fsfilt.h>
39 #include <linux/lustre_smfs.h>
40 #include <linux/lustre_snap.h>
41
42 #include "smfs_internal.h"
43
44 static void *fsfilt_smfs_start(struct inode *inode, int op,
45                                void *desc_private, int logs)
46 {
47         void *handle;
48         struct inode *cache_inode = I2CI(inode);
49         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
50         int extra = 0;
51         int opcode = op;
52         
53         if (cache_fsfilt == NULL)
54                 return NULL;
55
56         if (!cache_fsfilt->fs_start)
57                 return ERR_PTR(-ENOSYS);
58         
59         //opcode can be changed here. 
60         //For example, unlink is rename in nature for undo plugin 
61         extra = SMFS_PLG_HELP(inode->i_sb, PLG_TRANS_SIZE, &opcode);
62
63         handle = cache_fsfilt->fs_start(cache_inode, op, desc_private,
64                                         logs + extra);
65
66         return handle;
67 }
68
69 static void *fsfilt_smfs_brw_start(int objcount, struct fsfilt_objinfo *fso,
70                                    int niocount, struct niobuf_local *nb,
71                                    void *desc_private, int logs)
72 {
73         struct fsfilt_operations *cache_fsfilt;
74         struct dentry *cache_dentry = NULL;
75         struct inode *cache_inode = NULL;
76         struct fsfilt_objinfo cache_fso;
77         void   *rc = NULL;
78
79         ENTRY;
80         
81         cache_fsfilt = I2FOPS(fso->fso_dentry->d_inode);
82         if (cache_fsfilt == NULL)
83                 RETURN(NULL);
84
85         cache_inode = I2CI(fso->fso_dentry->d_inode);
86         cache_dentry = pre_smfs_dentry(NULL, cache_inode, fso->fso_dentry);
87         if (!cache_dentry)
88                 RETURN(ERR_PTR(-ENOMEM));
89         
90         cache_fso.fso_dentry = cache_dentry;
91         cache_fso.fso_bufcnt = fso->fso_bufcnt;
92
93         if (!cache_fsfilt->fs_brw_start) {
94                 rc =  ERR_PTR(-ENOSYS);
95                 goto exit;
96         }
97         
98         rc = cache_fsfilt->fs_brw_start(objcount, &cache_fso, niocount, nb,
99                                         desc_private, logs);
100 exit:
101         post_smfs_dentry(cache_dentry);
102         RETURN(rc);
103 }
104
105 /* FIXME-WANGDI: here we can easily have inode == NULL due to
106    mds_open() behavior. It passes NULL inode to mds_finish_transno()
107    sometimes. Probably we should have spare way to get cache fsfilt
108    operations. */
109 static int fsfilt_smfs_commit(struct super_block *sb, struct inode *inode, 
110                               void *h, int force_sync)
111 {
112         struct fsfilt_operations *cache_fsfilt = S2SMI(sb)->sm_cache_fsfilt;
113         struct super_block *csb = S2CSB(sb); 
114         struct inode *cache_inode = NULL;
115         int    rc = -EIO;
116         
117         ENTRY;
118         
119         if (inode)
120                 cache_inode = I2CI(inode);
121
122         if (cache_fsfilt == NULL)
123                 RETURN(rc);
124
125         if (!cache_fsfilt->fs_commit)
126                 RETURN(-ENOSYS);
127
128         rc = cache_fsfilt->fs_commit(csb, cache_inode, h, force_sync);
129
130         RETURN(rc);
131 }
132
133 static int fsfilt_smfs_commit_async(struct inode *inode, void *h,
134                                     void **wait_handle)
135 {
136         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
137         struct inode *cache_inode = NULL;
138         int    rc = -EIO;
139
140         cache_inode = I2CI(inode);
141         if (cache_fsfilt == NULL)
142                 RETURN(-EINVAL);
143
144         if (!cache_fsfilt->fs_commit_async)
145                 RETURN(-ENOSYS);
146
147         rc = cache_fsfilt->fs_commit_async(cache_inode, h, wait_handle);
148
149         RETURN(rc);
150 }
151
152 static int fsfilt_smfs_commit_wait(struct inode *inode, void *h)
153 {
154         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
155         struct inode *cache_inode = NULL;
156         int    rc = -EIO;
157
158         cache_inode = I2CI(inode);
159         if (cache_fsfilt == NULL)
160                 RETURN(-EINVAL);
161
162         if (!cache_fsfilt->fs_commit_wait)
163                 RETURN(-ENOSYS);
164
165         rc = cache_fsfilt->fs_commit_wait(cache_inode, h);
166
167         RETURN(rc);
168 }
169
170 static int fsfilt_smfs_iocontrol(struct inode *inode, struct file *file,
171                                  unsigned int cmd, unsigned long arg)
172 {
173         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
174         struct inode *cache_inode = I2CI(inode);
175         struct smfs_file_info *sfi = NULL;
176         struct file * cache_file = NULL;
177         int    rc = -EIO;
178         ENTRY;
179
180         if (!cache_fsfilt || !cache_inode)
181                 RETURN(rc);
182
183         if (!cache_fsfilt->fs_iocontrol)
184                 RETURN(-ENOSYS);
185
186
187         if (file != NULL) {
188                 sfi = F2SMFI(file);
189                 if (sfi->magic != SMFS_FILE_MAGIC)
190                         BUG();
191                 cache_file = sfi->c_file;
192         }
193         
194         pre_smfs_inode(inode, cache_inode);
195         
196         rc = cache_fsfilt->fs_iocontrol(cache_inode, cache_file, cmd, arg);
197
198         post_smfs_inode(inode, cache_inode);
199
200         RETURN(rc);
201 }
202
203 static int fsfilt_smfs_send_bio(int rw, struct inode *inode, void *bio)
204 {
205         struct inode *cache_inode;
206         struct fsfilt_operations *cache_fsfilt;
207         
208         ENTRY;
209         
210         cache_fsfilt = I2FOPS(inode);
211         if (!cache_fsfilt)
212                 RETURN(-EINVAL);
213
214         cache_inode = I2CI(inode);
215         if (!cache_inode)
216                 RETURN(-EINVAL);
217
218         if (!cache_fsfilt->fs_send_bio)
219                 RETURN(-ENOSYS);
220
221         return cache_fsfilt->fs_send_bio(rw, cache_inode, bio);
222 }
223
224 static struct page * fsfilt_smfs_getpage(struct inode *inode, long int index)
225 {
226         struct  fsfilt_operations *cache_fsfilt;
227         struct  inode *cache_inode;
228         ENTRY;
229         cache_fsfilt = I2FOPS(inode);
230         if (!cache_fsfilt)
231                 RETURN(ERR_PTR(-EINVAL));
232
233         cache_inode = I2CI(inode);
234         if (!cache_inode)
235                 RETURN(ERR_PTR(-EINVAL));
236
237         if (!cache_fsfilt->fs_getpage)
238                 RETURN(ERR_PTR(-ENOSYS));
239 #if CONFIG_SNAPFS
240         if (SMFS_DO_COW(S2SMI(inode->i_sb))) {
241                 struct address_space_operations *aops = 
242                                 cache_inode->i_mapping->a_ops;
243                 if (aops->bmap(cache_inode->i_mapping, index)) {
244                         struct inode *ind_inode = NULL;
245                         struct inode *cache_ind = NULL;
246                         struct page  *page = NULL;
247                         
248                         ind_inode = smfs_cow_get_ind(inode, index);
249                         if (!ind_inode) {
250                                 RETURN(ERR_PTR(-EIO));
251                         }
252                         cache_ind = I2CI(ind_inode);
253                         /*FIXME cow inode should be bottom fs inode */         
254                         page = cache_fsfilt->fs_getpage(cache_ind, index);
255                         iput(ind_inode); 
256                         RETURN(page);
257                 } 
258         }
259 #endif
260         return cache_fsfilt->fs_getpage(cache_inode, index);
261 }
262
263 static ssize_t fsfilt_smfs_readpage(struct file *file, char *buf,
264                                     size_t count, loff_t *off)
265 {
266         struct fsfilt_operations *cache_fsfilt;
267         struct smfs_file_info *sfi;
268         struct inode *cache_inode;
269         loff_t tmp_ppos;
270         loff_t *cache_ppos;
271         ssize_t rc = -EIO;
272
273         ENTRY;
274
275         cache_fsfilt = I2FOPS(file->f_dentry->d_inode);
276         if (!cache_fsfilt)
277                 RETURN(rc);
278
279         cache_inode = I2CI(file->f_dentry->d_inode);
280         if (!cache_inode)
281                 RETURN(rc);
282
283         sfi = F2SMFI(file);
284         if (sfi->magic != SMFS_FILE_MAGIC)
285                 BUG();
286
287         if (off != &(file->f_pos))
288                 cache_ppos = &tmp_ppos;
289         else
290                 cache_ppos = &sfi->c_file->f_pos;
291         *cache_ppos = *off;
292
293         pre_smfs_inode(file->f_dentry->d_inode, cache_inode);
294 #if CONFIG_SNAPFS
295         /*readdir page*/
296         if (smfs_dotsnap_inode(file->f_dentry->d_inode)) {
297                 struct fsfilt_operations *snapops = 
298                                         I2SNAPOPS(file->f_dentry->d_inode);
299                 
300                 LASSERT(S_ISDIR(file->f_dentry->d_inode->i_mode));
301                 
302                 rc = snapops->fs_read_dotsnap_dir_page(sfi->c_file, buf, count, 
303                                                        cache_ppos); 
304         } else {
305                 if (cache_fsfilt->fs_readpage)
306                         rc = cache_fsfilt->fs_readpage(sfi->c_file, buf, count,
307                                                        cache_ppos);
308         }
309 #else
310         if (cache_fsfilt->fs_readpage)
311                 rc = cache_fsfilt->fs_readpage(sfi->c_file, buf, count,
312                                                cache_ppos);
313
314 #endif
315         *off = *cache_ppos;
316         post_smfs_inode(file->f_dentry->d_inode, cache_inode);
317         duplicate_file(file, sfi->c_file);
318
319         RETURN(rc);
320 }
321
322
323 static int fsfilt_smfs_add_journal_cb(struct obd_device *obd,
324                                       struct super_block *sb, __u64 last_rcvd,
325                                       void *handle, fsfilt_cb_t cb_func,
326                                       void *cb_data)
327 {
328         struct fsfilt_operations *cache_fsfilt = S2SMI(sb)->sm_cache_fsfilt;
329         struct super_block *csb = S2CSB(sb);
330         int rc = -EIO;
331         
332         ENTRY;
333         
334         if (!cache_fsfilt)
335                  RETURN(rc);
336         if (cache_fsfilt->fs_add_journal_cb)
337                 rc = cache_fsfilt->fs_add_journal_cb(obd, csb, last_rcvd,
338                                                      handle, cb_func, cb_data);
339         RETURN(rc);
340 }
341
342 static int fsfilt_smfs_statfs(struct super_block *sb, struct obd_statfs *osfs)
343 {
344         struct fsfilt_operations *cache_fsfilt = S2SMI(sb)->sm_cache_fsfilt;
345         struct super_block *csb = S2CSB(sb);
346         int rc = -EIO;
347
348         ENTRY;
349         
350         if (!cache_fsfilt)
351                 RETURN(rc);
352
353         if (!cache_fsfilt->fs_statfs)
354                 RETURN(-ENOSYS);
355
356         rc = cache_fsfilt->fs_statfs(csb, osfs);
357         duplicate_sb(csb, sb);
358
359         RETURN(rc);
360 }
361
362 static int fsfilt_smfs_sync(struct super_block *sb)
363 {
364         struct fsfilt_operations *cache_fsfilt = S2SMI(sb)->sm_cache_fsfilt;
365         struct super_block *csb = S2CSB(sb);
366         int    rc = -ENOSYS;
367
368         if (!cache_fsfilt)
369                 RETURN(-EINVAL);
370
371         if (cache_fsfilt->fs_sync)
372                 rc = cache_fsfilt->fs_sync(csb);
373
374         RETURN(rc);
375 }
376
377 int fsfilt_smfs_map_inode_pages(struct inode *inode, struct page **page,
378                                 int pages, unsigned long *blocks, int *created,
379                                 int create, struct semaphore *sem)
380 {
381         struct  fsfilt_operations *cache_fsfilt = I2FOPS(inode);
382         struct  inode *cache_inode = NULL;
383         int     rc = -EIO;
384         
385         ENTRY;
386         
387         if (!cache_fsfilt)
388                 RETURN(-EINVAL);
389
390         cache_inode = I2CI(inode);
391
392         if (!cache_inode)
393                 RETURN(rc);
394
395         if (!cache_fsfilt->fs_map_inode_pages)
396                 RETURN(-ENOSYS);
397
398         down(&cache_inode->i_sem);
399
400         rc = cache_fsfilt->fs_map_inode_pages(cache_inode, page, pages, blocks,
401                                               created, create, sem);
402         up(&cache_inode->i_sem);
403
404         RETURN(rc);
405 }
406
407 static int fsfilt_smfs_prep_san_write(struct inode *inode, long *blocks,
408                                       int nblocks, loff_t newsize)
409 {
410         struct  fsfilt_operations *cache_fsfilt = I2FOPS(inode);
411         struct  inode *cache_inode = NULL;
412         int     rc = -EIO;
413
414         if (!cache_fsfilt)
415                 RETURN(-EINVAL);
416
417         cache_inode = I2CI(inode);
418
419         if (!cache_inode)
420                 RETURN(-EINVAL);
421
422         if (!cache_fsfilt->fs_prep_san_write)
423                 RETURN(-ENOSYS);
424
425         down(&cache_inode->i_sem);
426         rc = cache_fsfilt->fs_prep_san_write(cache_inode, blocks, nblocks,
427                                              newsize);
428         up(&cache_inode->i_sem);
429
430         RETURN(rc);
431 }
432
433 static int fsfilt_smfs_read_record(struct file * file, void *buf,
434                                    int size, loff_t *offs)
435 {
436         struct  fsfilt_operations *cache_fsfilt;
437         struct  inode *cache_inode;
438         struct  smfs_file_info *sfi;
439         loff_t  tmp_ppos;
440         loff_t  *cache_ppos;
441         ssize_t rc;
442
443         ENTRY;
444         cache_fsfilt = I2FOPS(file->f_dentry->d_inode);
445         if (!cache_fsfilt)
446                 RETURN(-EINVAL);
447
448         cache_inode = I2CI(file->f_dentry->d_inode);
449
450         if (!cache_inode)
451                 RETURN(-EINVAL);
452
453         sfi = F2SMFI(file);
454         if (sfi->magic != SMFS_FILE_MAGIC) BUG();
455
456         if (offs != &(file->f_pos))
457                 cache_ppos = &tmp_ppos;
458         else
459                 cache_ppos = &sfi->c_file->f_pos;
460         *cache_ppos = *offs;
461
462         pre_smfs_inode(file->f_dentry->d_inode, cache_inode);
463
464         if (!cache_fsfilt->fs_read_record)
465                 RETURN(-ENOSYS);
466
467         rc = cache_fsfilt->fs_read_record(sfi->c_file, buf, size, cache_ppos);
468
469         *offs = *cache_ppos;
470         post_smfs_inode(file->f_dentry->d_inode, cache_inode);
471         duplicate_file(file, sfi->c_file);
472
473         RETURN(rc);
474 }
475
476 static int fsfilt_smfs_write_record(struct file *file, void *buf, int bufsize,
477                                     loff_t *offs, int force_sync)
478 {
479         struct  fsfilt_operations *cache_fsfilt;
480         struct  inode *cache_inode;
481         struct  smfs_file_info *sfi;
482         loff_t  tmp_ppos;
483         loff_t  *cache_ppos;
484         ssize_t rc = -EIO;
485
486         ENTRY;
487
488         cache_fsfilt = I2FOPS(file->f_dentry->d_inode);
489         if (!cache_fsfilt)
490                 RETURN(-EINVAL);
491
492         cache_inode = I2CI(file->f_dentry->d_inode);
493
494         if (!cache_inode)
495                 RETURN(-EINVAL);
496
497         sfi = F2SMFI(file);
498         if (sfi->magic != SMFS_FILE_MAGIC)
499                 BUG();
500
501         if (offs != &(file->f_pos))
502                 cache_ppos = &tmp_ppos;
503         else
504                 cache_ppos = &sfi->c_file->f_pos;
505         *cache_ppos = *offs;
506
507         pre_smfs_inode(file->f_dentry->d_inode, cache_inode);
508
509         if (!cache_fsfilt->fs_write_record)
510                 RETURN(-ENOSYS);
511
512         rc = cache_fsfilt->fs_write_record(sfi->c_file, buf,
513                                            bufsize, cache_ppos, force_sync);
514         *offs = *cache_ppos;
515         post_smfs_inode(file->f_dentry->d_inode, cache_inode);
516         duplicate_file(file, sfi->c_file);
517
518         RETURN(rc);
519 }
520
521 static int fsfilt_smfs_post_setup(struct obd_device *obd, struct vfsmount *mnt,
522                                   struct dentry *root_dentry)
523 {
524         struct super_block *sb = NULL;
525         int rc = 0;
526
527         ENTRY;
528         
529         if (mnt) {
530                 sb = mnt->mnt_sb;
531                 
532                 if (obd)
533                         S2SMI(sb)->smsi_exp = obd->obd_self_export;
534                
535                 rc = smfs_post_setup(obd, mnt, root_dentry);
536                 if (rc) {
537                         CERROR("post_setup fails in obd %p rc=%d", obd, rc);
538                 }
539
540               
541         }
542         
543         RETURN(rc);
544 }
545
546 static int fsfilt_smfs_post_cleanup(struct obd_device *obd,
547                                     struct vfsmount *mnt)
548 {
549         struct super_block *sb = NULL;
550         int rc = 0;
551         ENTRY;
552         
553         if (mnt) {
554                 sb = mnt->mnt_sb;
555                 smfs_post_cleanup(sb);
556         }
557         
558         RETURN(rc);
559 }
560
561 static int fsfilt_smfs_set_fs_flags(struct inode *inode, int flags)
562 {
563         int rc = 0;
564         ENTRY;
565
566         if (flags & SM_ALL_PLG) /* enable all plugins */
567                 SMFS_SET(I2SMI(inode)->smi_flags, SMFS_PLG_ALL);
568         if (flags & SM_PRECREATE) /* disable logs for precreated objs */
569                 SMFS_CLEAR(I2SMI(inode)->smi_flags, SMFS_PLG_ALL);
570
571
572 #if 0
573         if (SMFS_DO_COW(S2SMI(inode->i_sb)) && (flags & SM_DO_COW))
574                 SMFS_SET_INODE_COW(inode);
575 #endif
576         RETURN(rc);
577 }
578
579 static int fsfilt_smfs_clear_fs_flags(struct inode *inode, int flags)
580 {
581         int rc = 0;
582         ENTRY;
583         /*
584         if (SMFS_DO_REC(S2SMI(inode->i_sb)) && (flags & SM_DO_REC))
585                 SMFS_CLEAN_INODE_REC(inode);
586         if (SMFS_DO_COW(S2SMI(inode->i_sb)) && (flags & SM_DO_COW))
587                 SMFS_CLEAN_INODE_COW(inode);
588         */
589         if(flags & SM_ALL_PLG) /* disable all plugins */
590                 SMFS_CLEAR(I2SMI(inode)->smi_flags, SMFS_PLG_ALL);
591         if (flags & SM_PRECREATE) /* enable log again */
592                 SMFS_SET(I2SMI(inode)->smi_flags, SMFS_PLG_ALL);
593
594         RETURN(rc);
595 }
596
597 static int fsfilt_smfs_get_fs_flags(struct dentry *de)
598 {
599         struct inode *inode = de->d_inode;
600         int flags = 0;
601         ENTRY;
602
603         LASSERT(inode);
604         
605         flags = I2SMI(inode)->smi_flags & S2SMI(inode->i_sb)->plg_flags;
606        
607         RETURN(flags); 
608 }
609
610 static int fsfilt_smfs_set_ost_flags(struct super_block *sb)
611 {
612         return 0;
613 }
614
615 static int fsfilt_smfs_set_mds_flags(struct super_block *sb)
616 {
617         return 0;
618 }
619
620 #if 0
621 static int fsfilt_smfs_get_reint_log_ctxt(struct super_block *sb,
622                                           struct llog_ctxt **ctxt)
623 {
624         struct smfs_super_info *smfs_info = S2SMI(sb);
625         int rc = 0;
626
627         *ctxt = smfs_info->smsi_kml_log;
628         RETURN(rc);
629 }
630 #endif
631
632 static int fsfilt_smfs_setup(struct obd_device *obd, struct super_block *sb)
633 {
634         struct smfs_super_info *smfs_info = S2SMI(sb);
635         struct fsfilt_operations *cache_fsfilt;
636         struct super_block *csb;
637         int rc = 0;
638
639         ENTRY;
640         
641         /* It should be initialized olready by smfs_read_super(). */
642         if (!(cache_fsfilt = smfs_info->sm_cache_fsfilt))
643                     cache_fsfilt = fsfilt_get_ops(smfs_info->smsi_cache_ftype);
644
645         if (!cache_fsfilt)
646                 RETURN(-ENOENT);
647
648         csb = S2CSB(sb);
649         if (cache_fsfilt->fs_setup) 
650                 rc = cache_fsfilt->fs_setup(obd, csb);
651         
652         duplicate_sb(sb, csb);
653         
654         RETURN(rc);
655 }
656
657 static int fsfilt_smfs_setattr(struct dentry *dentry, void *handle,
658                                struct iattr *iattr, int do_trunc)
659 {
660         struct fsfilt_operations *cache_fsfilt = I2FOPS(dentry->d_inode);
661         struct dentry *cache_dentry = NULL;
662         struct inode *cache_inode = I2CI(dentry->d_inode);
663         struct hook_setattr_msg msg = {
664                 .dentry = dentry,
665                 .attr = iattr
666         };
667         int    rc = -EIO;
668
669         if (!cache_fsfilt)
670                 RETURN(rc);
671
672         if (!cache_fsfilt->fs_setattr)
673                 RETURN(-ENOSYS);
674
675         cache_dentry = pre_smfs_dentry(NULL, cache_inode, dentry);
676         if (!cache_dentry)
677                 RETURN(-ENOMEM);
678
679         pre_smfs_inode(dentry->d_inode, cache_inode);
680
681         SMFS_PRE_HOOK(dentry->d_inode, HOOK_F_SETATTR, &msg);
682         
683         rc = cache_fsfilt->fs_setattr(cache_dentry, handle, iattr, do_trunc);
684
685         SMFS_POST_HOOK(dentry->d_inode, HOOK_F_SETATTR, &msg, rc);
686         post_smfs_inode(dentry->d_inode, cache_inode);
687
688         post_smfs_dentry(cache_dentry);
689         RETURN(rc);
690 }
691
692 static int fsfilt_smfs_set_xattr(struct inode *inode, void *handle, char *name,
693                                  void *buffer, int buffer_size)
694 {
695         struct  fsfilt_operations *cache_fsfilt = I2FOPS(inode);
696         struct  inode *cache_inode = NULL;
697         int     rc = -EIO;
698
699         ENTRY;
700         
701         if (!cache_fsfilt)
702                 RETURN(rc);
703
704         cache_inode = I2CI(inode);
705         if (!cache_inode)
706                 RETURN(rc);
707
708         pre_smfs_inode(inode, cache_inode);
709
710         if (cache_fsfilt->fs_set_xattr)
711                 rc = cache_fsfilt->fs_set_xattr(cache_inode, handle, name,
712                                                 buffer, buffer_size);
713         post_smfs_inode(inode, cache_inode);
714
715         RETURN(rc);
716 }
717
718 static int fsfilt_smfs_get_xattr(struct inode *inode, char *name,
719                                  void *buffer, int buffer_size)
720 {
721         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
722         struct inode *cache_inode = NULL;
723         int    rc = -EIO;
724
725         if (!cache_fsfilt)
726                 RETURN(rc);
727
728         cache_inode = I2CI(inode);
729         if (!cache_inode)
730                 RETURN(rc);
731
732         pre_smfs_inode(inode, cache_inode);
733
734         if (cache_fsfilt->fs_get_xattr)
735                 rc = cache_fsfilt->fs_get_xattr(cache_inode, name,
736                                                 buffer, buffer_size);
737         post_smfs_inode(inode, cache_inode);
738
739         RETURN(rc);
740 }
741
742 #define XATTR_LUSTRE_MDS_LOV_EA         "lov"
743 #define XATTR_LUSTRE_MDS_MEA_EA         "mea"
744 #define XATTR_LUSTRE_MDS_MID_EA         "mid"
745 #define XATTR_LUSTRE_MDS_SID_EA         "sid"
746
747 static int fsfilt_smfs_set_md(struct inode *inode, void *handle,
748                               void *lmm, int lmm_size, enum ea_type type)
749 {
750         int rc;
751         
752         switch(type) {
753         case EA_LOV:
754                 rc = fsfilt_smfs_set_xattr(inode, handle,
755                                            XATTR_LUSTRE_MDS_LOV_EA,
756                                            lmm, lmm_size);
757                 break;
758         case EA_MEA:
759                 rc = fsfilt_smfs_set_xattr(inode, handle,
760                                            XATTR_LUSTRE_MDS_MEA_EA,
761                                            lmm, lmm_size);
762                 break;
763         case EA_SID:
764                 rc = fsfilt_smfs_set_xattr(inode, handle,
765                                            XATTR_LUSTRE_MDS_SID_EA,
766                                            lmm, lmm_size);
767                 break;
768         case EA_MID:
769                 rc = fsfilt_smfs_set_xattr(inode, handle,
770                                            XATTR_LUSTRE_MDS_MID_EA,
771                                            lmm, lmm_size);
772                 break;
773         default:
774                 rc = -EINVAL;
775         }
776
777         return rc;
778 }
779
780 static int fsfilt_smfs_get_md(struct inode *inode, void *lmm,
781                               int lmm_size, enum ea_type type)
782 {
783         int rc;
784         
785         switch (type) {
786         case EA_LOV:
787                 rc = fsfilt_smfs_get_xattr(inode,
788                                            XATTR_LUSTRE_MDS_LOV_EA,
789                                            lmm, lmm_size);
790                 break;
791         case EA_MEA:
792                 rc = fsfilt_smfs_get_xattr(inode,
793                                            XATTR_LUSTRE_MDS_MEA_EA,
794                                            lmm, lmm_size);
795                 break;
796         case EA_SID:
797                 rc = fsfilt_smfs_get_xattr(inode,
798                                            XATTR_LUSTRE_MDS_SID_EA,
799                                            lmm, lmm_size);
800                 break;
801         case EA_MID:
802                 rc = fsfilt_smfs_get_xattr(inode,
803                                            XATTR_LUSTRE_MDS_MID_EA,
804                                            lmm, lmm_size);
805                 break;
806         default:
807                 rc = -EINVAL;
808         }
809         
810         return rc;
811 }
812
813 static int fsfilt_smfs_insert_extents_ea(struct inode *inode,
814                                          unsigned long from, unsigned long num)
815 {
816         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
817         struct inode *cache_inode = NULL;
818         int    rc = -EIO;
819
820         if (!cache_fsfilt)
821                 RETURN(rc);
822
823         cache_inode = I2CI(inode);
824         if (!cache_inode)
825                 RETURN(rc);
826
827         pre_smfs_inode(inode, cache_inode);
828
829         if (cache_fsfilt->fs_insert_extents_ea)
830                 rc = cache_fsfilt->fs_insert_extents_ea(cache_inode, from, num);
831
832         post_smfs_inode(inode, cache_inode);
833         return rc;
834 }
835
836 static int fsfilt_smfs_remove_extents_ea(struct inode *inode,
837                                          unsigned long from, unsigned long num)
838 {
839         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
840         struct inode *cache_inode = NULL;
841         int    rc = -EIO;
842
843         if (!cache_fsfilt)
844                 RETURN(rc);
845
846         cache_inode = I2CI(inode);
847         if (!cache_inode)
848                 RETURN(rc);
849
850         pre_smfs_inode(inode, cache_inode);
851
852         if (cache_fsfilt->fs_remove_extents_ea)
853                 rc = cache_fsfilt->fs_remove_extents_ea(cache_inode, from, num);
854
855         post_smfs_inode(inode, cache_inode);
856         return rc;
857 }
858
859 static int fsfilt_smfs_init_extents_ea(struct inode *inode)
860 {
861         struct fsfilt_operations *cache_fsfilt = I2FOPS(inode);
862         struct inode *cache_inode = NULL;
863         int    rc = -EIO;
864         ENTRY;
865
866         if (!cache_fsfilt)
867                 RETURN(rc);
868
869         cache_inode = I2CI(inode);
870         if (!cache_inode)
871                 RETURN(rc);
872
873         pre_smfs_inode(inode, cache_inode);
874
875         if (cache_fsfilt->fs_init_extents_ea)
876                 rc = cache_fsfilt->fs_init_extents_ea(cache_inode);
877
878         post_smfs_inode(inode, cache_inode);
879         return rc;
880 }
881
882 static int fsfilt_smfs_free_extents(struct super_block *sb, ino_t ino,
883                                     char *pbuf, int size)
884 {
885         OBD_FREE(pbuf, size * (sizeof(struct ldlm_extent)));
886         return 0;
887 }
888
889 static int fsfilt_smfs_write_extents(struct dentry *dentry,
890                                      unsigned long from, unsigned long num)
891 {
892         int rc = 0;
893         struct inode * cache_inode = I2CI(dentry->d_inode);
894         struct hook_write_msg msg = {
895                 .dentry = dentry,
896                 .count = num,
897                 .pos = from
898         };
899
900         ENTRY;
901         
902         /*TODO: fix this later
903         pre_smfs_inode(dentry->d_inode, cache_inode);
904  
905         SMFS_PRE_HOOK(dentry->d_inode, HOOK_WRITE, &msg);
906         
907         rc = smfs_write_extents(dentry->d_inode, dentry, from, num);
908         SMFS_POST_HOOK(dentry->d_inode, HOOK_WRITE, &msg, rc);
909         post_smfs_inode(dentry->d_inode, cache_inode);
910         */
911         
912         RETURN(rc);
913 }
914
915 static int fsfilt_smfs_precreate_rec(struct dentry *dentry, int *count, 
916                                      struct obdo *oa)
917 {
918         int rc = 0;
919         /* Why to log precreate?? MDS will do this in any case
920         if (SMFS_DO_REC(S2SMI(dentry->d_inode->i_sb)))
921                 rc = smfs_rec_precreate(dentry, count, oa);
922         */
923         return rc;
924 }
925
926 static int fsfilt_smfs_get_ino_write_extents(struct super_block *sb, ino_t ino,
927                                              char **pbuf, int *size)
928 {
929         struct fs_extent *fs_extents;
930         struct ldlm_extent *extents = NULL;
931         struct inode *inode;
932         struct inode *cache_inode;
933         struct fsfilt_operations *cache_fsfilt = NULL;
934         struct lvfs_run_ctxt saved;
935         int    rc = 0, fs_ex_size, ex_num, flags;
936         char   *buf = NULL, *ex_buf = NULL;
937         ENTRY;
938
939         push_ctxt(&saved, S2SMI(sb)->smsi_ctxt, NULL);
940
941         inode = iget(sb, ino);
942
943         if (!inode || is_bad_inode(inode)) {
944                 CWARN("Can not get inode %lu ino\n", ino);
945                 GOTO(out, rc = 0);
946         }
947         cache_inode = I2CI(inode);
948         cache_fsfilt = I2FOPS(inode);
949
950         rc = cache_fsfilt->fs_get_xattr(cache_inode, REINT_EXTENTS_FLAGS,
951                                         &flags, sizeof(int));
952         if (!(flags & SMFS_OVER_WRITE) && !(flags & SMFS_DIRTY_WRITE)) {
953                 GOTO(out, rc = 0);
954         } else if (flags & SMFS_OVER_WRITE) {
955                 *size = 1;
956                 OBD_ALLOC(ex_buf, sizeof(struct ldlm_extent));
957                 if (!ex_buf)
958                         GOTO(out, rc=-ENOMEM);
959                 extents = (struct ldlm_extent*)(ex_buf);
960                 extents->start = 0;
961                 extents->end = 0xffffffff;
962         }
963         if (rc < 0)
964                 GOTO(out, rc);
965         rc = cache_fsfilt->fs_get_write_extents_num(cache_inode, &fs_ex_size);
966         if (rc)
967                 GOTO(out, rc);
968         OBD_ALLOC(buf, fs_ex_size);
969         if (!buf)
970                 GOTO(out, rc=-ENOMEM);
971
972         rc = cache_fsfilt->fs_get_inode_write_extents(cache_inode, &buf,
973                                                       &fs_ex_size);
974         if (rc < 0)
975                 GOTO(out, rc);
976         rc = 0;
977         ex_num = fs_ex_size / sizeof(struct fs_extent);
978         *size =  ex_num;
979         OBD_ALLOC(ex_buf, ex_num* sizeof(struct ldlm_extent));
980         if (!ex_buf)
981                 GOTO(out, rc=-ENOMEM);
982
983         fs_extents = (struct fs_extent*)(buf);
984         extents = (struct ldlm_extent*)(ex_buf);
985         while (ex_num > 0) {
986                 int blk_size = I2CI(inode)->i_blksize;
987
988                 extents->start = fs_extents->e_block * blk_size;
989                 extents->end = extents->start + fs_extents->e_num * blk_size;
990                 fs_extents++;
991                 extents++;
992                 ex_num--;
993         }
994         *pbuf = ex_buf;
995 out:
996         iput(inode);
997         if (buf)
998                 OBD_FREE(buf, fs_ex_size);
999         if (rc && extents)
1000                 OBD_FREE(ex_buf, (*size) * (sizeof(struct ldlm_extent)));
1001         pop_ctxt(&saved, S2SMI(sb)->smsi_ctxt, NULL);
1002         return rc;
1003 }
1004
1005 static int fsfilt_smfs_set_snap_item(struct super_block *sb, char *name)
1006 {
1007         int rc = 0;
1008
1009         ENTRY;
1010 #if CONFIG_SNAPFS
1011 #warning "still not implement for add snap item -wangdi"         
1012 #endif
1013         RETURN(rc);        
1014 }
1015 static int fsfilt_smfs_do_write_cow(struct dentry *de, void *extents,
1016                                     int num_extents)
1017 {
1018         int rc = 0;
1019 #if CONFIG_SNAPFS
1020         struct write_extents *w_ext = (struct write_extents *)extents;
1021         int i = 0;
1022         ENTRY;
1023         for (i = 0; i < num_extents; i++) {
1024                size_t count = w_ext->w_count;
1025                loff_t off = w_ext->w_pos;
1026                rc = smfs_cow_write_pre(de->d_inode, de, &count, &off);
1027                if (rc)
1028                         RETURN(rc);  
1029                w_ext ++;
1030         }
1031 #endif
1032         RETURN(rc);
1033 }
1034
1035 static int fsfilt_smfs_add_dir_entry(struct obd_device * obd,
1036                                      struct dentry * parent, char* name,
1037                                      int namelen, unsigned long ino,
1038                                      unsigned long generation,
1039                                      unsigned long mds,
1040                                      unsigned long fid) 
1041 {
1042         struct fsfilt_operations *cache_fsfilt = I2FOPS(parent->d_inode);
1043         struct dentry *cache_dentry = NULL, *dentry = NULL;
1044         struct inode *cache_parent = I2CI(parent->d_inode);
1045         int    rc = -EIO;
1046
1047         ENTRY;
1048         
1049         if (!cache_fsfilt)
1050                 RETURN(rc);
1051
1052         if (!cache_fsfilt->fs_add_dir_entry)
1053                 RETURN(-ENOSYS);
1054
1055         dentry = ll_lookup_one_len(name, parent, namelen);
1056         if (IS_ERR(dentry)) {
1057                 CERROR("can't lookup %*s in %lu/%lu: %d\n", namelen,
1058                        name, parent->d_inode->i_ino,
1059                        (unsigned long) parent->d_inode->i_generation,
1060                        (int) PTR_ERR(dentry));
1061                 RETURN(PTR_ERR(dentry));
1062         }
1063         if (dentry->d_inode != NULL || dentry->d_flags & DCACHE_CROSS_REF) {
1064                 CERROR("dentry %*s(0x%p) found\n", dentry->d_name.len,
1065                        dentry->d_name.name, dentry);
1066                 l_dput(dentry);
1067                 RETURN(-EEXIST);
1068         }
1069         /* mds_reint_rename() may use this method to add dir entry 
1070          * that points onto local inode. and we don't want to find
1071          * it cross-ref by subsequent lookups */
1072         d_drop(dentry);
1073
1074         dentry->d_flags |= DCACHE_CROSS_REF;
1075         dentry->d_inum = ino;
1076         dentry->d_mdsnum = mds;
1077         dentry->d_generation = generation;
1078         dentry->d_fid = fid;
1079         l_dput(dentry);
1080
1081         cache_dentry = pre_smfs_dentry(NULL, cache_parent, parent);
1082         if (!cache_dentry) {
1083                 RETURN(-ENOMEM);
1084         }
1085
1086         pre_smfs_inode(parent->d_inode, cache_parent);
1087         
1088         rc = cache_fsfilt->fs_add_dir_entry(obd, cache_dentry, name, namelen,
1089                                             ino, generation, mds, fid);
1090
1091         post_smfs_inode(parent->d_inode, cache_parent);
1092         
1093         post_smfs_dentry(cache_dentry);
1094         
1095         RETURN(rc);
1096         
1097 }
1098
1099 static int fsfilt_smfs_del_dir_entry(struct obd_device * obd,
1100                                      struct dentry * dentry) 
1101 {
1102         struct fsfilt_operations *cache_fsfilt = I2FOPS(dentry->d_parent->d_inode);
1103         struct dentry *cache_dentry = NULL, *cache_parent = NULL;
1104         struct inode * cache_dir = I2CI(dentry->d_parent->d_inode);
1105         struct inode * cache_inode = NULL;
1106         int    rc = -EIO;
1107
1108         ENTRY;
1109         
1110         if (!cache_fsfilt)
1111                 RETURN(rc);
1112
1113         if (!cache_fsfilt->fs_del_dir_entry)
1114                 RETURN(-ENOSYS);
1115
1116         if (dentry->d_inode)
1117                 cache_inode = I2CI(dentry->d_inode);
1118         
1119         cache_parent = pre_smfs_dentry(NULL, cache_dir, dentry->d_parent);
1120         cache_dentry = pre_smfs_dentry(cache_parent, cache_inode, dentry);
1121         if (!cache_parent || !cache_dentry) {
1122                 rc = (-ENOMEM);
1123                 goto exit;
1124         }
1125
1126         pre_smfs_inode(dentry->d_parent->d_inode, cache_dir);
1127         pre_smfs_inode(dentry->d_inode, cache_inode);
1128         
1129         rc = cache_fsfilt->fs_del_dir_entry(obd, cache_dentry);
1130
1131         if (!rc)
1132                 d_drop(dentry);
1133
1134         post_smfs_inode(dentry->d_inode, cache_inode);
1135         post_smfs_inode(dentry->d_parent->d_inode, cache_dir);
1136 exit:
1137         post_smfs_dentry(cache_dentry);
1138         post_smfs_dentry(cache_parent);
1139         RETURN(rc);
1140         
1141 }
1142
1143
1144 static struct fsfilt_operations fsfilt_smfs_ops = {
1145         .fs_type                = "smfs",
1146         .fs_owner               = THIS_MODULE,
1147         .fs_start               = fsfilt_smfs_start,
1148         .fs_brw_start           = fsfilt_smfs_brw_start,
1149         .fs_commit              = fsfilt_smfs_commit,
1150         .fs_commit_async        = fsfilt_smfs_commit_async,
1151         .fs_commit_wait         = fsfilt_smfs_commit_wait,
1152         .fs_setattr             = fsfilt_smfs_setattr,
1153         .fs_iocontrol           = fsfilt_smfs_iocontrol,
1154         .fs_set_md              = fsfilt_smfs_set_md,
1155         .fs_get_md              = fsfilt_smfs_get_md,
1156         .fs_readpage            = fsfilt_smfs_readpage,
1157         .fs_getpage             = fsfilt_smfs_getpage,
1158         .fs_add_journal_cb      = fsfilt_smfs_add_journal_cb,
1159         .fs_statfs              = fsfilt_smfs_statfs,
1160         .fs_sync                = fsfilt_smfs_sync,
1161         .fs_map_inode_pages     = fsfilt_smfs_map_inode_pages,
1162         .fs_prep_san_write      = fsfilt_smfs_prep_san_write,
1163         .fs_write_record        = fsfilt_smfs_write_record,
1164         .fs_read_record         = fsfilt_smfs_read_record,
1165         .fs_setup               = fsfilt_smfs_setup,
1166         .fs_send_bio            = fsfilt_smfs_send_bio,
1167         .fs_set_xattr           = fsfilt_smfs_set_xattr,
1168         .fs_get_xattr           = fsfilt_smfs_get_xattr,
1169         .fs_get_op_len          = NULL,
1170         .fs_del_dir_entry       = fsfilt_smfs_del_dir_entry,
1171         .fs_add_dir_entry       = fsfilt_smfs_add_dir_entry,
1172         .fs_insert_extents_ea   = fsfilt_smfs_insert_extents_ea,
1173         .fs_remove_extents_ea   = fsfilt_smfs_remove_extents_ea,
1174         .fs_init_extents_ea     = fsfilt_smfs_init_extents_ea,
1175         .fs_get_ino_write_extents = fsfilt_smfs_get_ino_write_extents,
1176         .fs_get_write_extents_num = NULL,
1177
1178         .fs_free_write_extents  = fsfilt_smfs_free_extents,
1179         .fs_write_extents       = fsfilt_smfs_write_extents,
1180         .fs_post_setup          = fsfilt_smfs_post_setup,
1181         .fs_post_cleanup        = fsfilt_smfs_post_cleanup,
1182         .fs_set_fs_flags        = fsfilt_smfs_set_fs_flags,
1183         .fs_clear_fs_flags      = fsfilt_smfs_clear_fs_flags,
1184         .fs_get_fs_flags        = fsfilt_smfs_get_fs_flags,
1185         .fs_set_ost_flags       = fsfilt_smfs_set_ost_flags,
1186         .fs_set_mds_flags       = fsfilt_smfs_set_mds_flags,
1187         .fs_precreate_rec       = fsfilt_smfs_precreate_rec,
1188         .fs_get_reint_log_ctxt  = NULL, /*fsfilt_smfs_get_reint_log_ctxt,*/
1189         .fs_set_snap_item       = fsfilt_smfs_set_snap_item,
1190         .fs_do_write_cow        = fsfilt_smfs_do_write_cow,
1191  };
1192
1193 struct fsfilt_operations *get_smfs_fs_ops(void)
1194 {
1195         return (&fsfilt_smfs_ops);
1196 }
1197 EXPORT_SYMBOL(get_smfs_fs_ops);
1198
1199