Whamcloud - gitweb
Updated snapshot files for new obdo methods. No testing yet.
[fs/lustre-release.git] / lustre / obdfs / namei.c
1 /*
2  *  linux/fs/obdfs/namei.c
3  *
4  * Copyright (C) 1992, 1993, 1994, 1995
5  * Remy Card (card@masi.ibp.fr)
6  * Laboratoire MASI - Institut Blaise Pascal
7  * Universite Pierre et Marie Curie (Paris VI)
8  *
9  *  from
10  *
11  *  linux/fs/ext2/namei.c
12  *
13  *  Copyright (C) 1991, 1992  Linus Torvalds
14  *
15  *  Big-endian to little-endian byte-swapping/bitmaps by
16  *        David S. Miller (davem@caip.rutgers.edu), 1995
17  *  Directory entry file type support and forward compatibility hooks
18  *      for B-tree directories by Theodore Ts'o (tytso@mit.edu), 1998
19  * 
20  *  Changes for use in OBDFS
21  *  Copyright (c) 1999, Seagate Technology Inc.
22  * 
23  */
24
25 #include <asm/uaccess.h>
26
27 #include <linux/errno.h>
28 #include <linux/fs.h>
29 #include <linux/ext2_fs.h>
30 #include <linux/fcntl.h>
31 #include <linux/sched.h>
32 #include <linux/stat.h>
33 #include <linux/string.h>
34 #include <linux/locks.h>
35 #include <linux/quotaops.h>
36 #include <linux/iobuf.h>
37
38 #include <linux/obd_support.h>
39 #include <linux/obdfs.h>
40
41 /*
42  * define how far ahead to read directories while searching them.
43  */
44 #define NAMEI_RA_CHUNKS  2
45 #define NAMEI_RA_BLOCKS  4
46 #define NAMEI_RA_SIZE        (NAMEI_RA_CHUNKS * NAMEI_RA_BLOCKS)
47 #define NAMEI_RA_INDEX(c,b)  (((c) * NAMEI_RA_BLOCKS) + (b))
48
49 /*
50  * NOTE! unlike strncmp, ext2_match returns 1 for success, 0 for failure.
51  *
52  * `len <= EXT2_NAME_LEN' is guaranteed by caller.
53  * `de != NULL' is guaranteed by caller.
54  */
55 static inline int ext2_match (int len, const char * const name,
56                        struct ext2_dir_entry_2 * de)
57 {
58         if (len != de->name_len)
59                 return 0;
60         if (!de->inode)
61                 return 0;
62         return !memcmp(name, de->name, len);
63 }
64
65 /*
66  *      obdfs_find_entry()
67  *
68  * finds an entry in the specified directory with the wanted name. It
69  * returns the cache buffer in which the entry was found, and the entry
70  * itself (as a parameter - res_dir).  It does NOT read the inode of the
71  * entry - you'll have to do that yourself if you want to.
72  */
73 static struct page * obdfs_find_entry (struct inode * dir,
74                                        const char * const name, int namelen,
75                                        struct ext2_dir_entry_2 ** res_dir,
76                                        int lock)
77 {
78         struct super_block * sb;
79         unsigned long offset;
80         struct page * page;
81         ENTRY;
82         CDEBUG(D_INODE, "find entry for %*s\n", namelen, name);
83
84         *res_dir = NULL;
85         sb = dir->i_sb;
86
87         if (namelen > EXT2_NAME_LEN)
88                 return NULL;
89
90         CDEBUG(D_INODE, "dirsize is %Ld\n", dir->i_size);
91
92         page = 0;
93         offset = 0;
94         while ( offset < dir->i_size ) {
95                 struct ext2_dir_entry_2 * de;
96                 char * dlimit;
97
98                 page = obdfs_getpage(dir, offset, 0, lock);
99
100                 if ( !page ) {
101                         CDEBUG(D_INODE, "No page, offset %lx\n", offset);
102                         return NULL;
103                 }
104
105                 de = (struct ext2_dir_entry_2 *) page_address(page);
106                 dlimit = (char *)page_address(page) + PAGE_SIZE; 
107                 while ((char *) de < dlimit) {
108                         /* this code is executed quadratically often */
109                         /* do minimal checking `by hand' */
110                         int de_len;
111                         /* CDEBUG(D_INODE, "Entry %p len %d, page at %#lx - %#lx , offset %lx\n",
112                                de, le16_to_cpu(de->rec_len), page_address(page),
113                                page_address(page) + PAGE_SIZE, offset); */
114
115                         if ((char *) de + namelen <= dlimit &&
116                             ext2_match (namelen, name, de)) {
117                                 /* found a match -
118                                    just to be sure, do a full check */
119                                 if (!obdfs_check_dir_entry("ext2_find_entry",
120                                                           dir, de, page, offset))
121                                         goto failure;
122                                 *res_dir = de;
123                                 EXIT;
124                                 return page;
125                         }
126                         /* prevent looping on a bad block */
127                         de_len = le16_to_cpu(de->rec_len);
128                         if (de_len <= 0) {
129                                 printk("Bad entry at %p len %d\n", de, de_len);
130                                 goto failure;
131                         }
132                         offset += de_len;
133                         de = (struct ext2_dir_entry_2 *)
134                                 ((char *) de + de_len);
135                         /* CDEBUG(D_INODE, "Next while %lx\n", offset); */
136                 }
137                 if ( lock ) 
138                         UnlockPage(page);
139                 page_cache_release(page);
140                 page = NULL;
141                 CDEBUG(D_INODE, "Next for %lx\n", offset);
142         }
143
144 failure:
145         CDEBUG(D_INODE, "Negative case, page %p, offset %ld\n", page, offset);
146         if (page) {
147                 if (lock) 
148                         UnlockPage(page);
149                 page_cache_release(page);
150         }
151         EXIT;
152         return NULL;
153 } /* obdfs_find_entry */
154
155 struct dentry *obdfs_lookup(struct inode * dir, struct dentry *dentry)
156 {
157         struct inode * inode;
158         struct ext2_dir_entry_2 * de;
159         struct page * page;
160         ENTRY;
161
162         if (dentry->d_name.len > EXT2_NAME_LEN)
163                 return ERR_PTR(-ENAMETOOLONG);
164
165         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
166         inode = NULL;
167         if ( !page ) 
168                 CDEBUG(D_INODE, "No page - negative entry.\n");
169         if ( page && !de ) {
170                 CDEBUG(D_INODE, "Danger: PAGE but de.\n");
171                 return ERR_PTR(-ENOENT);
172         }
173         if (page) {
174                 unsigned long ino = le32_to_cpu(de->inode);
175                 UnlockPage(page);
176                 page_cache_release(page);
177                 inode = iget(dir->i_sb, ino);
178
179                 if (!inode) { 
180                         CDEBUG(D_INODE, "No inode.\n");
181                         EXIT;
182                         return ERR_PTR(-EACCES);
183                 }
184         }
185         d_add(dentry, inode);
186         EXIT;
187         return NULL;
188 } /* obdfs_lookup */
189
190
191 /*
192  *      obdfs_add_entry()
193  *
194  * adds a file entry to the specified directory, using the same
195  * semantics as ext2_find_entry(). It returns NULL if it failed.
196  *
197  * NOTE!! The inode part of 'de' is left at 0 - which means you
198  * may not sleep between calling this and putting something into
199  * the entry, as someone else might have used it while you slept.
200
201  * returns a locked and held page upon success 
202  */
203
204 /* XXX I believe these pages should in fact NOT be locked */
205
206 static struct page *obdfs_add_entry (struct inode * dir,
207                                      const char * name, int namelen,
208                                      struct ext2_dir_entry_2 ** res_dir,
209                                      int *err)
210 {
211         unsigned long offset;
212         unsigned short rec_len;
213         struct page *page;
214         struct ext2_dir_entry_2 * de, * de1;
215         struct super_block * sb;
216
217         ENTRY;
218         *err = -EINVAL;
219         *res_dir = NULL;
220         if (!dir || !dir->i_nlink) {
221                 EXIT;
222                 return NULL;
223         }
224         sb = dir->i_sb;
225
226         if (!namelen) { 
227                 EXIT;
228                 return NULL;
229         }
230         /*
231          * Is this a busy deleted directory?  Can't create new files if so
232          */
233         if (dir->i_size == 0)
234         {
235                 EXIT;
236                 *err = -ENOENT;
237                 return NULL;
238         }
239         page = obdfs_getpage(dir, 0, 0, LOCKED);
240         if (!page) {
241                 EXIT;
242                 return NULL;
243         }
244         rec_len = EXT2_DIR_REC_LEN(namelen);
245         CDEBUG(D_INODE, "reclen: %d\n", rec_len);
246         PDEBUG(page, "starting search");
247         offset = 0;
248         de = (struct ext2_dir_entry_2 *) page_address(page);
249         *err = -ENOSPC;
250         while (1) {
251                 CDEBUG(D_INODE, "Considering entry at %p, (page at %#lx - %#lx), offset %ld\n",
252                        de, page_address(page), page_address(page) + PAGE_SIZE, offset);
253                 if ((char *)de >= PAGE_SIZE + (char *)page_address(page)) {
254                         UnlockPage(page);
255                         page_cache_release(page);
256                         page = obdfs_getpage(dir, offset, 1, LOCKED);
257                         if (!page) {
258                                 EXIT;
259                                 return NULL;
260                         }
261                         PDEBUG(page, "new directory page");
262                         if (dir->i_size <= offset) {
263                                 if (dir->i_size == 0) {
264                                         *err = -ENOENT;
265                                         EXIT;
266                                         return NULL;
267                                 }
268
269                                 CDEBUG(D_INODE, "creating next block\n");
270
271                                 de = (struct ext2_dir_entry_2 *) page_address(page);
272                                 de->inode = 0;
273                                 de->rec_len = le16_to_cpu(PAGE_SIZE);
274                                 dir->i_size = offset + PAGE_SIZE;
275                                 dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
276                                 mark_inode_dirty(dir);
277                         } else {
278
279                                 ext2_debug ("skipping to next block\n");
280
281                                 de = (struct ext2_dir_entry_2 *) page_address(page);
282                         }
283                 }
284                 CDEBUG(D_INODE, "\n");
285                 if (!obdfs_check_dir_entry ("ext2_add_entry", dir, de, page,
286                                            offset)) {
287                         *err = -ENOENT;
288                         UnlockPage(page);
289                         page_cache_release(page);
290                         EXIT;
291                         return NULL;
292                 }
293                 CDEBUG(D_INODE, "\n");
294                 if (ext2_match (namelen, name, de)) {
295                                 *err = -EEXIST;
296                                 UnlockPage(page);
297                                 page_cache_release(page);
298                                 EXIT;
299                                 return NULL;
300                 }
301                 CDEBUG(D_INODE, "Testing for enough space at de %p\n", de);
302                 if ( (le32_to_cpu(de->inode) == 0 && le16_to_cpu(de->rec_len) >= rec_len) ||
303                      (le16_to_cpu(de->rec_len) >= EXT2_DIR_REC_LEN(de->name_len) + rec_len)) {
304                         offset += le16_to_cpu(de->rec_len);
305                         CDEBUG(D_INODE, "Found enough space de %p, offset %#lx\n", de, offset);
306                         if (le32_to_cpu(de->inode)) {
307                                 CDEBUG(D_INODE, "Inserting new in %p\n", de);
308                                 de1 = (struct ext2_dir_entry_2 *) ((char *) de +
309                                         EXT2_DIR_REC_LEN(de->name_len));
310                                 CDEBUG(D_INODE, "-- de1 at %p\n", de1);
311                                 de1->rec_len = cpu_to_le16(le16_to_cpu(de->rec_len) -
312                                         EXT2_DIR_REC_LEN(de->name_len));
313                                 de->rec_len = cpu_to_le16(EXT2_DIR_REC_LEN(de->name_len));
314                                 de = de1;
315                         }
316                         CDEBUG(D_INODE, "Reclen adjusted; copy %d bytes to %p, page at %#lx EOP at %#lx\n", namelen, de->name, page_address(page), page_address(page) + PAGE_SIZE);
317                         de->inode = 0;
318                         de->name_len = namelen;
319                         de->file_type = 0;
320                         memcpy (de->name, name, namelen);
321                         CDEBUG(D_INODE, "Copy done\n");
322                         /*
323                          * XXX shouldn't update any times until successful
324                          * completion of syscall, but too many callers depend
325                          * on this.
326                          *
327                          * XXX similarly, too many callers depend on
328                          * ext2_new_inode() setting the times, but error
329                          * recovery deletes the inode, so the worst that can
330                          * happen is that the times are slightly out of date
331                          * and/or different from the directory change time.
332                          */
333                         dir->i_mtime = dir->i_ctime = CURRENT_TIME;
334                         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
335                         mark_inode_dirty(dir);
336                         dir->i_version = ++event;
337                         *res_dir = de;
338                         *err = 0;
339                         PDEBUG(page, "addentry");
340                         CDEBUG(D_INODE, "Regular exit from add_entry");
341                         EXIT;
342                         return page;
343                 }
344                 CDEBUG(D_INODE, "\n");
345                 offset += le16_to_cpu(de->rec_len);
346                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
347                 
348         }
349         CDEBUG(D_INODE, "\n");
350
351         UnlockPage(page);
352         page_cache_release(page);
353         PDEBUG(page, "addentry");
354         EXIT;
355         return NULL;
356 } /* obdfs_add_entry */
357
358 /*
359  * obdfs_delete_entry deletes a directory entry by merging it with the
360  * previous entry
361  */
362 static int obdfs_delete_entry (struct ext2_dir_entry_2 * dir,
363                               struct page * page)
364 {
365         struct ext2_dir_entry_2 * de, * pde;
366         int i;
367
368         i = 0;
369         pde = NULL;
370         de = (struct ext2_dir_entry_2 *) page_address(page);
371         while (i < PAGE_SIZE) {
372                 if (!obdfs_check_dir_entry ("ext2_delete_entry", NULL, 
373                                            de, page, i))
374                         return -EIO;
375                 if (de == dir)  {
376                         if (pde)
377                                 pde->rec_len =
378                                         cpu_to_le16(le16_to_cpu(pde->rec_len) +
379                                                     le16_to_cpu(dir->rec_len));
380                         else
381                                 dir->inode = 0;
382                         return 0;
383                 }
384                 i += le16_to_cpu(de->rec_len);
385                 pde = de;
386                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
387         }
388         return -ENOENT;
389 } /* obdfs_delete_entry */
390
391
392 static inline void ext2_set_de_type(struct super_block *sb,
393                                 struct ext2_dir_entry_2 *de,
394                                 umode_t mode) {
395         if (!EXT2_HAS_INCOMPAT_FEATURE(sb, EXT2_FEATURE_INCOMPAT_FILETYPE))
396                 return;
397         if (S_ISCHR(mode))
398                 de->file_type = EXT2_FT_CHRDEV;
399         else if (S_ISBLK(mode))
400                 de->file_type = EXT2_FT_BLKDEV;
401         else if (S_ISFIFO(mode))  
402                 de->file_type = EXT2_FT_FIFO;
403         else if (S_ISLNK(mode))
404                 de->file_type = EXT2_FT_SYMLINK;
405         else if (S_ISREG(mode))
406                 de->file_type = EXT2_FT_REG_FILE;
407         else if (S_ISDIR(mode))  
408                 de->file_type = EXT2_FT_DIR;
409 }
410
411
412 /*
413  * Display all dentries holding the specified inode.
414  */
415 #if 0
416 static void show_dentry(struct list_head * dlist, int subdirs)
417 {
418         struct list_head *tmp = dlist;
419
420         while ((tmp = tmp->next) != dlist) {
421                 struct dentry * dentry;
422                 const char * unhashed = "";
423
424                 if ( subdirs ) 
425                         dentry  = list_entry(tmp, struct dentry, d_child);
426                 else 
427                         dentry  = list_entry(tmp, struct dentry, d_alias);
428
429                 if (list_empty(&dentry->d_hash))
430                         unhashed = "(unhashed)";
431
432                 if ( dentry->d_inode ) 
433                         printk("show_dentry: %s/%s, d_count=%d%s (ino %ld, dev %d, ct %d)\n",
434                                dentry->d_parent->d_name.name,
435                                dentry->d_name.name, dentry->d_count,
436                                unhashed, dentry->d_inode->i_ino, 
437                                dentry->d_inode->i_dev, 
438                                dentry->d_inode->i_count);
439                 else 
440                         printk("show_dentry: %s/%s, d_count=%d%s \n",
441                                dentry->d_parent->d_name.name,
442                                dentry->d_name.name, dentry->d_count,
443                                unhashed);
444         }
445 } /* show_dentry */
446 #endif
447
448
449 struct inode *obdfs_new_inode(struct inode *dir)
450 {
451         struct obdo *oa;
452         struct inode *inode;
453         int err;
454
455         ENTRY;
456         oa = obdo_alloc();
457         if (!oa) {
458                 EXIT;
459                 return ERR_PTR(-ENOMEM);
460         }
461
462         err = IOPS(dir, create)(IID(dir), oa);
463
464         if ( err ) {
465                 obdo_free(oa);
466                 EXIT;
467                 return ERR_PTR(err);
468         }
469
470         inode = iget(dir->i_sb, (ino_t)oa->o_id);
471
472         if (!inode) {
473                 IOPS(dir, destroy)(IID(dir), oa);
474                 obdo_free(oa);
475                 EXIT;
476                 return ERR_PTR(-EIO);
477         }
478
479         if (!list_empty(&inode->i_dentry)) {
480                 CDEBUG(D_INODE, "New inode (%ld) has aliases!\n", inode->i_ino);
481                 IOPS(dir, destroy)(IID(dir), oa);
482                 obdo_free(oa);
483                 iput(inode);
484                 EXIT;
485                 return ERR_PTR(-EIO);
486         }
487
488         INIT_LIST_HEAD(&OBDFS_LIST(inode));
489         obdo_free(oa);
490
491         EXIT;
492         return inode;
493 } /* obdfs_new_inode */
494
495
496 /*
497  * By the time this is called, we already have created
498  * the directory cache entry for the new file, but it
499  * is so far negative - it has no inode.
500  *
501  * If the create succeeds, we fill in the inode information
502  * with d_instantiate(). 
503  */
504 int obdfs_create (struct inode * dir, struct dentry * dentry, int mode)
505 {
506         struct inode * inode;
507         struct page *page;
508         struct ext2_dir_entry_2 * de;
509         int err = -EIO;
510
511         ENTRY;
512         inode = obdfs_new_inode(dir);
513         if ( IS_ERR(inode) ) {
514                 EXIT;
515                 return PTR_ERR(inode);
516         }
517
518         inode->i_op = &obdfs_file_inode_operations;
519         inode->i_mode = mode;
520         mark_inode_dirty(inode);
521         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
522         if (!page) {
523                 inode->i_nlink--;
524                 mark_inode_dirty(inode);
525                 iput (inode);
526                 EXIT;
527                 return err;
528         }
529         de->inode = cpu_to_le32(inode->i_ino);
530         ext2_set_de_type(dir->i_sb, de, S_IFREG);
531         dir->i_version = ++event;
532
533         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
534         UnlockPage(page);
535
536         page_cache_release(page);
537         d_instantiate(dentry, inode);
538         EXIT;
539         return err;
540 } /* obdfs_create */
541
542 int obdfs_mknod (struct inode * dir, struct dentry *dentry, int mode, int rdev)
543 {
544         struct inode * inode;
545         struct page *page;
546         struct ext2_dir_entry_2 * de;
547         int err;
548
549         ENTRY;
550
551         inode = obdfs_new_inode(dir);
552         if ( IS_ERR(inode) ) {
553                 EXIT;
554                 return PTR_ERR(inode);
555         }
556
557         inode->i_uid = current->fsuid;
558         init_special_inode(inode, mode, rdev);
559         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
560         if (!page)
561                 goto out_no_entry;
562         de->inode = cpu_to_le32(inode->i_ino);
563         dir->i_version = ++event;
564         ext2_set_de_type(dir->i_sb, de, inode->i_mode);
565         mark_inode_dirty(inode);
566
567         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
568         UnlockPage(page);
569
570         d_instantiate(dentry, inode);
571         page_cache_release(page);
572         err = 0;
573 out:
574         return err;
575
576 out_no_entry:
577         inode->i_nlink--;
578         mark_inode_dirty(inode);
579         iput(inode);
580         goto out;
581 } /* obdfs_mknod */
582
583 int obdfs_mkdir(struct inode * dir, struct dentry * dentry, int mode)
584 {
585         struct inode * inode;
586         struct page *page, *inode_page;
587         struct ext2_dir_entry_2 * de;
588         int err;
589
590         ENTRY;
591
592         err = -EMLINK;
593         if (dir->i_nlink >= EXT2_LINK_MAX)
594                 goto out;
595
596         inode = obdfs_new_inode(dir);
597         if ( IS_ERR(inode) ) {
598                 EXIT;
599                 return PTR_ERR(inode);
600         }
601
602         inode->i_op = &obdfs_dir_inode_operations;
603         inode->i_blocks = 0;    
604         inode_page = obdfs_getpage(inode, 0, 1, LOCKED);
605         if (!inode_page) {
606                 inode->i_nlink--; /* is this nlink == 0? */
607                 mark_inode_dirty(inode);
608                 iput (inode);
609                 return err;
610         }
611
612         /* create . and .. */
613         de = (struct ext2_dir_entry_2 *) page_address(inode_page);
614         de->inode = cpu_to_le32(inode->i_ino);
615         de->name_len = 1;
616         de->rec_len = cpu_to_le16(EXT2_DIR_REC_LEN(de->name_len));
617         strcpy (de->name, ".");
618         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
619         
620         de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
621         de->inode = cpu_to_le32(dir->i_ino);
622         de->rec_len = cpu_to_le16(PAGE_SIZE - EXT2_DIR_REC_LEN(1));
623         de->name_len = 2;
624         strcpy (de->name, "..");
625         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
626         
627         /* XXX handle err */
628         err = obdfs_do_writepage(inode, inode_page, IS_SYNC(inode));
629         inode->i_blocks = PAGE_SIZE/inode->i_sb->s_blocksize;
630         inode->i_size = PAGE_SIZE;
631         UnlockPage(inode_page);
632         page_cache_release(inode_page);
633
634         inode->i_nlink = 2;
635         inode->i_mode = S_IFDIR | mode;
636         if (dir->i_mode & S_ISGID)
637                 inode->i_mode |= S_ISGID;
638         mark_inode_dirty(inode);
639
640         /* now deal with the parent */
641         page = obdfs_add_entry(dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
642         if (!page) {
643                 goto out_no_entry;
644         }
645
646         de->inode = cpu_to_le32(inode->i_ino);
647         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
648         dir->i_version = ++event;
649
650         dir->i_nlink++;
651         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
652         mark_inode_dirty(dir);
653         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
654         /* XXX handle err? */
655
656         UnlockPage(page);
657
658         page_cache_release(page);
659         d_instantiate(dentry, inode);
660 out:
661         EXIT;
662         return err;
663
664 out_no_entry:
665         inode->i_nlink = 0;
666         mark_inode_dirty(inode);
667         iput (inode);
668         EXIT;
669         goto out;
670 } /* obdfs_mkdir */
671
672
673 /*
674  * routine to check that the specified directory is empty (for rmdir)
675  */
676 static int empty_dir (struct inode * inode)
677 {
678         unsigned long offset;
679         struct page *page;
680         struct ext2_dir_entry_2 * de, * de1;
681         struct super_block * sb;
682
683         sb = inode->i_sb;
684         if (inode->i_size < EXT2_DIR_REC_LEN(1) + EXT2_DIR_REC_LEN(2) ||
685             !(page = obdfs_getpage (inode, 0, 0, LOCKED))) {
686                 ext2_warning (inode->i_sb, "empty_dir",
687                               "bad directory (dir #%lu) - no data block",
688                               inode->i_ino);
689                 return 1;
690         }
691         de = (struct ext2_dir_entry_2 *) page_address(page);
692         de1 = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
693         if (le32_to_cpu(de->inode) != inode->i_ino || !le32_to_cpu(de1->inode) || 
694             strcmp (".", de->name) || strcmp ("..", de1->name)) {
695                 ext2_warning (inode->i_sb, "empty_dir",
696                               "bad directory (dir #%lu) - no `.' or `..'",
697                               inode->i_ino);
698                 page_cache_release(page);
699                 return 1;
700         }
701         offset = le16_to_cpu(de->rec_len) + le16_to_cpu(de1->rec_len);
702         de = (struct ext2_dir_entry_2 *) ((char *) de1 + le16_to_cpu(de1->rec_len));
703         while (offset < inode->i_size ) {
704                 if (!page || (void *) de >= (void *) (page_address(page) + PAGE_SIZE)) {
705                         if (page) {
706                                 UnlockPage(page);
707                                 page_cache_release(page);
708                         }
709                         page = obdfs_getpage(inode, offset, 0, LOCKED);
710                         if (!page) {
711 #if 0
712                                 ext2_error (sb, "empty_dir",
713                                             "directory #%lu contains a hole at offset %lu",
714                                             inode->i_ino, offset);
715 #endif
716                                 offset += sb->s_blocksize;
717                                 continue;
718                         }
719                         de = (struct ext2_dir_entry_2 *) page_address(page);
720                 }
721                 if (!obdfs_check_dir_entry ("empty_dir", inode, de, page,
722                                            offset)) {
723                         UnlockPage(page);
724                         page_cache_release(page);
725                         return 1;
726                 }
727                 if (le32_to_cpu(de->inode)) {
728                         UnlockPage(page);
729                         page_cache_release(page);
730                         return 0;
731                 }
732                 offset += le16_to_cpu(de->rec_len);
733                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
734         }
735         UnlockPage(page);
736         page_cache_release(page);
737         return 1;
738 } /* empty_dir */
739
740 int obdfs_rmdir (struct inode * dir, struct dentry *dentry)
741 {
742         int retval;
743         struct inode * inode;
744         struct page *page;
745         struct ext2_dir_entry_2 * de;
746         int err;
747
748         ENTRY;
749
750         retval = -ENOENT;
751         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
752         if (!page)
753                 goto end_rmdir;
754
755         inode = dentry->d_inode;
756         DQUOT_INIT(inode);
757
758         retval = -EIO;
759         if (le32_to_cpu(de->inode) != inode->i_ino)
760                 goto end_rmdir;
761
762         retval = -ENOTEMPTY;
763         if (!empty_dir (inode))
764                 goto end_rmdir;
765
766         retval = obdfs_delete_entry (de, page);
767         dir->i_version = ++event;
768         if (retval)
769                 goto end_rmdir;
770         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
771         /* XXX handle err? */
772         UnlockPage(page);
773
774         if (inode->i_nlink != 2)
775                 ext2_warning (inode->i_sb, "ext2_rmdir",
776                               "empty directory has nlink!=2 (%d)",
777                               inode->i_nlink);
778         inode->i_version = ++event;
779         inode->i_nlink = 0;
780         inode->i_size = 0;
781         mark_inode_dirty(inode);
782         dir->i_nlink--;
783         inode->i_ctime = dir->i_ctime = dir->i_mtime = CURRENT_TIME;
784         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
785         mark_inode_dirty(dir);
786         d_delete(dentry);
787
788 end_rmdir:
789         if ( page )
790                 page_cache_release(page);
791         EXIT;
792         return retval;
793 } /* obdfs_rmdir */
794
795 int obdfs_unlink(struct inode * dir, struct dentry *dentry)
796 {
797         int retval;
798         struct inode * inode;
799         struct page *page;
800         struct ext2_dir_entry_2 * de;
801         int err;
802
803         ENTRY;
804
805         retval = -ENOENT;
806         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
807         if (!page)
808                 goto end_unlink;
809
810         inode = dentry->d_inode;
811         DQUOT_INIT(inode);
812
813         retval = -EIO;
814         if (le32_to_cpu(de->inode) != inode->i_ino)
815                 goto end_unlink;
816         
817         if (!inode->i_nlink) {
818                 ext2_warning (inode->i_sb, "ext2_unlink",
819                               "Deleting nonexistent file (%lu), %d",
820                               inode->i_ino, inode->i_nlink);
821                 inode->i_nlink = 1;
822         }
823         retval = obdfs_delete_entry (de, page);
824         if (retval)
825                 goto end_unlink;
826         dir->i_version = ++event;
827         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
828         /* XXX handle err? */
829         UnlockPage(page);
830
831         dir->i_ctime = dir->i_mtime = CURRENT_TIME;
832         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
833         mark_inode_dirty(dir);
834         inode->i_nlink--;
835         mark_inode_dirty(inode);
836         inode->i_ctime = dir->i_ctime;
837         retval = 0;
838         d_delete(dentry);       /* This also frees the inode */
839
840 end_unlink:
841         if (page)
842                 page_cache_release(page);
843         EXIT;
844         return retval;
845 } /* obdfs_unlink */
846
847 int obdfs_symlink (struct inode * dir, struct dentry *dentry,
848                    const char * symname)
849 {
850         struct ext2_dir_entry_2 * de;
851         struct inode * inode;
852         struct obdfs_inode_info *oinfo;
853         struct page* page = NULL, * name_page = NULL;
854         char * link;
855         int i, l, err = -EIO;
856         char c;
857
858         ENTRY;
859         inode = obdfs_new_inode(dir);
860         oinfo = OBDFS_INFO(inode);
861         if ( IS_ERR(inode) ) {
862                 EXIT;
863                 return PTR_ERR(inode);
864         }
865
866         inode->i_mode = S_IFLNK | S_IRWXUGO;
867         inode->i_op = &obdfs_symlink_inode_operations;
868         for (l = 0; l < inode->i_sb->s_blocksize - 1 && symname [l]; l++)
869                 ;
870
871         if (l >= sizeof(OBDFS_INFO(inode)->oi_inline)) {
872                 CDEBUG(D_INODE, "l=%d, normal symlink\n", l);
873
874                 name_page = obdfs_getpage(inode, 0, 1, LOCKED);
875                 if (!name_page) {
876                         inode->i_nlink--;
877                         mark_inode_dirty(inode);
878                         iput (inode);
879                         EXIT;
880                         return err;
881                 }
882                 link = (char *)page_address(name_page);
883         } else {
884                 link = oinfo->oi_inline;
885                 oinfo->oi_flags |= OBD_FL_INLINEDATA;
886
887                 CDEBUG(D_INODE, "l=%d, fast symlink\n", l);
888
889         }
890         i = 0;
891         while (i < inode->i_sb->s_blocksize - 1 && (c = *(symname++)))
892                 link[i++] = c;
893         link[i] = 0;
894         if (name_page) {
895                 err = obdfs_do_writepage(inode, name_page, IS_SYNC(inode));
896                 /* XXX handle err */
897                 PDEBUG(name_page, "symlink");
898                 UnlockPage(name_page);
899                 page_cache_release(name_page);
900         }
901         inode->i_size = i;
902         mark_inode_dirty(inode);
903
904         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
905         if (!page)
906                 goto out_no_entry;
907         de->inode = cpu_to_le32(inode->i_ino);
908         ext2_set_de_type(dir->i_sb, de, S_IFLNK);
909         dir->i_version = ++event;
910         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
911         UnlockPage(page);
912
913         d_instantiate(dentry, inode);
914 out:
915         EXIT;
916         return err;
917
918 out_no_entry:
919         inode->i_nlink--;
920         mark_inode_dirty(inode);
921         iput (inode);
922         goto out;
923 } /* obdfs_symlink */
924
925 int obdfs_link (struct dentry * old_dentry,
926                 struct inode * dir, struct dentry *dentry)
927 {
928         struct inode *inode = old_dentry->d_inode;
929         struct ext2_dir_entry_2 * de;
930         struct page *page;
931         int err;
932
933         ENTRY;
934
935         if (S_ISDIR(inode->i_mode))
936                 return -EPERM;
937
938         if (inode->i_nlink >= EXT2_LINK_MAX)
939                 return -EMLINK;
940
941         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
942         if (!page)
943                 return err;
944
945         de->inode = cpu_to_le32(inode->i_ino);
946         ext2_set_de_type(dir->i_sb, de, inode->i_mode);
947         dir->i_version = ++event;
948
949         err = obdfs_do_writepage(dir, page, IS_SYNC(dir));
950         UnlockPage(page);
951
952         page_cache_release(page);
953         inode->i_nlink++;
954         inode->i_ctime = CURRENT_TIME;
955         mark_inode_dirty(inode);
956         inode->i_count++;
957         d_instantiate(dentry, inode);
958         return err;
959 } /* obdfs_link */
960
961 #define PARENT_INO(buffer) \
962         ((struct ext2_dir_entry_2 *) ((char *) buffer + \
963         le16_to_cpu(((struct ext2_dir_entry_2 *) buffer)->rec_len)))->inode
964
965 /*
966  * Anybody can rename anything with this: the permission checks are left to the
967  * higher-level routines.
968  */
969 int obdfs_rename (struct inode * old_dir, struct dentry *old_dentry,
970                            struct inode * new_dir, struct dentry *new_dentry)
971 {
972         struct inode * old_inode, * new_inode;
973         struct page * old_page, * new_page, * dir_page;
974         struct ext2_dir_entry_2 * old_de, * new_de;
975         int err;
976
977         ENTRY;
978
979         new_page = dir_page = NULL;
980
981         /* does the old entry exist? - if not get out */
982         old_page = obdfs_find_entry (old_dir, old_dentry->d_name.name, old_dentry->d_name.len, &old_de, NOLOCK);
983         PDEBUG(old_page, "rename - old page");
984         /*
985          *  Check for inode number is _not_ due to possible IO errors.
986          *  We might rmdir the source, keep it as pwd of some process
987          *  and merrily kill the link to whatever was created under the
988          *  same name. Goodbye sticky bit ;-<
989          */
990         old_inode = old_dentry->d_inode;
991         err = -ENOENT;
992         if (!old_page || le32_to_cpu(old_de->inode) != old_inode->i_ino)
993                 goto end_rename;
994
995         /* find new inode */
996         new_inode = new_dentry->d_inode;
997         new_page = obdfs_find_entry (new_dir, new_dentry->d_name.name,
998                                 new_dentry->d_name.len, &new_de, NOLOCK);
999         PDEBUG(new_page, "rename - new page ");
1000         if (new_page) {
1001                 if (!new_inode) {
1002                         page_cache_release(new_page);
1003                         new_page = NULL;
1004                 } else {
1005                         DQUOT_INIT(new_inode);
1006                 }
1007         }
1008         /* in this case we to check more ... */
1009         if (S_ISDIR(old_inode->i_mode)) {
1010                 /* can only rename into empty new directory */
1011                 if (new_inode) {
1012                         err = -ENOTEMPTY;
1013                         if (!empty_dir (new_inode))
1014                                 goto end_rename;
1015                 }
1016                 err = -EIO;
1017                 dir_page= obdfs_getpage (old_inode, 0, 0, LOCKED);
1018                 PDEBUG(dir_page, "rename dir page");
1019
1020                 if (!dir_page)
1021                         goto end_rename;
1022                 if (le32_to_cpu(PARENT_INO(page_address(dir_page))) != old_dir->i_ino)
1023                         goto end_rename;
1024                 err = -EMLINK;
1025                 if (!new_inode && new_dir!=old_dir &&
1026                                 new_dir->i_nlink >= EXT2_LINK_MAX)
1027                         goto end_rename;
1028         }
1029         /* create the target dir entry */
1030         if (!new_page) {
1031                 new_page = obdfs_add_entry (new_dir, new_dentry->d_name.name,
1032                                         new_dentry->d_name.len, &new_de,
1033                                         &err);
1034                 PDEBUG(new_page, "rename new page");
1035                 if (!new_page)
1036                         goto end_rename;
1037         }
1038         new_dir->i_version = ++event;
1039
1040         /*
1041          * remove the old entry
1042          */
1043         new_de->inode = le32_to_cpu(old_inode->i_ino);
1044         if (EXT2_HAS_INCOMPAT_FEATURE(new_dir->i_sb,
1045                                       EXT2_FEATURE_INCOMPAT_FILETYPE))
1046                 new_de->file_type = old_de->file_type;
1047         
1048         obdfs_delete_entry (old_de, old_page);
1049
1050         old_dir->i_version = ++event;
1051         if (new_inode) {
1052                 new_inode->i_nlink--;
1053                 new_inode->i_ctime = CURRENT_TIME;
1054                 mark_inode_dirty(new_inode);
1055         }
1056         old_dir->i_ctime = old_dir->i_mtime = CURRENT_TIME;
1057         old_dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
1058         mark_inode_dirty(old_dir);
1059         if (dir_page) {
1060                 PARENT_INO(page_address(dir_page)) = le32_to_cpu(new_dir->i_ino);
1061                 /* XXX handle err */
1062                 err = obdfs_do_writepage(old_inode, dir_page, IS_SYNC(old_inode));
1063                 old_dir->i_nlink--;
1064                 mark_inode_dirty(old_dir);
1065                 if (new_inode) {
1066                         new_inode->i_nlink--;
1067                         mark_inode_dirty(new_inode);
1068                 } else {
1069                         new_dir->i_nlink++;
1070                         new_dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
1071                         mark_inode_dirty(new_dir);
1072                 }
1073         }
1074         if ( old_page != new_page ) {
1075                 unsigned long index = old_page->index;
1076                 /* lock the old_page and release unlocked copy */
1077                 CDEBUG(D_INODE, "old_page at %p\n", old_page);
1078                 page_cache_release(old_page);
1079                 old_page = obdfs_getpage(old_dir, index >> PAGE_SHIFT, 0, LOCKED);
1080                 CDEBUG(D_INODE, "old_page at %p\n", old_page);
1081                 /* XXX handle err */
1082                 err = obdfs_do_writepage(old_dir, old_page, IS_SYNC(old_dir));
1083         }
1084
1085         err = obdfs_do_writepage(new_dir, new_page, IS_SYNC(new_dir));
1086
1087 end_rename:
1088         if (old_page && PageLocked(old_page) )
1089                 UnlockPage(old_page);
1090         if (old_page)
1091                 page_cache_release(old_page);
1092         if (new_page && PageLocked(new_page) )
1093                 UnlockPage(new_page);
1094         if (new_page)
1095                 page_cache_release(new_page);
1096         if (dir_page && PageLocked(dir_page) )
1097                 UnlockPage(dir_page);
1098         if (dir_page)
1099                 page_cache_release(dir_page);
1100
1101
1102         return err;
1103 } /* obdfs_rename */