Whamcloud - gitweb
12d0bb660284fb5c47ebcf377250c341f0d79f3b
[fs/lustre-release.git] / lustre / obdfs / namei.c
1 /*
2  *  linux/fs/obdfs/namei.c
3  *
4  * Copyright (C) 1992, 1993, 1994, 1995
5  * Remy Card (card@masi.ibp.fr)
6  * Laboratoire MASI - Institut Blaise Pascal
7  * Universite Pierre et Marie Curie (Paris VI)
8  *
9  *  from
10  *
11  *  linux/fs/ext2/namei.c
12  *
13  *  Copyright (C) 1991, 1992  Linus Torvalds
14  *
15  *  Big-endian to little-endian byte-swapping/bitmaps by
16  *        David S. Miller (davem@caip.rutgers.edu), 1995
17  *  Directory entry file type support and forward compatibility hooks
18  *      for B-tree directories by Theodore Ts'o (tytso@mit.edu), 1998
19  * 
20  *  Changes for use in OBDFS
21  *  Copyright (c) 1999, Seagate Technology Inc.
22  * 
23  */
24
25 #include <asm/uaccess.h>
26
27 #include <linux/errno.h>
28 #include <linux/fs.h>
29 #include <linux/ext2_fs.h>
30 #include <linux/fcntl.h>
31 #include <linux/sched.h>
32 #include <linux/stat.h>
33 #include <linux/string.h>
34 #include <linux/locks.h>
35 #include <linux/quotaops.h>
36 #include <linux/iobuf.h>
37
38 #include <linux/obd_support.h>
39 #include <linux/obdfs.h>
40
41 /*
42  * define how far ahead to read directories while searching them.
43  */
44 #define NAMEI_RA_CHUNKS  2
45 #define NAMEI_RA_BLOCKS  4
46 #define NAMEI_RA_SIZE        (NAMEI_RA_CHUNKS * NAMEI_RA_BLOCKS)
47 #define NAMEI_RA_INDEX(c,b)  (((c) * NAMEI_RA_BLOCKS) + (b))
48
49 /*
50  * NOTE! unlike strncmp, ext2_match returns 1 for success, 0 for failure.
51  *
52  * `len <= EXT2_NAME_LEN' is guaranteed by caller.
53  * `de != NULL' is guaranteed by caller.
54  */
55 static inline int ext2_match (int len, const char * const name,
56                        struct ext2_dir_entry_2 * de)
57 {
58         if (len != de->name_len)
59                 return 0;
60         if (!de->inode)
61                 return 0;
62         return !memcmp(name, de->name, len);
63 }
64
65 /*
66  *      ext2_find_entry()
67  *
68  * finds an entry in the specified directory with the wanted name. It
69  * returns the cache buffer in which the entry was found, and the entry
70  * itself (as a parameter - res_dir). It does NOT read the inode of the
71  * entry - you'll have to do that yourself if you want to.
72  */
73 static struct page * obdfs_find_entry (struct inode * dir,
74                                              const char * const name, int namelen,
75                                              struct ext2_dir_entry_2 ** res_dir, int lock)
76 {
77         struct super_block * sb;
78         unsigned long offset;
79         struct page * page;
80         ENTRY;
81         CDEBUG(D_INODE, "find entry for %*s\n", namelen, name);
82
83         *res_dir = NULL;
84         sb = dir->i_sb;
85
86         if (namelen > EXT2_NAME_LEN)
87                 return NULL;
88
89         CDEBUG(D_INODE, "dirsize is %Ld\n", dir->i_size);
90
91         page = 0;
92         offset = 0;
93         while ( offset < dir->i_size ) {
94                 struct ext2_dir_entry_2 * de;
95                 char * dlimit;
96
97                 page = obdfs_getpage(dir, offset, 0, lock);
98
99                 if ( !page ) {
100                         CDEBUG(D_INODE, "No page, offset %lx\n", offset);
101                         return NULL;
102                 }
103
104                 de = (struct ext2_dir_entry_2 *) page_address(page);
105                 dlimit = (char *)page_address(page) + PAGE_SIZE; 
106                 while ((char *) de < dlimit) {
107                         /* this code is executed quadratically often */
108                         /* do minimal checking `by hand' */
109                         int de_len;
110                         CDEBUG(D_INODE, "Entry %p len %d, page at %#lx - %#lx , offset %lx\n",
111                                de, le16_to_cpu(de->rec_len), page_address(page),
112                                page_address(page) + PAGE_SIZE, offset);
113
114                         if ((char *) de + namelen <= dlimit &&
115                             ext2_match (namelen, name, de)) {
116                                 /* found a match -
117                                    just to be sure, do a full check */
118                                 if (!obdfs_check_dir_entry("ext2_find_entry",
119                                                           dir, de, page, offset))
120                                         goto failure;
121                                 *res_dir = de;
122                                 EXIT;
123                                 return page;
124                         }
125                         /* prevent looping on a bad block */
126                         de_len = le16_to_cpu(de->rec_len);
127                         if (de_len <= 0) {
128                                 CDEBUG(D_INODE, "Bad entry: at %p len %d\n",
129                                        de, de_len);
130                                 goto failure;
131                         }
132                         offset += de_len;
133                         de = (struct ext2_dir_entry_2 *)
134                                 ((char *) de + de_len);
135                         CDEBUG(D_INODE, "Next while %lx\n", offset);
136                 }
137                 if ( lock ) 
138                         UnlockPage(page);
139                 page_cache_release(page);
140                 page = NULL;
141                 CDEBUG(D_INODE, "Next for %lx\n", offset);
142         }
143
144 failure:
145         CDEBUG(D_INODE, "Negative case, page %p, offset %ld\n", page, offset);
146         if (page) {
147                 if (lock) 
148                         UnlockPage(page);
149                 page_cache_release(page);
150         }
151         EXIT;
152         return NULL;
153 }
154
155 struct dentry *obdfs_lookup(struct inode * dir, struct dentry *dentry)
156 {
157         struct inode * inode;
158         struct ext2_dir_entry_2 * de;
159         struct page * page;
160         ENTRY;
161
162         if (dentry->d_name.len > EXT2_NAME_LEN)
163                 return ERR_PTR(-ENAMETOOLONG);
164
165         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
166         inode = NULL;
167         if ( !page ) 
168                 CDEBUG(D_INODE, "No page - negative entry.\n");
169         if ( page && !de ) {
170                 CDEBUG(D_INODE, "Danger: PAGE but de.\n");
171                 return ERR_PTR(-ENOENT);
172         }
173         if (page) {
174                 unsigned long ino = le32_to_cpu(de->inode);
175                 UnlockPage(page);
176                 page_cache_release(page);
177                 inode = iget(dir->i_sb, ino);
178
179                 if (!inode) { 
180                         CDEBUG(D_INODE, "No inode.\n");
181                         EXIT;
182                         return ERR_PTR(-EACCES);
183                 }
184         }
185         d_add(dentry, inode);
186         EXIT;
187         return NULL;
188 }
189
190
191 /*
192  *      ext2_add_entry()
193  *
194  * adds a file entry to the specified directory, using the same
195  * semantics as ext2_find_entry(). It returns NULL if it failed.
196  *
197  * NOTE!! The inode part of 'de' is left at 0 - which means you
198  * may not sleep between calling this and putting something into
199  * the entry, as someone else might have used it while you slept.
200
201  * returns a locked and held page upon success 
202  */
203 static struct page *obdfs_add_entry (struct inode * dir,
204                                      const char * name, int namelen,
205                                      struct ext2_dir_entry_2 ** res_dir,
206                                      int *err)
207 {
208         unsigned long offset;
209         unsigned short rec_len;
210         struct page *page;
211         struct ext2_dir_entry_2 * de, * de1;
212         struct super_block * sb;
213
214         ENTRY;
215         *err = -EINVAL;
216         *res_dir = NULL;
217         if (!dir || !dir->i_nlink) {
218                 EXIT;
219                 return NULL;
220         }
221         sb = dir->i_sb;
222
223         if (!namelen) { 
224                 EXIT;
225                 return NULL;
226         }
227         /*
228          * Is this a busy deleted directory?  Can't create new files if so
229          */
230         if (dir->i_size == 0)
231         {
232                 EXIT;
233                 *err = -ENOENT;
234                 return NULL;
235         }
236         page = obdfs_getpage(dir, 0, 0, LOCKED);
237         if (!page) {
238                 EXIT;
239                 return NULL;
240         }
241         rec_len = EXT2_DIR_REC_LEN(namelen);
242         CDEBUG(D_INODE, "reclen: %d\n", rec_len);
243         offset = 0;
244         de = (struct ext2_dir_entry_2 *) page_address(page);
245         *err = -ENOSPC;
246         while (1) {
247                 CDEBUG(D_INODE, "Considering entry at %p, (page at %#lx - %#lx), offset %ld\n",
248                        de, page_address(page), page_address(page) + PAGE_SIZE, offset);
249                 if ((char *)de >= PAGE_SIZE + (char *)page_address(page)) {
250                         UnlockPage(page);
251                         page_cache_release(page);
252                         page = obdfs_getpage(dir, offset, 1, LOCKED);
253                         if (!page) {
254                                 EXIT;
255                                 return NULL;
256                         }
257                         if (dir->i_size <= offset) {
258                                 if (dir->i_size == 0) {
259                                         *err = -ENOENT;
260                                         EXIT;
261                                         return NULL;
262                                 }
263
264                                 CDEBUG(D_INODE, "creating next block\n");
265
266                                 de = (struct ext2_dir_entry_2 *) page_address(page);
267                                 de->inode = 0;
268                                 de->rec_len = le16_to_cpu(PAGE_SIZE);
269                                 dir->i_size = offset + PAGE_SIZE;
270                                 dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
271                                 mark_inode_dirty(dir);
272                         } else {
273
274                                 ext2_debug ("skipping to next block\n");
275
276                                 de = (struct ext2_dir_entry_2 *) page_address(page);
277                         }
278                 }
279                 CDEBUG(D_INODE, "\n");
280                 if (!obdfs_check_dir_entry ("ext2_add_entry", dir, de, page,
281                                            offset)) {
282                         *err = -ENOENT;
283                         UnlockPage(page);
284                         page_cache_release(page);
285                         EXIT;
286                         return NULL;
287                 }
288                 CDEBUG(D_INODE, "\n");
289                 if (ext2_match (namelen, name, de)) {
290                                 *err = -EEXIST;
291                                 UnlockPage(page);
292                                 page_cache_release(page);
293                                 EXIT;
294                                 return NULL;
295                 }
296                 CDEBUG(D_INODE, "Testing for enough space at de %p\n", de);
297                 if ( (le32_to_cpu(de->inode) == 0 && le16_to_cpu(de->rec_len) >= rec_len) ||
298                      (le16_to_cpu(de->rec_len) >= EXT2_DIR_REC_LEN(de->name_len) + rec_len)) {
299                         offset += le16_to_cpu(de->rec_len);
300                         CDEBUG(D_INODE, "Found enough space de %p, offset %#lx\n", de, offset);
301                         if (le32_to_cpu(de->inode)) {
302                                 CDEBUG(D_INODE, "Inserting new in %p\n", de);
303                                 de1 = (struct ext2_dir_entry_2 *) ((char *) de +
304                                         EXT2_DIR_REC_LEN(de->name_len));
305                                 CDEBUG(D_INODE, "-- de1 at %p\n", de1);
306                                 de1->rec_len = cpu_to_le16(le16_to_cpu(de->rec_len) -
307                                         EXT2_DIR_REC_LEN(de->name_len));
308                                 de->rec_len = cpu_to_le16(EXT2_DIR_REC_LEN(de->name_len));
309                                 de = de1;
310                         }
311                         CDEBUG(D_INODE, "Reclen adjusted; copy %d bytes to %p, page at %#lx EOP at %#lx\n", namelen, de->name, page_address(page), page_address(page) + PAGE_SIZE);
312                         de->inode = 0;
313                         de->name_len = namelen;
314                         de->file_type = 0;
315                         memcpy (de->name, name, namelen);
316                         CDEBUG(D_INODE, "Copy done\n");
317                         /*
318                          * XXX shouldn't update any times until successful
319                          * completion of syscall, but too many callers depend
320                          * on this.
321                          *
322                          * XXX similarly, too many callers depend on
323                          * ext2_new_inode() setting the times, but error
324                          * recovery deletes the inode, so the worst that can
325                          * happen is that the times are slightly out of date
326                          * and/or different from the directory change time.
327                          */
328                         dir->i_mtime = dir->i_ctime = CURRENT_TIME;
329                         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
330                         mark_inode_dirty(dir);
331                         dir->i_version = ++event;
332                         *res_dir = de;
333                         *err = 0;
334                         PDEBUG(page, "addentry");
335                         CDEBUG(D_INODE, "Regular exit from add_entry");
336                         EXIT;
337                         return page;
338                 }
339                 CDEBUG(D_INODE, "\n");
340                 offset += le16_to_cpu(de->rec_len);
341                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
342                 
343         }
344         CDEBUG(D_INODE, "\n");
345
346         UnlockPage(page);
347         page_cache_release(page);
348         PDEBUG(page, "addentry");
349         EXIT;
350         return NULL;
351 }
352
353 /*
354  * ext2_delete_entry deletes a directory entry by merging it with the
355  * previous entry
356  */
357 static int obdfs_delete_entry (struct ext2_dir_entry_2 * dir,
358                               struct page * page)
359 {
360         struct ext2_dir_entry_2 * de, * pde;
361         int i;
362
363         i = 0;
364         pde = NULL;
365         de = (struct ext2_dir_entry_2 *) page_address(page);
366         while (i < PAGE_SIZE) {
367                 if (!obdfs_check_dir_entry ("ext2_delete_entry", NULL, 
368                                            de, page, i))
369                         return -EIO;
370                 if (de == dir)  {
371                         if (pde)
372                                 pde->rec_len =
373                                         cpu_to_le16(le16_to_cpu(pde->rec_len) +
374                                                     le16_to_cpu(dir->rec_len));
375                         else
376                                 dir->inode = 0;
377                         return 0;
378                 }
379                 i += le16_to_cpu(de->rec_len);
380                 pde = de;
381                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
382         }
383         return -ENOENT;
384 }
385
386
387 static inline void ext2_set_de_type(struct super_block *sb,
388                                 struct ext2_dir_entry_2 *de,
389                                 umode_t mode) {
390         if (!EXT2_HAS_INCOMPAT_FEATURE(sb, EXT2_FEATURE_INCOMPAT_FILETYPE))
391                 return;
392         if (S_ISCHR(mode))
393                 de->file_type = EXT2_FT_CHRDEV;
394         else if (S_ISBLK(mode))
395                 de->file_type = EXT2_FT_BLKDEV;
396         else if (S_ISFIFO(mode))  
397                 de->file_type = EXT2_FT_FIFO;
398         else if (S_ISLNK(mode))
399                 de->file_type = EXT2_FT_SYMLINK;
400         else if (S_ISREG(mode))
401                 de->file_type = EXT2_FT_REG_FILE;
402         else if (S_ISDIR(mode))  
403                 de->file_type = EXT2_FT_DIR;
404 }
405
406
407 /*
408  * Display all dentries holding the specified inode.
409  */
410 #if 0
411 static void show_dentry(struct list_head * dlist, int subdirs)
412 {
413         struct list_head *tmp = dlist;
414
415         while ((tmp = tmp->next) != dlist) {
416                 struct dentry * dentry;
417                 const char * unhashed = "";
418
419                 if ( subdirs ) 
420                         dentry  = list_entry(tmp, struct dentry, d_child);
421                 else 
422                         dentry  = list_entry(tmp, struct dentry, d_alias);
423
424                 if (list_empty(&dentry->d_hash))
425                         unhashed = "(unhashed)";
426
427                 if ( dentry->d_inode ) 
428                         printk("show_dentry: %s/%s, d_count=%d%s (ino %ld, dev %d, ct %d)\n",
429                                dentry->d_parent->d_name.name,
430                                dentry->d_name.name, dentry->d_count,
431                                unhashed, dentry->d_inode->i_ino, 
432                                dentry->d_inode->i_dev, 
433                                dentry->d_inode->i_count);
434                 else 
435                         printk("show_dentry: %s/%s, d_count=%d%s \n",
436                                dentry->d_parent->d_name.name,
437                                dentry->d_name.name, dentry->d_count,
438                                unhashed);
439         }
440 }
441 #endif
442
443
444 /*
445  * By the time this is called, we already have created
446  * the directory cache entry for the new file, but it
447  * is so far negative - it has no inode.
448  *
449  * If the create succeeds, we fill in the inode information
450  * with d_instantiate(). 
451  */
452 int obdfs_create (struct inode * dir, struct dentry * dentry, int mode)
453 {
454         struct inode * inode;
455         struct page *page;
456         struct ext2_dir_entry_2 * de;
457         int err = -EIO;
458         ino_t ino;
459
460         ENTRY;
461
462         /*
463          * N.B. Several error exits in ext2_new_inode don't set err.
464          */
465         ino = iops(dir)->o_create(iid(dir), 0, &err);
466         if ( err ) 
467                 return err;
468         err = -EIO;
469         inode =  iget(dir->i_sb, ino);
470         if (!inode || !list_empty(&inode->i_dentry)) {
471                 CDEBUG(D_INODE, "No inode, ino %ld\n", ino);
472                 EXIT;
473                 return err;
474         }
475
476         inode->i_op = &obdfs_file_inode_operations;
477         inode->i_mode = mode;
478         mark_inode_dirty(inode);
479         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
480         if (!page) {
481                 inode->i_nlink--;
482                 mark_inode_dirty(inode);
483                 iput (inode);
484                 EXIT;
485                 return err;
486         }
487         de->inode = cpu_to_le32(inode->i_ino);
488         ext2_set_de_type(dir->i_sb, de, S_IFREG);
489         dir->i_version = ++event;
490         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 0);
491         UnlockPage(page);
492 #if 0
493         if (IS_SYNC(dir)) {
494                 ll_rw_block (WRITE, 1, &bh);
495                 wait_on_buffer (bh);
496         }
497 #endif
498         page_cache_release(page);
499         d_instantiate(dentry, inode);
500         EXIT;
501         return 0;
502 }
503
504 int obdfs_mknod (struct inode * dir, struct dentry *dentry, int mode, int rdev)
505 {
506         struct inode * inode;
507         struct page *page;
508         struct ext2_dir_entry_2 * de;
509         int err = -EIO;
510
511         ino_t ino;
512
513         ENTRY;
514
515         /*
516          * N.B. Several error exits in ext2_new_inode don't set err.
517          */
518         ino = iops(dir)->o_create(iid(dir), 0, &err);
519         if ( ino == -1 ) 
520                 return -1;
521         inode =  iget(dir->i_sb, ino);
522         if (!inode)
523                 return err;
524
525         inode->i_uid = current->fsuid;
526         init_special_inode(inode, mode, rdev);
527         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
528         if (!page)
529                 goto out_no_entry;
530         de->inode = cpu_to_le32(inode->i_ino);
531         dir->i_version = ++event;
532         ext2_set_de_type(dir->i_sb, de, inode->i_mode);
533         mark_inode_dirty(inode);
534         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 0);
535         UnlockPage(page);
536
537 #if 0
538         if (IS_SYNC(dir)) {
539                 ll_rw_block (WRITE, 1, &bh);
540                 wait_on_buffer (bh);
541         }
542 #endif
543         d_instantiate(dentry, inode);
544         page_cache_release(page);
545         err = 0;
546 out:
547         return err;
548
549 out_no_entry:
550         inode->i_nlink--;
551         mark_inode_dirty(inode);
552         iput(inode);
553         goto out;
554 }
555
556 int obdfs_mkdir(struct inode * dir, struct dentry * dentry, int mode)
557 {
558         struct inode * inode;
559         struct page *page, *inode_page;
560         struct ext2_dir_entry_2 * de;
561         int err;
562         ino_t ino;
563
564         ENTRY;
565
566         err = -EMLINK;
567         if (dir->i_nlink >= EXT2_LINK_MAX)
568                 goto out;
569
570         err = -EIO;
571         ino = iops(dir)->o_create(iid(dir), 0, &err);
572         if ( ino == -1 ) 
573                 return -1;
574         inode =  iget(dir->i_sb, ino);
575         if (!inode)
576                 return err;
577
578
579         inode->i_op = &obdfs_dir_inode_operations;
580         inode->i_blocks = 0;    
581         inode_page = obdfs_getpage(inode, 0, 1, LOCKED);
582         if (!inode_page) {
583                 inode->i_nlink--; /* is this nlink == 0? */
584                 mark_inode_dirty(inode);
585                 iput (inode);
586                 return err;
587         }
588
589         /* create . and .. */
590         de = (struct ext2_dir_entry_2 *) page_address(inode_page);
591         de->inode = cpu_to_le32(inode->i_ino);
592         de->name_len = 1;
593         de->rec_len = cpu_to_le16(EXT2_DIR_REC_LEN(de->name_len));
594         strcpy (de->name, ".");
595         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
596         
597         de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
598         de->inode = cpu_to_le32(dir->i_ino);
599         de->rec_len = cpu_to_le16(PAGE_SIZE - EXT2_DIR_REC_LEN(1));
600         de->name_len = 2;
601         strcpy (de->name, "..");
602         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
603         
604         iops(dir)->o_brw(WRITE, iid(dir), inode, inode_page, 1);
605         inode->i_blocks = PAGE_SIZE/inode->i_sb->s_blocksize;
606         inode->i_size = PAGE_SIZE;
607         UnlockPage(inode_page);
608         page_cache_release(inode_page);
609
610         inode->i_nlink = 2;
611         inode->i_mode = S_IFDIR | mode;
612         if (dir->i_mode & S_ISGID)
613                 inode->i_mode |= S_ISGID;
614         mark_inode_dirty(inode);
615
616         /* now deal with the parent */
617         page = obdfs_add_entry(dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
618         if (!page) {
619                 goto out_no_entry;
620         }
621
622         de->inode = cpu_to_le32(inode->i_ino);
623         ext2_set_de_type(dir->i_sb, de, S_IFDIR);
624         dir->i_version = ++event;
625
626 #if 0
627         if (IS_SYNC(dir)) {
628                 ll_rw_block (WRITE, 1, &bh);
629                 wait_on_buffer (bh);
630         }
631 #endif
632         dir->i_nlink++;
633         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
634         mark_inode_dirty(dir);
635         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 1);
636         UnlockPage(page);
637         page_cache_release(page);
638         d_instantiate(dentry, inode);
639         err = 0;
640 out:
641         EXIT;
642         return err;
643
644 out_no_entry:
645         inode->i_nlink = 0;
646         mark_inode_dirty(inode);
647         iput (inode);
648         EXIT;
649         goto out;
650 }
651
652
653 /*
654  * routine to check that the specified directory is empty (for rmdir)
655  */
656 static int empty_dir (struct inode * inode)
657 {
658         unsigned long offset;
659         struct page *page;
660         struct ext2_dir_entry_2 * de, * de1;
661         struct super_block * sb;
662
663         sb = inode->i_sb;
664         if (inode->i_size < EXT2_DIR_REC_LEN(1) + EXT2_DIR_REC_LEN(2) ||
665             !(page = obdfs_getpage (inode, 0, 0, LOCKED))) {
666                 ext2_warning (inode->i_sb, "empty_dir",
667                               "bad directory (dir #%lu) - no data block",
668                               inode->i_ino);
669                 return 1;
670         }
671         de = (struct ext2_dir_entry_2 *) page_address(page);
672         de1 = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
673         if (le32_to_cpu(de->inode) != inode->i_ino || !le32_to_cpu(de1->inode) || 
674             strcmp (".", de->name) || strcmp ("..", de1->name)) {
675                 ext2_warning (inode->i_sb, "empty_dir",
676                               "bad directory (dir #%lu) - no `.' or `..'",
677                               inode->i_ino);
678                 page_cache_release(page);
679                 return 1;
680         }
681         offset = le16_to_cpu(de->rec_len) + le16_to_cpu(de1->rec_len);
682         de = (struct ext2_dir_entry_2 *) ((char *) de1 + le16_to_cpu(de1->rec_len));
683         while (offset < inode->i_size ) {
684                 if (!page || (void *) de >= (void *) (page_address(page) + PAGE_SIZE)) {
685                         if (page) {
686                                 UnlockPage(page);
687                                 page_cache_release(page);
688                         }
689                         page = obdfs_getpage(inode, offset, 0, LOCKED);
690                         if (!page) {
691 #if 0
692                                 ext2_error (sb, "empty_dir",
693                                             "directory #%lu contains a hole at offset %lu",
694                                             inode->i_ino, offset);
695 #endif
696                                 offset += sb->s_blocksize;
697                                 continue;
698                         }
699                         de = (struct ext2_dir_entry_2 *) page_address(page);
700                 }
701                 if (!obdfs_check_dir_entry ("empty_dir", inode, de, page,
702                                            offset)) {
703                         UnlockPage(page);
704                         page_cache_release(page);
705                         return 1;
706                 }
707                 if (le32_to_cpu(de->inode)) {
708                         UnlockPage(page);
709                         page_cache_release(page);
710                         return 0;
711                 }
712                 offset += le16_to_cpu(de->rec_len);
713                 de = (struct ext2_dir_entry_2 *) ((char *) de + le16_to_cpu(de->rec_len));
714         }
715         UnlockPage(page);
716         page_cache_release(page);
717         return 1;
718 }
719
720 int obdfs_rmdir (struct inode * dir, struct dentry *dentry)
721 {
722         int retval;
723         struct inode * inode;
724         struct page *page;
725         struct ext2_dir_entry_2 * de;
726
727         ENTRY;
728
729         retval = -ENOENT;
730         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
731         if (!page)
732                 goto end_rmdir;
733
734         inode = dentry->d_inode;
735         DQUOT_INIT(inode);
736
737         retval = -EIO;
738         if (le32_to_cpu(de->inode) != inode->i_ino)
739                 goto end_rmdir;
740
741         retval = -ENOTEMPTY;
742         if (!empty_dir (inode))
743                 goto end_rmdir;
744
745         retval = obdfs_delete_entry (de, page);
746         dir->i_version = ++event;
747         if (retval)
748                 goto end_rmdir;
749         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 0);
750         UnlockPage(page);
751 #if 0
752         if (IS_SYNC(dir)) {
753                 ll_rw_block (WRITE, 1, &bh);
754                 wait_on_buffer (bh);
755         }
756 #endif
757         if (inode->i_nlink != 2)
758                 ext2_warning (inode->i_sb, "ext2_rmdir",
759                               "empty directory has nlink!=2 (%d)",
760                               inode->i_nlink);
761         inode->i_version = ++event;
762         inode->i_nlink = 0;
763         inode->i_size = 0;
764         mark_inode_dirty(inode);
765         dir->i_nlink--;
766         inode->i_ctime = dir->i_ctime = dir->i_mtime = CURRENT_TIME;
767         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
768         mark_inode_dirty(dir);
769         d_delete(dentry);
770
771 end_rmdir:
772         if ( page )
773                 page_cache_release(page);
774         EXIT;
775         return retval;
776 }
777
778 int obdfs_unlink(struct inode * dir, struct dentry *dentry)
779 {
780         int retval;
781         struct inode * inode;
782         struct page *page;
783         struct ext2_dir_entry_2 * de;
784
785         ENTRY;
786
787         retval = -ENOENT;
788         page = obdfs_find_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, LOCKED);
789         if (!page)
790                 goto end_unlink;
791
792         inode = dentry->d_inode;
793         DQUOT_INIT(inode);
794
795         retval = -EIO;
796         if (le32_to_cpu(de->inode) != inode->i_ino)
797                 goto end_unlink;
798         
799         if (!inode->i_nlink) {
800                 ext2_warning (inode->i_sb, "ext2_unlink",
801                               "Deleting nonexistent file (%lu), %d",
802                               inode->i_ino, inode->i_nlink);
803                 inode->i_nlink = 1;
804         }
805         retval = obdfs_delete_entry (de, page);
806         if (retval)
807                 goto end_unlink;
808         dir->i_version = ++event;
809         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 0);
810         UnlockPage(page);
811 #if 0
812         if (IS_SYNC(dir)) {
813                 ll_rw_block (WRITE, 1, &bh);
814                 wait_on_buffer (bh);
815         }
816 #endif
817         dir->i_ctime = dir->i_mtime = CURRENT_TIME;
818         dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
819         mark_inode_dirty(dir);
820         inode->i_nlink--;
821         mark_inode_dirty(inode);
822         inode->i_ctime = dir->i_ctime;
823         retval = 0;
824         d_delete(dentry);       /* This also frees the inode */
825
826 end_unlink:
827         if (page)
828                 page_cache_release(page);
829         EXIT;
830         return retval;
831 }
832
833 int obdfs_symlink (struct inode * dir, struct dentry *dentry, const char * symname)
834 {
835         struct ext2_dir_entry_2 * de;
836         struct inode * inode;
837         struct page* page = NULL, * name_page = NULL;
838         char * link;
839         int i, l, err = -EIO;
840         char c;
841         ino_t ino;
842
843         ENTRY;
844         /*
845          * N.B. Several error exits in ext2_new_inode don't set err.
846          */
847         ino = iops(dir)->o_create(iid(dir), 0, &err);
848         if ( ino == -1 )  {
849                 EXIT;
850                 return -1;
851         }
852         inode =  iget(dir->i_sb, ino);
853         if (!inode) {
854                 EXIT;
855                 return err;
856         }
857         inode->i_mode = S_IFLNK | S_IRWXUGO;
858         inode->i_op = &obdfs_symlink_inode_operations;
859         for (l = 0; l < inode->i_sb->s_blocksize - 1 &&
860              symname [l]; l++)
861                 ;
862
863         /* For obdfs we always use normal (not fast) symlinks
864         if (l >= sizeof (inode->u.ext2_i.i_data)) { */
865                 CDEBUG(D_INODE, "l=%d, normal symlink\n", l);
866
867                 name_page = obdfs_getpage(inode, 0, 1, LOCKED);
868                 if (!name_page) {
869                         inode->i_nlink--;
870                         mark_inode_dirty(inode);
871                         iput (inode);
872                         EXIT;
873                         return err;
874                 }
875                 link = (char *)page_address(name_page);
876         /* } else {
877                 link = (char *) inode->u.ext2_i.i_data;
878
879                 CDEBUG(D_INODE, "l=%d, fast symlink\n", l);
880
881         } */
882         i = 0;
883         while (i < inode->i_sb->s_blocksize - 1 && (c = *(symname++)))
884                 link[i++] = c;
885         link[i] = 0;
886         if (name_page) {
887                 iops(inode)->o_brw(WRITE, iid(inode), inode, name_page, 1);
888                 PDEBUG(name_page, "symlink");
889                 UnlockPage(name_page);
890                 page_cache_release(name_page);
891         }
892         inode->i_size = i;
893         mark_inode_dirty(inode);
894
895         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
896         if (!page)
897                 goto out_no_entry;
898         de->inode = cpu_to_le32(inode->i_ino);
899         ext2_set_de_type(dir->i_sb, de, S_IFLNK);
900         dir->i_version = ++event;
901         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 1);
902         UnlockPage(page);
903 #if 0
904         if (IS_SYNC(dir)) {
905                 ll_rw_block (WRITE, 1, &bh);
906                 wait_on_buffer (bh);
907         }
908 #endif
909         d_instantiate(dentry, inode);
910         err = 0;
911 out:
912         EXIT;
913         return err;
914
915 out_no_entry:
916         inode->i_nlink--;
917         mark_inode_dirty(inode);
918         iput (inode);
919         goto out;
920 }
921
922 int obdfs_link (struct dentry * old_dentry,
923                 struct inode * dir, struct dentry *dentry)
924 {
925         struct inode *inode = old_dentry->d_inode;
926         struct ext2_dir_entry_2 * de;
927         struct page *page;
928         int err;
929
930         ENTRY;
931
932         if (S_ISDIR(inode->i_mode))
933                 return -EPERM;
934
935         if (inode->i_nlink >= EXT2_LINK_MAX)
936                 return -EMLINK;
937
938         page = obdfs_add_entry (dir, dentry->d_name.name, dentry->d_name.len, &de, &err);
939         if (!page)
940                 return err;
941
942         de->inode = cpu_to_le32(inode->i_ino);
943         ext2_set_de_type(dir->i_sb, de, inode->i_mode);
944         dir->i_version = ++event;
945         iops(dir)->o_brw(WRITE, iid(dir), dir, page, 0);
946         UnlockPage(page);
947
948 #if 0
949         if (IS_SYNC(dir)) {
950                 ll_rw_block (WRITE, 1, &bh);
951                 wait_on_buffer (bh);
952         }
953 #endif
954         page_cache_release(page);
955         inode->i_nlink++;
956         inode->i_ctime = CURRENT_TIME;
957         mark_inode_dirty(inode);
958         inode->i_count++;
959         d_instantiate(dentry, inode);
960         return 0;
961 }
962
963 #define PARENT_INO(buffer) \
964         ((struct ext2_dir_entry_2 *) ((char *) buffer + \
965         le16_to_cpu(((struct ext2_dir_entry_2 *) buffer)->rec_len)))->inode
966
967 /*
968  * Anybody can rename anything with this: the permission checks are left to the
969  * higher-level routines.
970  */
971 int obdfs_rename (struct inode * old_dir, struct dentry *old_dentry,
972                            struct inode * new_dir, struct dentry *new_dentry)
973 {
974         struct inode * old_inode, * new_inode;
975         struct page * old_page, * new_page, * dir_page;
976         struct ext2_dir_entry_2 * old_de, * new_de;
977         int retval;
978
979         ENTRY;
980
981         new_page = dir_page = NULL;
982
983         /* does the old entry exist? - if not get out */
984         old_page = obdfs_find_entry (old_dir, old_dentry->d_name.name, old_dentry->d_name.len, &old_de, NOLOCK);
985         PDEBUG(old_page, "rename - old page");
986         /*
987          *  Check for inode number is _not_ due to possible IO errors.
988          *  We might rmdir the source, keep it as pwd of some process
989          *  and merrily kill the link to whatever was created under the
990          *  same name. Goodbye sticky bit ;-<
991          */
992         old_inode = old_dentry->d_inode;
993         retval = -ENOENT;
994         if (!old_page || le32_to_cpu(old_de->inode) != old_inode->i_ino)
995                 goto end_rename;
996
997         /* find new inode */
998         new_inode = new_dentry->d_inode;
999         new_page = obdfs_find_entry (new_dir, new_dentry->d_name.name,
1000                                 new_dentry->d_name.len, &new_de, NOLOCK);
1001         PDEBUG(new_page, "rename - new page ");
1002         if (new_page) {
1003                 if (!new_inode) {
1004                         page_cache_release(new_page);
1005                         new_page = NULL;
1006                 } else {
1007                         DQUOT_INIT(new_inode);
1008                 }
1009         }
1010         /* in this case we to check more ... */
1011         if (S_ISDIR(old_inode->i_mode)) {
1012                 /* can only rename into empty new directory */
1013                 if (new_inode) {
1014                         retval = -ENOTEMPTY;
1015                         if (!empty_dir (new_inode))
1016                                 goto end_rename;
1017                 }
1018                 retval = -EIO;
1019                 dir_page= obdfs_getpage (old_inode, 0, 0, LOCKED);
1020                 PDEBUG(dir_page, "rename dir page");
1021
1022                 if (!dir_page)
1023                         goto end_rename;
1024                 if (le32_to_cpu(PARENT_INO(page_address(dir_page))) != old_dir->i_ino)
1025                         goto end_rename;
1026                 retval = -EMLINK;
1027                 if (!new_inode && new_dir!=old_dir &&
1028                                 new_dir->i_nlink >= EXT2_LINK_MAX)
1029                         goto end_rename;
1030         }
1031         /* create the target dir entry */
1032         if (!new_page) {
1033                 new_page = obdfs_add_entry (new_dir, new_dentry->d_name.name,
1034                                         new_dentry->d_name.len, &new_de,
1035                                         &retval);
1036                 PDEBUG(new_page, "rename new page");
1037                 if (!new_page)
1038                         goto end_rename;
1039         }
1040         new_dir->i_version = ++event;
1041
1042         /*
1043          * remove the old entry
1044          */
1045         new_de->inode = le32_to_cpu(old_inode->i_ino);
1046         if (EXT2_HAS_INCOMPAT_FEATURE(new_dir->i_sb,
1047                                       EXT2_FEATURE_INCOMPAT_FILETYPE))
1048                 new_de->file_type = old_de->file_type;
1049         
1050         obdfs_delete_entry (old_de, old_page);
1051
1052         old_dir->i_version = ++event;
1053         if (new_inode) {
1054                 new_inode->i_nlink--;
1055                 new_inode->i_ctime = CURRENT_TIME;
1056                 mark_inode_dirty(new_inode);
1057         }
1058         old_dir->i_ctime = old_dir->i_mtime = CURRENT_TIME;
1059         old_dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
1060         mark_inode_dirty(old_dir);
1061         if (dir_page) {
1062                 PARENT_INO(page_address(dir_page)) = le32_to_cpu(new_dir->i_ino);
1063                 iops(old_inode)->o_brw(WRITE, iid(old_inode), old_inode, dir_page, 0);
1064                 old_dir->i_nlink--;
1065                 mark_inode_dirty(old_dir);
1066                 if (new_inode) {
1067                         new_inode->i_nlink--;
1068                         mark_inode_dirty(new_inode);
1069                 } else {
1070                         new_dir->i_nlink++;
1071                         new_dir->u.ext2_i.i_flags &= ~EXT2_BTREE_FL;
1072                         mark_inode_dirty(new_dir);
1073                 }
1074         }
1075         if ( old_page != new_page ) {
1076                 unsigned long index = old_page->index;
1077                 /* lock the old_page and release unlocked copy */
1078                 CDEBUG(D_INODE, "old_page at %p\n", old_page);
1079                 page_cache_release(old_page);
1080                 old_page = obdfs_getpage(old_dir, index >> PAGE_SHIFT, 0, LOCKED);
1081                 CDEBUG(D_INODE, "old_page at %p\n", old_page);
1082                 iops(old_dir)->o_brw(WRITE, iid(old_dir), old_dir, old_page,0);
1083         }
1084 #if 0
1085         if (IS_SYNC(old_dir)) {
1086                 ll_rw_block (WRITE, 1, &old_bh);
1087                 wait_on_buffer (old_bh);
1088         }
1089 #endif
1090         iops(new_dir)->o_brw(WRITE, iid(new_dir), new_dir, new_page, 0);
1091 #if 0
1092         if (IS_SYNC(new_dir)) {
1093                 ll_rw_block (WRITE, 1, &new_bh);
1094                 wait_on_buffer (new_bh);
1095         }
1096 #endif
1097
1098         retval = 0;
1099
1100 end_rename:
1101         if (old_page && PageLocked(old_page) )
1102                 UnlockPage(old_page);
1103         if (old_page)
1104                 page_cache_release(old_page);
1105         if (new_page && PageLocked(new_page) )
1106                 UnlockPage(new_page);
1107         if (new_page)
1108                 page_cache_release(new_page);
1109         if (dir_page && PageLocked(dir_page) )
1110                 UnlockPage(dir_page);
1111         if (dir_page)
1112                 page_cache_release(dir_page);
1113
1114
1115         return retval;
1116 }