Whamcloud - gitweb
- Fixed serious LDLM bugs, including mistaking the lock _type_ for the lock
[fs/lustre-release.git] / lustre / llite / namei.c
1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2  * vim:expandtab:shiftwidth=8:tabstop=8:
3  *
4  * This code is issued under the GNU General Public License.
5  * See the file COPYING in this distribution
6  *
7  * Copyright (C) 1992, 1993, 1994, 1995
8  * Remy Card (card@masi.ibp.fr)
9  * Laboratoire MASI - Institut Blaise Pascal
10  * Universite Pierre et Marie Curie (Paris VI)
11  *
12  *  from
13  *
14  *  linux/fs/ext2/namei.c
15  *
16  *  Copyright (C) 1991, 1992  Linus Torvalds
17  *
18  *  Big-endian to little-endian byte-swapping/bitmaps by
19  *        David S. Miller (davem@caip.rutgers.edu), 1995
20  *  Directory entry file type support and forward compatibility hooks
21  *      for B-tree directories by Theodore Ts'o (tytso@mit.edu), 1998
22  *
23  *  Changes for use in OBDFS
24  *  Copyright (c) 1999, Seagate Technology Inc.
25  *  Copyright (C) 2001, Cluster File Systems, Inc.
26  *                       Rewritten based on recent ext2 page cache use.
27  *
28  */
29
30 #include <linux/fs.h>
31 #include <linux/locks.h>
32 #include <linux/quotaops.h>
33
34 #define DEBUG_SUBSYSTEM S_LLITE
35
36 #include <linux/obd_support.h>
37 #include <linux/lustre_lite.h>
38 #include <linux/lustre_dlm.h>
39 extern struct address_space_operations ll_aops;
40
41 /* from super.c */
42 extern void ll_change_inode(struct inode *inode);
43 extern int ll_setattr(struct dentry *de, struct iattr *attr);
44
45 /* from dir.c */
46 extern int ll_add_link (struct dentry *dentry, struct inode *inode);
47 ino_t ll_inode_by_name(struct inode * dir, struct dentry *dentry, int *typ);
48 int ext2_make_empty(struct inode *inode, struct inode *parent);
49 struct ext2_dir_entry_2 * ext2_find_entry (struct inode * dir,
50                    struct dentry *dentry, struct page ** res_page);
51 int ext2_delete_entry (struct ext2_dir_entry_2 * dir, struct page * page );
52 int ext2_empty_dir (struct inode * inode);
53 struct ext2_dir_entry_2 * ext2_dotdot (struct inode *dir, struct page **p);
54 void ext2_set_link(struct inode *dir, struct ext2_dir_entry_2 *de,
55                    struct page *page, struct inode *inode);
56
57 /*
58  * Couple of helper functions - make the code slightly cleaner.
59  */
60 static inline void ext2_inc_count(struct inode *inode)
61 {
62         inode->i_nlink++;
63 }
64
65 /* postpone the disk update until the inode really goes away */
66 static inline void ext2_dec_count(struct inode *inode)
67 {
68         inode->i_nlink--;
69 }
70
71 static inline int ext2_add_nondir(struct dentry *dentry, struct inode *inode)
72 {
73         int err;
74         err = ll_add_link(dentry, inode);
75         if (!err) {
76                 d_instantiate(dentry, inode);
77                 return 0;
78         }
79         ext2_dec_count(inode);
80         iput(inode);
81         return err;
82 }
83
84 /* methods */
85 static int ll_find_inode(struct inode *inode, unsigned long ino, void *opaque)
86 {
87         struct mds_body *body = (struct mds_body *)opaque;
88
89         if (inode->i_generation != body->generation)
90                 return 0;
91
92         return 1;
93 }
94
95 extern struct dentry_operations ll_d_ops;
96
97 int ll_lock(struct inode *dir, struct dentry *dentry,
98             struct lookup_intent *it, struct lustre_handle *lockh)
99 {
100         struct ll_sb_info *sbi = ll_i2sbi(dir);
101         int err;
102
103         if ((it->it_op & (IT_CREAT | IT_MKDIR | IT_SYMLINK | IT_SETATTR |
104                           IT_MKNOD)) )
105                 err = mdc_enqueue(&sbi->ll_mdc_conn, LDLM_MDSINTENT,
106                                   it, LCK_PW, dir, dentry, lockh, 0, NULL, 0,
107                                   dir, sizeof(*dir));
108         else if (it->it_op & (IT_READDIR | IT_GETATTR | IT_OPEN))
109                 err = mdc_enqueue(&sbi->ll_mdc_conn, LDLM_MDSINTENT,
110                                   it, LCK_PR, dir, dentry, lockh, 0, NULL, 0,
111                                   dir, sizeof(*dir));
112         else
113                 LBUG();
114
115         RETURN(err);
116 }
117
118 int ll_unlock(__u32 mode, struct lustre_handle *lockh)
119 {
120         struct ldlm_lock *lock;
121         ENTRY;
122
123         lock = lustre_handle2object(lockh);
124         ldlm_lock_decref(lock, mode);
125
126         RETURN(0);
127 }
128
129 static struct dentry *ll_lookup2(struct inode * dir, struct dentry *dentry,
130                                  struct lookup_intent *it)
131 {
132         struct ptlrpc_request *request = NULL;
133         struct inode * inode = NULL;
134         struct ll_sb_info *sbi = ll_i2sbi(dir);
135         struct ll_inode_md md;
136         struct lustre_handle lockh;
137         int err, type, offset;
138         ino_t ino;
139
140         ENTRY;
141
142         CDEBUG(D_INFO, "name: %*s, intent op: %d\n", dentry->d_name.len,
143                dentry->d_name.name, it->it_op);
144
145         if (dentry->d_name.len > EXT2_NAME_LEN)
146                 RETURN(ERR_PTR(-ENAMETOOLONG));
147
148         err = ll_lock(dir, dentry, it, &lockh);
149         memcpy(it->it_lock_handle, &lockh, sizeof(lockh));
150
151         if ( (it->it_op & (IT_CREAT | IT_MKDIR | IT_SYMLINK | IT_MKNOD)) &&
152              it->it_disposition && !it->it_status)
153                 GOTO(negative, NULL);
154
155         if ( (it->it_op & (IT_GETATTR)) &&
156              it->it_disposition && it->it_status)
157                 GOTO(negative, NULL);
158
159         if (!it->it_disposition) {
160                 struct ll_inode_info *lli = ll_i2info(dir);
161                 memcpy(&lli->lli_intent_lock_handle, &lockh, sizeof(lockh));
162
163                 ino = ll_inode_by_name(dir, dentry, &type);
164
165                 err = mdc_getattr(&sbi->ll_mdc_conn, ino, type,
166                                   OBD_MD_FLNOTOBD|OBD_MD_FLBLOCKS, 0, &request);
167                 if (err) {
168                         CERROR("failure %d inode %ld\n", err, (long)ino);
169                         ptlrpc_free_req(request);
170                         RETURN(ERR_PTR(-abs(err)));
171                 }
172                 offset = 0;
173         } else {
174                 struct mds_body *body;
175
176                 offset = 1;
177                 request = (struct ptlrpc_request *)it->it_data;
178                 body = lustre_msg_buf(request->rq_repmsg, 1);
179                 type = body->mode;
180         }
181
182         if (S_ISREG(type)) {
183                 if (request->rq_repmsg->bufcount < offset + 2 ||
184                     request->rq_repmsg->buflens[offset + 1] !=
185                     sizeof(struct obdo))
186                         LBUG();
187
188                 md.obdo = lustre_msg_buf(request->rq_repmsg, offset + 1);
189         } else
190                 md.obdo = NULL;
191
192         md.body = lustre_msg_buf(request->rq_repmsg, offset);
193
194         inode = iget4(dir->i_sb, ino, ll_find_inode, &md);
195
196         if (it->it_op & IT_RENAME)
197                 it->it_data = dentry;
198
199         ptlrpc_free_req(request);
200         if (!inode)
201                 RETURN(ERR_PTR(-ENOMEM));
202
203         EXIT;
204  negative:
205         dentry->d_op = &ll_d_ops;
206         d_add(dentry, inode);
207         return NULL;
208 }
209
210 static struct inode *ll_create_node(struct inode *dir, const char *name,
211                                     int namelen, const char *tgt, int tgtlen,
212                                     int mode, __u64 extra,
213                                     struct lookup_intent *it, struct obdo *obdo)
214 {
215         struct inode *inode;
216         struct ptlrpc_request *request = NULL;
217         struct mds_body *body;
218         int rc;
219         time_t time = CURRENT_TIME;
220         struct ll_sb_info *sbi = ll_i2sbi(dir);
221         struct ll_inode_md md;
222
223         ENTRY;
224
225         if (!it->it_disposition) {
226                 rc = mdc_create(&sbi->ll_mdc_conn, dir, name, namelen, tgt,
227                                  tgtlen, mode, current->fsuid,
228                                  current->fsgid, time, extra, obdo, &request);
229                 if (rc) {
230                         inode = ERR_PTR(rc);
231                         GOTO(out, rc);
232                 }
233                 body = lustre_msg_buf(request->rq_repmsg, 0);
234                 md.obdo = obdo;
235         } else {
236                 request = it->it_data;
237                 body = lustre_msg_buf(request->rq_repmsg, 1);
238                 md.obdo = NULL;
239         }
240
241         body->valid = (__u32)OBD_MD_FLNOTOBD;
242
243         body->nlink = 1;
244         body->atime = body->ctime = body->mtime = time;
245         body->uid = current->fsuid;
246         body->gid = current->fsgid;
247         body->mode = mode;
248
249         md.body = body;
250
251         inode = iget4(dir->i_sb, body->ino, ll_find_inode, &md);
252         if (IS_ERR(inode)) {
253                 CERROR("new_inode -fatal:  %ld\n", PTR_ERR(inode));
254                 inode = ERR_PTR(-EIO);
255                 LBUG();
256                 GOTO(out, -EIO);
257         }
258
259         if (!list_empty(&inode->i_dentry)) {
260                 CERROR("new_inode -fatal: inode %d, ct %d lnk %d\n",
261                        body->ino, atomic_read(&inode->i_count),
262                        inode->i_nlink);
263                 iput(inode);
264                 LBUG();
265                 inode = ERR_PTR(-EIO);
266                 GOTO(out, -EIO);
267         }
268
269         EXIT;
270  out:
271         ptlrpc_free_req(request);
272         return inode;
273 }
274
275 int ll_mdc_unlink(struct inode *dir, struct inode *child,
276                   const char *name, int len)
277 {
278         struct ptlrpc_request *request = NULL;
279         int err;
280         struct ll_sb_info *sbi = ll_i2sbi(dir);
281
282         ENTRY;
283
284         err = mdc_unlink(&sbi->ll_mdc_conn, dir, child,
285                          name, len, &request);
286         ptlrpc_free_req(request);
287
288         RETURN(err);
289 }
290
291 int ll_mdc_link(struct dentry *src, struct inode *dir,
292                 const char *name, int len)
293 {
294         struct ptlrpc_request *request = NULL;
295         int err;
296         struct ll_sb_info *sbi = ll_i2sbi(dir);
297
298         ENTRY;
299
300         err = mdc_link(&sbi->ll_mdc_conn, src, dir, name,
301                        len, &request);
302         ptlrpc_free_req(request);
303
304         RETURN(err);
305 }
306
307 int ll_mdc_rename(struct inode *src, struct inode *tgt,
308                   struct dentry *old, struct dentry *new)
309 {
310         struct ptlrpc_request *request = NULL;
311         struct ll_sb_info *sbi = ll_i2sbi(src);
312         int err;
313
314         ENTRY;
315
316         err = mdc_rename(&sbi->ll_mdc_conn, src, tgt,
317                          old->d_name.name, old->d_name.len,
318                          new->d_name.name, new->d_name.len, &request);
319         ptlrpc_free_req(request);
320
321         RETURN(err);
322 }
323
324 /*
325  * By the time this is called, we already have created
326  * the directory cache entry for the new file, but it
327  * is so far negative - it has no inode.
328  *
329  * If the create succeeds, we fill in the inode information
330  * with d_instantiate().
331  */
332
333 static int ll_create(struct inode * dir, struct dentry * dentry, int mode)
334 {
335         int rc = 0;
336         struct obdo oa;
337         struct inode *inode;
338
339         if (dentry->d_it->it_disposition == 0) {
340                 memset(&oa, 0, sizeof(oa));
341                 oa.o_valid = OBD_MD_FLMODE;
342                 oa.o_mode = S_IFREG | 0600;
343                 rc = obd_create(ll_i2obdconn(dir), &oa);
344                 if (rc)
345                         RETURN(rc);
346         }
347
348         mode = mode | S_IFREG;
349         CDEBUG(D_DENTRY, "name %s mode %o o_id %lld\n",
350                dentry->d_name.name, mode, (unsigned long long)oa.o_id);
351         inode = ll_create_node(dir, dentry->d_name.name, dentry->d_name.len,
352                                NULL, 0, mode, 0, dentry->d_it, &oa);
353
354         if (IS_ERR(inode)) {
355                 rc = PTR_ERR(inode);
356                 CERROR("error creating MDS object for id %Ld: rc = %d\n",
357                        (unsigned long long)oa.o_id, rc);
358                 GOTO(out_destroy, rc);
359         }
360
361         // XXX clean up the object
362         inode->i_op = &ll_file_inode_operations;
363         inode->i_fop = &ll_file_operations;
364         inode->i_mapping->a_ops = &ll_aops;
365
366         if (dentry->d_it->it_disposition) {
367                 struct ll_inode_info *ii = ll_i2info(inode);
368                 ii->lli_flags |= OBD_FL_CREATEONOPEN;
369                 memcpy(&ii->lli_intent_lock_handle,
370                        dentry->d_it->it_lock_handle,
371                        sizeof(struct lustre_handle));
372         }
373
374         /* no directory data updates when intents rule */
375         if (dentry->d_it->it_disposition == 0)
376                 rc = ext2_add_nondir(dentry, inode);
377         else
378                 d_instantiate(dentry, inode);
379         RETURN(rc);
380
381 out_destroy:
382         rc = obd_destroy(ll_i2obdconn(dir), &oa);
383         if (rc)
384                 CERROR("error destroying object %Ld in error path: err = %d\n",
385                        (unsigned long long)oa.o_id, rc);
386         return rc;
387 }
388
389 static int ll_mknod(struct inode *dir, struct dentry *dentry, int mode,
390                     int rdev)
391 {
392         struct inode * inode = ll_create_node(dir, dentry->d_name.name,
393                                               dentry->d_name.len, NULL, 0,
394                                               mode, rdev, NULL, NULL);
395         int err = PTR_ERR(inode);
396         if (!IS_ERR(inode)) {
397                 init_special_inode(inode, mode, rdev);
398                 err = ext2_add_nondir(dentry, inode);
399         }
400         return err;
401 }
402
403 static int ll_symlink(struct inode *dir, struct dentry *dentry,
404                       const char *symname)
405 {
406         int err = -ENAMETOOLONG;
407         unsigned l = strlen(symname);
408         struct inode * inode;
409         struct ll_inode_info *oinfo;
410
411         if (l > LL_INLINESZ)
412                 return err;
413
414         inode = ll_create_node(dir, dentry->d_name.name,
415                                dentry->d_name.len, symname, l,
416                                S_IFLNK | S_IRWXUGO, 0, dentry->d_it, NULL);
417         err = PTR_ERR(inode);
418         if (IS_ERR(inode))
419                 return err;
420
421         oinfo = ll_i2info(inode);
422
423         inode->i_op = &ll_fast_symlink_inode_operations;
424         memcpy(oinfo->lli_inline, symname, l);
425         inode->i_size = l-1;
426
427         err = ext2_add_nondir(dentry, inode);
428
429         if (err) {
430                 ext2_dec_count(inode);
431                 iput (inode);
432         }
433         return err;
434 }
435
436 static int ll_link(struct dentry * old_dentry, struct inode * dir,
437                    struct dentry *dentry)
438 {
439         int err;
440         struct inode *inode = old_dentry->d_inode;
441
442         if (S_ISDIR(inode->i_mode))
443                 return -EPERM;
444
445         if (inode->i_nlink >= EXT2_LINK_MAX)
446                 return -EMLINK;
447
448         err = ll_mdc_link(old_dentry, dir,
449                           dentry->d_name.name, dentry->d_name.len);
450         if (err) {
451                 EXIT;
452                 return err;
453         }
454
455         inode->i_ctime = CURRENT_TIME;
456         ext2_inc_count(inode);
457         atomic_inc(&inode->i_count);
458
459         return ext2_add_nondir(dentry, inode);
460 }
461
462 static int ll_mkdir(struct inode * dir, struct dentry * dentry, int mode)
463 {
464         struct inode * inode;
465         int err = -EMLINK;
466         ENTRY;
467
468         if (dir->i_nlink >= EXT2_LINK_MAX)
469                 goto out;
470
471         ext2_inc_count(dir);
472
473         inode = ll_create_node (dir, dentry->d_name.name,
474                                 dentry->d_name.len, NULL, 0,
475                                 S_IFDIR | mode, 0, dentry->d_it, NULL);
476         err = PTR_ERR(inode);
477         if (IS_ERR(inode))
478                 goto out_dir;
479
480         inode->i_op = &ll_dir_inode_operations;
481         inode->i_fop = &ll_dir_operations;
482         inode->i_mapping->a_ops = &ll_aops;
483         inode->i_nlink = 1;
484         ext2_inc_count(inode);
485
486         err = ext2_make_empty(inode, dir);
487         if (err)
488                 goto out_fail;
489
490         /* no directory data updates when intents rule */
491         if (dentry->d_it->it_disposition == 0) {
492                 err = ll_add_link(dentry, inode);
493                 if (err)
494                         goto out_fail;
495         }
496
497         d_instantiate(dentry, inode);
498 out:
499         EXIT;
500         return err;
501
502 out_fail:
503         ext2_dec_count(inode);
504         ext2_dec_count(inode);
505         iput(inode);
506         EXIT;
507 out_dir:
508         ext2_dec_count(dir);
509         EXIT;
510         goto out;
511 }
512
513 static int ll_unlink(struct inode * dir, struct dentry *dentry)
514 {
515         struct inode * inode = dentry->d_inode;
516         struct ext2_dir_entry_2 * de;
517         struct page * page;
518         int err = -ENOENT;
519
520         de = ext2_find_entry (dir, dentry, &page);
521         if (!de)
522                 goto out;
523
524         err = ll_mdc_unlink(dir, dentry->d_inode,
525                             dentry->d_name.name, dentry->d_name.len);
526         if (err)
527                 goto out;
528
529         err = ext2_delete_entry (de, page);
530         if (err)
531                 goto out;
532
533         inode->i_ctime = dir->i_ctime;
534         ext2_dec_count(inode);
535         err = 0;
536 out:
537         return err;
538 }
539
540 static int ll_rmdir(struct inode * dir, struct dentry *dentry)
541 {
542         struct inode * inode = dentry->d_inode;
543         int err = -ENOTEMPTY;
544
545         if (ext2_empty_dir(inode)) {
546                 err = ll_unlink(dir, dentry);
547                 if (!err) {
548                         inode->i_size = 0;
549                         ext2_dec_count(inode);
550                         ext2_dec_count(dir);
551                 }
552         }
553         return err;
554 }
555
556 static int ll_rename (struct inode * old_dir, struct dentry * old_dentry,
557                       struct inode * new_dir, struct dentry * new_dentry )
558 {
559         struct inode * old_inode = old_dentry->d_inode;
560         struct inode * new_inode = new_dentry->d_inode;
561         struct page * dir_page = NULL;
562         struct ext2_dir_entry_2 * dir_de = NULL;
563         struct page * old_page;
564         struct ext2_dir_entry_2 * old_de;
565         int err = -ENOENT;
566
567         if (new_dentry->d_it) {
568                 struct ptlrpc_request *req = new_dentry->d_it->it_data;
569                 err = req->rq_status;
570                 goto out;
571         }
572
573         err = ll_mdc_rename(old_dir, new_dir, old_dentry, new_dentry);
574         if (err)
575                 goto out;
576
577         old_de = ext2_find_entry (old_dir, old_dentry, &old_page);
578         if (!old_de)
579                 goto out;
580
581         if (S_ISDIR(old_inode->i_mode)) {
582                 err = -EIO;
583                 dir_de = ext2_dotdot(old_inode, &dir_page);
584                 if (!dir_de)
585                         goto out_old;
586         }
587
588         if (new_inode) {
589                 struct page *new_page;
590                 struct ext2_dir_entry_2 *new_de;
591
592                 err = -ENOTEMPTY;
593                 if (dir_de && !ext2_empty_dir (new_inode))
594                         goto out_dir;
595
596                 err = -ENOENT;
597                 new_de = ext2_find_entry (new_dir, new_dentry, &new_page);
598                 if (!new_de)
599                         goto out_dir;
600                 ext2_inc_count(old_inode);
601                 ext2_set_link(new_dir, new_de, new_page, old_inode);
602                 new_inode->i_ctime = CURRENT_TIME;
603                 if (dir_de)
604                         new_inode->i_nlink--;
605                 ext2_dec_count(new_inode);
606         } else {
607                 if (dir_de) {
608                         err = -EMLINK;
609                         if (new_dir->i_nlink >= EXT2_LINK_MAX)
610                                 goto out_dir;
611                 }
612                 ext2_inc_count(old_inode);
613                 err = ll_add_link(new_dentry, old_inode);
614                 if (err) {
615                         ext2_dec_count(old_inode);
616                         goto out_dir;
617                 }
618                 if (dir_de)
619                         ext2_inc_count(new_dir);
620         }
621
622         ext2_delete_entry (old_de, old_page);
623         ext2_dec_count(old_inode);
624
625         if (dir_de) {
626                 ext2_set_link(old_inode, dir_de, dir_page, new_dir);
627                 ext2_dec_count(old_dir);
628         }
629         return 0;
630
631 out_dir:
632         if (dir_de) {
633                 kunmap(dir_page);
634                 page_cache_release(dir_page);
635         }
636 out_old:
637         kunmap(old_page);
638         page_cache_release(old_page);
639 out:
640         return err;
641 }
642
643 struct inode_operations ll_dir_inode_operations = {
644         create:         ll_create,
645         lookup2:        ll_lookup2,
646         link:           ll_link,
647         unlink:         ll_unlink,
648         symlink:        ll_symlink,
649         mkdir:          ll_mkdir,
650         rmdir:          ll_rmdir,
651         mknod:          ll_mknod,
652         rename:         ll_rename,
653         setattr:        ll_setattr
654 };