Whamcloud - gitweb
9dc7a15b0fb139b63db15c86e2656f9115bfb1c3
[fs/lustre-release.git] / libsysio / src / namei.c
1 /*
2  *    This Cplant(TM) source code is the property of Sandia National
3  *    Laboratories.
4  *
5  *    This Cplant(TM) source code is copyrighted by Sandia National
6  *    Laboratories.
7  *
8  *    The redistribution of this Cplant(TM) source code is subject to the
9  *    terms of the GNU Lesser General Public License
10  *    (see cit/LGPL or http://www.gnu.org/licenses/lgpl.html)
11  *
12  *    Cplant(TM) Copyright 1998-2003 Sandia Corporation. 
13  *    Under the terms of Contract DE-AC04-94AL85000, there is a non-exclusive
14  *    license for use of this work by or on behalf of the US Government.
15  *    Export of this program may require a license from the United States
16  *    Government.
17  */
18
19 /*
20  * This library is free software; you can redistribute it and/or
21  * modify it under the terms of the GNU Lesser General Public
22  * License as published by the Free Software Foundation; either
23  * version 2.1 of the License, or (at your option) any later version.
24  * 
25  * This library is distributed in the hope that it will be useful,
26  * but WITHOUT ANY WARRANTY; without even the implied warranty of
27  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
28  * Lesser General Public License for more details.
29  * 
30  * You should have received a copy of the GNU Lesser General Public
31  * License along with this library; if not, write to the Free Software
32  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
33  *
34  * Questions or comments about this library should be sent to:
35  *
36  * Lee Ward
37  * Sandia National Laboratories, New Mexico
38  * P.O. Box 5800
39  * Albuquerque, NM 87185-1110
40  *
41  * lee@sandia.gov
42  */
43
44 #if defined(AUTOMOUNT_FILE_NAME) && defined(__linux__)
45 #define _BSD_SOURCE
46 #endif
47
48 #include <stdlib.h>
49 #include <string.h>
50 #include <errno.h>
51 #include <assert.h>
52 #include <unistd.h>
53 #include <sys/param.h>
54 #include <sys/types.h>
55 #include <sys/stat.h>
56 #include <sys/queue.h>
57
58 #include "sysio.h"
59 #include "mount.h"
60 #include "inode.h"
61
62 /*
63  * Parse next component in path.
64  */
65 #ifndef AUTOMOUNT_FILE_NAME
66 static
67 #endif
68 void
69 _sysio_next_component(const char *path, struct qstr *name)
70 {
71         while (*path == PATH_SEPARATOR)
72                 path++;
73         name->name = path;
74         name->len = 0;
75         name->hashval = 0;
76         while (*path && *path != PATH_SEPARATOR) {
77                 name->hashval =
78                     37 * name->hashval + *path++;
79                 name->len++;
80         }
81 }
82
83 /*
84  * Given parent, look up component.
85  */
86 static int
87 lookup(struct pnode *parent,
88        struct qstr *name,
89        struct pnode **pnop,
90        struct intent *intnt,
91        const char *path)
92 {
93         int     err;
94         struct pnode *pno;
95
96         if (!parent->p_base->pb_ino)
97                 return -ENOTDIR;
98
99         err = _sysio_permitted(parent->p_base->pb_ino, X_OK);
100         if (err)
101                 return err;
102
103         /*
104          * Short-circuit `.' and `..'; We don't cache those.
105          */
106         pno = NULL;
107         if (name->len == 1 && name->name[0] == '.')
108                 pno = parent;
109         else if (name->len == 2 && name->name[0] == '.' && name->name[1] == '.')
110                 pno = parent->p_parent;
111         if (pno)
112                 P_REF(pno);
113         else {
114                 /*
115                  * Get cache entry then.
116                  */
117                 err = _sysio_p_find_alias(parent, name, &pno);
118                 if (err)
119                         return err;
120         }
121
122         /*
123          * While covered, move to the covering node.
124          */
125         while (pno->p_cover && pno->p_cover != pno) {
126                 struct pnode *cover;
127
128                 cover = pno->p_cover;
129                 P_REF(cover);
130                 P_RELE(pno);
131                 pno = cover;
132         }
133
134         *pnop = pno;
135
136         /*
137          * (Re)validate the pnode.
138          */
139         err = _sysio_p_validate(pno, intnt, path);
140         if (err)
141                 return err;
142
143         return 0;
144 }
145
146 /*
147  * The meat. Walk an absolute or relative path, looking up each
148  * component. Various flags in the nameidata argument govern actions
149  * and return values/state. They are:
150  *
151  * ND_NOFOLLOW          symbolic links are not followed
152  * ND_NEGOK             if terminal/leaf does not exist, return
153  *                       path node (alias) anyway.
154  */
155 int
156 _sysio_path_walk(struct pnode *parent, struct nameidata *nd)
157 {
158         int     err;
159         const char *path;
160         struct qstr this, next;
161         struct inode *ino;
162
163         /*
164          * NULL path?
165          */
166         if (!nd->nd_path)
167                 return -EFAULT;
168
169         /*
170          * Empty path?
171          */
172         if (!*nd->nd_path)
173                 return -ENOENT;
174
175         /*
176          * Leading slash?
177          */
178         if (*nd->nd_path == PATH_SEPARATOR) {
179                 /*
180                  * Make parent the root of the name space.
181                  */
182                 parent = nd->nd_root;
183         }
184
185 #if DEFER_INIT_CWD
186         if (!parent) {
187                 const char *icwd;
188
189                 if (!_sysio_init_cwd)
190                         abort();
191
192                 /*
193                  * Finally have to set the curretn working directory. We can
194                  * not tolerate errors here or else risk leaving the process
195                  * in a very unexpected location. We abort then unless all goes
196                  * well.
197                  */
198                 icwd = _sysio_init_cwd;
199                 _sysio_init_cwd = NULL;
200                 if (_sysio_namei(NULL, icwd, 0, NULL, &parent) != 0 ||
201                     _sysio_p_chdir(parent) != 0)
202                         abort();
203         }
204 #endif
205
206         /*
207          * (Re)Validate the parent.
208          */
209         err = _sysio_p_validate(parent, NULL, NULL);
210         if (err)
211                 return err;
212
213         /*
214          * Prime everything for the loop. Will need another reference to the
215          * initial directory. It'll be dropped later.
216          */
217         nd->nd_pno = parent;
218         P_REF(nd->nd_pno);
219         _sysio_next_component(nd->nd_path, &next);
220         path = next.name;
221         parent = NULL;
222         err = 0;
223
224         /*
225          * Derecurse the path tree-walk.
226          */
227         for (;;) {
228                 ino = nd->nd_pno->p_base->pb_ino;
229                 if (S_ISLNK(ino->i_stbuf.st_mode) &&
230                     (next.len || !(nd->nd_flags & ND_NOFOLLOW))) {
231                         char    *lpath;
232                         ssize_t cc;
233                         struct nameidata nameidata;
234
235                         if (nd->nd_slicnt >= MAX_SYMLINK) {
236                                 err = -ELOOP;
237                                 break;
238                         }
239
240                         /*
241                          * Follow symbolic link.
242                          */
243                         lpath = malloc(MAXPATHLEN + 1);
244                         if (!lpath) {
245                                 err = -ENOMEM;
246                                 break;
247                         }
248                         cc =
249                             ino->i_ops.inop_readlink(nd->nd_pno,
250                                                      lpath,
251                                                      MAXPATHLEN);
252                         if (cc < 0) {
253                                 free(lpath);
254                                 err = (int )cc;
255                                 break;
256                         }
257                         lpath[cc] = '\0';                       /* NUL term */
258                         /*
259                          * Handle symbolic links with recursion. Yuck!
260                          * Pass the NULL intent for recursive symlink
261                          * except the last component.
262                          */
263                         ND_INIT(&nameidata,
264                                 (nd->nd_flags | ND_NEGOK),
265                                 lpath,
266                                 nd->nd_root,
267                                 !next.len ? nd->nd_intent : NULL);
268                         nameidata.nd_slicnt = nd->nd_slicnt + 1;
269                         err =
270                             _sysio_path_walk(nd->nd_pno->p_parent, &nameidata);
271                         free(lpath);
272                         if (err)
273                                 break;
274                         P_RELE(nd->nd_pno);
275                         nd->nd_pno = nameidata.nd_pno;
276                         ino = nd->nd_pno->p_base->pb_ino;
277                 }
278 #ifdef AUTOMOUNT_FILE_NAME
279                 else if (ino &&
280                          S_ISDIR(ino->i_stbuf.st_mode) &&
281                          (nd->nd_pno->p_mount->mnt_flags & MOUNT_F_AUTO) &&
282                          nd->nd_amcnt < MAX_MOUNT_DEPTH &&
283                          ino->i_stbuf.st_mode & S_ISUID) {
284                         struct pnode *pno;
285
286                         /*
287                          * We're committed to a lookup. It's time to see if
288                          * we're going to do it in an automount-point and
289                          * arrange the mount if so.
290                          */
291                         assert(!nd->nd_pno->p_cover);
292                         err =
293                             lookup(nd->nd_pno,
294                                    &_sysio_mount_file_name,
295                                    &pno,
296                                    NULL,
297                                    NULL);
298                         if (pno)
299                                 P_RELE(pno);
300                         if (!err && _sysio_automount(pno) == 0) {
301                                 struct pnode *root;
302
303                                 /*
304                                  * All went well. Need to switch
305                                  * parent pno and ino to the
306                                  * root of the newly mounted sub-tree.
307                                  *
308                                  * NB:
309                                  * We don't recurseively retry these
310                                  * things. It's OK to have the new root
311                                  * be an automount-point but it's going
312                                  * to take another lookup to accomplish it.
313                                  * The alternative could get us into an
314                                  * infinite loop.
315                                  */
316                                 root = nd->nd_pno->p_cover;
317                                 assert(root);
318                                 P_RELE(nd->nd_pno);
319                                 nd->nd_pno = root;
320 #if 0
321                                 P_REF(nd->nd_pno);
322 #endif
323                                 ino = nd->nd_pno->p_base->pb_ino;
324                                 assert(ino);
325
326                                 /*
327                                  * Must send the intent-path again.
328                                  */
329                                 path = nd->nd_path;
330                                 nd->nd_amcnt++;
331
332                                 /*
333                                  * Must go back top and retry with this
334                                  * new pnode as parent.
335                                  */
336                                 continue;
337                         }
338                         err = 0;                        /* it never happened */
339                 }
340 #endif
341
342                 /*
343                  * Set up for next component.
344                  */
345                 this = next;
346                 if (path)
347                         path = this.name;
348                 if (!this.len)
349                         break;
350                 if (!ino) {
351                         /*
352                          * Should only be here if final component was
353                          * target of a symlink.
354                          */
355                         nd->nd_path = this.name + this.len;
356                         err = -ENOENT;
357                         break;
358                 }
359                 nd->nd_path = this.name + this.len;
360                 _sysio_next_component(nd->nd_path, &next);
361                 parent = nd->nd_pno;
362                 nd->nd_pno = NULL;
363
364                 /*
365                  * Parent must be a directory.
366                  */
367                 if (ino && !S_ISDIR(ino->i_stbuf.st_mode)) {
368                         err = -ENOTDIR;
369                         break;
370                 }
371
372                 /*
373                  * The extra path arg is passed only on the first lookup in the
374                  * walk as we cross into each file system, anew. The intent is
375                  * passed both on the first lookup and when trying to look up
376                  * the final component -- Of the original path, not on the
377                  * file system.
378                  *
379                  * Confused? Me too and I came up with this weirdness. It's
380                  * hints to the file system drivers. Read on.
381                  *
382                  * The first lookup will give everything one needs to ready
383                  * everything for the entire operation before the path is
384                  * walked. The file system driver knows it's the first lookup
385                  * in the walk because it has both the path and the intent.
386                  *
387                  * Alternatively, one could split the duties; The first lookup
388                  * can be used to prime the file system inode cache with the
389                  * interior nodes we'll want in the path-walk. Then, when
390                  * looking up the last component, ready everything for the
391                  * operations(s) to come. The file system driver knows it's
392                  * the last lookup in the walk because it has the intent,
393                  * again, but without the path.
394                  *
395                  * One special case; If we were asked to look up a single
396                  * component, we treat it as the last component. The file
397                  * system driver never sees the extra path argument. It should
398                  * be noted that the driver always has the fully qualified
399                  * path, on the target file system, available to it for any
400                  * node it is looking up, including the last, via the base
401                  * path node and it's ancestor chain.
402                  */
403                 err =
404                     lookup(parent,
405                            &this,
406                            &nd->nd_pno,
407                            (path || !next.len)
408                              ? nd->nd_intent
409                              : NULL,
410                            (path && next.len) ? path : NULL);
411                 if (err) {
412                         if (err == -ENOENT &&
413                             !next.len &&
414                             (nd->nd_flags & ND_NEGOK))
415                                 err = 0;
416                         break;
417                 }
418                 path = NULL;                            /* Stop that! */
419                 if ((parent->p_mount->mnt_fs !=
420                      nd->nd_pno->p_mount->mnt_fs)) {
421                         /*
422                          * Crossed into a new fs. We'll want the next lookup
423                          * to include the path again.
424                          */
425                         path = nd->nd_path;
426                 }
427
428                 /*
429                  * Release the parent.
430                  */
431                 P_RELE(parent);
432                 parent = NULL;
433         }
434
435         /*
436          * Trailing separators cause us to break from the loop with
437          * a parent set but no pnode. Check for that.
438          */
439         if (!nd->nd_pno) {
440                 nd->nd_pno = parent;
441                 parent = NULL;
442                 /*
443                  * Make sure the last processed component was a directory. The
444                  * trailing slashes are illegal behind anything else.
445                  */
446                 if (!(err ||
447                       S_ISDIR(nd->nd_pno->p_base->pb_ino->i_stbuf.st_mode)))
448                         err = -ENOTDIR;
449         }
450
451         /*
452          * Drop reference to parent if set. Either we have a dup of the original
453          * parent or an intermediate reference.
454          */
455         if (parent)
456                 P_RELE(parent);
457
458         /*
459          * On error, we will want to drop our reference to the current
460          * path node if at end.
461          */
462         if (err && nd->nd_pno) {
463                 P_RELE(nd->nd_pno);
464                 nd->nd_pno = NULL;
465         }
466
467         return err;
468 }
469
470 #ifdef CPLANT_YOD
471 /* 
472  * for backward compatibility w/protocol switch
473  * remove everything up to the first ':'
474  * fortran libs prepend cwd to path, so not much choice
475  */
476 #define STRIP_PREFIX(p) strchr(p,':') ? strchr(p,':')+1 : p
477 #else
478 #define STRIP_PREFIX(p) p
479 #endif
480
481 /*
482  * Expanded form of the path-walk routine, with the common arguments, builds
483  * the nameidata bundle and calls path-walk.
484  */
485 int
486 _sysio_namei(struct pnode *parent,
487              const char *path,
488              unsigned flags,
489              struct intent *intnt,
490              struct pnode **pnop)
491 {
492         struct nameidata nameidata;
493         int     err;
494
495         ND_INIT(&nameidata, flags, STRIP_PREFIX(path), _sysio_root, intnt);
496         err = _sysio_path_walk(parent, &nameidata);
497         if (!err)
498                 *pnop = nameidata.nd_pno;
499         return err;
500 }