1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (c) 2003 Cluster File Systems, Inc.
6 * This file is part of the Lustre file system, http://www.lustre.org
7 * Lustre is a trademark of Cluster File Systems, Inc.
9 * You may have signed or agreed to another license before downloading
10 * this software. If so, you are bound by the terms and conditions
11 * of that agreement, and the following does not apply to you. See the
12 * LICENSE file included with this distribution for more information.
14 * If you did not agree to a different license, then this copy of Lustre
15 * is open source software; you can redistribute it and/or modify it
16 * under the terms of version 2 of the GNU General Public License as
17 * published by the Free Software Foundation.
19 * In either case, Lustre is distributed in the hope that it will be
20 * useful, but WITHOUT ANY WARRANTY; without even the implied warranty
21 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
22 * license text for more details.
25 #define DEBUG_SUBSYSTEM S_MDS
27 #ifndef AUTOCONF_INCLUDED
28 #include <linux/config.h>
30 #include <linux/module.h>
31 #include <linux/kernel.h>
33 #include <linux/string.h>
34 #include <linux/stat.h>
35 #include <linux/errno.h>
36 #include <linux/version.h>
37 #include <linux/buffer_head.h> // for wait_on_buffer
38 #include <linux/unistd.h>
40 #include <asm/system.h>
41 #include <asm/uaccess.h>
44 #include <linux/stat.h>
45 #include <asm/uaccess.h>
46 #include <linux/slab.h>
48 # include <asm/segment.h>
51 #include <obd_support.h>
52 #include <lustre_lib.h>
53 #include "mds_internal.h"
55 void mds_pack_inode2fid(struct ll_fid *fid, struct inode *inode)
57 fid->id = inode->i_ino;
58 fid->generation = inode->i_generation;
59 fid->f_type = (S_IFMT & inode->i_mode);
62 /* Note that we can copy all of the fields, just some will not be "valid" */
63 void mds_pack_inode2body(struct mds_body *b, struct inode *inode)
65 b->valid |= OBD_MD_FLID | OBD_MD_FLCTIME | OBD_MD_FLUID |
66 OBD_MD_FLGID | OBD_MD_FLFLAGS | OBD_MD_FLTYPE |
67 OBD_MD_FLMODE | OBD_MD_FLNLINK | OBD_MD_FLGENER |
68 OBD_MD_FLATIME | OBD_MD_FLMTIME; /* bug 2020 */
70 if (!S_ISREG(inode->i_mode))
71 b->valid |= OBD_MD_FLSIZE | OBD_MD_FLBLOCKS | OBD_MD_FLATIME |
72 OBD_MD_FLMTIME | OBD_MD_FLRDEV;
74 b->ino = inode->i_ino;
75 b->atime = LTIME_S(inode->i_atime);
76 b->mtime = LTIME_S(inode->i_mtime);
77 b->ctime = LTIME_S(inode->i_ctime);
78 b->mode = inode->i_mode;
79 b->size = i_size_read(inode);
80 b->blocks = inode->i_blocks;
81 b->uid = inode->i_uid;
82 b->gid = inode->i_gid;
83 b->flags = ll_inode_to_ext_flags(b->flags, inode->i_flags);
84 b->rdev = inode->i_rdev;
85 /* Return the correct link count for orphan inodes */
86 b->nlink = mds_inode_is_orphan(inode) ? 0 : inode->i_nlink;
87 b->generation = inode->i_generation;
91 static inline unsigned int attr_unpack(__u64 sa_valid) {
92 unsigned int ia_valid = 0;
94 if (sa_valid & MDS_ATTR_MODE)
95 ia_valid |= ATTR_MODE;
96 if (sa_valid & MDS_ATTR_UID)
98 if (sa_valid & MDS_ATTR_GID)
100 if (sa_valid & MDS_ATTR_SIZE)
101 ia_valid |= ATTR_SIZE;
102 if (sa_valid & MDS_ATTR_ATIME)
103 ia_valid |= ATTR_ATIME;
104 if (sa_valid & MDS_ATTR_MTIME)
105 ia_valid |= ATTR_MTIME;
106 if (sa_valid & MDS_ATTR_CTIME)
107 ia_valid |= ATTR_CTIME;
108 if (sa_valid & MDS_ATTR_ATIME_SET)
109 ia_valid |= ATTR_ATIME_SET;
110 if (sa_valid & MDS_ATTR_MTIME_SET)
111 ia_valid |= ATTR_MTIME_SET;
112 if (sa_valid & MDS_ATTR_FORCE)
113 ia_valid |= ATTR_FORCE;
114 if (sa_valid & MDS_ATTR_ATTR_FLAG)
115 ia_valid |= ATTR_ATTR_FLAG;
116 if (sa_valid & MDS_ATTR_KILL_SUID)
117 ia_valid |= ATTR_KILL_SUID;
118 if (sa_valid & MDS_ATTR_KILL_SGID)
119 ia_valid |= ATTR_KILL_SGID;
120 if (sa_valid & MDS_ATTR_CTIME_SET)
121 ia_valid |= ATTR_CTIME_SET;
122 if (sa_valid & MDS_ATTR_FROM_OPEN)
123 ia_valid |= ATTR_FROM_OPEN;
124 if (sa_valid & MDS_ATTR_BLOCKS)
125 ia_valid |= ATTR_BLOCKS;
126 if (sa_valid & MDS_OPEN_OWNEROVERRIDE)
127 ia_valid |= MDS_OPEN_OWNEROVERRIDE;
132 static int mds_setattr_unpack(struct ptlrpc_request *req, int offset,
133 struct mds_update_record *r)
135 struct iattr *attr = &r->ur_iattr;
136 struct mds_rec_setattr *rec;
139 rec = lustre_swab_reqbuf(req, offset, sizeof(*rec),
140 lustre_swab_mds_rec_setattr);
144 r->ur_uc.luc_fsuid = rec->sa_fsuid;
145 r->ur_uc.luc_fsgid = rec->sa_fsgid;
146 r->ur_uc.luc_cap = rec->sa_cap;
148 r->ur_uc.luc_suppgid1 = rec->sa_suppgid;
149 r->ur_uc.luc_suppgid2 = -1;
151 r->ur_fid1 = &rec->sa_fid;
152 attr->ia_valid = attr_unpack(rec->sa_valid);
153 attr->ia_mode = rec->sa_mode;
154 attr->ia_uid = rec->sa_uid;
155 attr->ia_gid = rec->sa_gid;
156 attr->ia_size = rec->sa_size;
157 LTIME_S(attr->ia_atime) = rec->sa_atime;
158 LTIME_S(attr->ia_mtime) = rec->sa_mtime;
159 LTIME_S(attr->ia_ctime) = rec->sa_ctime;
160 r->ur_flags = rec->sa_attr_flags;
162 lustre_set_req_swabbed(req, offset + 1);
163 r->ur_eadatalen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
164 if (r->ur_eadatalen) {
165 r->ur_eadata = lustre_msg_buf(req->rq_reqmsg, offset + 1, 0);
166 if (r->ur_eadata == NULL)
169 r->ur_cookielen = lustre_msg_buflen(req->rq_reqmsg, offset + 2);
170 if (r->ur_cookielen) {
171 r->ur_logcookies = lustre_msg_buf(req->rq_reqmsg, offset + 2,0);
172 if (r->ur_eadata == NULL)
175 if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) {
176 r->ur_dlm = lustre_swab_reqbuf(req, offset + 3,
178 lustre_swab_ldlm_request);
179 if (r->ur_dlm == NULL)
185 static int mds_create_unpack(struct ptlrpc_request *req, int offset,
186 struct mds_update_record *r)
188 struct mds_rec_create *rec;
191 rec = lustre_swab_reqbuf(req, offset, sizeof (*rec),
192 lustre_swab_mds_rec_create);
196 r->ur_uc.luc_fsuid = rec->cr_fsuid;
197 r->ur_uc.luc_fsgid = rec->cr_fsgid;
198 r->ur_uc.luc_cap = rec->cr_cap;
200 r->ur_uc.luc_suppgid1 = rec->cr_suppgid;
201 r->ur_uc.luc_suppgid2 = -1;
203 r->ur_fid1 = &rec->cr_fid;
204 r->ur_fid2 = &rec->cr_replayfid;
205 r->ur_mode = rec->cr_mode;
206 r->ur_rdev = rec->cr_rdev;
207 r->ur_time = rec->cr_time;
208 r->ur_flags = rec->cr_flags;
210 lustre_set_req_swabbed(req, offset + 1);
211 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
212 if (r->ur_name == NULL)
214 r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
216 lustre_set_req_swabbed(req, offset + 2);
217 r->ur_tgtlen = lustre_msg_buflen(req->rq_reqmsg, offset + 2);
219 /* NB for now, we only seem to pass NULL terminated symlink
220 * target strings here. If this ever changes, we'll have
221 * to stop checking for a buffer filled completely with a
222 * NULL terminated string here, and make the callers check
223 * depending on what they expect. We should probably stash
224 * it in r->ur_eadata in that case, so it's obvious... -eeb
226 r->ur_tgt = lustre_msg_string(req->rq_reqmsg, offset + 2, 0);
227 if (r->ur_tgt == NULL)
230 if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) {
231 r->ur_dlm = lustre_swab_reqbuf(req, offset + 3,
233 lustre_swab_ldlm_request);
234 if (r->ur_dlm == NULL)
240 static int mds_link_unpack(struct ptlrpc_request *req, int offset,
241 struct mds_update_record *r)
243 struct mds_rec_link *rec;
246 rec = lustre_swab_reqbuf(req, offset, sizeof (*rec),
247 lustre_swab_mds_rec_link);
251 r->ur_uc.luc_fsuid = rec->lk_fsuid;
252 r->ur_uc.luc_fsgid = rec->lk_fsgid;
253 r->ur_uc.luc_cap = rec->lk_cap;
255 r->ur_uc.luc_suppgid1 = rec->lk_suppgid1;
256 r->ur_uc.luc_suppgid2 = rec->lk_suppgid2;
258 r->ur_fid1 = &rec->lk_fid1;
259 r->ur_fid2 = &rec->lk_fid2;
260 r->ur_time = rec->lk_time;
262 lustre_set_req_swabbed(req, offset + 1);
263 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
264 if (r->ur_name == NULL)
266 r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
267 if (lustre_msg_buflen(req->rq_reqmsg, offset + 2)) {
268 r->ur_dlm = lustre_swab_reqbuf(req, offset + 2,
270 lustre_swab_ldlm_request);
271 if (r->ur_dlm == NULL)
277 static int mds_unlink_unpack(struct ptlrpc_request *req, int offset,
278 struct mds_update_record *r)
280 struct mds_rec_unlink *rec;
283 rec = lustre_swab_reqbuf(req, offset, sizeof (*rec),
284 lustre_swab_mds_rec_unlink);
288 r->ur_uc.luc_fsuid = rec->ul_fsuid;
289 r->ur_uc.luc_fsgid = rec->ul_fsgid;
290 r->ur_uc.luc_cap = rec->ul_cap;
292 r->ur_uc.luc_suppgid1 = rec->ul_suppgid;
293 r->ur_uc.luc_suppgid2 = -1;
295 r->ur_mode = rec->ul_mode;
296 r->ur_fid1 = &rec->ul_fid1;
297 r->ur_fid2 = &rec->ul_fid2;
298 r->ur_time = rec->ul_time;
300 lustre_set_req_swabbed(req, offset + 1);
301 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
302 if (r->ur_name == NULL)
304 r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
306 if (lustre_msg_buflen(req->rq_reqmsg, offset + 2)) {
307 r->ur_dlm = lustre_swab_reqbuf(req, offset + 2,
309 lustre_swab_ldlm_request);
310 if (r->ur_dlm == NULL)
316 static int mds_rename_unpack(struct ptlrpc_request *req, int offset,
317 struct mds_update_record *r)
319 struct mds_rec_rename *rec;
322 rec = lustre_swab_reqbuf(req, offset, sizeof (*rec),
323 lustre_swab_mds_rec_rename);
327 r->ur_uc.luc_fsuid = rec->rn_fsuid;
328 r->ur_uc.luc_fsgid = rec->rn_fsgid;
329 r->ur_uc.luc_cap = rec->rn_cap;
331 r->ur_uc.luc_suppgid1 = rec->rn_suppgid1;
332 r->ur_uc.luc_suppgid2 = rec->rn_suppgid2;
334 r->ur_fid1 = &rec->rn_fid1;
335 r->ur_fid2 = &rec->rn_fid2;
336 r->ur_time = rec->rn_time;
338 lustre_set_req_swabbed(req, offset + 1);
339 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
340 if (r->ur_name == NULL)
342 r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
344 lustre_set_req_swabbed(req, offset + 2);
345 r->ur_tgt = lustre_msg_string(req->rq_reqmsg, offset + 2, 0);
346 if (r->ur_tgt == NULL)
348 r->ur_tgtlen = lustre_msg_buflen(req->rq_reqmsg, offset + 2);
349 if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) {
350 r->ur_dlm = lustre_swab_reqbuf(req, offset + 3,
352 lustre_swab_ldlm_request);
353 if (r->ur_dlm == NULL)
359 static int mds_open_unpack(struct ptlrpc_request *req, int offset,
360 struct mds_update_record *r)
362 struct mds_rec_create *rec;
365 rec = lustre_swab_reqbuf(req, offset, sizeof(*rec),
366 lustre_swab_mds_rec_create);
370 r->ur_uc.luc_fsuid = rec->cr_fsuid;
371 r->ur_uc.luc_fsgid = rec->cr_fsgid;
372 r->ur_uc.luc_cap = rec->cr_cap;
374 r->ur_uc.luc_suppgid1 = rec->cr_suppgid;
375 r->ur_uc.luc_suppgid2 = -1;
377 r->ur_fid1 = &rec->cr_fid;
378 r->ur_fid2 = &rec->cr_replayfid;
379 r->ur_mode = rec->cr_mode;
380 r->ur_rdev = rec->cr_rdev;
381 r->ur_time = rec->cr_time;
382 r->ur_flags = rec->cr_flags;
384 lustre_set_req_swabbed(req, offset + 1);
385 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
386 if (r->ur_name == NULL)
388 r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1);
390 lustre_set_req_swabbed(req, offset + 2);
391 r->ur_eadatalen = lustre_msg_buflen(req->rq_reqmsg, offset + 2);
392 if (r->ur_eadatalen) {
393 r->ur_eadata = lustre_msg_buf(req->rq_reqmsg, offset + 2, 0);
394 if (r->ur_eadata == NULL)
400 typedef int (*update_unpacker)(struct ptlrpc_request *req, int offset,
401 struct mds_update_record *r);
403 static update_unpacker mds_unpackers[REINT_MAX] = {
404 [REINT_SETATTR] mds_setattr_unpack,
405 [REINT_CREATE] mds_create_unpack,
406 [REINT_LINK] mds_link_unpack,
407 [REINT_UNLINK] mds_unlink_unpack,
408 [REINT_RENAME] mds_rename_unpack,
409 [REINT_OPEN] mds_open_unpack,
412 int mds_update_unpack(struct ptlrpc_request *req, int offset,
413 struct mds_update_record *rec)
415 mds_reint_t opcode, *opcodep;
419 /* NB don't lustre_swab_reqbuf() here. We're just taking a peek
420 * and we want to leave it to the specific unpacker once we've
421 * identified the message type */
422 opcodep = lustre_msg_buf(req->rq_reqmsg, offset, sizeof (*opcodep));
427 if (lustre_msg_swabbed(req->rq_reqmsg))
430 if (opcode >= REINT_MAX || mds_unpackers[opcode] == NULL) {
431 CERROR("Unexpected opcode %d\n", opcode);
435 rec->ur_opcode = opcode;
436 rc = mds_unpackers[opcode](req, offset, rec);
441 int mds_init_ucred(struct lvfs_ucred *ucred, struct ptlrpc_request *req,
444 struct mds_body *body = lustre_msg_buf(req->rq_reqmsg, offset,
447 struct mds_obd *mds = mds_req2mds(req);
451 LASSERT(body != NULL); /* previously verified & swabbed by caller */
454 if (req->rq_uid != LNET_UID_ANY) {
455 /* Non-root local cluster client */
456 LASSERT (req->rq_uid != 0);
457 ucred->luc_fsuid = req->rq_uid;
461 ucred->luc_fsuid = body->fsuid;
462 ucred->luc_fsgid = body->fsgid;
463 ucred->luc_cap = body->capability;
467 ucred->luc_uce = upcall_cache_get_entry(mds->mds_group_hash,
471 if (IS_ERR(ucred->luc_uce)) {
472 rc = PTR_ERR(ucred->luc_uce);
473 ucred->luc_uce = NULL;
479 ucred->luc_fsgid = ucred->luc_uce->ue_primary;
486 void mds_exit_ucred(struct lvfs_ucred *ucred, struct mds_obd *mds)
489 upcall_cache_put_entry(mds->mds_group_hash, ucred->luc_uce);