1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (c) 2003 Cluster File Systems, Inc.
6 * This file is part of Lustre, http://www.lustre.org.
8 * Lustre is free software; you can redistribute it and/or
9 * modify it under the terms of version 2 of the GNU General Public
10 * License as published by the Free Software Foundation.
12 * Lustre is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Lustre; if not, write to the Free Software
19 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
22 #define DEBUG_SUBSYSTEM S_MDS
24 #include <linux/config.h>
25 #include <linux/module.h>
26 #include <linux/kernel.h>
28 #include <linux/string.h>
29 #include <linux/stat.h>
30 #include <linux/errno.h>
31 #include <linux/version.h>
32 #if (LINUX_VERSION_CODE < KERNEL_VERSION(2,5,0))
33 # include <linux/locks.h> // for wait_on_buffer
35 # include <linux/buffer_head.h> // for wait_on_buffer
37 #include <linux/unistd.h>
39 #include <asm/system.h>
40 #include <asm/uaccess.h>
43 #include <linux/stat.h>
44 #include <asm/uaccess.h>
45 #include <linux/slab.h>
46 #include <asm/segment.h>
48 #include <linux/obd_support.h>
49 #include <linux/lustre_lib.h>
50 #include <linux/lustre_mds.h>
52 #include <linux/lustre_smfs.h>
53 #include <linux/lustre_snap.h>
55 void mds_pack_dentry2fid(struct ll_fid *fid, struct dentry *dentry)
57 fid->id = dentry->d_inum;
58 fid->generation = dentry->d_generation;
59 fid->mds = dentry->d_mdsnum;
62 void mds_pack_dentry2body(struct mds_body *b, struct dentry *dentry)
64 b->valid |= OBD_MD_FLID | OBD_MD_FLGENER;
65 b->ino = dentry->d_inum;
66 b->generation = dentry->d_generation;
67 b->mds = dentry->d_mdsnum;
70 void mds_pack_inode2fid(struct obd_device *obd, struct ll_fid *fid,
74 if (is_smfs_sb(inode->i_sb)) {
75 struct smfs_inode_info *sm_info = I2SMI(inode);
76 fid->snap_index = sm_info->sm_sninfo.sn_index;
79 fid->id = inode->i_ino;
80 fid->generation = inode->i_generation;
81 fid->f_type = (S_IFMT & inode->i_mode);
82 fid->mds = obd->u.mds.mds_num;
85 /* Note that we can copy all of the fields, just some will not be "valid" */
86 void mds_pack_inode2body(struct obd_device *obd, struct mds_body *b,
89 b->valid |= OBD_MD_FLID | OBD_MD_FLCTIME | OBD_MD_FLUID |
90 OBD_MD_FLGID | OBD_MD_FLFLAGS | OBD_MD_FLTYPE |
91 OBD_MD_FLMODE | OBD_MD_FLNLINK | OBD_MD_FLGENER |
92 OBD_MD_FLATIME | OBD_MD_FLMTIME; /* bug 2020 */
94 if (!S_ISREG(inode->i_mode))
95 b->valid |= OBD_MD_FLSIZE | OBD_MD_FLBLOCKS | OBD_MD_FLATIME |
96 OBD_MD_FLMTIME | OBD_MD_FLRDEV;
98 b->ino = inode->i_ino;
99 b->atime = LTIME_S(inode->i_atime);
100 b->mtime = LTIME_S(inode->i_mtime);
101 b->ctime = LTIME_S(inode->i_ctime);
102 b->mode = inode->i_mode;
103 b->size = inode->i_size;
104 b->blocks = inode->i_blocks;
105 b->uid = inode->i_uid;
106 b->gid = inode->i_gid;
107 b->flags = inode->i_flags;
108 b->rdev = inode->i_rdev;
109 /* Return the correct link count for orphan inodes */
110 if (mds_inode_is_orphan(inode)) {
112 } else if (S_ISDIR(inode->i_mode)) {
115 b->nlink = inode->i_nlink;
117 b->generation = inode->i_generation;
119 b->mds = obd->u.mds.mds_num;
123 static int mds_setattr_unpack(struct ptlrpc_request *req, int offset,
124 struct mds_update_record *r)
126 struct iattr *attr = &r->ur_iattr;
127 struct mds_rec_setattr *rec;
130 rec = lustre_swab_reqbuf(req, offset, sizeof(*rec),
131 lustre_swab_mds_rec_setattr);
135 r->_ur_fsuid = rec->sa_fsuid;
136 r->_ur_fsgid = rec->sa_fsgid;
137 r->_ur_cap = rec->sa_cap;
138 r->_ur_suppgid1 = rec->sa_suppgid;
139 r->_ur_suppgid2 = -1;
140 r->ur_fid1 = &rec->sa_fid;
141 attr->ia_valid = rec->sa_valid;
142 attr->ia_mode = rec->sa_mode;
143 attr->ia_uid = rec->sa_uid;
144 attr->ia_gid = rec->sa_gid;
145 attr->ia_size = rec->sa_size;
146 LTIME_S(attr->ia_atime) = rec->sa_atime;
147 LTIME_S(attr->ia_mtime) = rec->sa_mtime;
148 LTIME_S(attr->ia_ctime) = rec->sa_ctime;
149 attr->ia_attr_flags = rec->sa_attr_flags;
151 LASSERT_REQSWAB (req, offset + 1);
152 if (req->rq_reqmsg->bufcount > offset + 1) {
153 r->ur_eadata = lustre_msg_buf (req->rq_reqmsg,
155 if (r->ur_eadata == NULL)
157 r->ur_eadatalen = req->rq_reqmsg->buflens[offset + 1];
160 if (req->rq_reqmsg->bufcount > offset + 2) {
161 r->ur_logcookies = lustre_msg_buf(req->rq_reqmsg, offset + 2,0);
162 if (r->ur_eadata == NULL)
165 r->ur_cookielen = req->rq_reqmsg->buflens[offset + 2];
171 static int mds_create_unpack(struct ptlrpc_request *req, int offset,
172 struct mds_update_record *r)
174 struct mds_rec_create *rec;
177 rec = lustre_swab_reqbuf (req, offset, sizeof (*rec),
178 lustre_swab_mds_rec_create);
182 r->_ur_fsuid = rec->cr_fsuid;
183 r->_ur_fsgid = rec->cr_fsgid;
184 r->_ur_cap = rec->cr_cap;
185 r->ur_fid1 = &rec->cr_fid;
186 r->ur_fid2 = &rec->cr_replayfid;
187 r->ur_mode = rec->cr_mode;
188 r->ur_rdev = rec->cr_rdev;
189 r->ur_time = rec->cr_time;
190 r->ur_flags = rec->cr_flags;
191 r->_ur_suppgid1 = rec->cr_suppgid;
192 r->_ur_suppgid2 = -1;
194 LASSERT_REQSWAB (req, offset + 1);
195 r->ur_name = lustre_msg_string (req->rq_reqmsg, offset + 1, 0);
196 if (r->ur_name == NULL)
198 r->ur_namelen = req->rq_reqmsg->buflens[offset + 1];
200 LASSERT_REQSWAB (req, offset + 2);
201 if (req->rq_reqmsg->bufcount > offset + 2) {
202 if (S_ISLNK(r->ur_mode)) {
203 r->ur_tgt = lustre_msg_string(req->rq_reqmsg,
205 if (r->ur_tgt == NULL)
207 r->ur_tgtlen = req->rq_reqmsg->buflens[offset + 2];
208 } else if (S_ISDIR(r->ur_mode)) {
209 /* Stripe info for mkdir - just a 16bit integer */
210 if (req->rq_reqmsg->buflens[offset + 2] != 2) {
211 CERROR("mkdir stripe info does not match "
212 "expected size %d vs 2\n",
213 req->rq_reqmsg->buflens[offset + 2]);
216 r->ur_eadata = lustre_swab_buf (req->rq_reqmsg,
217 offset + 2, 2, __swab16s);
218 r->ur_eadatalen = req->rq_reqmsg->buflens[offset + 2];
220 /* Hm, no other users so far? */
227 static int mds_link_unpack(struct ptlrpc_request *req, int offset,
228 struct mds_update_record *r)
230 struct mds_rec_link *rec;
233 rec = lustre_swab_reqbuf (req, offset, sizeof (*rec),
234 lustre_swab_mds_rec_link);
238 r->_ur_fsuid = rec->lk_fsuid;
239 r->_ur_fsgid = rec->lk_fsgid;
240 r->_ur_cap = rec->lk_cap;
241 r->_ur_suppgid1 = rec->lk_suppgid1;
242 r->_ur_suppgid2 = rec->lk_suppgid2;
243 r->ur_fid1 = &rec->lk_fid1;
244 r->ur_fid2 = &rec->lk_fid2;
245 r->ur_time = rec->lk_time;
247 LASSERT_REQSWAB (req, offset + 1);
248 r->ur_name = lustre_msg_string (req->rq_reqmsg, offset + 1, 0);
249 if (r->ur_name == NULL)
251 r->ur_namelen = req->rq_reqmsg->buflens[offset + 1];
255 static int mds_unlink_unpack(struct ptlrpc_request *req, int offset,
256 struct mds_update_record *r)
258 struct mds_rec_unlink *rec;
261 rec = lustre_swab_reqbuf (req, offset, sizeof (*rec),
262 lustre_swab_mds_rec_unlink);
266 r->_ur_fsuid = rec->ul_fsuid;
267 r->_ur_fsgid = rec->ul_fsgid;
268 r->_ur_cap = rec->ul_cap;
269 r->ur_mode = rec->ul_mode;
270 r->_ur_suppgid1 = rec->ul_suppgid;
271 r->_ur_suppgid2 = -1;
272 r->ur_fid1 = &rec->ul_fid1;
273 r->ur_fid2 = &rec->ul_fid2;
274 r->ur_time = rec->ul_time;
276 LASSERT_REQSWAB (req, offset + 1);
277 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
278 if (r->ur_name == NULL)
280 r->ur_namelen = req->rq_reqmsg->buflens[offset + 1];
284 static int mds_rename_unpack(struct ptlrpc_request *req, int offset,
285 struct mds_update_record *r)
287 struct mds_rec_rename *rec;
290 rec = lustre_swab_reqbuf (req, offset, sizeof (*rec),
291 lustre_swab_mds_rec_unlink);
295 r->_ur_fsuid = rec->rn_fsuid;
296 r->_ur_fsgid = rec->rn_fsgid;
297 r->_ur_cap = rec->rn_cap;
298 r->_ur_suppgid1 = rec->rn_suppgid1;
299 r->_ur_suppgid2 = rec->rn_suppgid2;
300 r->ur_fid1 = &rec->rn_fid1;
301 r->ur_fid2 = &rec->rn_fid2;
302 r->ur_time = rec->rn_time;
304 LASSERT_REQSWAB (req, offset + 1);
305 r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0);
306 if (r->ur_name == NULL)
308 r->ur_namelen = req->rq_reqmsg->buflens[offset + 1];
310 LASSERT_REQSWAB (req, offset + 2);
311 r->ur_tgt = lustre_msg_string(req->rq_reqmsg, offset + 2, 0);
312 if (r->ur_tgt == NULL)
314 r->ur_tgtlen = req->rq_reqmsg->buflens[offset + 2];
318 static int mds_open_unpack(struct ptlrpc_request *req, int offset,
319 struct mds_update_record *r)
321 struct mds_rec_create *rec;
324 rec = lustre_swab_reqbuf (req, offset, sizeof (*rec),
325 lustre_swab_mds_rec_create);
329 r->_ur_fsuid = rec->cr_fsuid;
330 r->_ur_fsgid = rec->cr_fsgid;
331 r->_ur_cap = rec->cr_cap;
332 r->ur_fid1 = &rec->cr_fid;
333 r->ur_fid2 = &rec->cr_replayfid;
334 r->ur_mode = rec->cr_mode;
335 r->ur_rdev = rec->cr_rdev;
336 r->ur_time = rec->cr_time;
337 r->ur_flags = rec->cr_flags;
338 r->_ur_suppgid1 = rec->cr_suppgid;
339 r->_ur_suppgid2 = -1;
341 LASSERT_REQSWAB (req, offset + 1);
342 r->ur_name = lustre_msg_string (req->rq_reqmsg, offset + 1, 0);
343 if (r->ur_name == NULL)
345 r->ur_namelen = req->rq_reqmsg->buflens[offset + 1];
347 LASSERT_REQSWAB (req, offset + 2);
348 if (req->rq_reqmsg->bufcount > offset + 2) {
349 r->ur_eadata = lustre_msg_buf(req->rq_reqmsg, offset + 2, 0);
350 if (r->ur_eadata == NULL)
352 r->ur_eadatalen = req->rq_reqmsg->buflens[offset + 2];
357 typedef int (*update_unpacker)(struct ptlrpc_request *req, int offset,
358 struct mds_update_record *r);
360 static update_unpacker mds_unpackers[REINT_MAX + 1] = {
361 [REINT_SETATTR] mds_setattr_unpack,
362 [REINT_CREATE] mds_create_unpack,
363 [REINT_LINK] mds_link_unpack,
364 [REINT_UNLINK] mds_unlink_unpack,
365 [REINT_RENAME] mds_rename_unpack,
366 [REINT_OPEN] mds_open_unpack,
369 int mds_update_unpack(struct ptlrpc_request *req, int offset,
370 struct mds_update_record *rec)
377 /* NB don't lustre_swab_reqbuf() here. We're just taking a peek
378 * and we want to leave it to the specific unpacker once we've
379 * identified the message type */
380 opcodep = lustre_msg_buf (req->rq_reqmsg, offset, sizeof (*opcodep));
385 if (lustre_msg_swabbed (req->rq_reqmsg))
388 if (opcode > REINT_MAX ||
389 mds_unpackers[opcode] == NULL) {
390 CERROR ("Unexpected opcode %d\n", opcode);
394 rec->ur_opcode = opcode;
395 rc = mds_unpackers[opcode](req, offset, rec);