/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*- * vim:expandtab:shiftwidth=8:tabstop=8: * * Copyright (c) 2003 Cluster File Systems, Inc. * * This file is part of the Lustre file system, http://www.lustre.org * Lustre is a trademark of Cluster File Systems, Inc. * * You may have signed or agreed to another license before downloading * this software. If so, you are bound by the terms and conditions * of that agreement, and the following does not apply to you. See the * LICENSE file included with this distribution for more information. * * If you did not agree to a different license, then this copy of Lustre * is open source software; you can redistribute it and/or modify it * under the terms of version 2 of the GNU General Public License as * published by the Free Software Foundation. * * In either case, Lustre is distributed in the hope that it will be * useful, but WITHOUT ANY WARRANTY; without even the implied warranty * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * license text for more details. */ #define DEBUG_SUBSYSTEM S_MDS #ifndef AUTOCONF_INCLUDED #include #endif #include #include #include #include #include #include #include #include // for wait_on_buffer #include #include #include #include #include #include #include #include #include #include #include "mds_internal.h" void mds_pack_inode2fid(struct ll_fid *fid, struct inode *inode) { fid->id = inode->i_ino; fid->generation = inode->i_generation; fid->f_type = (S_IFMT & inode->i_mode); } /* Note that we can copy all of the fields, just some will not be "valid" */ void mds_pack_inode2body(struct mds_body *b, struct inode *inode) { b->valid |= OBD_MD_FLID | OBD_MD_FLCTIME | OBD_MD_FLUID | OBD_MD_FLGID | OBD_MD_FLFLAGS | OBD_MD_FLTYPE | OBD_MD_FLMODE | OBD_MD_FLNLINK | OBD_MD_FLGENER | OBD_MD_FLATIME | OBD_MD_FLMTIME; /* bug 2020 */ if (!S_ISREG(inode->i_mode)) b->valid |= OBD_MD_FLSIZE | OBD_MD_FLBLOCKS | OBD_MD_FLATIME | OBD_MD_FLMTIME | OBD_MD_FLRDEV; b->ino = inode->i_ino; b->atime = LTIME_S(inode->i_atime); b->mtime = LTIME_S(inode->i_mtime); b->ctime = LTIME_S(inode->i_ctime); b->mode = inode->i_mode; b->size = i_size_read(inode); b->blocks = inode->i_blocks; b->uid = inode->i_uid; b->gid = inode->i_gid; b->flags = ll_inode_to_ext_flags(b->flags, inode->i_flags); b->rdev = inode->i_rdev; /* Return the correct link count for orphan inodes */ b->nlink = mds_inode_is_orphan(inode) ? 0 : inode->i_nlink; b->generation = inode->i_generation; b->suppgid = -1; } static inline unsigned int attr_unpack(__u64 sa_valid) { unsigned int ia_valid = 0; if (sa_valid & MDS_ATTR_MODE) ia_valid |= ATTR_MODE; if (sa_valid & MDS_ATTR_UID) ia_valid |= ATTR_UID; if (sa_valid & MDS_ATTR_GID) ia_valid |= ATTR_GID; if (sa_valid & MDS_ATTR_SIZE) ia_valid |= ATTR_SIZE; if (sa_valid & MDS_ATTR_ATIME) ia_valid |= ATTR_ATIME; if (sa_valid & MDS_ATTR_MTIME) ia_valid |= ATTR_MTIME; if (sa_valid & MDS_ATTR_CTIME) ia_valid |= ATTR_CTIME; if (sa_valid & MDS_ATTR_ATIME_SET) ia_valid |= ATTR_ATIME_SET; if (sa_valid & MDS_ATTR_MTIME_SET) ia_valid |= ATTR_MTIME_SET; if (sa_valid & MDS_ATTR_FORCE) ia_valid |= ATTR_FORCE; if (sa_valid & MDS_ATTR_ATTR_FLAG) ia_valid |= ATTR_ATTR_FLAG; if (sa_valid & MDS_ATTR_KILL_SUID) ia_valid |= ATTR_KILL_SUID; if (sa_valid & MDS_ATTR_KILL_SGID) ia_valid |= ATTR_KILL_SGID; if (sa_valid & MDS_ATTR_CTIME_SET) ia_valid |= ATTR_CTIME_SET; if (sa_valid & MDS_ATTR_FROM_OPEN) ia_valid |= ATTR_FROM_OPEN; if (sa_valid & MDS_ATTR_BLOCKS) ia_valid |= ATTR_BLOCKS; return ia_valid; } /* unpacking */ static int mds_setattr_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct iattr *attr = &r->ur_iattr; struct mds_rec_setattr *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof(*rec), lustre_swab_mds_rec_setattr); if (rec == NULL) RETURN (-EFAULT); r->ur_uc.luc_fsuid = rec->sa_fsuid; r->ur_uc.luc_fsgid = rec->sa_fsgid; r->ur_uc.luc_cap = rec->sa_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->sa_suppgid; r->ur_uc.luc_suppgid2 = -1; #endif r->ur_fid1 = &rec->sa_fid; attr->ia_valid = attr_unpack(rec->sa_valid); attr->ia_mode = rec->sa_mode; attr->ia_uid = rec->sa_uid; attr->ia_gid = rec->sa_gid; attr->ia_size = rec->sa_size; LTIME_S(attr->ia_atime) = rec->sa_atime; LTIME_S(attr->ia_mtime) = rec->sa_mtime; LTIME_S(attr->ia_ctime) = rec->sa_ctime; r->ur_flags = rec->sa_attr_flags; lustre_set_req_swabbed(req, offset + 1); r->ur_eadatalen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); if (r->ur_eadatalen) { r->ur_eadata = lustre_msg_buf(req->rq_reqmsg, offset + 1, 0); if (r->ur_eadata == NULL) RETURN(-EFAULT); } r->ur_cookielen = lustre_msg_buflen(req->rq_reqmsg, offset + 2); if (r->ur_cookielen) { r->ur_logcookies = lustre_msg_buf(req->rq_reqmsg, offset + 2,0); if (r->ur_eadata == NULL) RETURN (-EFAULT); } if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) { r->ur_dlm = lustre_swab_reqbuf(req, offset + 3, sizeof(*r->ur_dlm), lustre_swab_ldlm_request); if (r->ur_dlm == NULL) RETURN (-EFAULT); } RETURN(0); } static int mds_create_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct mds_rec_create *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof (*rec), lustre_swab_mds_rec_create); if (rec == NULL) RETURN (-EFAULT); r->ur_uc.luc_fsuid = rec->cr_fsuid; r->ur_uc.luc_fsgid = rec->cr_fsgid; r->ur_uc.luc_cap = rec->cr_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->cr_suppgid; r->ur_uc.luc_suppgid2 = -1; #endif r->ur_fid1 = &rec->cr_fid; r->ur_fid2 = &rec->cr_replayfid; r->ur_mode = rec->cr_mode; r->ur_rdev = rec->cr_rdev; r->ur_time = rec->cr_time; r->ur_flags = rec->cr_flags; lustre_set_req_swabbed(req, offset + 1); r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0); if (r->ur_name == NULL) RETURN (-EFAULT); r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); lustre_set_req_swabbed(req, offset + 2); r->ur_tgtlen = lustre_msg_buflen(req->rq_reqmsg, offset + 2); if (r->ur_tgtlen) { /* NB for now, we only seem to pass NULL terminated symlink * target strings here. If this ever changes, we'll have * to stop checking for a buffer filled completely with a * NULL terminated string here, and make the callers check * depending on what they expect. We should probably stash * it in r->ur_eadata in that case, so it's obvious... -eeb */ r->ur_tgt = lustre_msg_string(req->rq_reqmsg, offset + 2, 0); if (r->ur_tgt == NULL) RETURN (-EFAULT); } if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) { r->ur_dlm = lustre_swab_reqbuf(req, offset + 3, sizeof(*r->ur_dlm), lustre_swab_ldlm_request); if (r->ur_dlm == NULL) RETURN (-EFAULT); } RETURN(0); } static int mds_link_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct mds_rec_link *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof (*rec), lustre_swab_mds_rec_link); if (rec == NULL) RETURN (-EFAULT); r->ur_uc.luc_fsuid = rec->lk_fsuid; r->ur_uc.luc_fsgid = rec->lk_fsgid; r->ur_uc.luc_cap = rec->lk_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->lk_suppgid1; r->ur_uc.luc_suppgid2 = rec->lk_suppgid2; #endif r->ur_fid1 = &rec->lk_fid1; r->ur_fid2 = &rec->lk_fid2; r->ur_time = rec->lk_time; lustre_set_req_swabbed(req, offset + 1); r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0); if (r->ur_name == NULL) RETURN (-EFAULT); r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); if (lustre_msg_buflen(req->rq_reqmsg, offset + 2)) { r->ur_dlm = lustre_swab_reqbuf(req, offset + 2, sizeof(*r->ur_dlm), lustre_swab_ldlm_request); if (r->ur_dlm == NULL) RETURN (-EFAULT); } RETURN(0); } static int mds_unlink_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct mds_rec_unlink *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof (*rec), lustre_swab_mds_rec_unlink); if (rec == NULL) RETURN(-EFAULT); r->ur_uc.luc_fsuid = rec->ul_fsuid; r->ur_uc.luc_fsgid = rec->ul_fsgid; r->ur_uc.luc_cap = rec->ul_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->ul_suppgid; r->ur_uc.luc_suppgid2 = -1; #endif r->ur_mode = rec->ul_mode; r->ur_fid1 = &rec->ul_fid1; r->ur_fid2 = &rec->ul_fid2; r->ur_time = rec->ul_time; lustre_set_req_swabbed(req, offset + 1); r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0); if (r->ur_name == NULL) RETURN(-EFAULT); r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); if (lustre_msg_buflen(req->rq_reqmsg, offset + 2)) { r->ur_dlm = lustre_swab_reqbuf(req, offset + 2, sizeof(*r->ur_dlm), lustre_swab_ldlm_request); if (r->ur_dlm == NULL) RETURN (-EFAULT); } RETURN(0); } static int mds_rename_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct mds_rec_rename *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof (*rec), lustre_swab_mds_rec_rename); if (rec == NULL) RETURN(-EFAULT); r->ur_uc.luc_fsuid = rec->rn_fsuid; r->ur_uc.luc_fsgid = rec->rn_fsgid; r->ur_uc.luc_cap = rec->rn_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->rn_suppgid1; r->ur_uc.luc_suppgid2 = rec->rn_suppgid2; #endif r->ur_fid1 = &rec->rn_fid1; r->ur_fid2 = &rec->rn_fid2; r->ur_time = rec->rn_time; lustre_set_req_swabbed(req, offset + 1); r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0); if (r->ur_name == NULL) RETURN(-EFAULT); r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); lustre_set_req_swabbed(req, offset + 2); r->ur_tgt = lustre_msg_string(req->rq_reqmsg, offset + 2, 0); if (r->ur_tgt == NULL) RETURN(-EFAULT); r->ur_tgtlen = lustre_msg_buflen(req->rq_reqmsg, offset + 2); if (lustre_msg_buflen(req->rq_reqmsg, offset + 3)) { r->ur_dlm = lustre_swab_reqbuf(req, offset + 3, sizeof(*r->ur_dlm), lustre_swab_ldlm_request); if (r->ur_dlm == NULL) RETURN (-EFAULT); } RETURN(0); } static int mds_open_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *r) { struct mds_rec_create *rec; ENTRY; rec = lustre_swab_reqbuf(req, offset, sizeof(*rec), lustre_swab_mds_rec_create); if (rec == NULL) RETURN(-EFAULT); r->ur_uc.luc_fsuid = rec->cr_fsuid; r->ur_uc.luc_fsgid = rec->cr_fsgid; r->ur_uc.luc_cap = rec->cr_cap; #if 0 r->ur_uc.luc_suppgid1 = rec->cr_suppgid; r->ur_uc.luc_suppgid2 = -1; #endif r->ur_fid1 = &rec->cr_fid; r->ur_fid2 = &rec->cr_replayfid; r->ur_mode = rec->cr_mode; r->ur_rdev = rec->cr_rdev; r->ur_time = rec->cr_time; r->ur_flags = rec->cr_flags; lustre_set_req_swabbed(req, offset + 1); r->ur_name = lustre_msg_string(req->rq_reqmsg, offset + 1, 0); if (r->ur_name == NULL) RETURN(-EFAULT); r->ur_namelen = lustre_msg_buflen(req->rq_reqmsg, offset + 1); lustre_set_req_swabbed(req, offset + 2); r->ur_eadatalen = lustre_msg_buflen(req->rq_reqmsg, offset + 2); if (r->ur_eadatalen) { r->ur_eadata = lustre_msg_buf(req->rq_reqmsg, offset + 2, 0); if (r->ur_eadata == NULL) RETURN (-EFAULT); } RETURN(0); } typedef int (*update_unpacker)(struct ptlrpc_request *req, int offset, struct mds_update_record *r); static update_unpacker mds_unpackers[REINT_MAX] = { [REINT_SETATTR] mds_setattr_unpack, [REINT_CREATE] mds_create_unpack, [REINT_LINK] mds_link_unpack, [REINT_UNLINK] mds_unlink_unpack, [REINT_RENAME] mds_rename_unpack, [REINT_OPEN] mds_open_unpack, }; int mds_update_unpack(struct ptlrpc_request *req, int offset, struct mds_update_record *rec) { mds_reint_t opcode, *opcodep; int rc; ENTRY; /* NB don't lustre_swab_reqbuf() here. We're just taking a peek * and we want to leave it to the specific unpacker once we've * identified the message type */ opcodep = lustre_msg_buf(req->rq_reqmsg, offset, sizeof (*opcodep)); if (opcodep == NULL) RETURN(-EFAULT); opcode = *opcodep; if (lustre_msg_swabbed(req->rq_reqmsg)) __swab32s(&opcode); if (opcode >= REINT_MAX || mds_unpackers[opcode] == NULL) { CERROR("Unexpected opcode %d\n", opcode); RETURN(-EFAULT); } rec->ur_opcode = opcode; rc = mds_unpackers[opcode](req, offset, rec); RETURN(rc); } int mds_init_ucred(struct lvfs_ucred *ucred, struct ptlrpc_request *req, int offset) { struct mds_body *body = lustre_msg_buf(req->rq_reqmsg, offset, sizeof(*body)); #if 0 struct mds_obd *mds = mds_req2mds(req); int rc; #endif LASSERT(body != NULL); /* previously verified & swabbed by caller */ #ifdef CRAY_XT3 if (req->rq_uid != LNET_UID_ANY) { /* Non-root local cluster client */ LASSERT (req->rq_uid != 0); ucred->luc_fsuid = req->rq_uid; } else #endif { ucred->luc_fsuid = body->fsuid; ucred->luc_fsgid = body->fsgid; ucred->luc_cap = body->capability; } #if 0 ucred->luc_uce = upcall_cache_get_entry(mds->mds_group_hash, ucred->luc_fsuid, ucred->luc_fsgid, 1, &body->suppgid); if (IS_ERR(ucred->luc_uce)) { rc = PTR_ERR(ucred->luc_uce); ucred->luc_uce = NULL; return rc; } #ifdef CRAY_XT3 if (ucred->luc_uce) ucred->luc_fsgid = ucred->luc_uce->ue_primary; #endif #endif return 0; } void mds_exit_ucred(struct lvfs_ucred *ucred, struct mds_obd *mds) { #if 0 upcall_cache_put_entry(mds->mds_group_hash, ucred->luc_uce); #endif }