1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (C) 2001-2003 Cluster File Systems, Inc. <info@clusterfs.com>
6 * This file is part of Lustre, http://www.lustre.org.
8 * Lustre is free software; you can redistribute it and/or
9 * modify it under the terms of version 2 of the GNU General Public
10 * License as published by the Free Software Foundation.
12 * Lustre is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Lustre; if not, write to the Free Software
19 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 * MDS data structures.
22 * See also lustre_idl.h for wire formats of requests.
30 # include <linux/fs.h>
31 # include <linux/dcache.h>
34 #include <linux/lustre_handles.h>
35 #include <linux/kp30.h>
36 #include <linux/lustre_idl.h>
37 #include <linux/lustre_lib.h>
38 #include <linux/lustre_dlm.h>
39 #include <linux/lustre_log.h>
40 #include <linux/lustre_export.h>
42 struct ldlm_lock_desc;
44 struct ptlrpc_connection;
47 struct ptlrpc_request;
51 #define LUSTRE_MDS_NAME "mds"
52 #define LUSTRE_MDT_NAME "mdt"
53 #define LUSTRE_MDC_NAME "mdc"
55 struct mds_update_record {
57 struct ll_fid *ur_fid1;
58 struct ll_fid *ur_fid2;
66 struct llog_cookie *ur_logcookies;
67 struct iattr ur_iattr;
68 struct lvfs_ucred ur_uc;
75 #define _ur_fsuid ur_uc.luc_fsuid
76 #define _ur_fsgid ur_uc.luc_fsgid
77 #define _ur_cap ur_uc.luc_cap
78 #define _ur_suppgid1 ur_uc.luc_suppgid1
79 #define _ur_suppgid2 ur_uc.luc_suppgid2
81 /* i_attr_flags holds the open count in the inode in 2.4 */
82 //XXX Alex implement on 2.4 with i_attr_flags and find soln for 2.5 please
83 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(2,5,0))
84 # define mds_inode_oatomic(inode) ((atomic_t *)&(inode)->i_cindex)
86 # define mds_inode_oatomic(inode) ((atomic_t *)&(inode)->i_attr_flags)
89 # define mds_open_orphan_count(inode) \
90 atomic_read(mds_inode_oatomic(inode))
91 # define mds_open_orphan_inc(inode) \
92 atomic_inc(mds_inode_oatomic(inode))
93 # define mds_open_orphan_dec_test(inode) \
94 atomic_dec_and_test(mds_inode_oatomic(inode))
96 #define mds_inode_is_orphan(inode) ((inode)->i_flags & 0x4000000)
97 #define mds_inode_set_orphan(inode) (inode)->i_flags |= 0x4000000
99 #define MDS_LR_SERVER_SIZE 512
101 #define MDS_LR_CLIENT_START 8192
102 #define MDS_LR_CLIENT_SIZE 128
103 #if MDS_LR_CLIENT_START < MDS_LR_SERVER_SIZE
104 #error "Can't have MDS_LR_CLIENT_START < MDS_LR_SERVER_SIZE"
107 #define MDS_CLIENT_SLOTS 17
109 #define MDS_ROCOMPAT_LOVOBJID 0x00000001
110 #define MDS_ROCOMPAT_SUPP (MDS_ROCOMPAT_LOVOBJID)
112 #define MDS_INCOMPAT_SUPP (0)
114 #define REAL_MDS_NUMBER 1
115 #define CACHE_MDS_NUMBER 0
117 /*flags for indicate the record are come from cmobd reint or
119 #define REC_REINT_CREATE 0x0001
121 /* Data stored per server at the head of the last_rcvd file. In le32 order.
122 * Try to keep this the same as fsd_server_data so we might one day merge. */
123 struct mds_server_data {
124 __u8 msd_uuid[40]; /* server UUID */
125 __u64 msd_last_transno; /* last completed transaction ID */
126 __u64 msd_mount_count; /* MDS incarnation number */
128 __u32 msd_feature_compat; /* compatible feature flags */
129 __u32 msd_feature_rocompat;/* read-only compatible feature flags */
130 __u32 msd_feature_incompat;/* incompatible feature flags */
131 __u32 msd_server_size; /* size of server data area */
132 __u32 msd_client_start; /* start of per-client data area */
133 __u16 msd_client_size; /* size of per-client data area */
134 __u16 msd_subdir_count; /* number of subdirectories for objects */
135 __u64 msd_catalog_oid; /* recovery catalog object id */
136 __u32 msd_catalog_ogen; /* recovery catalog inode generation */
137 __u8 msd_peeruuid[40]; /* UUID of LOV/OSC associated with MDS */
138 __u8 msd_padding[MDS_LR_SERVER_SIZE - 140];
141 /* Data stored per client in the last_rcvd file. In le32 order. */
142 struct mds_client_data {
143 __u8 mcd_uuid[40]; /* client UUID */
144 __u64 mcd_last_transno; /* last completed transaction ID */
145 __u64 mcd_last_xid; /* xid for the last transaction */
146 __u32 mcd_last_result; /* result from last RPC */
147 __u32 mcd_last_data; /* per-op data (disposition for open &c.) */
148 __u8 mcd_padding[MDS_LR_CLIENT_SIZE - 64];
151 /* file data for open files on MDS */
152 struct mds_file_data {
153 struct portals_handle mfd_handle; /* must be first */
154 atomic_t mfd_refcount;
155 struct list_head mfd_list;
158 struct dentry *mfd_dentry;
161 /* mds/mds_reint.c */
162 int mds_reint_rec(struct mds_update_record *r, int offset,
163 struct ptlrpc_request *req, struct lustre_handle *);
167 struct dentry *mds_fid2locked_dentry(struct obd_device *obd, struct ll_fid *fid,
168 struct vfsmount **mnt, int lock_mode,
169 struct lustre_handle *lockh, int *pmode,
170 char *name, int namelen, __u64 lockpart);
171 struct dentry *mds_fid2dentry(struct mds_obd *mds, struct ll_fid *fid,
172 struct vfsmount **mnt);
173 int mds_update_server_data(struct obd_device *, int force_sync);
176 int mds_fs_setup(struct obd_device *obddev, struct vfsmount *mnt);
177 int mds_fs_cleanup(struct obd_device *obddev, int failover);
182 /* mdc/mdc_locks.c */
183 int it_disposition(struct lookup_intent *it, int flag);
184 void it_set_disposition(struct lookup_intent *it, int flag);
185 int it_open_error(int phase, struct lookup_intent *it);
186 int mdc_set_lock_data(struct obd_export *exp, __u64 *lockh, void *data);
187 int mdc_change_cbdata(struct obd_export *exp, struct ll_fid *fid,
188 ldlm_iterator_t it, void *data);
189 int mdc_intent_lock(struct obd_export *exp, struct ll_uctxt *,
190 struct ll_fid *parent,
191 const char *name, int len, void *lmm, int lmmsize,
192 struct ll_fid *child,
193 struct lookup_intent *, int,
194 struct ptlrpc_request **reqp,
195 ldlm_blocking_callback cb_blocking);
196 int mdc_enqueue(struct obd_export *exp,
198 struct lookup_intent *it,
200 struct mdc_op_data *data,
201 struct lustre_handle *lockh,
204 ldlm_completion_callback cb_completion,
205 ldlm_blocking_callback cb_blocking,
208 /* mdc/mdc_request.c */
209 int mdc_req2lustre_md(struct obd_export *exp_mdc, struct ptlrpc_request *req,
210 unsigned int offset, struct obd_export *exp_osc,
211 struct lustre_md *md);
212 int mdc_getstatus(struct obd_export *exp, struct ll_fid *rootfid);
213 int mdc_getattr(struct obd_export *exp, struct ll_fid *fid,
214 unsigned long valid, unsigned int ea_size,
215 struct ptlrpc_request **request);
216 int mdc_getattr_name(struct obd_export *exp, struct ll_fid *fid,
217 char *filename, int namelen, unsigned long valid,
218 unsigned int ea_size, struct ptlrpc_request **request);
219 int mdc_setattr(struct obd_export *exp, struct mdc_op_data *data,
220 struct iattr *iattr, void *ea, int ealen, void *ea2, int ea2len,
221 struct ptlrpc_request **request);
222 int mdc_open(struct obd_export *exp, obd_id ino, int type, int flags,
223 struct lov_mds_md *lmm, int lmm_size, struct lustre_handle *fh,
224 struct ptlrpc_request **);
225 struct obd_client_handle;
226 int mdc_set_open_replay_data(struct obd_export *exp,
227 struct obd_client_handle *och,
228 struct ptlrpc_request *open_req);
229 int mdc_clear_open_replay_data(struct obd_export *exp,
230 struct obd_client_handle *och);
231 int mdc_close(struct obd_export *, struct obdo *, struct obd_client_handle *,
232 struct ptlrpc_request **);
233 int mdc_readpage(struct obd_export *exp, struct ll_fid *mdc_fid,
234 __u64, struct page *, struct ptlrpc_request **);
235 int mdc_create(struct obd_export *exp, struct mdc_op_data *op_data,
236 const void *data, int datalen, int mode, __u32 uid, __u32 gid,
237 __u64 rdev, struct ptlrpc_request **request);
238 int mdc_unlink(struct obd_export *exp, struct mdc_op_data *data,
239 struct ptlrpc_request **request);
240 int mdc_link(struct obd_export *exp, struct mdc_op_data *data,
241 struct ptlrpc_request **);
242 int mdc_rename(struct obd_export *exp, struct mdc_op_data *data,
243 const char *old, int oldlen, const char *new, int newlen,
244 struct ptlrpc_request **request);
245 int mdc_sync(struct obd_export *exp, struct ll_fid *fid,
246 struct ptlrpc_request **);
247 int mdc_create_client(struct obd_uuid uuid, struct ptlrpc_client *cl);
249 /* Store the generation of a newly-created inode in |req| for replay. */
250 int mdc_store_inode_generation(struct obd_export *exp, struct ptlrpc_request *req,
251 int reqoff, int repoff);
252 int mdc_llog_process(struct obd_export *, char *logname, llog_cb_t, void *data);
253 int mdc_done_writing(struct obd_export *exp, struct obdo *);
254 int mdc_reint(struct ptlrpc_request *request, struct mdc_rpc_lock *rpc_lock,
256 static inline void mdc_pack_fid(struct ll_fid *fid, obd_id ino, __u32 gen,
260 fid->generation = gen;
264 /* ioctls for trying requests */
265 #define IOC_REQUEST_TYPE 'f'
266 #define IOC_REQUEST_MIN_NR 30
268 #define IOC_REQUEST_GETATTR _IOWR('f', 30, long)
269 #define IOC_REQUEST_READPAGE _IOWR('f', 31, long)
270 #define IOC_REQUEST_SETATTR _IOWR('f', 32, long)
271 #define IOC_REQUEST_CREATE _IOWR('f', 33, long)
272 #define IOC_REQUEST_OPEN _IOWR('f', 34, long)
273 #define IOC_REQUEST_CLOSE _IOWR('f', 35, long)
274 #define IOC_REQUEST_MAX_NR 35
276 #define MDS_CHECK_RESENT(req, reconstruct) \
278 if (lustre_msg_get_flags(req->rq_reqmsg) & MSG_RESENT) { \
279 struct mds_client_data *mcd = \
280 req->rq_export->exp_mds_data.med_mcd; \
281 if (mcd->mcd_last_xid == req->rq_xid) { \
285 DEBUG_REQ(D_HA, req, "no reply for RESENT req (have "LPD64")", \
286 mcd->mcd_last_xid); \