/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
* vim:expandtab:shiftwidth=8:tabstop=8:
*
- * Copyright (C) 2001 Cluster File Systems, Inc. <braam@clusterfs.com>
+ * Copyright (C) 2001-2003 Cluster File Systems, Inc. <info@clusterfs.com>
*
* This file is part of Lustre, http://www.lustre.org.
*
* along with Lustre; if not, write to the Free Software
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
*
- * MDS data structures.
+ * MDS data structures.
* See also lustre_idl.h for wire formats of requests.
*
*/
#ifndef _LUSTRE_MDS_H
#define _LUSTRE_MDS_H
+#ifdef __KERNEL__
+# include <linux/fs.h>
+# include <linux/dcache.h>
+#endif
-#include <linux/obd_support.h>
+#include <linux/lustre_handles.h>
+#include <linux/kp30.h>
#include <linux/lustre_idl.h>
-#include <linux/lustre_net.h>
+#include <linux/lustre_lib.h>
+#include <linux/lustre_dlm.h>
+#include <linux/lustre_log.h>
+#include <linux/lustre_export.h>
-static inline void l_dput(struct dentry *de)
-{
- if (!de || IS_ERR(de))
- return;
- dput(de);
-}
-
-struct mds_run_ctxt {
- struct vfsmount *pwdmnt;
- struct dentry *pwd;
- mm_segment_t fs;
-};
+struct ldlm_lock_desc;
+struct mds_obd;
+struct ptlrpc_connection;
+struct ptlrpc_client;
+struct obd_export;
+struct ptlrpc_request;
+struct obd_device;
+struct ll_file_data;
-#define MDS_UNMOUNT 1
#define LUSTRE_MDS_NAME "mds"
+#define LUSTRE_MDT_NAME "mdt"
+#define LUSTRE_MDC_NAME "mdc"
-struct mds_obd {
- char *mds_fstype;
- struct task_struct *mds_thread;
- __u32 mds_remote_nid;
- wait_queue_head_t mds_waitq;
- wait_queue_head_t mds_done_waitq;
- struct timer_list *mds_timer;
- int mds_interval;
- int mds_flags;
- struct list_head mds_reqs;
- struct super_block * mds_sb;
- struct vfsmount *mds_vfsmnt;
- struct mds_run_ctxt mds_ctxt;
- spinlock_t mds_lock;
- __u64 mds_lastino;
- struct file_operations *mds_fop;
- struct inode_operations *mds_iop;
- struct address_space_operations *mds_aops;
-
- struct ptlrpc_service *mds_service;
-};
-
-
-struct mds_update_record {
- __u32 ur_reclen;
+struct mds_update_record {
__u32 ur_opcode;
struct ll_fid *ur_fid1;
struct ll_fid *ur_fid2;
char *ur_name;
int ur_tgtlen;
char *ur_tgt;
+ int ur_eadatalen;
+ void *ur_eadata;
+ int ur_cookielen;
+ struct llog_cookie *ur_logcookies;
struct iattr ur_iattr;
- __u64 ur_id;
+ struct lvfs_ucred ur_uc;
+ __u64 ur_rdev;
__u32 ur_mode;
- __u32 ur_uid;
- __u32 ur_gid;
__u64 ur_time;
-};
+ __u32 ur_flags;
+};
-/* mds/mds_pack.c */
-void *mds_req_tgt(struct mds_req *req);
-int mds_pack_req(char *name, int namelen, char *tgt, int tgtlen, struct ptlreq_hdr **hdr, struct mds_req **req, int *len, char **buf);
-int mds_unpack_req(char *buf, int len, struct ptlreq_hdr **hdr, struct mds_req **req);
-int mds_pack_rep(char *name, int namelen, char *tgt, int tgtlen, struct ptlrep_hdr **hdr, struct mds_rep **rep, int *len, char **buf);
-int mds_unpack_rep(char *buf, int len, struct ptlrep_hdr **hdr, struct mds_rep **rep);
+#define _ur_fsuid ur_uc.luc_fsuid
+#define _ur_fsgid ur_uc.luc_fsgid
+#define _ur_cap ur_uc.luc_cap
+#define _ur_suppgid1 ur_uc.luc_suppgid1
+#define _ur_suppgid2 ur_uc.luc_suppgid2
-/* mds/mds_reint.c */
-int mds_reint_rec(struct mds_update_record *r, struct ptlrpc_request *req);
+/* i_attr_flags holds the open count in the inode in 2.4 */
+//XXX Alex implement on 2.4 with i_attr_flags and find soln for 2.5 please
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(2,5,0))
+# define mds_inode_oatomic(inode) ((atomic_t *)&(inode)->i_cindex)
+#else
+# define mds_inode_oatomic(inode) ((atomic_t *)&(inode)->i_attr_flags)
+#endif
+
+# define mds_open_orphan_count(inode) \
+ atomic_read(mds_inode_oatomic(inode))
+# define mds_open_orphan_inc(inode) \
+ atomic_inc(mds_inode_oatomic(inode))
+# define mds_open_orphan_dec_test(inode) \
+ atomic_dec_and_test(mds_inode_oatomic(inode))
+
+#define mds_inode_is_orphan(inode) ((inode)->i_flags & 0x4000000)
+#define mds_inode_set_orphan(inode) (inode)->i_flags |= 0x4000000
+
+#define MDS_LR_SERVER_SIZE 512
+
+#define MDS_LR_CLIENT_START 8192
+#define MDS_LR_CLIENT_SIZE 128
+#if MDS_LR_CLIENT_START < MDS_LR_SERVER_SIZE
+#error "Can't have MDS_LR_CLIENT_START < MDS_LR_SERVER_SIZE"
+#endif
+
+#define MDS_CLIENT_SLOTS 17
+
+#define MDS_ROCOMPAT_LOVOBJID 0x00000001
+#define MDS_ROCOMPAT_SUPP (MDS_ROCOMPAT_LOVOBJID)
+
+#define MDS_INCOMPAT_SUPP (0)
-/* lib/mds_updates.c */
-int mds_update_unpack(char *buf, int len, struct mds_update_record *r);
+#define REAL_MDS_NUMBER 1
+#define CACHE_MDS_NUMBER 0
-void mds_setattr_pack(struct mds_rec_setattr *rec, struct inode *inode, struct iattr *iattr);
-void mds_create_pack(struct mds_rec_create *rec, struct inode *inode, const char *name, int namelen, __u32 mode, __u64 id, __u32 uid, __u32 gid, __u64 time, const char *tgt, int tgtlen);
-void mds_unlink_pack(struct mds_rec_unlink *rec, struct inode *inode, const char *name, int namelen);
-void mds_link_pack(struct mds_rec_link *rec, struct inode *inode, struct inode *dir, const char *name, int namelen);
-void mds_rename_pack(struct mds_rec_rename *rec, struct inode *srcdir, struct inode *tgtdir, const char *name, int namelen, const char *tgt, int tgtlen);
+/*flags for indicate the record are come from cmobd reint or
+ mdc create */
+#define REC_REINT_CREATE 0x0001
+
+/* Data stored per server at the head of the last_rcvd file. In le32 order.
+ * Try to keep this the same as fsd_server_data so we might one day merge. */
+struct mds_server_data {
+ __u8 msd_uuid[40]; /* server UUID */
+ __u64 msd_last_transno; /* last completed transaction ID */
+ __u64 msd_mount_count; /* MDS incarnation number */
+ __u64 msd_unused;
+ __u32 msd_feature_compat; /* compatible feature flags */
+ __u32 msd_feature_rocompat;/* read-only compatible feature flags */
+ __u32 msd_feature_incompat;/* incompatible feature flags */
+ __u32 msd_server_size; /* size of server data area */
+ __u32 msd_client_start; /* start of per-client data area */
+ __u16 msd_client_size; /* size of per-client data area */
+ __u16 msd_subdir_count; /* number of subdirectories for objects */
+ __u64 msd_catalog_oid; /* recovery catalog object id */
+ __u32 msd_catalog_ogen; /* recovery catalog inode generation */
+ __u8 msd_peeruuid[40]; /* UUID of LOV/OSC associated with MDS */
+ __u8 msd_padding[MDS_LR_SERVER_SIZE - 140];
+};
+
+/* Data stored per client in the last_rcvd file. In le32 order. */
+struct mds_client_data {
+ __u8 mcd_uuid[40]; /* client UUID */
+ __u64 mcd_last_transno; /* last completed transaction ID */
+ __u64 mcd_last_xid; /* xid for the last transaction */
+ __u32 mcd_last_result; /* result from last RPC */
+ __u32 mcd_last_data; /* per-op data (disposition for open &c.) */
+ __u8 mcd_padding[MDS_LR_CLIENT_SIZE - 64];
+};
+
+/* file data for open files on MDS */
+struct mds_file_data {
+ struct portals_handle mfd_handle; /* must be first */
+ atomic_t mfd_refcount;
+ struct list_head mfd_list;
+ __u64 mfd_xid;
+ int mfd_mode;
+ struct dentry *mfd_dentry;
+};
+
+/* mds/mds_reint.c */
+int mds_reint_rec(struct mds_update_record *r, int offset,
+ struct ptlrpc_request *req, struct lustre_handle *);
/* mds/handler.c */
-struct dentry *mds_fid2dentry(struct mds_obd *mds, struct ll_fid *fid, struct vfsmount **mnt);
-
-/* llight/request.c */
-int mdc_getattr(struct lustre_peer *peer, ino_t ino, int type, int valid,
- struct mds_rep **mds_reply, struct ptlrep_hdr **hdr);
-int mdc_setattr(struct lustre_peer *peer, struct inode *inode,
- struct iattr *iattr, struct mds_rep **mds_reply,
- struct ptlrep_hdr **hdr);
-int mdc_readpage(struct lustre_peer *peer, ino_t ino, int type, __u64 offset,
- char *addr, struct mds_rep **rep, struct ptlrep_hdr **hdr);
-int mdc_create(struct lustre_peer *peer,
- struct inode *dir, const char *name, int namelen,
- const char *tgt, int tgtlen,
- int mode, __u64 id, __u32 uid, __u32 gid, __u64 time,
- struct mds_rep **rep, struct ptlrep_hdr **hdr);
-int mdc_unlink(struct lustre_peer *peer,
- struct inode *dir, const char *name, int namelen,
- struct mds_rep **rep, struct ptlrep_hdr **hdr);
-int mdc_link(struct lustre_peer *peer, struct dentry *src,
- struct inode *dir, const char *name, int namelen,
- struct mds_rep **rep, struct ptlrep_hdr **hdr);
-int mdc_rename(struct lustre_peer *peer, struct inode *src,
- struct inode *tgt, const char *old, int oldlen,
- const char *new, int newlen,
- struct mds_rep **rep, struct ptlrep_hdr **hdr);
+#ifdef __KERNEL__
+struct dentry *mds_fid2locked_dentry(struct obd_device *obd, struct ll_fid *fid,
+ struct vfsmount **mnt, int lock_mode,
+ struct lustre_handle *lockh, int *pmode,
+ char *name, int namelen, __u64 lockpart);
+struct dentry *mds_fid2dentry(struct mds_obd *mds, struct ll_fid *fid,
+ struct vfsmount **mnt);
+int mds_update_server_data(struct obd_device *, int force_sync);
+
+/* mds/mds_fs.c */
+int mds_fs_setup(struct obd_device *obddev, struct vfsmount *mnt);
+int mds_fs_cleanup(struct obd_device *obddev, int failover);
+#endif
+
+/* mds/mds_lov.c */
+
+/* mdc/mdc_locks.c */
+int it_disposition(struct lookup_intent *it, int flag);
+void it_set_disposition(struct lookup_intent *it, int flag);
+int it_open_error(int phase, struct lookup_intent *it);
+int mdc_set_lock_data(struct obd_export *exp, __u64 *lockh, void *data);
+int mdc_change_cbdata(struct obd_export *exp, struct ll_fid *fid,
+ ldlm_iterator_t it, void *data);
+int mdc_intent_lock(struct obd_export *exp, struct ll_uctxt *,
+ struct ll_fid *parent,
+ const char *name, int len, void *lmm, int lmmsize,
+ struct ll_fid *child,
+ struct lookup_intent *, int,
+ struct ptlrpc_request **reqp,
+ ldlm_blocking_callback cb_blocking);
+int mdc_enqueue(struct obd_export *exp,
+ int lock_type,
+ struct lookup_intent *it,
+ int lock_mode,
+ struct mdc_op_data *data,
+ struct lustre_handle *lockh,
+ void *lmm,
+ int lmmlen,
+ ldlm_completion_callback cb_completion,
+ ldlm_blocking_callback cb_blocking,
+ void *cb_data);
+
+/* mdc/mdc_request.c */
+int mdc_req2lustre_md(struct obd_export *exp_mdc, struct ptlrpc_request *req,
+ unsigned int offset, struct obd_export *exp_osc,
+ struct lustre_md *md);
+int mdc_getstatus(struct obd_export *exp, struct ll_fid *rootfid);
+int mdc_getattr(struct obd_export *exp, struct ll_fid *fid,
+ unsigned long valid, unsigned int ea_size,
+ struct ptlrpc_request **request);
+int mdc_getattr_name(struct obd_export *exp, struct ll_fid *fid,
+ char *filename, int namelen, unsigned long valid,
+ unsigned int ea_size, struct ptlrpc_request **request);
+int mdc_setattr(struct obd_export *exp, struct mdc_op_data *data,
+ struct iattr *iattr, void *ea, int ealen, void *ea2, int ea2len,
+ struct ptlrpc_request **request);
+int mdc_open(struct obd_export *exp, obd_id ino, int type, int flags,
+ struct lov_mds_md *lmm, int lmm_size, struct lustre_handle *fh,
+ struct ptlrpc_request **);
+struct obd_client_handle;
+int mdc_set_open_replay_data(struct obd_export *exp,
+ struct obd_client_handle *och,
+ struct ptlrpc_request *open_req);
+int mdc_clear_open_replay_data(struct obd_export *exp,
+ struct obd_client_handle *och);
+int mdc_close(struct obd_export *, struct obdo *, struct obd_client_handle *,
+ struct ptlrpc_request **);
+int mdc_readpage(struct obd_export *exp, struct ll_fid *mdc_fid,
+ __u64, struct page *, struct ptlrpc_request **);
+int mdc_create(struct obd_export *exp, struct mdc_op_data *op_data,
+ const void *data, int datalen, int mode, __u32 uid, __u32 gid,
+ __u64 rdev, struct ptlrpc_request **request);
+int mdc_unlink(struct obd_export *exp, struct mdc_op_data *data,
+ struct ptlrpc_request **request);
+int mdc_link(struct obd_export *exp, struct mdc_op_data *data,
+ struct ptlrpc_request **);
+int mdc_rename(struct obd_export *exp, struct mdc_op_data *data,
+ const char *old, int oldlen, const char *new, int newlen,
+ struct ptlrpc_request **request);
+int mdc_sync(struct obd_export *exp, struct ll_fid *fid,
+ struct ptlrpc_request **);
+int mdc_create_client(struct obd_uuid uuid, struct ptlrpc_client *cl);
+
+/* Store the generation of a newly-created inode in |req| for replay. */
+int mdc_store_inode_generation(struct obd_export *exp, struct ptlrpc_request *req,
+ int reqoff, int repoff);
+int mdc_llog_process(struct obd_export *, char *logname, llog_cb_t, void *data);
+int mdc_done_writing(struct obd_export *exp, struct obdo *);
+int mdc_reint(struct ptlrpc_request *request, struct mdc_rpc_lock *rpc_lock,
+ int level);
+static inline void mdc_pack_fid(struct ll_fid *fid, obd_id ino, __u32 gen,
+ int type)
+{
+ fid->id = ino;
+ fid->generation = gen;
+ fid->f_type = type;
+}
/* ioctls for trying requests */
#define IOC_REQUEST_TYPE 'f'
#define IOC_REQUEST_MIN_NR 30
-#define IOC_REQUEST_GETATTR _IOWR('f', 30, long)
-#define IOC_REQUEST_READPAGE _IOWR('f', 31, long)
-#define IOC_REQUEST_SETATTR _IOWR('f', 32, long)
-#define IOC_REQUEST_CREATE _IOWR('f', 33, long)
-#define IOC_REQUEST_MAX_NR 33
+#define IOC_REQUEST_GETATTR _IOWR('f', 30, long)
+#define IOC_REQUEST_READPAGE _IOWR('f', 31, long)
+#define IOC_REQUEST_SETATTR _IOWR('f', 32, long)
+#define IOC_REQUEST_CREATE _IOWR('f', 33, long)
+#define IOC_REQUEST_OPEN _IOWR('f', 34, long)
+#define IOC_REQUEST_CLOSE _IOWR('f', 35, long)
+#define IOC_REQUEST_MAX_NR 35
+
+#define MDS_CHECK_RESENT(req, reconstruct) \
+{ \
+ if (lustre_msg_get_flags(req->rq_reqmsg) & MSG_RESENT) { \
+ struct mds_client_data *mcd = \
+ req->rq_export->exp_mds_data.med_mcd; \
+ if (mcd->mcd_last_xid == req->rq_xid) { \
+ reconstruct; \
+ RETURN(0); \
+ } \
+ DEBUG_REQ(D_HA, req, "no reply for RESENT req (have "LPD64")", \
+ mcd->mcd_last_xid); \
+ } \
+}
#endif