#include <obd_class.h>
#include <lustre_disk.h>
#include <dt_object.h>
+#include <lquota.h>
#include "osd_oi.h"
#include "osd_iam.h"
+#include "osd_scrub.h"
+#include "osd_quota_fmt.h"
struct inode;
#define OSD_COUNTERS (0)
+/* Lustre special inode::i_state to indicate OI scrub skip this inode. */
+#define I_LUSTRE_NOSCRUB (1 << 31)
+
/** Enable thandle usage statistics */
#define OSD_THANDLE_STATS (0)
-#ifdef HAVE_QUOTA_SUPPORT
-struct osd_ctxt {
- __u32 oc_uid;
- __u32 oc_gid;
- cfs_kernel_cap_t oc_cap;
-};
-#endif
-
struct osd_directory {
struct iam_container od_container;
struct iam_descr od_descr;
#endif /* HAVE_LDISKFS_PDO */
+#define OSD_OTABLE_IT_CACHE_SIZE 128
+#define OSD_OTABLE_IT_CACHE_MASK (~(OSD_OTABLE_IT_CACHE_SIZE - 1))
+
+struct osd_inconsistent_item {
+ /* link into osd_scrub::os_inconsistent_items,
+ * protected by osd_scrub::os_lock. */
+ cfs_list_t oii_list;
+
+ /* The right FID <=> ino#/gen mapping. */
+ struct osd_idmap_cache oii_cache;
+
+ unsigned int oii_insert:1; /* insert or update mapping. */
+};
+
+struct osd_otable_cache {
+ struct osd_idmap_cache ooc_cache[OSD_OTABLE_IT_CACHE_SIZE];
+
+ /* Index for next cache slot to be filled. */
+ int ooc_producer_idx;
+
+ /* Index for next cache slot to be returned by it::next(). */
+ int ooc_consumer_idx;
+
+ /* How many items in ooc_cache. */
+ int ooc_cached_items;
+
+ /* Position for up layer LFSCK iteration pre-loading. */
+ __u32 ooc_pos_preload;
+};
+
+struct osd_otable_it {
+ struct osd_device *ooi_dev;
+ struct osd_otable_cache ooi_cache;
+
+ /* For osd_otable_it_key. */
+ __u8 ooi_key[16];
+
+ /* The following bits can be updated/checked w/o lock protection.
+ * If more bits will be introduced in the future and need lock to
+ * protect, please add comment. */
+ unsigned long ooi_used_outside:1, /* Some user out of OSD
+ * uses the iteration. */
+ ooi_all_cached:1, /* No more entries can be
+ * filled into cache. */
+ ooi_user_ready:1, /* The user out of OSD is
+ * ready to iterate. */
+ ooi_waiting:1; /* it::next is waiting. */
+};
+
extern const int osd_dto_credits_noquota[];
/*
/* super-class */
struct dt_device od_dt_dev;
/* information about underlying file system */
- struct lustre_mount_info *od_mount;
struct vfsmount *od_mnt;
/* object index */
struct osd_oi **od_oi_table;
/*
* Fid Capability
*/
- unsigned int od_fl_capa:1;
+ unsigned int od_fl_capa:1,
+ od_is_md:1; /* set in ->ldo_prepare */
unsigned long od_capa_timeout;
__u32 od_capa_alg;
struct lustre_capa_key *od_capa_keys;
struct obd_statfs od_statfs;
cfs_spinlock_t od_osfs_lock;
- /**
- * The following flag indicates, if it is interop mode or not.
- * It will be initialized, using mount param.
- */
- __u32 od_iop_mode;
+ unsigned int od_iop_mode:1,
+ od_noscrub:1;
struct fsfilt_operations *od_fsops;
+ int od_connects;
+ struct lu_site od_site;
/*
* mapping for legacy OST objids
struct brw_stats od_brw_stats;
cfs_atomic_t od_r_in_flight;
cfs_atomic_t od_w_in_flight;
+
+ cfs_mutex_t od_otable_mutex;
+ struct osd_otable_it *od_otable_it;
+ struct osd_scrub od_scrub;
+
+ /* service name associated with the osd device */
+ char od_svname[MAX_OBD_NAME];
+
+ /* quota slave instance */
+ struct qsd_instance *od_quota_slave;
};
#define OSD_TRACK_DECLARES
unsigned short ot_id_cnt;
unsigned short ot_id_type;
uid_t ot_id_array[OSD_MAX_UGID_CNT];
+ struct lquota_trans *ot_quota_trans;
#ifdef OSD_TRACK_DECLARES
unsigned char ot_declare_attr_set;
struct iam_iterator oi_it;
};
+struct osd_quota_leaf {
+ cfs_list_t oql_link;
+ uint oql_blk;
+};
+
+/**
+ * Iterator's in-memory data structure for quota file.
+ */
+struct osd_it_quota {
+ struct osd_object *oiq_obj;
+ /** tree blocks path to where the entry is stored */
+ uint oiq_blk[LUSTRE_DQTREEDEPTH + 1];
+ /** on-disk offset for current key where quota record can be found */
+ loff_t oiq_offset;
+ /** identifier for current quota record */
+ __u64 oiq_id;
+ /** the record index in the leaf/index block */
+ uint oiq_index[LUSTRE_DQTREEDEPTH + 1];
+ /** list of already processed leaf blocks */
+ cfs_list_t oiq_list;
+};
+
#define MAX_BLOCKS_PER_PAGE (CFS_PAGE_SIZE / 512)
struct osd_iobuf {
/** osd iterator context used for iterator session */
- union {
- struct osd_it_iam oti_it;
- /** ldiskfs iterator data structure, see osd_it_ea_{init, fini} */
- struct osd_it_ea oti_it_ea;
- };
+ union {
+ struct osd_it_iam oti_it;
+ /* ldiskfs iterator data structure,
+ * see osd_it_ea_{init, fini} */
+ struct osd_it_ea oti_it_ea;
+ struct osd_it_quota oti_it_quota;
+ };
/** pre-allocated buffer used by oti_it_ea, size OSD_IT_EA_BUFSIZE */
void *oti_it_ea_buf;
long long oti_alignment_lieutenant_colonel;
};
+ struct osd_idmap_cache oti_cache;
int oti_r_locks;
int oti_w_locks;
struct osd_iobuf oti_iobuf;
struct inode oti_inode;
int oti_created[PTLRPC_MAX_BRW_PAGES];
-#ifdef HAVE_QUOTA_SUPPORT
- struct osd_ctxt oti_ctxt;
-#endif
struct lu_env oti_obj_delete_tx_env;
#define OSD_FID_REC_SZ 32
char oti_ldp[OSD_FID_REC_SZ];
char oti_ldp2[OSD_FID_REC_SZ];
+
+ /* used by quota code */
+ union {
+ struct if_dqblk oti_dqblk;
+ struct if_dqinfo oti_dqinfo;
+ };
+ struct lquota_id_info oti_qi;
+ struct lquota_trans oti_quota_trans;
+ union lquota_rec oti_quota_rec;
+ __u64 oti_quota_id;
};
extern int ldiskfs_pdo;
struct obd_statfs *sfs);
int osd_object_auth(const struct lu_env *env, struct dt_object *dt,
struct lustre_capa *capa, __u64 opc);
-void osd_declare_qid(struct dt_object *dt, struct osd_thandle *oh,
- int type, uid_t id, struct inode *inode);
struct inode *osd_iget(struct osd_thread_info *info, struct osd_device *dev,
struct osd_inode_id *id);
struct inode *osd_iget_fid(struct osd_thread_info *info, struct osd_device *dev,
const struct lu_fid *fid,
const struct osd_inode_id *id, struct thandle *th);
+void osd_scrub_file_reset(struct osd_scrub *scrub, __u8 *uuid, __u64 flags);
+int osd_scrub_file_store(struct osd_scrub *scrub);
+int osd_scrub_start(struct osd_device *dev);
+int osd_scrub_setup(const struct lu_env *env, struct osd_device *dev);
+void osd_scrub_cleanup(const struct lu_env *env, struct osd_device *dev);
+int osd_oii_insert(struct osd_device *dev, struct osd_idmap_cache *oic,
+ int insert);
+int osd_oii_lookup(struct osd_device *dev, const struct lu_fid *fid,
+ struct osd_inode_id *id);
+int osd_scrub_dump(struct osd_device *dev, char *buf, int len);
+
+/* osd_quota_fmt.c */
+int walk_tree_dqentry(const struct lu_env *env, struct osd_object *obj,
+ int type, uint blk, int depth, uint index,
+ struct osd_it_quota *it);
+int walk_block_dqentry(const struct lu_env *env, struct osd_object *obj,
+ int type, uint blk, uint index,
+ struct osd_it_quota *it);
+loff_t find_tree_dqentry(const struct lu_env *env,
+ struct osd_object *obj, int type,
+ qid_t dqid, uint blk, int depth,
+ struct osd_it_quota *it);
+/* osd_quota.c */
+int osd_declare_qid(const struct lu_env *env, struct osd_thandle *oh,
+ struct lquota_id_info *qi, bool allocated, int *flags);
+int osd_declare_inode_qid(const struct lu_env *env, qid_t uid, qid_t gid,
+ long long space, struct osd_thandle *oh,
+ bool is_blk, bool allocated, int *flags, bool force);
+const struct dt_rec *osd_quota_pack(struct osd_object *obj,
+ const struct dt_rec *rec,
+ union lquota_rec *quota_rec);
+void osd_quota_unpack(struct osd_object *obj, const struct dt_rec *rec);
+int osd_quota_migration(const struct lu_env *env, struct dt_object *dt,
+ const struct dt_index_features *feat);
+
+static inline bool is_quota_glb_feat(const struct dt_index_features *feat)
+{
+ return (feat == &dt_quota_iusr_features ||
+ feat == &dt_quota_busr_features ||
+ feat == &dt_quota_igrp_features ||
+ feat == &dt_quota_bgrp_features) ? true : false;
+}
+
/*
* Invariants, assertions.
*/
#define osd_invariant(obj) (1)
#endif
+#define OSD_MAX_CACHE_SIZE OBD_OBJECT_EOF
+
extern const struct dt_index_operations osd_otable_ops;
static inline int osd_oi_fid2idx(struct osd_device *dev,
static inline struct osd_oi *osd_fid2oi(struct osd_device *osd,
const struct lu_fid *fid)
{
- LASSERT(!fid_is_idif(fid));
- LASSERT(!fid_is_igif(fid));
- LASSERT(osd->od_oi_table != NULL && osd->od_oi_count >= 1);
- /* It can work even od_oi_count equals to 1 although it's unexpected,
- * the only reason we set it to 1 is for performance measurement */
+ LASSERTF(!fid_is_idif(fid), DFID"\n", PFID(fid));
+ LASSERTF(!fid_is_igif(fid), DFID"\n", PFID(fid));
+ LASSERT(osd->od_oi_table != NULL && osd->od_oi_count >= 1);
+ /* It can work even od_oi_count equals to 1 although it's unexpected,
+ * the only reason we set it to 1 is for performance measurement */
return osd->od_oi_table[osd_oi_fid2idx(osd, fid)];
}
static inline struct super_block *osd_sb(const struct osd_device *dev)
{
- return dev->od_mount->lmi_mnt->mnt_sb;
+ return dev->od_mnt->mnt_sb;
}
static inline int osd_object_is_root(const struct osd_object *obj)
int osd_ldiskfs_read(struct inode *inode, void *buf, int size, loff_t *offs);
int osd_ldiskfs_write_record(struct inode *inode, void *buf, int bufsize,
- loff_t *offs, handle_t *handle);
+ int write_NUL, loff_t *offs, handle_t *handle);
static inline
struct dentry *osd_child_dentry_by_inode(const struct lu_env *env,
return result;
}
+/**
+ * Quota/Accounting handling
+ */
+extern const struct dt_index_operations osd_acct_index_ops;
+int osd_acct_obj_lookup(struct osd_thread_info *info, struct osd_device *osd,
+ const struct lu_fid *fid, struct osd_inode_id *id);
+
+/* copy from fs/ext4/dir.c */
+static inline int is_32bit_api(void)
+{
+#ifdef CONFIG_COMPAT
+ return is_compat_task();
+#else
+ return (BITS_PER_LONG == 32);
+#endif
+}
+
+static inline loff_t ldiskfs_get_htree_eof(struct file *filp)
+{
+ if ((filp->f_mode & FMODE_32BITHASH) ||
+ (!(filp->f_mode & FMODE_64BITHASH) && is_32bit_api()))
+ return LDISKFS_HTREE_EOF_32BIT;
+ else
+ return LDISKFS_HTREE_EOF_64BIT;
+}
+
#endif /* __KERNEL__ */
#endif /* _OSD_INTERNAL_H */