Whamcloud - gitweb
LU-5560 llite: basic support of SELinux in CLIO
[fs/lustre-release.git] / lustre / lfsck / lfsck_internal.h
index 5a801cf..4abe593 100644 (file)
@@ -20,7 +20,7 @@
  * GPL HEADER END
  */
 /*
- * Copyright (c) 2013, Intel Corporation.
+ * Copyright (c) 2013, 2014, Intel Corporation.
  */
 /*
  * lustre/lfsck/lfsck_internal.h
@@ -47,7 +47,7 @@
 #include <md_object.h>
 #include <lustre_linkea.h>
 
-#define HALF_SEC                       (HZ >> 1)
+#define HALF_SEC                       msecs_to_jiffies(MSEC_PER_SEC >> 1)
 #define LFSCK_CHECKPOINT_INTERVAL      60
 
 enum lfsck_flags {
@@ -108,6 +108,26 @@ struct lfsck_bookmark {
        __u64   lb_reserved[2];
 };
 
+enum lfsck_namespace_trace_flags {
+       LNTF_CHECK_LINKEA       = 0x01,
+       LNTF_CHECK_PARENT       = 0x02,
+       LNTF_SKIP_NLINK         = 0x04,
+       LNTF_CHECK_ORPHAN       = 0x08,
+       LNTF_UNCERTAIN_LMV      = 0x10,
+       LNTF_RECHECK_NAME_HASH  = 0x20,
+       LNTF_ALL                = 0xff
+};
+
+enum lfsck_namespace_inconsistency_type {
+       LNIT_NONE               = 0,
+       LNIT_BAD_LINKEA         = 1,
+       LNIT_UNMATCHED_PAIRS    = 2,
+       LNIT_DANGLING           = 3,
+       LNIT_MUL_REF            = 4,
+       LNIT_BAD_TYPE           = 5,
+       LNIT_BAD_DIRENT         = 6,
+};
+
 struct lfsck_namespace {
        /* Magic number to detect that this struct contains valid data. */
        __u32   ln_magic;
@@ -157,9 +177,6 @@ struct lfsck_namespace {
        /* How many directories have been traversed. */
        __u64   ln_dirs_checked;
 
-       /* How many multiple-linked objects have been checked. */
-       __u64   ln_mlinked_checked;
-
        /* How many objects have been double scanned. */
        __u64   ln_objs_checked_phase2;
 
@@ -172,9 +189,6 @@ struct lfsck_namespace {
        /* How many objects with nlink fixed. */
        __u64   ln_objs_nlink_repaired;
 
-       /* How many objects were lost before, but found back now. */
-       __u64   ln_objs_lost_found;
-
        /* The latest object has been processed (failed) during double scan. */
        struct lu_fid   ln_fid_latest_scanned_phase2;
 
@@ -183,6 +197,86 @@ struct lfsck_namespace {
 
        /* How many linkEA entries have been repaired. */
        __u64   ln_linkea_repaired;
+
+       /* How many multiple-linked objects have been checked. */
+       __u64   ln_mul_linked_checked;
+
+       /* How many multiple-linked objects have been repaired. */
+       __u64   ln_mul_linked_repaired;
+
+       /* How many undefined inconsistency found in phase2. */
+       __u64   ln_unknown_inconsistency;
+
+       /* How many unmatched pairs have been repaired. */
+       __u64   ln_unmatched_pairs_repaired;
+
+       /* How many dangling name entries have been found/repaired. */
+       __u64   ln_dangling_repaired;
+
+       /* How many multiple referenced name entries have been
+        * found/repaired. */
+       __u64   ln_mul_ref_repaired;
+
+       /* How many name entries with bad file type have been repaired. */
+       __u64   ln_bad_type_repaired;
+
+       /* How many lost name entries have been re-inserted. */
+       __u64   ln_lost_dirent_repaired;
+
+       /* How many objects under /lost+found have been scanned. */
+       __u64   ln_local_lpf_scanned;
+
+       /* How many objects under /lost+found have been moved to
+        * namespace visible directory. */
+       __u64   ln_local_lpf_moved;
+
+       /* How many objects under /lost+found have been skipped. */
+       __u64   ln_local_lpf_skipped;
+
+       /* How many objects under /lost+found failed to be processed. */
+       __u64   ln_local_lpf_failed;
+
+       /* How many striped directories (master) have been scanned. */
+       __u64   ln_striped_dirs_scanned;
+
+       /* How many striped directories (master) have been repaired. */
+       __u64   ln_striped_dirs_repaired;
+
+       /* How many striped directories (master) failed verification. */
+       __u64   ln_striped_dirs_failed;
+
+       /* How many striped directories (master) has been disabled. */
+       __u64   ln_striped_dirs_disabled;
+
+       /* How many striped directory's (master) have been skipped
+        * (for shards verification) because of lost master LMV EA. */
+       __u64   ln_striped_dirs_skipped;
+
+       /* How many striped directory's shards (slave) have been scanned. */
+       __u64   ln_striped_shards_scanned;
+
+       /* How many striped directory's shards (slave) have been repaired. */
+       __u64   ln_striped_shards_repaired;
+
+       /* How many striped directory's shards (slave) failed verification. */
+       __u64   ln_striped_shards_failed;
+
+       /* How many striped directory's shards (slave) have been skipped
+        * (for name hash verification) because do not know whether the slave
+        * LMV EA is valid or not. */
+       __u64   ln_striped_shards_skipped;
+
+       /* How many name entries under striped directory with bad name
+        * hash have been repaired. */
+       __u64   ln_name_hash_repaired;
+
+       /* The size of MDT targets bitmap with nbits. Such bitmap records
+        * the MDTs that contain non-verified MDT-objects. */
+       __u32   ln_bitmap_size;
+
+       __u32   ln_reserved_1;
+       /* For further using. 256-bytes aligned now. */
+       __u64   ln_reserved[15];
 };
 
 enum lfsck_layout_inconsistency_type {
@@ -254,8 +348,25 @@ struct lfsck_layout {
         * MDT(s)/OST(s) do not participate in the LFSCK */
        __u64   ll_objs_skipped;
 
+       /* The size of ll_ost_bitmap with nbits. */
+       __u32   ll_bitmap_size;
+
        /* For further using. 256-bytes aligned now. */
-       __u64   ll_reserved[12];
+       __u32   ll_reserved_1;
+       __u64   ll_reserved_2[11];
+
+       /* The OST targets bitmap to record the OSTs that contain
+        * non-verified OST-objects. */
+       __u8    ll_ost_bitmap[0];
+};
+
+struct lfsck_assistant_object {
+       struct lu_fid           lso_fid;
+       __u64                   lso_oit_cookie;
+       struct lu_attr          lso_attr;
+       atomic_t                lso_ref;
+       unsigned int            lso_dead:1,
+                               lso_is_dir:1;
 };
 
 struct lfsck_component;
@@ -271,6 +382,12 @@ struct lfsck_operations {
                           struct lfsck_component *com,
                           bool new_checked);
 
+       void (*lfsck_close_dir)(const struct lu_env *env,
+                               struct lfsck_component *com);
+
+       int (*lfsck_open_dir)(const struct lu_env *env,
+                             struct lfsck_component *com);
+
        int (*lfsck_checkpoint)(const struct lu_env *env,
                                struct lfsck_component *com,
                                bool init);
@@ -285,6 +402,7 @@ struct lfsck_operations {
 
        int (*lfsck_exec_dir)(const struct lu_env *env,
                              struct lfsck_component *com,
+                             struct lfsck_assistant_object *lso,
                              struct lu_dirent *ent,
                              __u16 type);
 
@@ -308,7 +426,8 @@ struct lfsck_operations {
 
        int (*lfsck_in_notify)(const struct lu_env *env,
                               struct lfsck_component *com,
-                              struct lfsck_request *lr);
+                              struct lfsck_request *lr,
+                              struct thandle *th);
 
        int (*lfsck_query)(const struct lu_env *env,
                           struct lfsck_component *com);
@@ -336,7 +455,8 @@ struct lfsck_tgt_desc {
        __u32              ltd_namespace_gen;
        unsigned int       ltd_dead:1,
                           ltd_layout_done:1,
-                          ltd_namespace_done:1;
+                          ltd_namespace_done:1,
+                          ltd_synced_failures:1;
 };
 
 struct lfsck_tgt_desc_idx {
@@ -363,12 +483,39 @@ struct lfsck_tgt_descs {
        __u32                            ltd_tgtnr;
 };
 
-#define LTD_TGT(ltd, index)    \
-       ((ltd)->ltd_tgts_idx[(index) / TGT_PTRS_PER_BLOCK]->\
-        ldi_tgts[(index) % TGT_PTRS_PER_BLOCK])
+static inline struct lfsck_tgt_desc *
+lfsck_ltd2tgt(struct lfsck_tgt_descs *ltd, __u32 index)
+{
+       __u32 idx1 = index / TGT_PTRS_PER_BLOCK;
+       __u32 idx2 = index % TGT_PTRS_PER_BLOCK;
+       struct lfsck_tgt_desc *__tgt = NULL;
 
-#define OST_TGT(lfsck, index)   LTD_TGT(&lfsck->li_ost_descs, index)
-#define MDT_TGT(lfsck, index)   LTD_TGT(&lfsck->li_mdt_descs, index)
+       if (unlikely(idx1 >= TGT_PTRS))
+               CDEBUG(D_LFSCK, "The target idx %u is invalid.\n", index);
+       else if (likely(ltd->ltd_tgts_idx[idx1] != NULL))
+               __tgt = ltd->ltd_tgts_idx[idx1]->ldi_tgts[idx2];
+
+       return __tgt;
+}
+
+static inline void lfsck_assign_tgt(struct lfsck_tgt_descs *ltd,
+                                   struct lfsck_tgt_desc *tgt, __u32 index)
+{
+       __u32 idx1 = index / TGT_PTRS_PER_BLOCK;
+       __u32 idx2 = index % TGT_PTRS_PER_BLOCK;
+
+       if (likely(idx1 < TGT_PTRS && ltd->ltd_tgts_idx[idx1] != NULL))
+               ltd->ltd_tgts_idx[idx1]->ldi_tgts[idx2] = tgt;
+}
+
+#define LFSCK_STF_BITS 4
+/* If want to adjust the LFSCK_STF_COUNT, please change LFSCK_STF_BITS. */
+#define LFSCK_STF_COUNT        (1 << LFSCK_STF_BITS)
+
+struct lfsck_sub_trace_obj {
+       struct dt_object        *lsto_obj;
+       struct mutex             lsto_mutex;
+};
 
 struct lfsck_component {
        /* into lfsck_instance::li_list_(scan,double_scan,idle} */
@@ -383,6 +530,7 @@ struct lfsck_component {
        struct lfsck_position    lc_pos_start;
        struct lfsck_instance   *lc_lfsck;
        struct dt_object        *lc_obj;
+       struct lfsck_sub_trace_obj lc_sub_trace_objs[LFSCK_STF_COUNT];
        struct lfsck_operations *lc_ops;
        void                    *lc_file_ram;
        void                    *lc_file_disk;
@@ -403,10 +551,78 @@ struct lfsck_component {
        /* How many objects have been scanned since last sleep. */
        __u32                    lc_new_scanned;
 
-       unsigned int             lc_journal:1;
        __u16                    lc_type;
 };
 
+#define LFSCK_LMV_MAX_STRIPES  LMV_MAX_STRIPE_COUNT
+#define LFSCK_LMV_DEF_STRIPES  4
+
+/* Warning: NOT change the lfsck_slave_lmv_flags members order,
+ *         otherwise the lfsck_record_lmv() may be wrong. */
+enum lfsck_slave_lmv_flags {
+       LSLF_NONE       = 0,
+       LSLF_BAD_INDEX2 = 1,
+       LSLF_NO_LMVEA   = 2,
+       LSLF_DANGLING   = 3,
+       LSLF_BAD_INDEX1 = 4,
+};
+
+/* When the namespace LFSCK scans a striped directory, it will record all
+ * the known shards' information in the structure "lfsck_slave_lmv_rec",
+ * including the shard's FID, index, slave LMV EA, and so on. Each shard
+ * will take one lfsck_slave_lmv_rec slot. After the 1st cycle scanning
+ * the striped directory, the LFSCK will get all the information about
+ * whether there are some inconsistency, and then it can repair them in
+ * the 2nd cycle scanning. */
+struct lfsck_slave_lmv_rec {
+       struct lu_fid   lslr_fid;
+       __u32           lslr_stripe_count;
+       __u32           lslr_index; /* the index in name or in slave lmv */
+       __u32           lslr_hash_type;
+       __u32           lslr_flags;
+};
+
+struct lfsck_lmv {
+       struct lmv_mds_md_v1             ll_lmv;
+       atomic_t                         ll_ref;
+       int                              ll_stripes_allocated;
+       int                              ll_stripes_filled;
+       int                              ll_exit_value;
+       __u32                            ll_max_stripe_count;
+       __u32                            ll_max_filled_off;
+       __u32                            ll_hash_type;
+       unsigned int                     ll_lmv_master:1,
+                                        ll_lmv_slave:1,
+                                        ll_lmv_verified:1,
+                                        ll_lmv_updated:1,
+                                        ll_inline:1,
+                                        ll_failed:1,
+                                        ll_ignore:1;
+       struct lfsck_slave_lmv_rec      *ll_lslr;
+};
+
+/* If the namespace LFSCK finds that the master MDT-object of a striped
+ * directory lost its master LMV EA, it will re-generate the master LMV
+ * EA and notify the LFSCK instance on the MDT on which the striped dir
+ * master MDT-object resides to rescan the striped directory. To do that,
+ * the notify handler will insert a "lfsck_lmv_unit" structure into the
+ * lfsck::li_list_lmv. The LFSCK instance will scan such list from time
+ * to time to check whether needs to rescan some stirped directories. */
+struct lfsck_lmv_unit {
+       struct list_head         llu_link;
+       struct lfsck_lmv         llu_lmv;
+       struct dt_object        *llu_obj;
+       struct lfsck_instance   *llu_lfsck;
+};
+
+struct lfsck_rec_lmv_save {
+       struct lu_fid           lrls_fid;
+       struct lmv_mds_md_v1    lrls_lmv;
+};
+
+/* Allow lfsck_record_lmv() to be called recursively at most three times. */
+#define LFSCK_REC_LMV_MAX_DEPTH 3
+
 struct lfsck_instance {
        struct mutex              li_mutex;
        spinlock_t                li_lock;
@@ -428,6 +644,9 @@ struct lfsck_instance {
        /* For the components those are not scanning now. */
        struct list_head          li_list_idle;
 
+       /* For the lfsck_lmv_unit to be handled. */
+       struct list_head          li_list_lmv;
+
        atomic_t                  li_ref;
        atomic_t                  li_double_scan_count;
        struct ptlrpc_thread      li_thread;
@@ -447,14 +666,18 @@ struct lfsck_instance {
        struct local_oid_storage *li_los;
        struct lu_fid             li_local_root_fid;  /* backend root "/" */
        struct lu_fid             li_global_root_fid; /* /ROOT */
+       struct dt_object         *li_lfsck_dir;
        struct dt_object         *li_bookmark_obj;
        struct dt_object         *li_lpf_obj;
+       struct dt_object         *li_lpf_root_obj;
        struct lu_client_seq     *li_seq;
        struct lfsck_bookmark     li_bookmark_ram;
        struct lfsck_bookmark     li_bookmark_disk;
        struct lfsck_position     li_pos_current;
        struct lfsck_position     li_pos_checkpoint;
 
+       struct lfsck_lmv         *li_lmv;
+
        /* Obj for otable-based iteration */
        struct dt_object         *li_obj_oit;
 
@@ -502,14 +725,7 @@ struct lfsck_instance {
                                  li_master:1, /* Master instance or not. */
                                  li_current_oit_processed:1,
                                  li_start_unplug:1;
-};
-
-enum lfsck_linkea_flags {
-       /* The linkea entries does not match the object nlinks. */
-       LLF_UNMATCH_NLINKS      = 0x01,
-
-       /* Fail to repair the multiple-linked objects during the double scan. */
-       LLF_REPAIR_FAILED       = 0x02,
+       struct lfsck_rec_lmv_save li_rec_lmv_save[LFSCK_REC_LMV_MAX_DEPTH];
 };
 
 struct lfsck_async_interpret_args {
@@ -517,6 +733,7 @@ struct lfsck_async_interpret_args {
        struct lfsck_tgt_descs          *laia_ltds;
        struct lfsck_tgt_desc           *laia_ltd;
        struct lfsck_request            *laia_lr;
+       atomic_t                        *laia_count;
        int                              laia_result;
        unsigned int                     laia_shared:1;
 };
@@ -529,7 +746,27 @@ struct lfsck_thread_args {
 };
 
 struct lfsck_assistant_req {
-       struct list_head        lar_list;
+       struct list_head                 lar_list;
+       struct lfsck_assistant_object   *lar_parent;
+};
+
+struct lfsck_namespace_req {
+       struct lfsck_assistant_req       lnr_lar;
+       struct lfsck_lmv                *lnr_lmv;
+       struct lu_fid                    lnr_fid;
+       __u64                            lnr_dir_cookie;
+       __u32                            lnr_attr;
+       __u32                            lnr_size;
+       __u16                            lnr_type;
+       __u16                            lnr_namelen;
+       char                             lnr_name[0];
+};
+
+struct lfsck_layout_req {
+       struct lfsck_assistant_req       llr_lar;
+       struct dt_object                *llr_child;
+       __u32                            llr_ost_idx;
+       __u32                            llr_lov_idx; /* offset in LOV EA */
 };
 
 struct lfsck_assistant_operations {
@@ -550,6 +787,10 @@ struct lfsck_assistant_operations {
 
        void (*la_req_fini)(const struct lu_env *env,
                            struct lfsck_assistant_req *lar);
+
+       void (*la_sync_failures)(const struct lu_env *env,
+                                struct lfsck_component *com,
+                                struct lfsck_request *lr);
 };
 
 struct lfsck_assistant_data {
@@ -579,6 +820,8 @@ struct lfsck_assistant_data {
 
        struct lfsck_assistant_operations       *lad_ops;
 
+       cfs_bitmap_t                            *lad_bitmap;
+
        __u32                                    lad_touch_gen;
        int                                      lad_prefetched;
        int                                      lad_assistant_status;
@@ -586,22 +829,33 @@ struct lfsck_assistant_data {
        unsigned int                             lad_to_post:1,
                                                 lad_to_double_scan:1,
                                                 lad_in_double_scan:1,
-                                                lad_exit:1;
+                                                lad_exit:1,
+                                                lad_incomplete:1;
+       bool                                     lad_advance_lock;
 };
 
 #define LFSCK_TMPBUF_LEN       64
 
+struct lfsck_lock_handle {
+       struct lustre_handle    llh_pdo_lh;
+       struct lustre_handle    llh_reg_lh;
+       ldlm_mode_t             llh_pdo_mode;
+       ldlm_mode_t             llh_reg_mode;
+};
+
 struct lfsck_thread_info {
+       struct lu_name          lti_name_const;
        struct lu_name          lti_name;
+       struct lu_name          lti_name2;
        struct lu_buf           lti_buf;
        struct lu_buf           lti_linkea_buf;
+       struct lu_buf           lti_linkea_buf2;
        struct lu_buf           lti_big_buf;
        struct lu_fid           lti_fid;
        struct lu_fid           lti_fid2;
        struct lu_fid           lti_fid3;
        struct lu_attr          lti_la;
        struct lu_attr          lti_la2;
-       struct lu_attr          lti_la3;
        struct ost_id           lti_oi;
        union {
                struct lustre_mdt_attrs lti_lma;
@@ -612,11 +866,14 @@ struct lfsck_thread_info {
        /* There will be '\0' at the end of the name. */
        char            lti_key[sizeof(struct lu_dirent) + NAME_MAX + 1];
        char                    lti_tmpbuf[LFSCK_TMPBUF_LEN];
+       char                    lti_tmpbuf2[LFSCK_TMPBUF_LEN];
        struct lfsck_request    lti_lr;
        struct lfsck_async_interpret_args lti_laia;
+       struct lfsck_async_interpret_args lti_laia2;
        struct lfsck_start      lti_start;
        struct lfsck_stop       lti_stop;
        ldlm_policy_data_t      lti_policy;
+       struct ldlm_enqueue_info lti_einfo;
        struct ldlm_res_id      lti_resid;
        union {
                struct filter_fid_old   lti_old_pfid;
@@ -627,6 +884,12 @@ struct lfsck_thread_info {
        struct lov_user_md      lti_lum;
        struct dt_insert_rec    lti_dt_rec;
        struct lu_object_conf   lti_conf;
+       struct lu_seq_range     lti_range;
+       struct lmv_mds_md_v1    lti_lmv;
+       struct lmv_mds_md_v1    lti_lmv2;
+       struct lmv_mds_md_v1    lti_lmv3;
+       struct lmv_mds_md_v1    lti_lmv4;
+       struct lfsck_lock_handle lti_llh;
 };
 
 /* lfsck_lib.c */
@@ -636,7 +899,13 @@ int lfsck_ibits_lock(const struct lu_env *env, struct lfsck_instance *lfsck,
                     struct dt_object *obj, struct lustre_handle *lh,
                     __u64 bits, ldlm_mode_t mode);
 void lfsck_ibits_unlock(struct lustre_handle *lh, ldlm_mode_t mode);
-int lfsck_create_lpf(const struct lu_env *env, struct lfsck_instance *lfsck);
+int lfsck_lock(const struct lu_env *env, struct lfsck_instance *lfsck,
+              struct dt_object *obj, const char *name,
+              struct lfsck_lock_handle *llh, __u64 bits, ldlm_mode_t mode);
+void lfsck_unlock(struct lfsck_lock_handle *llh);
+int lfsck_find_mdt_idx_by_fid(const struct lu_env *env,
+                             struct lfsck_instance *lfsck,
+                             const struct lu_fid *fid);
 int lfsck_verify_lpf(const struct lu_env *env, struct lfsck_instance *lfsck);
 struct lfsck_instance *lfsck_instance_find(struct dt_device *key, bool ref,
                                           bool unlink);
@@ -649,7 +918,7 @@ void lfsck_instance_cleanup(const struct lu_env *env,
                            struct lfsck_instance *lfsck);
 int lfsck_bits_dump(struct seq_file *m, int bits, const char *names[],
                    const char *prefix);
-int lfsck_time_dump(struct seq_file *m, __u64 time, const char *prefix);
+int lfsck_time_dump(struct seq_file *m, __u64 time, const char *name);
 int lfsck_pos_dump(struct seq_file *m, struct lfsck_position *pos,
                   const char *prefix);
 void lfsck_pos_fill(const struct lu_env *env, struct lfsck_instance *lfsck,
@@ -661,6 +930,14 @@ void lfsck_thread_args_fini(struct lfsck_thread_args *lta);
 struct lfsck_assistant_data *
 lfsck_assistant_data_init(struct lfsck_assistant_operations *lao,
                          const char *name);
+struct lfsck_assistant_object *
+lfsck_assistant_object_init(const struct lu_env *env, const struct lu_fid *fid,
+                           const struct lu_attr *attr, __u64 cookie,
+                           bool is_dir);
+struct dt_object *
+lfsck_assistant_object_load(const struct lu_env *env,
+                           struct lfsck_instance *lfsck,
+                           struct lfsck_assistant_object *lso);
 int lfsck_async_interpret_common(const struct lu_env *env,
                                 struct ptlrpc_request *req,
                                 void *args, int rc);
@@ -681,6 +958,11 @@ void lfsck_quit_generic(const struct lu_env *env,
                        struct lfsck_component *com);
 
 /* lfsck_engine.c */
+int lfsck_unpack_ent(struct lu_dirent *ent, __u64 *cookie, __u16 *type);
+void lfsck_close_dir(const struct lu_env *env,
+                    struct lfsck_instance *lfsck, int result);
+int lfsck_open_dir(const struct lu_env *env,
+                  struct lfsck_instance *lfsck, __u64 cookie);
 int lfsck_master_engine(void *args);
 int lfsck_assistant_engine(void *args);
 
@@ -695,30 +977,97 @@ int lfsck_set_param(const struct lu_env *env, struct lfsck_instance *lfsck,
                    struct lfsck_start *start, bool reset);
 
 /* lfsck_namespace.c */
-int lfsck_verify_linkea(const struct lu_env *env, struct dt_device *dev,
-                       struct dt_object *obj, const struct lu_name *cname,
-                       const struct lu_fid *pfid);
+int lfsck_namespace_trace_update(const struct lu_env *env,
+                                struct lfsck_component *com,
+                                const struct lu_fid *fid,
+                                const __u8 flags, bool add);
+int lfsck_namespace_check_exist(const struct lu_env *env,
+                               struct dt_object *dir,
+                               struct dt_object *obj, const char *name);
+int __lfsck_links_read(const struct lu_env *env, struct dt_object *obj,
+                      struct linkea_data *ldata);
+int lfsck_namespace_rebuild_linkea(const struct lu_env *env,
+                                  struct lfsck_component *com,
+                                  struct dt_object *obj,
+                                  struct linkea_data *ldata);
+int lfsck_namespace_repair_dangling(const struct lu_env *env,
+                                   struct lfsck_component *com,
+                                   struct dt_object *parent,
+                                   struct dt_object *child,
+                                   struct lfsck_namespace_req *lnr);
+int lfsck_namespace_repair_dirent(const struct lu_env *env,
+                                 struct lfsck_component *com,
+                                 struct dt_object *parent,
+                                 struct dt_object *child,
+                                 const char *name, const char *name2,
+                                 __u16 type, bool update, bool dec);
+int lfsck_verify_linkea(const struct lu_env *env, struct dt_object *obj,
+                       const struct lu_name *cname, const struct lu_fid *pfid);
 int lfsck_links_get_first(const struct lu_env *env, struct dt_object *obj,
                          char *name, struct lu_fid *pfid);
-int lfsck_remove_name_entry(const struct lu_env *env,
-                           struct lfsck_instance *lfsck,
-                           struct dt_object *parent,
-                           const char *name, __u32 type);
 int lfsck_update_name_entry(const struct lu_env *env,
                            struct lfsck_instance *lfsck,
-                           struct dt_object *parent, const char *name,
-                           const struct lu_fid *pfid, __u32 type);
+                           struct dt_object *dir, const char *name,
+                           const struct lu_fid *fid, __u32 type);
 int lfsck_namespace_setup(const struct lu_env *env,
                          struct lfsck_instance *lfsck);
 
+/* lfsck_striped_dir.c */
+void lfsck_lmv_put(const struct lu_env *env, struct lfsck_lmv *llmv);
+int lfsck_read_stripe_lmv(const struct lu_env *env, struct dt_object *obj,
+                         struct lmv_mds_md_v1 *lmv);
+int lfsck_shard_name_to_index(const struct lu_env *env, const char *name,
+                             int namelen, __u16 type,
+                             const struct lu_fid *fid);
+bool lfsck_is_valid_slave_name_entry(const struct lu_env *env,
+                                    struct lfsck_lmv *llmv,
+                                    const char *name, int namelen);
+int lfsck_namespace_check_name(const struct lu_env *env,
+                              struct dt_object *parent,
+                              struct dt_object *child,
+                              const struct lu_name *cname);
+int lfsck_namespace_update_lmv(const struct lu_env *env,
+                              struct lfsck_component *com,
+                              struct dt_object *obj,
+                              struct lmv_mds_md_v1 *lmv, bool locked);
+int lfsck_namespace_verify_stripe_slave(const struct lu_env *env,
+                                       struct lfsck_component *com,
+                                       struct dt_object *obj,
+                                       struct lfsck_lmv *llmv);
+int lfsck_namespace_scan_shard(const struct lu_env *env,
+                              struct lfsck_component *com,
+                              struct dt_object *child);
+int lfsck_namespace_notify_lmv_master_local(const struct lu_env *env,
+                                           struct lfsck_component *com,
+                                           struct dt_object *obj);
+int lfsck_namespace_repair_bad_name_hash(const struct lu_env *env,
+                                        struct lfsck_component *com,
+                                        struct dt_object *shard,
+                                        struct lfsck_lmv *llmv,
+                                        const char *name);
+int lfsck_namespace_striped_dir_rescan(const struct lu_env *env,
+                                      struct lfsck_component *com,
+                                      struct lfsck_namespace_req *lnr);
+int lfsck_namespace_handle_striped_master(const struct lu_env *env,
+                                         struct lfsck_component *com,
+                                         struct lfsck_namespace_req *lnr);
+
 /* lfsck_layout.c */
 int lfsck_layout_setup(const struct lu_env *env, struct lfsck_instance *lfsck);
 
+extern const char dot[];
+extern const char dotdot[];
 extern const char *lfsck_flags_names[];
 extern const char *lfsck_param_names[];
 extern struct lu_context_key lfsck_thread_key;
 
-static inline struct dt_device *lfsck_obj2dt_dev(struct dt_object *obj)
+static inline bool name_is_dot_or_dotdot(const char *name, int namelen)
+{
+       return name[0] == '.' &&
+              (namelen == 1 || (namelen == 2 && name[1] == '.'));
+}
+
+static inline struct dt_device *lfsck_obj2dev(struct dt_object *obj)
 {
        return container_of0(obj->do_lu.lo_dev, struct dt_device, dd_lu_dev);
 }
@@ -738,7 +1087,7 @@ lfsck_name_get_const(const struct lu_env *env, const void *area, ssize_t len)
 {
        struct lu_name *lname;
 
-       lname = &lfsck_env_info(env)->lti_name;
+       lname = &lfsck_env_info(env)->lti_name_const;
        lname->ln_name = area;
        lname->ln_namelen = len;
        return lname;
@@ -865,39 +1214,105 @@ static inline void lfsck_object_put(const struct lu_env *env,
        lu_object_put(env, &obj->do_lu);
 }
 
+static inline struct seq_server_site
+*lfsck_dev_site(struct lfsck_instance *lfsck)
+{
+       return lu_site2seq(lfsck->li_bottom->dd_lu_dev.ld_site);
+}
+
+static inline u32 lfsck_dev_idx(struct lfsck_instance *lfsck)
+{
+       return lfsck_dev_site(lfsck)->ss_node_id;
+}
+
 static inline struct dt_object *
 lfsck_object_find_by_dev_nowait(const struct lu_env *env, struct dt_device *dev,
                                const struct lu_fid *fid)
 {
        struct lu_object_conf   *conf = &lfsck_env_info(env)->lti_conf;
-       struct dt_object        *obj;
 
        conf->loc_flags = LOC_F_NOWAIT;
-       obj = lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, conf));
-       if (unlikely(obj == NULL))
-               return ERR_PTR(-ENOENT);
-
-       return obj;
+       return lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, conf));
 }
 
 static inline struct dt_object *
 lfsck_object_find_by_dev(const struct lu_env *env, struct dt_device *dev,
                         const struct lu_fid *fid)
 {
-       struct dt_object *obj;
+       return lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, NULL));
+}
 
-       obj = lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, NULL));
-       if (unlikely(obj == NULL))
-               return ERR_PTR(-ENOENT);
+static inline struct dt_device *
+lfsck_find_dev_by_fid(const struct lu_env *env, struct lfsck_instance *lfsck,
+                     const struct lu_fid *fid)
+{
+       struct dt_device *dev;
+       int               idx;
 
-       return obj;
+       if (!lfsck->li_master)
+               return lfsck->li_bottom;
+
+       idx = lfsck_find_mdt_idx_by_fid(env, lfsck, fid);
+       if (idx < 0)
+               return ERR_PTR(idx);
+
+       if (idx == lfsck_dev_idx(lfsck)) {
+               dev = lfsck->li_bottom;
+       } else {
+               struct lfsck_tgt_desc *ltd;
+
+               ltd = lfsck_ltd2tgt(&lfsck->li_mdt_descs, idx);
+               if (unlikely(ltd == NULL))
+                       return ERR_PTR(-ENODEV);
+
+               dev = ltd->ltd_tgt;
+       }
+
+       return dev;
 }
 
-static inline struct dt_object *lfsck_object_find(const struct lu_env *env,
-                                                 struct lfsck_instance *lfsck,
-                                                 const struct lu_fid *fid)
+static inline struct dt_object *
+lfsck_object_find_bottom(const struct lu_env *env, struct lfsck_instance *lfsck,
+                        const struct lu_fid *fid)
+{
+       struct dt_device *dev;
+
+       dev = lfsck_find_dev_by_fid(env, lfsck, fid);
+       if (IS_ERR(dev))
+               return (struct dt_object *)dev;
+
+       return lfsck_object_find_by_dev(env, dev, fid);
+}
+
+static inline struct dt_object *
+lfsck_object_find_bottom_nowait(const struct lu_env *env,
+                               struct lfsck_instance *lfsck,
+                               const struct lu_fid *fid)
 {
-       return lfsck_object_find_by_dev(env, lfsck->li_next, fid);
+       struct dt_device *dev;
+
+       dev = lfsck_find_dev_by_fid(env, lfsck, fid);
+       if (IS_ERR(dev))
+               return (struct dt_object *)dev;
+
+       return lfsck_object_find_by_dev_nowait(env, dev, fid);
+}
+
+static inline struct dt_object *
+lfsck_object_locate(struct dt_device *dev, struct dt_object *obj)
+{
+       if (lfsck_obj2dev(obj) == dev) {
+               return obj;
+       } else {
+               struct lu_object *lo;
+
+               lo = lu_object_locate(obj->do_lu.lo_header,
+                                     dev->dd_lu_dev.ld_type);
+               if (unlikely(lo == NULL))
+                       return ERR_PTR(-ENOENT);
+
+               return lu2dt(lo);
+       }
 }
 
 static inline struct lfsck_tgt_desc *lfsck_tgt_get(struct lfsck_tgt_descs *ltds,
@@ -905,7 +1320,7 @@ static inline struct lfsck_tgt_desc *lfsck_tgt_get(struct lfsck_tgt_descs *ltds,
 {
        struct lfsck_tgt_desc *ltd;
 
-       ltd = LTD_TGT(ltds, index);
+       ltd = lfsck_ltd2tgt(ltds, index);
        if (ltd != NULL)
                atomic_inc(&ltd->ltd_ref);
 
@@ -930,8 +1345,17 @@ static inline void lfsck_component_put(const struct lu_env *env,
                                       struct lfsck_component *com)
 {
        if (atomic_dec_and_test(&com->lc_ref)) {
+               struct lfsck_sub_trace_obj *lsto;
+               int                         i;
+
+               for (i = 0, lsto = &com->lc_sub_trace_objs[0];
+                    i < LFSCK_STF_COUNT; i++, lsto++) {
+                       if (lsto->lsto_obj != NULL)
+                               lfsck_object_put(env, lsto->lsto_obj);
+               }
+
                if (com->lc_obj != NULL)
-                       lu_object_put_nocache(env, &com->lc_obj->do_lu);
+                       lfsck_object_put(env, com->lc_obj);
                if (com->lc_file_ram != NULL)
                        OBD_FREE(com->lc_file_ram, com->lc_file_size);
                if (com->lc_file_disk != NULL)
@@ -961,11 +1385,6 @@ static inline void lfsck_instance_put(const struct lu_env *env,
                lfsck_instance_cleanup(env, lfsck);
 }
 
-static inline u32 lfsck_dev_idx(struct dt_device *dev)
-{
-       return dev->dd_lu_dev.ld_site->ld_seq_site->ss_node_id;
-}
-
 static inline bool lfsck_phase2_next_ready(struct lfsck_assistant_data *lad)
 {
        return list_empty(&lad->lad_mdt_phase1_list) &&
@@ -973,4 +1392,94 @@ static inline bool lfsck_phase2_next_ready(struct lfsck_assistant_data *lad)
                list_empty(&lad->lad_ost_phase1_list));
 }
 
+static inline void lfsck_lad_set_bitmap(const struct lu_env *env,
+                                       struct lfsck_component *com,
+                                       __u32 index)
+{
+       struct lfsck_assistant_data     *lad    = com->lc_data;
+       cfs_bitmap_t                    *bitmap = lad->lad_bitmap;
+
+       LASSERT(com->lc_lfsck->li_master);
+       LASSERT(bitmap != NULL);
+
+       if (likely(bitmap->size > index)) {
+               cfs_bitmap_set(bitmap, index);
+               lad->lad_incomplete = 1;
+       } else if (com->lc_type == LFSCK_TYPE_NAMESPACE) {
+               struct lfsck_namespace *ns = com->lc_file_ram;
+
+               ns->ln_flags |= LF_INCOMPLETE;
+       }
+}
+
+static inline int lfsck_links_read(const struct lu_env *env,
+                                  struct dt_object *obj,
+                                  struct linkea_data *ldata)
+{
+       ldata->ld_buf =
+               lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf,
+                                      PAGE_CACHE_SIZE);
+
+       return __lfsck_links_read(env, obj, ldata);
+}
+
+static inline int lfsck_links_read2(const struct lu_env *env,
+                                   struct dt_object *obj,
+                                   struct linkea_data *ldata)
+{
+       ldata->ld_buf =
+               lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf2,
+                                      PAGE_CACHE_SIZE);
+
+       return __lfsck_links_read(env, obj, ldata);
+}
+
+static inline struct lfsck_lmv *lfsck_lmv_get(struct lfsck_lmv *llmv)
+{
+       if (llmv != NULL)
+               atomic_inc(&llmv->ll_ref);
+
+       return llmv;
+}
+
+static inline int lfsck_sub_trace_file_fid2idx(const struct lu_fid *fid)
+{
+       return fid->f_oid & (LFSCK_STF_COUNT - 1);
+}
+
+static inline void lfsck_lmv_header_le_to_cpu(struct lmv_mds_md_v1 *dst,
+                                             const struct lmv_mds_md_v1 *src)
+{
+       dst->lmv_magic = le32_to_cpu(src->lmv_magic);
+       dst->lmv_stripe_count = le32_to_cpu(src->lmv_stripe_count);
+       dst->lmv_master_mdt_index = le32_to_cpu(src->lmv_master_mdt_index);
+       dst->lmv_hash_type = le32_to_cpu(src->lmv_hash_type);
+       dst->lmv_layout_version = le32_to_cpu(src->lmv_layout_version);
+}
+
+static inline void lfsck_lmv_header_cpu_to_le(struct lmv_mds_md_v1 *dst,
+                                             const struct lmv_mds_md_v1 *src)
+{
+       dst->lmv_magic = cpu_to_le32(src->lmv_magic);
+       dst->lmv_stripe_count = cpu_to_le32(src->lmv_stripe_count);
+       dst->lmv_master_mdt_index = cpu_to_le32(src->lmv_master_mdt_index);
+       dst->lmv_hash_type = cpu_to_le32(src->lmv_hash_type);
+       dst->lmv_layout_version = cpu_to_le32(src->lmv_layout_version);
+}
+
+static inline struct lfsck_assistant_object *
+lfsck_assistant_object_get(struct lfsck_assistant_object *lso)
+{
+       atomic_inc(&lso->lso_ref);
+
+       return lso;
+}
+
+static inline void
+lfsck_assistant_object_put(const struct lu_env *env,
+                          struct lfsck_assistant_object *lso)
+{
+       if (atomic_dec_and_test(&lso->lso_ref))
+               OBD_FREE_PTR(lso);
+}
 #endif /* _LFSCK_INTERNAL_H */