Whamcloud - gitweb
LU-5506 lfsck: skip orphan MDT-object handling for failed MDTs
[fs/lustre-release.git] / lustre / lfsck / lfsck_internal.h
index eb0af97..b32b147 100644 (file)
 #define HALF_SEC                       (HZ >> 1)
 #define LFSCK_CHECKPOINT_INTERVAL      60
 
-#define LFSCK_NAMEENTRY_DEAD           1 /* The object has been unlinked. */
-#define LFSCK_NAMEENTRY_REMOVED        2 /* The entry has been removed. */
-#define LFSCK_NAMEENTRY_RECREATED      3 /* The entry has been recreated. */
-
 enum lfsck_flags {
        /* Finish the first cycle scanning. */
        LF_SCANNED_ONCE         = 0x00000001ULL,
@@ -112,6 +108,22 @@ struct lfsck_bookmark {
        __u64   lb_reserved[2];
 };
 
+enum lfsck_namespace_trace_flags {
+       LNTF_CHECK_LINKEA       = 0x01,
+       LNTF_CHECK_PARENT       = 0x02,
+       LNTF_ALL                = 0xff
+};
+
+enum lfsck_namespace_inconsistency_type {
+       LNIT_NONE               = 0,
+       LNIT_BAD_LINKEA         = 1,
+       LNIT_UNMATCHED_PAIRS    = 2,
+       LNIT_DANGLING           = 3,
+       LNIT_MUL_REF            = 4,
+       LNIT_BAD_TYPE           = 5,
+       LNIT_BAD_DIRENT         = 6,
+};
+
 struct lfsck_namespace {
        /* Magic number to detect that this struct contains valid data. */
        __u32   ln_magic;
@@ -161,9 +173,6 @@ struct lfsck_namespace {
        /* How many directories have been traversed. */
        __u64   ln_dirs_checked;
 
-       /* How many multiple-linked objects have been checked. */
-       __u64   ln_mlinked_checked;
-
        /* How many objects have been double scanned. */
        __u64   ln_objs_checked_phase2;
 
@@ -176,9 +185,6 @@ struct lfsck_namespace {
        /* How many objects with nlink fixed. */
        __u64   ln_objs_nlink_repaired;
 
-       /* How many objects were lost before, but found back now. */
-       __u64   ln_objs_lost_found;
-
        /* The latest object has been processed (failed) during double scan. */
        struct lu_fid   ln_fid_latest_scanned_phase2;
 
@@ -187,6 +193,39 @@ struct lfsck_namespace {
 
        /* How many linkEA entries have been repaired. */
        __u64   ln_linkea_repaired;
+
+       /* How many multiple-linked objects have been checked. */
+       __u64   ln_mul_linked_checked;
+
+       /* How many multiple-linked objects have been repaired. */
+       __u64   ln_mul_linked_repaired;
+
+       /* How many undefined inconsistency found in phase2. */
+       __u64   ln_unknown_inconsistency;
+
+       /* How many unmatched pairs have been repaired. */
+       __u64   ln_unmatched_pairs_repaired;
+
+       /* How many dangling name entries have been found/repaired. */
+       __u64   ln_dangling_repaired;
+
+       /* How many multiple referenced name entries have been
+        * found/repaired. */
+       __u64   ln_mul_ref_repaired;
+
+       /* How many name entries with bad file type have been repaired. */
+       __u64   ln_bad_type_repaired;
+
+       /* How many lost name entries have been re-inserted. */
+       __u64   ln_lost_dirent_repaired;
+
+       /* The size of MDT targets bitmap with nbits. Such bitmap records
+        * the MDTs that contain non-verified MDT-objects. */
+       __u32   ln_bitmap_size;
+
+       __u32   ln_reserved_1;
+       /* For further using. 256-bytes aligned now. */
+       __u64   ln_reserved[25];
 };
 
 enum lfsck_layout_inconsistency_type {
@@ -258,8 +297,16 @@ struct lfsck_layout {
         * MDT(s)/OST(s) do not participate in the LFSCK */
        __u64   ll_objs_skipped;
 
+       /* The size of ll_ost_bitmap with nbits. */
+       __u32   ll_bitmap_size;
+
        /* For further using. 256-bytes aligned now. */
-       __u64   ll_reserved[12];
+       __u32   ll_reserved_1;
+       __u64   ll_reserved_2[11];
+
+       /* The OST targets bitmap to record the OSTs that contain
+        * non-verified OST-objects. */
+       __u8    ll_ost_bitmap[0];
 };
 
 struct lfsck_component;
@@ -289,19 +336,14 @@ struct lfsck_operations {
 
        int (*lfsck_exec_dir)(const struct lu_env *env,
                              struct lfsck_component *com,
-                             struct dt_object *obj,
-                             struct lu_dirent *ent);
+                             struct lu_dirent *ent,
+                             __u16 type);
 
        int (*lfsck_post)(const struct lu_env *env,
                          struct lfsck_component *com,
                          int result,
                          bool init);
 
-       int (*lfsck_interpret)(const struct lu_env *env,
-                              struct ptlrpc_request *req,
-                              void *args,
-                              int rc);
-
        int (*lfsck_dump)(const struct lu_env *env,
                          struct lfsck_component *com,
                          struct seq_file *m);
@@ -322,12 +364,6 @@ struct lfsck_operations {
        int (*lfsck_query)(const struct lu_env *env,
                           struct lfsck_component *com);
 
-       int (*lfsck_stop_notify)(const struct lu_env *env,
-                                struct lfsck_component *com,
-                                struct lfsck_tgt_descs *ltds,
-                                struct lfsck_tgt_desc *ltd,
-                                struct ptlrpc_request_set *set);
-
        int (*lfsck_join)(const struct lu_env *env,
                          struct lfsck_component *com,
                          struct lfsck_start_param *lsp);
@@ -343,11 +379,16 @@ struct lfsck_tgt_desc {
        struct obd_export *ltd_exp;
        struct list_head   ltd_layout_list;
        struct list_head   ltd_layout_phase_list;
+       struct list_head   ltd_namespace_list;
+       struct list_head   ltd_namespace_phase_list;
        atomic_t           ltd_ref;
        __u32              ltd_index;
        __u32              ltd_layout_gen;
+       __u32              ltd_namespace_gen;
        unsigned int       ltd_dead:1,
-                          ltd_layout_done:1;
+                          ltd_layout_done:1,
+                          ltd_namespace_done:1,
+                          ltd_namespace_failed:1;
 };
 
 struct lfsck_tgt_desc_idx {
@@ -414,7 +455,6 @@ struct lfsck_component {
        /* How many objects have been scanned since last sleep. */
        __u32                    lc_new_scanned;
 
-       unsigned int             lc_journal:1;
        __u16                    lc_type;
 };
 
@@ -464,6 +504,7 @@ struct lfsck_instance {
        struct lfsck_bookmark     li_bookmark_ram;
        struct lfsck_bookmark     li_bookmark_disk;
        struct lfsck_position     li_pos_current;
+       struct lfsck_position     li_pos_checkpoint;
 
        /* Obj for otable-based iteration */
        struct dt_object         *li_obj_oit;
@@ -514,19 +555,12 @@ struct lfsck_instance {
                                  li_start_unplug:1;
 };
 
-enum lfsck_linkea_flags {
-       /* The linkea entries does not match the object nlinks. */
-       LLF_UNMATCH_NLINKS      = 0x01,
-
-       /* Fail to repair the multiple-linked objects during the double scan. */
-       LLF_REPAIR_FAILED       = 0x02,
-};
-
 struct lfsck_async_interpret_args {
        struct lfsck_component          *laia_com;
        struct lfsck_tgt_descs          *laia_ltds;
        struct lfsck_tgt_desc           *laia_ltd;
        struct lfsck_request            *laia_lr;
+       atomic_t                        *laia_count;
        int                              laia_result;
        unsigned int                     laia_shared:1;
 };
@@ -538,16 +572,102 @@ struct lfsck_thread_args {
        struct lfsck_start_param        *lta_lsp;
 };
 
+struct lfsck_assistant_req {
+       struct list_head        lar_list;
+};
+
+struct lfsck_namespace_req {
+       struct lfsck_assistant_req       lnr_lar;
+       struct dt_object                *lnr_obj;
+       struct lu_fid                    lnr_fid;
+       __u64                            lnr_oit_cookie;
+       __u64                            lnr_dir_cookie;
+       __u32                            lnr_attr;
+       __u32                            lnr_size;
+       __u16                            lnr_type;
+       __u16                            lnr_namelen;
+       char                             lnr_name[0];
+};
+
+struct lfsck_assistant_operations {
+       int (*la_handler_p1)(const struct lu_env *env,
+                            struct lfsck_component *com,
+                            struct lfsck_assistant_req *lar);
+
+       int (*la_handler_p2)(const struct lu_env *env,
+                            struct lfsck_component *com);
+
+       void (*la_fill_pos)(const struct lu_env *env,
+                           struct lfsck_component *com,
+                           struct lfsck_position *pos);
+
+       int (*la_double_scan_result)(const struct lu_env *env,
+                                    struct lfsck_component *com,
+                                    int rc);
+
+       void (*la_req_fini)(const struct lu_env *env,
+                           struct lfsck_assistant_req *lar);
+
+       void (*la_sync_failures)(const struct lu_env *env,
+                                struct lfsck_component *com,
+                                struct lfsck_request *lr);
+};
+
+struct lfsck_assistant_data {
+       spinlock_t                               lad_lock;
+       struct list_head                         lad_req_list;
+
+       /* list for the ost targets involve LFSCK. */
+       struct list_head                         lad_ost_list;
+
+       /* list for the ost targets in phase1 scanning. */
+       struct list_head                         lad_ost_phase1_list;
+
+       /* list for the ost targets in phase1 scanning. */
+       struct list_head                         lad_ost_phase2_list;
+
+       /* list for the mdt targets involve LFSCK. */
+       struct list_head                         lad_mdt_list;
+
+       /* list for the mdt targets in phase1 scanning. */
+       struct list_head                         lad_mdt_phase1_list;
+
+       /* list for the mdt targets in phase1 scanning. */
+       struct list_head                         lad_mdt_phase2_list;
+
+       const char                              *lad_name;
+       struct ptlrpc_thread                     lad_thread;
+
+       struct lfsck_assistant_operations       *lad_ops;
+
+       cfs_bitmap_t                            *lad_bitmap;
+
+       __u32                                    lad_touch_gen;
+       int                                      lad_prefetched;
+       int                                      lad_assistant_status;
+       int                                      lad_post_result;
+       unsigned int                             lad_to_post:1,
+                                                lad_to_double_scan:1,
+                                                lad_in_double_scan:1,
+                                                lad_exit:1,
+                                                lad_incomplete:1;
+};
+
 #define LFSCK_TMPBUF_LEN       64
 
 struct lfsck_thread_info {
+       struct lu_name          lti_name_const;
        struct lu_name          lti_name;
+       struct lu_name          lti_name2;
        struct lu_buf           lti_buf;
        struct lu_buf           lti_linkea_buf;
+       struct lu_buf           lti_linkea_buf2;
        struct lu_buf           lti_big_buf;
        struct lu_fid           lti_fid;
        struct lu_fid           lti_fid2;
        struct lu_fid           lti_fid3;
+       struct lu_fid           lti_fid4;
+       struct lu_fid           lti_fid5;
        struct lu_attr          lti_la;
        struct lu_attr          lti_la2;
        struct lu_attr          lti_la3;
@@ -563,6 +683,7 @@ struct lfsck_thread_info {
        char                    lti_tmpbuf[LFSCK_TMPBUF_LEN];
        struct lfsck_request    lti_lr;
        struct lfsck_async_interpret_args lti_laia;
+       struct lfsck_async_interpret_args lti_laia2;
        struct lfsck_start      lti_start;
        struct lfsck_stop       lti_stop;
        ldlm_policy_data_t      lti_policy;
@@ -576,6 +697,7 @@ struct lfsck_thread_info {
        struct lov_user_md      lti_lum;
        struct dt_insert_rec    lti_dt_rec;
        struct lu_object_conf   lti_conf;
+       struct lu_seq_range     lti_range;
 };
 
 /* lfsck_lib.c */
@@ -585,6 +707,9 @@ int lfsck_ibits_lock(const struct lu_env *env, struct lfsck_instance *lfsck,
                     struct dt_object *obj, struct lustre_handle *lh,
                     __u64 bits, ldlm_mode_t mode);
 void lfsck_ibits_unlock(struct lustre_handle *lh, ldlm_mode_t mode);
+int lfsck_find_mdt_idx_by_fid(const struct lu_env *env,
+                             struct lfsck_instance *lfsck,
+                             const struct lu_fid *fid);
 int lfsck_create_lpf(const struct lu_env *env, struct lfsck_instance *lfsck);
 int lfsck_verify_lpf(const struct lu_env *env, struct lfsck_instance *lfsck);
 struct lfsck_instance *lfsck_instance_find(struct dt_device *key, bool ref,
@@ -606,18 +731,32 @@ void lfsck_pos_fill(const struct lu_env *env, struct lfsck_instance *lfsck,
 bool __lfsck_set_speed(struct lfsck_instance *lfsck, __u32 limit);
 void lfsck_control_speed(struct lfsck_instance *lfsck);
 void lfsck_control_speed_by_self(struct lfsck_component *com);
-struct lfsck_thread_args *lfsck_thread_args_init(struct lfsck_instance *lfsck,
-                                                struct lfsck_component *com,
-                                                struct lfsck_start_param *lsp);
 void lfsck_thread_args_fini(struct lfsck_thread_args *lta);
+struct lfsck_assistant_data *
+lfsck_assistant_data_init(struct lfsck_assistant_operations *lao,
+                         const char *name);
+int lfsck_async_interpret_common(const struct lu_env *env,
+                                struct ptlrpc_request *req,
+                                void *args, int rc);
 int lfsck_async_request(const struct lu_env *env, struct obd_export *exp,
                        struct lfsck_request *lr,
                        struct ptlrpc_request_set *set,
                        ptlrpc_interpterer_t interpterer,
                        void *args, int request);
+int lfsck_start_assistant(const struct lu_env *env, struct lfsck_component *com,
+                         struct lfsck_start_param *lsp);
+int lfsck_checkpoint_generic(const struct lu_env *env,
+                            struct lfsck_component *com);
+void lfsck_post_generic(const struct lu_env *env,
+                       struct lfsck_component *com, int *result);
+int lfsck_double_scan_generic(const struct lu_env *env,
+                             struct lfsck_component *com, int status);
+void lfsck_quit_generic(const struct lu_env *env,
+                       struct lfsck_component *com);
 
 /* lfsck_engine.c */
 int lfsck_master_engine(void *args);
+int lfsck_assistant_engine(void *args);
 
 /* lfsck_bookmark.c */
 void lfsck_bookmark_cpu_to_le(struct lfsck_bookmark *des,
@@ -630,6 +769,26 @@ int lfsck_set_param(const struct lu_env *env, struct lfsck_instance *lfsck,
                    struct lfsck_start *start, bool reset);
 
 /* lfsck_namespace.c */
+int lfsck_namespace_trace_update(const struct lu_env *env,
+                                struct lfsck_component *com,
+                                const struct lu_fid *fid,
+                                const __u8 flags, bool add);
+int __lfsck_links_read(const struct lu_env *env, struct dt_object *obj,
+                      struct linkea_data *ldata);
+int lfsck_namespace_rebuild_linkea(const struct lu_env *env,
+                                  struct lfsck_component *com,
+                                  struct dt_object *obj,
+                                  struct linkea_data *ldata);
+int lfsck_namespace_repair_dangling(const struct lu_env *env,
+                                   struct lfsck_component *com,
+                                   struct dt_object *child,
+                                   struct lfsck_namespace_req *lnr);
+int lfsck_namespace_repair_dirent(const struct lu_env *env,
+                                 struct lfsck_component *com,
+                                 struct dt_object *parent,
+                                 struct dt_object *child,
+                                 const char *name, const char *name2,
+                                 __u16 type, bool update, bool dec);
 int lfsck_verify_linkea(const struct lu_env *env, struct dt_device *dev,
                        struct dt_object *obj, const struct lu_name *cname,
                        const struct lu_fid *pfid);
@@ -649,6 +808,8 @@ int lfsck_namespace_setup(const struct lu_env *env,
 /* lfsck_layout.c */
 int lfsck_layout_setup(const struct lu_env *env, struct lfsck_instance *lfsck);
 
+extern const char dot[];
+extern const char dotdot[];
 extern const char *lfsck_flags_names[];
 extern const char *lfsck_param_names[];
 extern struct lu_context_key lfsck_thread_key;
@@ -673,7 +834,7 @@ lfsck_name_get_const(const struct lu_env *env, const void *area, ssize_t len)
 {
        struct lu_name *lname;
 
-       lname = &lfsck_env_info(env)->lti_name;
+       lname = &lfsck_env_info(env)->lti_name_const;
        lname->ln_name = area;
        lname->ln_namelen = len;
        return lname;
@@ -800,6 +961,11 @@ static inline void lfsck_object_put(const struct lu_env *env,
        lu_object_put(env, &obj->do_lu);
 }
 
+static inline u32 lfsck_dev_idx(struct dt_device *dev)
+{
+       return dev->dd_lu_dev.ld_site->ld_seq_site->ss_node_id;
+}
+
 static inline struct dt_object *
 lfsck_object_find_by_dev_nowait(const struct lu_env *env, struct dt_device *dev,
                                const struct lu_fid *fid)
@@ -835,6 +1001,32 @@ static inline struct dt_object *lfsck_object_find(const struct lu_env *env,
        return lfsck_object_find_by_dev(env, lfsck->li_next, fid);
 }
 
+static inline struct dt_object *
+lfsck_object_find_bottom(const struct lu_env *env, struct lfsck_instance *lfsck,
+                        const struct lu_fid *fid)
+{
+       struct dt_device *dev;
+       int               idx;
+
+       idx = lfsck_find_mdt_idx_by_fid(env, lfsck, fid);
+       if (idx < 0)
+               return ERR_PTR(idx);
+
+       if (idx == lfsck_dev_idx(lfsck->li_bottom)) {
+               dev = lfsck->li_bottom;
+       } else {
+               struct lfsck_tgt_desc *ltd;
+
+               ltd = LTD_TGT(&lfsck->li_mdt_descs, idx);
+               if (unlikely(ltd == NULL))
+                       return ERR_PTR(-ENODEV);
+
+               dev = ltd->ltd_tgt;
+       }
+
+       return lfsck_object_find_by_dev(env, dev, fid);
+}
+
 static inline struct lfsck_tgt_desc *lfsck_tgt_get(struct lfsck_tgt_descs *ltds,
                                                   __u32 index)
 {
@@ -896,9 +1088,49 @@ static inline void lfsck_instance_put(const struct lu_env *env,
                lfsck_instance_cleanup(env, lfsck);
 }
 
-static inline u32 lfsck_dev_idx(struct dt_device *dev)
+static inline bool lfsck_phase2_next_ready(struct lfsck_assistant_data *lad)
 {
-       return dev->dd_lu_dev.ld_site->ld_seq_site->ss_node_id;
+       return list_empty(&lad->lad_mdt_phase1_list) &&
+              (!list_empty(&lad->lad_ost_phase2_list) ||
+               list_empty(&lad->lad_ost_phase1_list));
+}
+
+static inline void lfsck_lad_set_bitmap(const struct lu_env *env,
+                                       struct lfsck_component *com,
+                                       __u32 index)
+{
+       struct lfsck_assistant_data     *lad    = com->lc_data;
+       cfs_bitmap_t                    *bitmap = lad->lad_bitmap;
+
+       LASSERT(com->lc_lfsck->li_master);
+       LASSERT(bitmap != NULL);
+       LASSERTF(bitmap->size > index, "invalid index: nbits %d, index %u\n",
+                bitmap->size, index);
+
+       cfs_bitmap_set(bitmap, index);
+       lad->lad_incomplete = 1;
+}
+
+static inline int lfsck_links_read(const struct lu_env *env,
+                                  struct dt_object *obj,
+                                  struct linkea_data *ldata)
+{
+       ldata->ld_buf =
+               lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf,
+                                      PAGE_CACHE_SIZE);
+
+       return __lfsck_links_read(env, obj, ldata);
+}
+
+static inline int lfsck_links_read2(const struct lu_env *env,
+                                   struct dt_object *obj,
+                                   struct linkea_data *ldata)
+{
+       ldata->ld_buf =
+               lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf2,
+                                      PAGE_CACHE_SIZE);
+
+       return __lfsck_links_read(env, obj, ldata);
 }
 
 #endif /* _LFSCK_INTERNAL_H */