Whamcloud - gitweb
LU-3118 lfsck: resume LFSCK from the last checkpoint
authorFan Yong <yong.fan@whamcloud.com>
Mon, 22 Apr 2013 01:58:42 +0000 (09:58 +0800)
committerOleg Drokin <oleg.drokin@intel.com>
Thu, 25 Apr 2013 15:37:50 +0000 (11:37 -0400)
It is a misc patch to enable the support to resume LFSCK from the last
checkpoint: no object will be skipped, not repeatly scan the object(s)
in front of checkpoint.

Other fixes:
1) Simplify LFSCK checkpoint logic.
2) Add linkEA for .lustre itself, then LFSCK will not be misguided.
3) Set LFSCK status as "failed" if hit error at prepare phase.
4) osd_otable_it_store() should return the cursor position, instead
of the pre-load position.
5) Other code cleanup.

Test-Parameters: testlist=sanity-scrub,sanity-lfsck
Signed-off-by: Fan Yong <fan.yong@intel.com>
Change-Id: I3f6e988da323239ff2655ad4b13eae711e892ebe
Reviewed-on: http://review.whamcloud.com/6078
Tested-by: Hudson
Reviewed-by: Alex Zhuravlev <alexey.zhuravlev@intel.com>
Reviewed-by: Andreas Dilger <andreas.dilger@intel.com>
Tested-by: Maloo <whamcloud.maloo@gmail.com>
lustre/mdd/mdd_device.c
lustre/mdd/mdd_dir.c
lustre/mdd/mdd_lfsck.c
lustre/mdd/mdd_lfsck.h
lustre/osd-ldiskfs/osd_scrub.c
lustre/tests/sanity-lfsck.sh

index 9633cfd..e4f5b09 100644 (file)
@@ -562,10 +562,12 @@ static int obf_lookup(const struct lu_env *env, struct md_object *p,
                 GOTO(out, rc = -EINVAL);
         }
 
                 GOTO(out, rc = -EINVAL);
         }
 
-       if (!fid_is_norm(f)) {
+       if (!fid_is_norm(f) && !fid_is_igif(f)) {
                CWARN("%s: "DFID" is invalid, sequence should be "
                CWARN("%s: "DFID" is invalid, sequence should be "
-                     ">= "LPX64"\n", mdd2obd_dev(mdd)->obd_name, PFID(f),
-                     (__u64)FID_SEQ_NORMAL);
+                     ">= "LPX64" or within ["LPX64","LPX64"].\n",
+                     mdd2obd_dev(mdd)->obd_name, PFID(f),
+                     (__u64)FID_SEQ_NORMAL, (__u64)FID_SEQ_IGIF,
+                     (__u64)FID_SEQ_IGIF_MAX);
                GOTO(out, rc = -EINVAL);
        }
 
                GOTO(out, rc = -EINVAL);
        }
 
index a587939..9d45b30 100644 (file)
@@ -1716,9 +1716,7 @@ static int mdd_declare_object_initialize(const struct lu_env *env,
                                              dotdot, handle);
         }
 
                                              dotdot, handle);
         }
 
-       if (rc == 0 && (fid_is_norm(mdo2fid(child)) ||
-                       fid_is_dot_lustre(mdo2fid(child)) ||
-                       fid_is_root(mdo2fid(child))))
+       if (rc == 0)
                mdd_declare_links_add(env, child, handle, ldata);
 
        RETURN(rc);
                mdd_declare_links_add(env, child, handle, ldata);
 
        RETURN(rc);
@@ -1758,9 +1756,7 @@ static int mdd_object_initialize(const struct lu_env *env,
                         mdo_ref_del(env, child, handle);
         }
 
                         mdo_ref_del(env, child, handle);
         }
 
-       if (rc == 0 && (fid_is_norm(mdo2fid(child)) ||
-                       fid_is_dot_lustre(mdo2fid(child)) ||
-                       fid_is_root(mdo2fid(child))))
+       if (rc == 0)
                mdd_links_add(env, child, pfid, lname, handle, ldata, 1);
 
        RETURN(rc);
                mdd_links_add(env, child, pfid, lname, handle, ldata, 1);
 
        RETURN(rc);
index 9d7b54c..f34fbe5 100644 (file)
@@ -47,7 +47,6 @@
 
 #define HALF_SEC                       (CFS_HZ >> 1)
 #define LFSCK_CHECKPOINT_INTERVAL      60
 
 #define HALF_SEC                       (CFS_HZ >> 1)
 #define LFSCK_CHECKPOINT_INTERVAL      60
-#define MDS_DIR_DUMMY_START            0xffffffffffffffffULL
 
 #define LFSCK_NAMEENTRY_DEAD           1 /* The object has been unlinked. */
 #define LFSCK_NAMEENTRY_REMOVED        2 /* The entry has been removed. */
 
 #define LFSCK_NAMEENTRY_DEAD           1 /* The object has been unlinked. */
 #define LFSCK_NAMEENTRY_REMOVED        2 /* The entry has been removed. */
@@ -233,8 +232,7 @@ static int lfsck_pos_dump(char **buf, int *len, struct lfsck_position *pos,
 }
 
 static void mdd_lfsck_pos_fill(const struct lu_env *env, struct md_lfsck *lfsck,
 }
 
 static void mdd_lfsck_pos_fill(const struct lu_env *env, struct md_lfsck *lfsck,
-                              struct lfsck_position *pos, bool oit_processed,
-                              bool dir_processed)
+                              struct lfsck_position *pos, bool init)
 {
        const struct dt_it_ops *iops = &lfsck->ml_obj_oit->do_index_ops->dio_it;
 
 {
        const struct dt_it_ops *iops = &lfsck->ml_obj_oit->do_index_ops->dio_it;
 
@@ -246,28 +244,23 @@ static void mdd_lfsck_pos_fill(const struct lu_env *env, struct md_lfsck *lfsck,
        }
 
        pos->lp_oit_cookie = iops->store(env, lfsck->ml_di_oit);
        }
 
        pos->lp_oit_cookie = iops->store(env, lfsck->ml_di_oit);
+       if (!lfsck->ml_current_oit_processed && !init)
+               pos->lp_oit_cookie--;
 
        LASSERT(pos->lp_oit_cookie > 0);
 
 
        LASSERT(pos->lp_oit_cookie > 0);
 
-       if (!oit_processed)
-               pos->lp_oit_cookie--;
-
        if (lfsck->ml_di_dir != NULL) {
                struct dt_object *dto = lfsck->ml_obj_dir;
 
        if (lfsck->ml_di_dir != NULL) {
                struct dt_object *dto = lfsck->ml_obj_dir;
 
-               pos->lp_dir_parent = *lu_object_fid(&dto->do_lu);
                pos->lp_dir_cookie = dto->do_index_ops->dio_it.store(env,
                                                        lfsck->ml_di_dir);
 
                pos->lp_dir_cookie = dto->do_index_ops->dio_it.store(env,
                                                        lfsck->ml_di_dir);
 
-               LASSERT(pos->lp_dir_cookie != MDS_DIR_DUMMY_START);
-
-               if (pos->lp_dir_cookie >= MDS_DIR_END_OFF)
-                       pos->lp_dir_cookie = MDS_DIR_END_OFF;
-               else if (!dir_processed)
-                       /* For the dir which just to be processed,
-                        * lp_dir_cookie will become MDS_DIR_DUMMY_START,
-                        * which can be correctly handled by mdd_lfsck_prep. */
-                       pos->lp_dir_cookie--;
+               if (pos->lp_dir_cookie >= MDS_DIR_END_OFF) {
+                       fid_zero(&pos->lp_dir_parent);
+                       pos->lp_dir_cookie = 0;
+               } else {
+                       pos->lp_dir_parent = *lu_object_fid(&dto->do_lu);
+               }
        } else {
                fid_zero(&pos->lp_dir_parent);
                pos->lp_dir_cookie = 0;
        } else {
                fid_zero(&pos->lp_dir_parent);
                pos->lp_dir_cookie = 0;
@@ -1026,7 +1019,7 @@ out:
 
 static void
 mdd_lfsck_namespace_fail(const struct lu_env *env, struct lfsck_component *com,
 
 static void
 mdd_lfsck_namespace_fail(const struct lu_env *env, struct lfsck_component *com,
-                        bool oit, bool new_checked)
+                        bool new_checked)
 {
        struct lfsck_namespace *ns = (struct lfsck_namespace *)com->lc_file_ram;
 
 {
        struct lfsck_namespace *ns = (struct lfsck_namespace *)com->lc_file_ram;
 
@@ -1036,7 +1029,7 @@ mdd_lfsck_namespace_fail(const struct lu_env *env, struct lfsck_component *com,
        ns->ln_items_failed++;
        if (mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent))
                mdd_lfsck_pos_fill(env, com->lc_lfsck,
        ns->ln_items_failed++;
        if (mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent))
                mdd_lfsck_pos_fill(env, com->lc_lfsck,
-                                  &ns->ln_pos_first_inconsistent, oit, !oit);
+                                  &ns->ln_pos_first_inconsistent, false);
        up_write(&com->lc_sem);
 }
 
        up_write(&com->lc_sem);
 }
 
@@ -1054,11 +1047,10 @@ static int mdd_lfsck_namespace_checkpoint(const struct lu_env *env,
 
        down_write(&com->lc_sem);
 
 
        down_write(&com->lc_sem);
 
-       ns->ln_pos_last_checkpoint = lfsck->ml_pos_current;
        if (init) {
        if (init) {
-               ns->ln_time_last_checkpoint = ns->ln_time_latest_start;
                ns->ln_pos_latest_start = lfsck->ml_pos_current;
        } else {
                ns->ln_pos_latest_start = lfsck->ml_pos_current;
        } else {
+               ns->ln_pos_last_checkpoint = lfsck->ml_pos_current;
                ns->ln_run_time_phase1 += cfs_duration_sec(cfs_time_current() +
                                HALF_SEC - lfsck->ml_time_last_checkpoint);
                ns->ln_time_last_checkpoint = cfs_time_current_sec();
                ns->ln_run_time_phase1 += cfs_duration_sec(cfs_time_current() +
                                HALF_SEC - lfsck->ml_time_last_checkpoint);
                ns->ln_time_last_checkpoint = cfs_time_current_sec();
@@ -1132,13 +1124,6 @@ static int mdd_lfsck_namespace_prep(const struct lu_env *env,
                    mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent)) {
                        *pos = ns->ln_pos_last_checkpoint;
                        pos->lp_oit_cookie++;
                    mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent)) {
                        *pos = ns->ln_pos_last_checkpoint;
                        pos->lp_oit_cookie++;
-                       if (!fid_is_zero(&pos->lp_dir_parent)) {
-                               if (pos->lp_dir_cookie == MDS_DIR_END_OFF) {
-                                       fid_zero(&pos->lp_dir_parent);
-                               } else {
-                                       pos->lp_dir_cookie++;
-                               }
-                       }
                } else {
                        *pos = ns->ln_pos_first_inconsistent;
                }
                } else {
                        *pos = ns->ln_pos_first_inconsistent;
                }
@@ -1242,7 +1227,8 @@ static int mdd_lfsck_namespace_exec_dir(const struct lu_env *env,
 
        if (ent->lde_name[0] == '.' &&
            (ent->lde_namelen == 1 ||
 
        if (ent->lde_name[0] == '.' &&
            (ent->lde_namelen == 1 ||
-            (ent->lde_namelen == 2 && ent->lde_name[1] == '.')))
+            (ent->lde_namelen == 2 && ent->lde_name[1] == '.') ||
+            fid_is_dot_lustre(&ent->lde_fid)))
                GOTO(out, rc = 0);
 
        if (!(bk->lb_param & LPF_DRYRUN) &&
                GOTO(out, rc = 0);
 
        if (!(bk->lb_param & LPF_DRYRUN) &&
@@ -1400,7 +1386,7 @@ out:
                if (mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent))
                        mdd_lfsck_pos_fill(env, lfsck,
                                           &ns->ln_pos_first_inconsistent,
                if (mdd_lfsck_pos_is_zero(&ns->ln_pos_first_inconsistent))
                        mdd_lfsck_pos_fill(env, lfsck,
                                           &ns->ln_pos_first_inconsistent,
-                                          true, false);
+                                          false);
                if (!(bk->lb_param & LPF_FAILOUT))
                        rc = 0;
        } else {
                if (!(bk->lb_param & LPF_FAILOUT))
                        rc = 0;
        } else {
@@ -1416,7 +1402,7 @@ out:
 
 static int mdd_lfsck_namespace_post(const struct lu_env *env,
                                    struct lfsck_component *com,
 
 static int mdd_lfsck_namespace_post(const struct lu_env *env,
                                    struct lfsck_component *com,
-                                   int result)
+                                   int result, bool init)
 {
        struct md_lfsck         *lfsck = com->lc_lfsck;
        struct lfsck_namespace  *ns    =
 {
        struct md_lfsck         *lfsck = com->lc_lfsck;
        struct lfsck_namespace  *ns    =
@@ -1426,6 +1412,8 @@ static int mdd_lfsck_namespace_post(const struct lu_env *env,
        down_write(&com->lc_sem);
 
        spin_lock(&lfsck->ml_lock);
        down_write(&com->lc_sem);
 
        spin_lock(&lfsck->ml_lock);
+       if (!init)
+               ns->ln_pos_last_checkpoint = lfsck->ml_pos_current;
        if (result > 0) {
                ns->ln_status = LS_SCANNING_PHASE2;
                ns->ln_flags |= LF_SCANNED_ONCE;
        if (result > 0) {
                ns->ln_status = LS_SCANNING_PHASE2;
                ns->ln_flags |= LF_SCANNED_ONCE;
@@ -1450,11 +1438,13 @@ static int mdd_lfsck_namespace_post(const struct lu_env *env,
        }
        spin_unlock(&lfsck->ml_lock);
 
        }
        spin_unlock(&lfsck->ml_lock);
 
-       ns->ln_run_time_phase1 += cfs_duration_sec(cfs_time_current() +
+       if (!init) {
+               ns->ln_run_time_phase1 += cfs_duration_sec(cfs_time_current() +
                                HALF_SEC - lfsck->ml_time_last_checkpoint);
                                HALF_SEC - lfsck->ml_time_last_checkpoint);
-       ns->ln_time_last_checkpoint = cfs_time_current_sec();
-       ns->ln_items_checked += com->lc_new_checked;
-       com->lc_new_checked = 0;
+               ns->ln_time_last_checkpoint = cfs_time_current_sec();
+               ns->ln_items_checked += com->lc_new_checked;
+               com->lc_new_checked = 0;
+       }
 
        rc = mdd_lfsck_namespace_store(env, com, false);
 
 
        rc = mdd_lfsck_namespace_store(env, com, false);
 
@@ -1580,7 +1570,7 @@ mdd_lfsck_namespace_dump(const struct lu_env *env, struct lfsck_component *com,
 
                buf += rc;
                len -= rc;
 
                buf += rc;
                len -= rc;
-               mdd_lfsck_pos_fill(env, lfsck, &pos, true, true);
+               mdd_lfsck_pos_fill(env, lfsck, &pos, false);
                rc = lfsck_pos_dump(&buf, &len, &pos, "current_position");
                if (rc <= 0)
                        goto out;
                rc = lfsck_pos_dump(&buf, &len, &pos, "current_position");
                if (rc <= 0)
                        goto out;
@@ -1972,9 +1962,8 @@ out:
 
 /* helper functions for framework */
 
 
 /* helper functions for framework */
 
-static int object_is_client_visible(const struct lu_env *env,
-                                   struct mdd_device *mdd,
-                                   struct mdd_object *obj)
+static int object_needs_lfsck(const struct lu_env *env, struct mdd_device *mdd,
+                             struct mdd_object *obj)
 {
        struct lu_fid *fid   = &mdd_env_info(env)->mti_fid;
        int            depth = 0;
 {
        struct lu_fid *fid   = &mdd_env_info(env)->mti_fid;
        int            depth = 0;
@@ -1989,6 +1978,13 @@ static int object_is_client_visible(const struct lu_env *env,
                        return 1;
                }
 
                        return 1;
                }
 
+               /* .lustre doesn't contain "real" user objects, no need lfsck */
+               if (fid_is_dot_lustre(mdo2fid(obj))) {
+                       if (depth > 0)
+                               mdd_object_put(env, obj);
+                       return 0;
+               }
+
                mdd_read_lock(env, obj, MOR_TGT_CHILD);
                if (unlikely(mdd_is_dead_obj(obj))) {
                        mdd_read_unlock(env, obj);
                mdd_read_lock(env, obj, MOR_TGT_CHILD);
                if (unlikely(mdd_is_dead_obj(obj))) {
                        mdd_read_unlock(env, obj);
@@ -2061,17 +2057,17 @@ static void mdd_lfsck_unpack_ent(struct lu_dirent *ent)
 /* LFSCK wrap functions */
 
 static void mdd_lfsck_fail(const struct lu_env *env, struct md_lfsck *lfsck,
 /* LFSCK wrap functions */
 
 static void mdd_lfsck_fail(const struct lu_env *env, struct md_lfsck *lfsck,
-                          bool oit, bool new_checked)
+                          bool new_checked)
 {
        struct lfsck_component *com;
 
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
 {
        struct lfsck_component *com;
 
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
-               com->lc_ops->lfsck_fail(env, com, oit, new_checked);
+               com->lc_ops->lfsck_fail(env, com, new_checked);
        }
 }
 
 static int mdd_lfsck_checkpoint(const struct lu_env *env,
        }
 }
 
 static int mdd_lfsck_checkpoint(const struct lu_env *env,
-                               struct md_lfsck *lfsck, bool oit)
+                               struct md_lfsck *lfsck)
 {
        struct lfsck_component *com;
        int                     rc;
 {
        struct lfsck_component *com;
        int                     rc;
@@ -2080,7 +2076,7 @@ static int mdd_lfsck_checkpoint(const struct lu_env *env,
                                    lfsck->ml_time_next_checkpoint)))
                return 0;
 
                                    lfsck->ml_time_next_checkpoint)))
                return 0;
 
-       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, oit, !oit);
+       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, false);
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
                rc = com->lc_ops->lfsck_checkpoint(env, com, false);
                if (rc != 0)
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
                rc = com->lc_ops->lfsck_checkpoint(env, com, false);
                if (rc != 0)
@@ -2110,6 +2106,7 @@ static int mdd_lfsck_prep(struct lu_env *env, struct md_lfsck *lfsck)
        LASSERT(lfsck->ml_obj_dir == NULL);
        LASSERT(lfsck->ml_di_dir == NULL);
 
        LASSERT(lfsck->ml_obj_dir == NULL);
        LASSERT(lfsck->ml_di_dir == NULL);
 
+       lfsck->ml_current_oit_processed = 0;
        cfs_list_for_each_entry_safe(com, next, &lfsck->ml_list_scan, lc_link) {
                com->lc_new_checked = 0;
                if (lfsck->ml_bookmark_ram.lb_param & LPF_DRYRUN)
        cfs_list_for_each_entry_safe(com, next, &lfsck->ml_list_scan, lc_link) {
                com->lc_new_checked = 0;
                if (lfsck->ml_bookmark_ram.lb_param & LPF_DRYRUN)
@@ -2170,8 +2167,10 @@ static int mdd_lfsck_prep(struct lu_env *env, struct md_lfsck *lfsck)
        if (IS_ERR(di))
                GOTO(out, rc = PTR_ERR(di));
 
        if (IS_ERR(di))
                GOTO(out, rc = PTR_ERR(di));
 
+       LASSERT(pos->lp_dir_cookie < MDS_DIR_END_OFF);
+
        rc = iops->load(env, di, pos->lp_dir_cookie);
        rc = iops->load(env, di, pos->lp_dir_cookie);
-       if (rc == 0)
+       if ((rc == 0) || (rc > 0 && pos->lp_dir_cookie > 0))
                rc = iops->next(env, di);
        else if (rc > 0)
                rc = 0;
                rc = iops->next(env, di);
        else if (rc > 0)
                rc = 0;
@@ -2194,10 +2193,16 @@ out:
        if (obj != NULL)
                mdd_object_put(env, obj);
 
        if (obj != NULL)
                mdd_object_put(env, obj);
 
-       if (rc != 0)
-               return (rc > 0 ? 0 : rc);
+       if (rc < 0) {
+               cfs_list_for_each_entry_safe(com, next, &lfsck->ml_list_scan,
+                                            lc_link)
+                       com->lc_ops->lfsck_post(env, com, rc, true);
 
 
-       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, false, false);
+               return rc;
+       }
+
+       rc = 0;
+       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, true);
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
                rc = com->lc_ops->lfsck_checkpoint(env, com, true);
                if (rc != 0)
        cfs_list_for_each_entry(com, &lfsck->ml_list_scan, lc_link) {
                rc = com->lc_ops->lfsck_checkpoint(env, com, true);
                if (rc != 0)
@@ -2232,7 +2237,7 @@ static int mdd_lfsck_exec_oit(const struct lu_env *env, struct md_lfsck *lfsck,
            cfs_list_empty(&lfsck->ml_list_dir))
               RETURN(0);
 
            cfs_list_empty(&lfsck->ml_list_dir))
               RETURN(0);
 
-       rc = object_is_client_visible(env, mdd_lfsck2mdd(lfsck), obj);
+       rc = object_needs_lfsck(env, mdd_lfsck2mdd(lfsck), obj);
        if (rc <= 0)
                GOTO(out, rc);
 
        if (rc <= 0)
                GOTO(out, rc);
 
@@ -2270,7 +2275,7 @@ static int mdd_lfsck_exec_oit(const struct lu_env *env, struct md_lfsck *lfsck,
 
 out:
        if (rc < 0)
 
 out:
        if (rc < 0)
-               mdd_lfsck_fail(env, lfsck, false, false);
+               mdd_lfsck_fail(env, lfsck, false);
        return (rc > 0 ? 0 : rc);
 }
 
        return (rc > 0 ? 0 : rc);
 }
 
@@ -2295,9 +2300,9 @@ static int mdd_lfsck_post(const struct lu_env *env, struct md_lfsck *lfsck,
        struct lfsck_component *next;
        int                     rc;
 
        struct lfsck_component *next;
        int                     rc;
 
-       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, true, true);
+       mdd_lfsck_pos_fill(env, lfsck, &lfsck->ml_pos_current, false);
        cfs_list_for_each_entry_safe(com, next, &lfsck->ml_list_scan, lc_link) {
        cfs_list_for_each_entry_safe(com, next, &lfsck->ml_list_scan, lc_link) {
-               rc = com->lc_ops->lfsck_post(env, com, result);
+               rc = com->lc_ops->lfsck_post(env, com, result, false);
                if (rc != 0)
                        return rc;
        }
                if (rc != 0)
                        return rc;
        }
@@ -2362,7 +2367,7 @@ static int mdd_lfsck_dir_engine(const struct lu_env *env,
                rc = iops->rec(env, di, (struct dt_rec *)ent,
                               lfsck->ml_args_dir);
                if (rc != 0) {
                rc = iops->rec(env, di, (struct dt_rec *)ent,
                               lfsck->ml_args_dir);
                if (rc != 0) {
-                       mdd_lfsck_fail(env, lfsck, false, true);
+                       mdd_lfsck_fail(env, lfsck, true);
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(rc);
                        else
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(rc);
                        else
@@ -2378,7 +2383,7 @@ static int mdd_lfsck_dir_engine(const struct lu_env *env,
                if (child == NULL) {
                        goto checkpoint;
                } else if (IS_ERR(child)) {
                if (child == NULL) {
                        goto checkpoint;
                } else if (IS_ERR(child)) {
-                       mdd_lfsck_fail(env, lfsck, false, true);
+                       mdd_lfsck_fail(env, lfsck, true);
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(PTR_ERR(child));
                        else
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(PTR_ERR(child));
                        else
@@ -2393,7 +2398,7 @@ static int mdd_lfsck_dir_engine(const struct lu_env *env,
                        RETURN(rc);
 
 checkpoint:
                        RETURN(rc);
 
 checkpoint:
-               rc = mdd_lfsck_checkpoint(env, lfsck, false);
+               rc = mdd_lfsck_checkpoint(env, lfsck);
                if (rc != 0 && bk->lb_param & LPF_FAILOUT)
                        RETURN(rc);
 
                if (rc != 0 && bk->lb_param & LPF_FAILOUT)
                        RETURN(rc);
 
@@ -2458,10 +2463,11 @@ static int mdd_lfsck_oit_engine(const struct lu_env *env,
                if (OBD_FAIL_CHECK(OBD_FAIL_LFSCK_CRASH))
                        RETURN(0);
 
                if (OBD_FAIL_CHECK(OBD_FAIL_LFSCK_CRASH))
                        RETURN(0);
 
+               lfsck->ml_current_oit_processed = 1;
                lfsck->ml_new_scanned++;
                rc = iops->rec(env, di, (struct dt_rec *)fid, 0);
                if (rc != 0) {
                lfsck->ml_new_scanned++;
                rc = iops->rec(env, di, (struct dt_rec *)fid, 0);
                if (rc != 0) {
-                       mdd_lfsck_fail(env, lfsck, true, true);
+                       mdd_lfsck_fail(env, lfsck, true);
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(rc);
                        else
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(rc);
                        else
@@ -2472,7 +2478,7 @@ static int mdd_lfsck_oit_engine(const struct lu_env *env,
                if (target == NULL) {
                        goto checkpoint;
                } else if (IS_ERR(target)) {
                if (target == NULL) {
                        goto checkpoint;
                } else if (IS_ERR(target)) {
-                       mdd_lfsck_fail(env, lfsck, true, true);
+                       mdd_lfsck_fail(env, lfsck, true);
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(PTR_ERR(target));
                        else
                        if (bk->lb_param & LPF_FAILOUT)
                                RETURN(PTR_ERR(target));
                        else
@@ -2489,7 +2495,7 @@ static int mdd_lfsck_oit_engine(const struct lu_env *env,
                        RETURN(rc);
 
 checkpoint:
                        RETURN(rc);
 
 checkpoint:
-               rc = mdd_lfsck_checkpoint(env, lfsck, true);
+               rc = mdd_lfsck_checkpoint(env, lfsck);
                if (rc != 0 && bk->lb_param & LPF_FAILOUT)
                        RETURN(rc);
 
                if (rc != 0 && bk->lb_param & LPF_FAILOUT)
                        RETURN(rc);
 
@@ -2504,8 +2510,10 @@ checkpoint:
                }
 
                rc = iops->next(env, di);
                }
 
                rc = iops->next(env, di);
-               if (rc > 0)
+               if (unlikely(rc > 0))
                        lfsck->ml_oit_over = 1;
                        lfsck->ml_oit_over = 1;
+               else if (likely(rc == 0))
+                       lfsck->ml_current_oit_processed = 0;
 
                if (unlikely(!thread_is_running(thread)))
                        RETURN(0);
 
                if (unlikely(!thread_is_running(thread)))
                        RETURN(0);
@@ -2526,7 +2534,7 @@ static int mdd_lfsck_main(void *args)
        ENTRY;
 
        cfs_daemonize("lfsck");
        ENTRY;
 
        cfs_daemonize("lfsck");
-       rc = lu_env_init(&env, LCT_MD_THREAD);
+       rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
        if (rc != 0) {
                CERROR("%s: LFSCK, fail to init env, rc = %d\n",
                       mdd_lfsck2name(lfsck), rc);
        if (rc != 0) {
                CERROR("%s: LFSCK, fail to init env, rc = %d\n",
                       mdd_lfsck2name(lfsck), rc);
@@ -2741,7 +2749,8 @@ int mdd_lfsck_start(const struct lu_env *env, struct md_lfsck *lfsck,
                cfs_list_for_each_entry_safe(com, next,
                                             &lfsck->ml_list_scan, lc_link) {
                        if (!(com->lc_type & start->ls_active)) {
                cfs_list_for_each_entry_safe(com, next,
                                             &lfsck->ml_list_scan, lc_link) {
                        if (!(com->lc_type & start->ls_active)) {
-                               rc = com->lc_ops->lfsck_post(env, com, 0);
+                               rc = com->lc_ops->lfsck_post(env, com, 0,
+                                                            false);
                                if (rc != 0)
                                        GOTO(out, rc);
                        }
                                if (rc != 0)
                                        GOTO(out, rc);
                        }
index fc584c7..dcd91b2 100644 (file)
@@ -194,7 +194,7 @@ struct lfsck_operations {
 
        void (*lfsck_fail)(const struct lu_env *env,
                           struct lfsck_component *com,
 
        void (*lfsck_fail)(const struct lu_env *env,
                           struct lfsck_component *com,
-                          bool oit, bool new_checked);
+                          bool new_checked);
 
        int (*lfsck_checkpoint)(const struct lu_env *env,
                                struct lfsck_component *com,
 
        int (*lfsck_checkpoint)(const struct lu_env *env,
                                struct lfsck_component *com,
@@ -214,7 +214,7 @@ struct lfsck_operations {
 
        int (*lfsck_post)(const struct lu_env *env,
                          struct lfsck_component *com,
 
        int (*lfsck_post)(const struct lu_env *env,
                          struct lfsck_component *com,
-                         int result);
+                         int result, bool init);
 
        int (*lfsck_dump)(const struct lu_env *env,
                          struct lfsck_component *com,
 
        int (*lfsck_dump)(const struct lu_env *env,
                          struct lfsck_component *com,
@@ -309,7 +309,8 @@ struct md_lfsck {
        unsigned int             ml_paused:1, /* The lfsck is paused. */
                                 ml_oit_over:1, /* oit is finished. */
                                 ml_drop_dryrun:1, /* Ever dryrun, not now. */
        unsigned int             ml_paused:1, /* The lfsck is paused. */
                                 ml_oit_over:1, /* oit is finished. */
                                 ml_drop_dryrun:1, /* Ever dryrun, not now. */
-                                ml_initialized:1; /* lfsck_setup is called. */
+                                ml_initialized:1, /* lfsck_setup is called. */
+                                ml_current_oit_processed:1;
 };
 
 enum lfsck_linkea_flags {
 };
 
 enum lfsck_linkea_flags {
index 77acd9e..1954b12 100644 (file)
@@ -1005,7 +1005,6 @@ static int osd_scrub_main(void *args)
                if (unlikely(!thread_is_running(thread)))
                        GOTO(post, rc = 0);
 
                if (unlikely(!thread_is_running(thread)))
                        GOTO(post, rc = 0);
 
-               LASSERT(scrub->os_pos_current >= ooc->ooc_pos_preload);
                scrub->os_pos_current = ooc->ooc_pos_preload;
        }
 
                scrub->os_pos_current = ooc->ooc_pos_preload;
        }
 
@@ -1922,7 +1921,7 @@ static __u64 osd_otable_it_store(const struct lu_env *env,
        struct osd_otable_cache *ooc = &it->ooi_cache;
        __u64                    hash;
 
        struct osd_otable_cache *ooc = &it->ooi_cache;
        __u64                    hash;
 
-       if (it->ooi_user_ready)
+       if (!it->ooi_user_ready)
                hash = ooc->ooc_pos_preload;
        else if (likely(ooc->ooc_consumer_idx != -1))
                hash = ooc->ooc_cache[ooc->ooc_consumer_idx].oic_lid.oii_ino;
                hash = ooc->ooc_pos_preload;
        else if (likely(ooc->ooc_consumer_idx != -1))
                hash = ooc->ooc_cache[ooc->ooc_consumer_idx].oic_lid.oii_ino;
@@ -1951,10 +1950,7 @@ static int osd_otable_it_load(const struct lu_env *env,
        if (hash > OSD_OTABLE_MAX_HASH)
                hash = OSD_OTABLE_MAX_HASH;
 
        if (hash > OSD_OTABLE_MAX_HASH)
                hash = OSD_OTABLE_MAX_HASH;
 
-       /* Skip the one that has been processed last time. */
-       if (ooc->ooc_pos_preload > hash)
-               ooc->ooc_pos_preload = hash;
-
+       ooc->ooc_pos_preload = hash;
        if (ooc->ooc_pos_preload <= LDISKFS_FIRST_INO(osd_sb(dev)))
                ooc->ooc_pos_preload = LDISKFS_FIRST_INO(osd_sb(dev)) + 1;
 
        if (ooc->ooc_pos_preload <= LDISKFS_FIRST_INO(osd_sb(dev)))
                ooc->ooc_pos_preload = LDISKFS_FIRST_INO(osd_sb(dev)) + 1;
 
index 80655d9..510b798 100644 (file)
@@ -62,7 +62,7 @@ lfsck_prep() {
 
        echo "preparing... ${nfiles} * ${ndirs} files will be created."
        mkdir -p $DIR/$tdir
 
        echo "preparing... ${nfiles} * ${ndirs} files will be created."
        mkdir -p $DIR/$tdir
-       cp $LUSTRE/tests/*.sh $DIR/$tdir/
+       cp $LUSTRE/tests/*.sh $DIR/
        for ((i=0; i<${ndirs}; i++)); do
                mkdir $DIR/$tdir/d${i}
                touch $DIR/$tdir/f${i}
        for ((i=0; i<${ndirs}; i++)); do
                mkdir $DIR/$tdir/d${i}
                touch $DIR/$tdir/f${i}