Whamcloud - gitweb
3eb3a02aa24ae6c68f8da0690064d114e5c12336
[fs/lustre-release.git] / lustre / lfsck / lfsck_lib.c
1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9
10  * This program is distributed in the hope that it will be useful,
11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13  * GNU General Public License version 2 for more details.  A copy is
14  * included in the COPYING file that accompanied this code.
15
16  * You should have received a copy of the GNU General Public License
17  * along with this program; if not, write to the Free Software
18  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19  *
20  * GPL HEADER END
21  */
22 /*
23  * Copyright (c) 2012, 2013, Intel Corporation.
24  */
25 /*
26  * lustre/lfsck/lfsck_lib.c
27  *
28  * Author: Fan, Yong <fan.yong@intel.com>
29  */
30
31 #define DEBUG_SUBSYSTEM S_LFSCK
32
33 #include <libcfs/list.h>
34 #include <lu_object.h>
35 #include <dt_object.h>
36 #include <md_object.h>
37 #include <lustre_fld.h>
38 #include <lustre_lib.h>
39 #include <lustre_net.h>
40 #include <lustre_lfsck.h>
41 #include <lustre/lustre_lfsck_user.h>
42
43 #include "lfsck_internal.h"
44
45 /* define lfsck thread key */
46 LU_KEY_INIT(lfsck, struct lfsck_thread_info);
47
48 static void lfsck_key_fini(const struct lu_context *ctx,
49                            struct lu_context_key *key, void *data)
50 {
51         struct lfsck_thread_info *info = data;
52
53         lu_buf_free(&info->lti_linkea_buf);
54         OBD_FREE_PTR(info);
55 }
56
57 LU_CONTEXT_KEY_DEFINE(lfsck, LCT_MD_THREAD | LCT_DT_THREAD);
58 LU_KEY_INIT_GENERIC(lfsck);
59
60 static CFS_LIST_HEAD(lfsck_instance_list);
61 static struct list_head lfsck_ost_orphan_list;
62 static struct list_head lfsck_mdt_orphan_list;
63 static DEFINE_SPINLOCK(lfsck_instance_lock);
64
65 static const char *lfsck_status_names[] = {
66         [LS_INIT]               = "init",
67         [LS_SCANNING_PHASE1]    = "scanning-phase1",
68         [LS_SCANNING_PHASE2]    = "scanning-phase2",
69         [LS_COMPLETED]          = "completed",
70         [LS_FAILED]             = "failed",
71         [LS_STOPPED]            = "stopped",
72         [LS_PAUSED]             = "paused",
73         [LS_CRASHED]            = "crashed",
74         [LS_PARTIAL]            = "partial",
75         [LS_CO_FAILED]          = "co-failed",
76         [LS_CO_STOPPED]         = "co-stopped",
77         [LS_CO_PAUSED]          = "co-paused"
78 };
79
80 const char *lfsck_flags_names[] = {
81         "scanned-once",
82         "inconsistent",
83         "upgrade",
84         "incomplete",
85         "crashed_lastid",
86         NULL
87 };
88
89 const char *lfsck_param_names[] = {
90         NULL,
91         "failout",
92         "dryrun",
93         "all_targets",
94         NULL
95 };
96
97 const char *lfsck_status2names(enum lfsck_status status)
98 {
99         if (unlikely(status < 0 || status >= LS_MAX))
100                 return "unknown";
101
102         return lfsck_status_names[status];
103 }
104
105 static int lfsck_tgt_descs_init(struct lfsck_tgt_descs *ltds)
106 {
107         spin_lock_init(&ltds->ltd_lock);
108         init_rwsem(&ltds->ltd_rw_sem);
109         INIT_LIST_HEAD(&ltds->ltd_orphan);
110         ltds->ltd_tgts_bitmap = CFS_ALLOCATE_BITMAP(BITS_PER_LONG);
111         if (ltds->ltd_tgts_bitmap == NULL)
112                 return -ENOMEM;
113
114         return 0;
115 }
116
117 static void lfsck_tgt_descs_fini(struct lfsck_tgt_descs *ltds)
118 {
119         struct lfsck_tgt_desc   *ltd;
120         struct lfsck_tgt_desc   *next;
121         int                      idx;
122
123         down_write(&ltds->ltd_rw_sem);
124
125         list_for_each_entry_safe(ltd, next, &ltds->ltd_orphan,
126                                  ltd_orphan_list) {
127                 list_del_init(&ltd->ltd_orphan_list);
128                 lfsck_tgt_put(ltd);
129         }
130
131         if (unlikely(ltds->ltd_tgts_bitmap == NULL)) {
132                 up_write(&ltds->ltd_rw_sem);
133
134                 return;
135         }
136
137         cfs_foreach_bit(ltds->ltd_tgts_bitmap, idx) {
138                 ltd = LTD_TGT(ltds, idx);
139                 if (likely(ltd != NULL)) {
140                         LASSERT(list_empty(&ltd->ltd_layout_list));
141                         LASSERT(list_empty(&ltd->ltd_layout_phase_list));
142
143                         ltds->ltd_tgtnr--;
144                         cfs_bitmap_clear(ltds->ltd_tgts_bitmap, idx);
145                         LTD_TGT(ltds, idx) = NULL;
146                         lfsck_tgt_put(ltd);
147                 }
148         }
149
150         LASSERTF(ltds->ltd_tgtnr == 0, "tgt count unmatched: %d\n",
151                  ltds->ltd_tgtnr);
152
153         for (idx = 0; idx < TGT_PTRS; idx++) {
154                 if (ltds->ltd_tgts_idx[idx] != NULL) {
155                         OBD_FREE_PTR(ltds->ltd_tgts_idx[idx]);
156                         ltds->ltd_tgts_idx[idx] = NULL;
157                 }
158         }
159
160         CFS_FREE_BITMAP(ltds->ltd_tgts_bitmap);
161         ltds->ltd_tgts_bitmap = NULL;
162         up_write(&ltds->ltd_rw_sem);
163 }
164
165 static int __lfsck_add_target(const struct lu_env *env,
166                               struct lfsck_instance *lfsck,
167                               struct lfsck_tgt_desc *ltd,
168                               bool for_ost, bool locked)
169 {
170         struct lfsck_tgt_descs *ltds;
171         __u32                   index = ltd->ltd_index;
172         int                     rc    = 0;
173         ENTRY;
174
175         if (for_ost)
176                 ltds = &lfsck->li_ost_descs;
177         else
178                 ltds = &lfsck->li_mdt_descs;
179
180         if (!locked)
181                 down_write(&ltds->ltd_rw_sem);
182
183         LASSERT(ltds->ltd_tgts_bitmap != NULL);
184
185         if (index >= ltds->ltd_tgts_bitmap->size) {
186                 __u32 newsize = max((__u32)ltds->ltd_tgts_bitmap->size,
187                                     (__u32)BITS_PER_LONG);
188                 cfs_bitmap_t *old_bitmap = ltds->ltd_tgts_bitmap;
189                 cfs_bitmap_t *new_bitmap;
190
191                 while (newsize < index + 1)
192                         newsize <<= 1;
193
194                 new_bitmap = CFS_ALLOCATE_BITMAP(newsize);
195                 if (new_bitmap == NULL)
196                         GOTO(unlock, rc = -ENOMEM);
197
198                 if (ltds->ltd_tgtnr > 0)
199                         cfs_bitmap_copy(new_bitmap, old_bitmap);
200                 ltds->ltd_tgts_bitmap = new_bitmap;
201                 CFS_FREE_BITMAP(old_bitmap);
202         }
203
204         if (cfs_bitmap_check(ltds->ltd_tgts_bitmap, index)) {
205                 CERROR("%s: the device %s (%u) is registered already\n",
206                        lfsck_lfsck2name(lfsck),
207                        ltd->ltd_tgt->dd_lu_dev.ld_obd->obd_name, index);
208                 GOTO(unlock, rc = -EEXIST);
209         }
210
211         if (ltds->ltd_tgts_idx[index / TGT_PTRS_PER_BLOCK] == NULL) {
212                 OBD_ALLOC_PTR(ltds->ltd_tgts_idx[index / TGT_PTRS_PER_BLOCK]);
213                 if (ltds->ltd_tgts_idx[index / TGT_PTRS_PER_BLOCK] == NULL)
214                         GOTO(unlock, rc = -ENOMEM);
215         }
216
217         LTD_TGT(ltds, index) = ltd;
218         cfs_bitmap_set(ltds->ltd_tgts_bitmap, index);
219         ltds->ltd_tgtnr++;
220
221         GOTO(unlock, rc = 0);
222
223 unlock:
224         if (!locked)
225                 up_write(&ltds->ltd_rw_sem);
226
227         return rc;
228 }
229
230 static int lfsck_add_target_from_orphan(const struct lu_env *env,
231                                         struct lfsck_instance *lfsck)
232 {
233         struct lfsck_tgt_descs  *ltds    = &lfsck->li_ost_descs;
234         struct lfsck_tgt_desc   *ltd;
235         struct lfsck_tgt_desc   *next;
236         struct list_head        *head    = &lfsck_ost_orphan_list;
237         int                      rc;
238         bool                     for_ost = true;
239
240 again:
241         spin_lock(&lfsck_instance_lock);
242         list_for_each_entry_safe(ltd, next, head, ltd_orphan_list) {
243                 if (ltd->ltd_key == lfsck->li_bottom) {
244                         list_del_init(&ltd->ltd_orphan_list);
245                         list_add_tail(&ltd->ltd_orphan_list,
246                                       &ltds->ltd_orphan);
247                 }
248         }
249         spin_unlock(&lfsck_instance_lock);
250
251         down_write(&ltds->ltd_rw_sem);
252         while (!list_empty(&ltds->ltd_orphan)) {
253                 ltd = list_entry(ltds->ltd_orphan.next,
254                                  struct lfsck_tgt_desc,
255                                  ltd_orphan_list);
256                 list_del_init(&ltd->ltd_orphan_list);
257                 rc = __lfsck_add_target(env, lfsck, ltd, for_ost, true);
258                 /* Do not hold the semaphore for too long time. */
259                 up_write(&ltds->ltd_rw_sem);
260                 if (rc != 0)
261                         return rc;
262
263                 down_write(&ltds->ltd_rw_sem);
264         }
265         up_write(&ltds->ltd_rw_sem);
266
267         if (for_ost) {
268                 ltds = &lfsck->li_mdt_descs;
269                 head = &lfsck_mdt_orphan_list;
270                 for_ost = false;
271                 goto again;
272         }
273
274         return 0;
275 }
276
277 static inline struct lfsck_component *
278 __lfsck_component_find(struct lfsck_instance *lfsck, __u16 type, cfs_list_t *list)
279 {
280         struct lfsck_component *com;
281
282         cfs_list_for_each_entry(com, list, lc_link) {
283                 if (com->lc_type == type)
284                         return com;
285         }
286         return NULL;
287 }
288
289 static struct lfsck_component *
290 lfsck_component_find(struct lfsck_instance *lfsck, __u16 type)
291 {
292         struct lfsck_component *com;
293
294         spin_lock(&lfsck->li_lock);
295         com = __lfsck_component_find(lfsck, type, &lfsck->li_list_scan);
296         if (com != NULL)
297                 goto unlock;
298
299         com = __lfsck_component_find(lfsck, type,
300                                      &lfsck->li_list_double_scan);
301         if (com != NULL)
302                 goto unlock;
303
304         com = __lfsck_component_find(lfsck, type, &lfsck->li_list_idle);
305
306 unlock:
307         if (com != NULL)
308                 lfsck_component_get(com);
309         spin_unlock(&lfsck->li_lock);
310         return com;
311 }
312
313 void lfsck_component_cleanup(const struct lu_env *env,
314                              struct lfsck_component *com)
315 {
316         if (!cfs_list_empty(&com->lc_link))
317                 cfs_list_del_init(&com->lc_link);
318         if (!cfs_list_empty(&com->lc_link_dir))
319                 cfs_list_del_init(&com->lc_link_dir);
320
321         lfsck_component_put(env, com);
322 }
323
324 void lfsck_instance_cleanup(const struct lu_env *env,
325                             struct lfsck_instance *lfsck)
326 {
327         struct ptlrpc_thread    *thread = &lfsck->li_thread;
328         struct lfsck_component  *com;
329         ENTRY;
330
331         LASSERT(list_empty(&lfsck->li_link));
332         LASSERT(thread_is_init(thread) || thread_is_stopped(thread));
333
334         if (lfsck->li_obj_oit != NULL) {
335                 lu_object_put_nocache(env, &lfsck->li_obj_oit->do_lu);
336                 lfsck->li_obj_oit = NULL;
337         }
338
339         LASSERT(lfsck->li_obj_dir == NULL);
340
341         while (!cfs_list_empty(&lfsck->li_list_scan)) {
342                 com = cfs_list_entry(lfsck->li_list_scan.next,
343                                      struct lfsck_component,
344                                      lc_link);
345                 lfsck_component_cleanup(env, com);
346         }
347
348         LASSERT(cfs_list_empty(&lfsck->li_list_dir));
349
350         while (!cfs_list_empty(&lfsck->li_list_double_scan)) {
351                 com = cfs_list_entry(lfsck->li_list_double_scan.next,
352                                      struct lfsck_component,
353                                      lc_link);
354                 lfsck_component_cleanup(env, com);
355         }
356
357         while (!cfs_list_empty(&lfsck->li_list_idle)) {
358                 com = cfs_list_entry(lfsck->li_list_idle.next,
359                                      struct lfsck_component,
360                                      lc_link);
361                 lfsck_component_cleanup(env, com);
362         }
363
364         lfsck_tgt_descs_fini(&lfsck->li_ost_descs);
365         lfsck_tgt_descs_fini(&lfsck->li_mdt_descs);
366
367         if (lfsck->li_bookmark_obj != NULL) {
368                 lu_object_put_nocache(env, &lfsck->li_bookmark_obj->do_lu);
369                 lfsck->li_bookmark_obj = NULL;
370         }
371
372         if (lfsck->li_los != NULL) {
373                 local_oid_storage_fini(env, lfsck->li_los);
374                 lfsck->li_los = NULL;
375         }
376
377         OBD_FREE_PTR(lfsck);
378 }
379
380 static inline struct lfsck_instance *
381 __lfsck_instance_find(struct dt_device *key, bool ref, bool unlink)
382 {
383         struct lfsck_instance *lfsck;
384
385         cfs_list_for_each_entry(lfsck, &lfsck_instance_list, li_link) {
386                 if (lfsck->li_bottom == key) {
387                         if (ref)
388                                 lfsck_instance_get(lfsck);
389                         if (unlink)
390                                 list_del_init(&lfsck->li_link);
391
392                         return lfsck;
393                 }
394         }
395
396         return NULL;
397 }
398
399 static inline struct lfsck_instance *lfsck_instance_find(struct dt_device *key,
400                                                          bool ref, bool unlink)
401 {
402         struct lfsck_instance *lfsck;
403
404         spin_lock(&lfsck_instance_lock);
405         lfsck = __lfsck_instance_find(key, ref, unlink);
406         spin_unlock(&lfsck_instance_lock);
407
408         return lfsck;
409 }
410
411 static inline int lfsck_instance_add(struct lfsck_instance *lfsck)
412 {
413         struct lfsck_instance *tmp;
414
415         spin_lock(&lfsck_instance_lock);
416         cfs_list_for_each_entry(tmp, &lfsck_instance_list, li_link) {
417                 if (lfsck->li_bottom == tmp->li_bottom) {
418                         spin_unlock(&lfsck_instance_lock);
419                         return -EEXIST;
420                 }
421         }
422
423         cfs_list_add_tail(&lfsck->li_link, &lfsck_instance_list);
424         spin_unlock(&lfsck_instance_lock);
425         return 0;
426 }
427
428 int lfsck_bits_dump(char **buf, int *len, int bits, const char *names[],
429                     const char *prefix)
430 {
431         int save = *len;
432         int flag;
433         int rc;
434         int i;
435
436         rc = snprintf(*buf, *len, "%s:%c", prefix, bits != 0 ? ' ' : '\n');
437         if (rc <= 0)
438                 return -ENOSPC;
439
440         *buf += rc;
441         *len -= rc;
442         for (i = 0, flag = 1; bits != 0; i++, flag = 1 << i) {
443                 if (flag & bits) {
444                         bits &= ~flag;
445                         if (names[i] != NULL) {
446                                 rc = snprintf(*buf, *len, "%s%c", names[i],
447                                               bits != 0 ? ',' : '\n');
448                                 if (rc <= 0)
449                                         return -ENOSPC;
450
451                                 *buf += rc;
452                                 *len -= rc;
453                         }
454                 }
455         }
456         return save - *len;
457 }
458
459 int lfsck_time_dump(char **buf, int *len, __u64 time, const char *prefix)
460 {
461         int rc;
462
463         if (time != 0)
464                 rc = snprintf(*buf, *len, "%s: "LPU64" seconds\n", prefix,
465                               cfs_time_current_sec() - time);
466         else
467                 rc = snprintf(*buf, *len, "%s: N/A\n", prefix);
468         if (rc <= 0)
469                 return -ENOSPC;
470
471         *buf += rc;
472         *len -= rc;
473         return rc;
474 }
475
476 int lfsck_pos_dump(char **buf, int *len, struct lfsck_position *pos,
477                    const char *prefix)
478 {
479         int rc;
480
481         if (fid_is_zero(&pos->lp_dir_parent)) {
482                 if (pos->lp_oit_cookie == 0)
483                         rc = snprintf(*buf, *len, "%s: N/A, N/A, N/A\n",
484                                       prefix);
485                 else
486                         rc = snprintf(*buf, *len, "%s: "LPU64", N/A, N/A\n",
487                                       prefix, pos->lp_oit_cookie);
488         } else {
489                 rc = snprintf(*buf, *len, "%s: "LPU64", "DFID", "LPU64"\n",
490                               prefix, pos->lp_oit_cookie,
491                               PFID(&pos->lp_dir_parent), pos->lp_dir_cookie);
492         }
493         if (rc <= 0)
494                 return -ENOSPC;
495
496         *buf += rc;
497         *len -= rc;
498         return rc;
499 }
500
501 void lfsck_pos_fill(const struct lu_env *env, struct lfsck_instance *lfsck,
502                     struct lfsck_position *pos, bool init)
503 {
504         const struct dt_it_ops *iops = &lfsck->li_obj_oit->do_index_ops->dio_it;
505
506         if (unlikely(lfsck->li_di_oit == NULL)) {
507                 memset(pos, 0, sizeof(*pos));
508                 return;
509         }
510
511         pos->lp_oit_cookie = iops->store(env, lfsck->li_di_oit);
512         if (!lfsck->li_current_oit_processed && !init)
513                 pos->lp_oit_cookie--;
514
515         LASSERT(pos->lp_oit_cookie > 0);
516
517         if (lfsck->li_di_dir != NULL) {
518                 struct dt_object *dto = lfsck->li_obj_dir;
519
520                 pos->lp_dir_cookie = dto->do_index_ops->dio_it.store(env,
521                                                         lfsck->li_di_dir);
522
523                 if (pos->lp_dir_cookie >= MDS_DIR_END_OFF) {
524                         fid_zero(&pos->lp_dir_parent);
525                         pos->lp_dir_cookie = 0;
526                 } else {
527                         pos->lp_dir_parent = *lfsck_dto2fid(dto);
528                 }
529         } else {
530                 fid_zero(&pos->lp_dir_parent);
531                 pos->lp_dir_cookie = 0;
532         }
533 }
534
535 static void __lfsck_set_speed(struct lfsck_instance *lfsck, __u32 limit)
536 {
537         lfsck->li_bookmark_ram.lb_speed_limit = limit;
538         if (limit != LFSCK_SPEED_NO_LIMIT) {
539                 if (limit > HZ) {
540                         lfsck->li_sleep_rate = limit / HZ;
541                         lfsck->li_sleep_jif = 1;
542                 } else {
543                         lfsck->li_sleep_rate = 1;
544                         lfsck->li_sleep_jif = HZ / limit;
545                 }
546         } else {
547                 lfsck->li_sleep_jif = 0;
548                 lfsck->li_sleep_rate = 0;
549         }
550 }
551
552 void lfsck_control_speed(struct lfsck_instance *lfsck)
553 {
554         struct ptlrpc_thread *thread = &lfsck->li_thread;
555         struct l_wait_info    lwi;
556
557         if (lfsck->li_sleep_jif > 0 &&
558             lfsck->li_new_scanned >= lfsck->li_sleep_rate) {
559                 lwi = LWI_TIMEOUT_INTR(lfsck->li_sleep_jif, NULL,
560                                        LWI_ON_SIGNAL_NOOP, NULL);
561
562                 l_wait_event(thread->t_ctl_waitq,
563                              !thread_is_running(thread),
564                              &lwi);
565                 lfsck->li_new_scanned = 0;
566         }
567 }
568
569 void lfsck_control_speed_by_self(struct lfsck_component *com)
570 {
571         struct lfsck_instance   *lfsck  = com->lc_lfsck;
572         struct ptlrpc_thread    *thread = &lfsck->li_thread;
573         struct l_wait_info       lwi;
574
575         if (lfsck->li_sleep_jif > 0 &&
576             com->lc_new_scanned >= lfsck->li_sleep_rate) {
577                 lwi = LWI_TIMEOUT_INTR(lfsck->li_sleep_jif, NULL,
578                                        LWI_ON_SIGNAL_NOOP, NULL);
579
580                 l_wait_event(thread->t_ctl_waitq,
581                              !thread_is_running(thread),
582                              &lwi);
583                 com->lc_new_scanned = 0;
584         }
585 }
586
587 static int lfsck_parent_fid(const struct lu_env *env, struct dt_object *obj,
588                             struct lu_fid *fid)
589 {
590         if (unlikely(!S_ISDIR(lfsck_object_type(obj)) ||
591                      !dt_try_as_dir(env, obj)))
592                 return -ENOTDIR;
593
594         return dt_lookup(env, obj, (struct dt_rec *)fid,
595                          (const struct dt_key *)"..", BYPASS_CAPA);
596 }
597
598 static int lfsck_needs_scan_dir(const struct lu_env *env,
599                                 struct lfsck_instance *lfsck,
600                                 struct dt_object *obj)
601 {
602         struct lu_fid *fid   = &lfsck_env_info(env)->lti_fid;
603         int            depth = 0;
604         int            rc;
605
606         if (!lfsck->li_master || !S_ISDIR(lfsck_object_type(obj)) ||
607             cfs_list_empty(&lfsck->li_list_dir))
608                RETURN(0);
609
610         while (1) {
611                 /* XXX: Currently, we do not scan the "/REMOTE_PARENT_DIR",
612                  *      which is the agent directory to manage the objects
613                  *      which name entries reside on remote MDTs. Related
614                  *      consistency verification will be processed in LFSCK
615                  *      phase III. */
616                 if (lu_fid_eq(lfsck_dto2fid(obj), &lfsck->li_global_root_fid)) {
617                         if (depth > 0)
618                                 lfsck_object_put(env, obj);
619                         return 1;
620                 }
621
622                 /* .lustre doesn't contain "real" user objects, no need lfsck */
623                 if (fid_is_dot_lustre(lfsck_dto2fid(obj))) {
624                         if (depth > 0)
625                                 lfsck_object_put(env, obj);
626                         return 0;
627                 }
628
629                 dt_read_lock(env, obj, MOR_TGT_CHILD);
630                 if (unlikely(lfsck_is_dead_obj(obj))) {
631                         dt_read_unlock(env, obj);
632                         if (depth > 0)
633                                 lfsck_object_put(env, obj);
634                         return 0;
635                 }
636
637                 rc = dt_xattr_get(env, obj,
638                                   lfsck_buf_get(env, NULL, 0), XATTR_NAME_LINK,
639                                   BYPASS_CAPA);
640                 dt_read_unlock(env, obj);
641                 if (rc >= 0) {
642                         if (depth > 0)
643                                 lfsck_object_put(env, obj);
644                         return 1;
645                 }
646
647                 if (rc < 0 && rc != -ENODATA) {
648                         if (depth > 0)
649                                 lfsck_object_put(env, obj);
650                         return rc;
651                 }
652
653                 rc = lfsck_parent_fid(env, obj, fid);
654                 if (depth > 0)
655                         lfsck_object_put(env, obj);
656                 if (rc != 0)
657                         return rc;
658
659                 if (unlikely(lu_fid_eq(fid, &lfsck->li_local_root_fid)))
660                         return 0;
661
662                 obj = lfsck_object_find(env, lfsck, fid);
663                 if (obj == NULL)
664                         return 0;
665                 else if (IS_ERR(obj))
666                         return PTR_ERR(obj);
667
668                 if (!dt_object_exists(obj)) {
669                         lfsck_object_put(env, obj);
670                         return 0;
671                 }
672
673                 /* Currently, only client visible directory can be remote. */
674                 if (dt_object_remote(obj)) {
675                         lfsck_object_put(env, obj);
676                         return 1;
677                 }
678
679                 depth++;
680         }
681         return 0;
682 }
683
684 struct lfsck_thread_args *lfsck_thread_args_init(struct lfsck_instance *lfsck,
685                                                  struct lfsck_component *com,
686                                                  struct lfsck_start_param *lsp)
687 {
688         struct lfsck_thread_args *lta;
689         int                       rc;
690
691         OBD_ALLOC_PTR(lta);
692         if (lta == NULL)
693                 return ERR_PTR(-ENOMEM);
694
695         rc = lu_env_init(&lta->lta_env, LCT_MD_THREAD | LCT_DT_THREAD);
696         if (rc != 0) {
697                 OBD_FREE_PTR(lta);
698                 return ERR_PTR(rc);
699         }
700
701         lta->lta_lfsck = lfsck_instance_get(lfsck);
702         if (com != NULL)
703                 lta->lta_com = lfsck_component_get(com);
704
705         lta->lta_lsp = lsp;
706
707         return lta;
708 }
709
710 void lfsck_thread_args_fini(struct lfsck_thread_args *lta)
711 {
712         if (lta->lta_com != NULL)
713                 lfsck_component_put(&lta->lta_env, lta->lta_com);
714         lfsck_instance_put(&lta->lta_env, lta->lta_lfsck);
715         lu_env_fini(&lta->lta_env);
716         OBD_FREE_PTR(lta);
717 }
718
719 /* LFSCK wrap functions */
720
721 void lfsck_fail(const struct lu_env *env, struct lfsck_instance *lfsck,
722                 bool new_checked)
723 {
724         struct lfsck_component *com;
725
726         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
727                 com->lc_ops->lfsck_fail(env, com, new_checked);
728         }
729 }
730
731 int lfsck_checkpoint(const struct lu_env *env, struct lfsck_instance *lfsck)
732 {
733         struct lfsck_component *com;
734         int                     rc  = 0;
735         int                     rc1 = 0;
736
737         if (likely(cfs_time_beforeq(cfs_time_current(),
738                                     lfsck->li_time_next_checkpoint)))
739                 return 0;
740
741         lfsck_pos_fill(env, lfsck, &lfsck->li_pos_current, false);
742         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
743                 rc = com->lc_ops->lfsck_checkpoint(env, com, false);
744                 if (rc != 0)
745                         rc1 = rc;
746         }
747
748         lfsck->li_time_last_checkpoint = cfs_time_current();
749         lfsck->li_time_next_checkpoint = lfsck->li_time_last_checkpoint +
750                                 cfs_time_seconds(LFSCK_CHECKPOINT_INTERVAL);
751         return rc1 != 0 ? rc1 : rc;
752 }
753
754 int lfsck_prep(const struct lu_env *env, struct lfsck_instance *lfsck,
755                struct lfsck_start_param *lsp)
756 {
757         struct dt_object       *obj     = NULL;
758         struct lfsck_component *com;
759         struct lfsck_component *next;
760         struct lfsck_position  *pos     = NULL;
761         const struct dt_it_ops *iops    =
762                                 &lfsck->li_obj_oit->do_index_ops->dio_it;
763         struct dt_it           *di;
764         int                     rc;
765         ENTRY;
766
767         LASSERT(lfsck->li_obj_dir == NULL);
768         LASSERT(lfsck->li_di_dir == NULL);
769
770         lfsck->li_current_oit_processed = 0;
771         cfs_list_for_each_entry_safe(com, next, &lfsck->li_list_scan, lc_link) {
772                 com->lc_new_checked = 0;
773                 if (lfsck->li_bookmark_ram.lb_param & LPF_DRYRUN)
774                         com->lc_journal = 0;
775
776                 rc = com->lc_ops->lfsck_prep(env, com, lsp);
777                 if (rc != 0)
778                         GOTO(out, rc);
779
780                 if ((pos == NULL) ||
781                     (!lfsck_pos_is_zero(&com->lc_pos_start) &&
782                      lfsck_pos_is_eq(pos, &com->lc_pos_start) > 0))
783                         pos = &com->lc_pos_start;
784         }
785
786         /* Init otable-based iterator. */
787         if (pos == NULL) {
788                 rc = iops->load(env, lfsck->li_di_oit, 0);
789                 if (rc > 0) {
790                         lfsck->li_oit_over = 1;
791                         rc = 0;
792                 }
793
794                 GOTO(out, rc);
795         }
796
797         rc = iops->load(env, lfsck->li_di_oit, pos->lp_oit_cookie);
798         if (rc < 0)
799                 GOTO(out, rc);
800         else if (rc > 0)
801                 lfsck->li_oit_over = 1;
802
803         if (!lfsck->li_master || fid_is_zero(&pos->lp_dir_parent))
804                 GOTO(out, rc = 0);
805
806         /* Find the directory for namespace-based traverse. */
807         obj = lfsck_object_find(env, lfsck, &pos->lp_dir_parent);
808         if (obj == NULL)
809                 GOTO(out, rc = 0);
810         else if (IS_ERR(obj))
811                 RETURN(PTR_ERR(obj));
812
813         /* XXX: Currently, skip remote object, the consistency for
814          *      remote object will be processed in LFSCK phase III. */
815         if (!dt_object_exists(obj) || dt_object_remote(obj) ||
816             unlikely(!S_ISDIR(lfsck_object_type(obj))))
817                 GOTO(out, rc = 0);
818
819         if (unlikely(!dt_try_as_dir(env, obj)))
820                 GOTO(out, rc = -ENOTDIR);
821
822         /* Init the namespace-based directory traverse. */
823         iops = &obj->do_index_ops->dio_it;
824         di = iops->init(env, obj, lfsck->li_args_dir, BYPASS_CAPA);
825         if (IS_ERR(di))
826                 GOTO(out, rc = PTR_ERR(di));
827
828         LASSERT(pos->lp_dir_cookie < MDS_DIR_END_OFF);
829
830         rc = iops->load(env, di, pos->lp_dir_cookie);
831         if ((rc == 0) || (rc > 0 && pos->lp_dir_cookie > 0))
832                 rc = iops->next(env, di);
833         else if (rc > 0)
834                 rc = 0;
835
836         if (rc != 0) {
837                 iops->put(env, di);
838                 iops->fini(env, di);
839                 GOTO(out, rc);
840         }
841
842         lfsck->li_obj_dir = lfsck_object_get(obj);
843         lfsck->li_cookie_dir = iops->store(env, di);
844         spin_lock(&lfsck->li_lock);
845         lfsck->li_di_dir = di;
846         spin_unlock(&lfsck->li_lock);
847
848         GOTO(out, rc = 0);
849
850 out:
851         if (obj != NULL)
852                 lfsck_object_put(env, obj);
853
854         if (rc < 0) {
855                 cfs_list_for_each_entry_safe(com, next, &lfsck->li_list_scan,
856                                              lc_link)
857                         com->lc_ops->lfsck_post(env, com, rc, true);
858
859                 return rc;
860         }
861
862         rc = 0;
863         lfsck_pos_fill(env, lfsck, &lfsck->li_pos_current, true);
864         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
865                 rc = com->lc_ops->lfsck_checkpoint(env, com, true);
866                 if (rc != 0)
867                         break;
868         }
869
870         lfsck->li_time_last_checkpoint = cfs_time_current();
871         lfsck->li_time_next_checkpoint = lfsck->li_time_last_checkpoint +
872                                 cfs_time_seconds(LFSCK_CHECKPOINT_INTERVAL);
873         return rc;
874 }
875
876 int lfsck_exec_oit(const struct lu_env *env, struct lfsck_instance *lfsck,
877                    struct dt_object *obj)
878 {
879         struct lfsck_component *com;
880         const struct dt_it_ops *iops;
881         struct dt_it           *di;
882         int                     rc;
883         ENTRY;
884
885         LASSERT(lfsck->li_obj_dir == NULL);
886
887         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
888                 rc = com->lc_ops->lfsck_exec_oit(env, com, obj);
889                 if (rc != 0)
890                         RETURN(rc);
891         }
892
893         rc = lfsck_needs_scan_dir(env, lfsck, obj);
894         if (rc <= 0)
895                 GOTO(out, rc);
896
897         if (unlikely(!dt_try_as_dir(env, obj)))
898                 GOTO(out, rc = -ENOTDIR);
899
900         iops = &obj->do_index_ops->dio_it;
901         di = iops->init(env, obj, lfsck->li_args_dir, BYPASS_CAPA);
902         if (IS_ERR(di))
903                 GOTO(out, rc = PTR_ERR(di));
904
905         rc = iops->load(env, di, 0);
906         if (rc == 0)
907                 rc = iops->next(env, di);
908         else if (rc > 0)
909                 rc = 0;
910
911         if (rc != 0) {
912                 iops->put(env, di);
913                 iops->fini(env, di);
914                 GOTO(out, rc);
915         }
916
917         lfsck->li_obj_dir = lfsck_object_get(obj);
918         lfsck->li_cookie_dir = iops->store(env, di);
919         spin_lock(&lfsck->li_lock);
920         lfsck->li_di_dir = di;
921         spin_unlock(&lfsck->li_lock);
922
923         GOTO(out, rc = 0);
924
925 out:
926         if (rc < 0)
927                 lfsck_fail(env, lfsck, false);
928         return (rc > 0 ? 0 : rc);
929 }
930
931 int lfsck_exec_dir(const struct lu_env *env, struct lfsck_instance *lfsck,
932                    struct dt_object *obj, struct lu_dirent *ent)
933 {
934         struct lfsck_component *com;
935         int                     rc;
936
937         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
938                 rc = com->lc_ops->lfsck_exec_dir(env, com, obj, ent);
939                 if (rc != 0)
940                         return rc;
941         }
942         return 0;
943 }
944
945 int lfsck_post(const struct lu_env *env, struct lfsck_instance *lfsck,
946                int result)
947 {
948         struct lfsck_component *com;
949         struct lfsck_component *next;
950         int                     rc  = 0;
951         int                     rc1 = 0;
952
953         lfsck_pos_fill(env, lfsck, &lfsck->li_pos_current, false);
954         cfs_list_for_each_entry_safe(com, next, &lfsck->li_list_scan, lc_link) {
955                 rc = com->lc_ops->lfsck_post(env, com, result, false);
956                 if (rc != 0)
957                         rc1 = rc;
958         }
959
960         lfsck->li_time_last_checkpoint = cfs_time_current();
961         lfsck->li_time_next_checkpoint = lfsck->li_time_last_checkpoint +
962                                 cfs_time_seconds(LFSCK_CHECKPOINT_INTERVAL);
963
964         /* Ignore some component post failure to make other can go ahead. */
965         return result;
966 }
967
968 int lfsck_double_scan(const struct lu_env *env, struct lfsck_instance *lfsck)
969 {
970         struct lfsck_component *com;
971         struct lfsck_component *next;
972         struct l_wait_info      lwi = { 0 };
973         int                     rc  = 0;
974         int                     rc1 = 0;
975
976         cfs_list_for_each_entry_safe(com, next, &lfsck->li_list_double_scan,
977                                      lc_link) {
978                 if (lfsck->li_bookmark_ram.lb_param & LPF_DRYRUN)
979                         com->lc_journal = 0;
980
981                 rc = com->lc_ops->lfsck_double_scan(env, com);
982                 if (rc != 0)
983                         rc1 = rc;
984         }
985
986         l_wait_event(lfsck->li_thread.t_ctl_waitq,
987                      atomic_read(&lfsck->li_double_scan_count) == 0,
988                      &lwi);
989
990         return rc1 != 0 ? rc1 : rc;
991 }
992
993 int lfsck_stop_notify(const struct lu_env *env, struct lfsck_instance *lfsck,
994                       struct lfsck_tgt_descs *ltds, struct lfsck_tgt_desc *ltd)
995 {
996         struct ptlrpc_request_set *set;
997         struct lfsck_component    *com;
998         int                        cnt = 0;
999         int                        rc  = 0;
1000         int                        rc1 = 0;
1001
1002         set = ptlrpc_prep_set();
1003         if (set == NULL)
1004                 return -ENOMEM;
1005
1006         list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
1007                 if (com->lc_ops->lfsck_stop_notify != NULL) {
1008                         rc = com->lc_ops->lfsck_stop_notify(env, com, ltds,
1009                                                             ltd, set);
1010                         if (rc != 0)
1011                                 rc1 = rc;
1012                         else
1013                                 cnt++;
1014                 }
1015         }
1016
1017         list_for_each_entry(com, &lfsck->li_list_double_scan, lc_link) {
1018                 if (com->lc_ops->lfsck_stop_notify != NULL) {
1019                         rc = com->lc_ops->lfsck_stop_notify(env, com, ltds,
1020                                                             ltd, set);
1021                         if (rc != 0)
1022                                 rc1 = rc;
1023                         else
1024                                 cnt++;
1025                 }
1026         }
1027
1028         if (cnt > 0)
1029                 rc = ptlrpc_set_wait(set);
1030         ptlrpc_set_destroy(set);
1031
1032         return rc1 != 0 ? rc1 : rc;
1033 }
1034
1035 void lfsck_quit(const struct lu_env *env, struct lfsck_instance *lfsck)
1036 {
1037         struct lfsck_component *com;
1038         struct lfsck_component *next;
1039
1040         list_for_each_entry_safe(com, next, &lfsck->li_list_scan,
1041                                  lc_link) {
1042                 if (com->lc_ops->lfsck_quit != NULL)
1043                         com->lc_ops->lfsck_quit(env, com);
1044         }
1045
1046         list_for_each_entry_safe(com, next, &lfsck->li_list_double_scan,
1047                                  lc_link) {
1048                 if (com->lc_ops->lfsck_quit != NULL)
1049                         com->lc_ops->lfsck_quit(env, com);
1050         }
1051 }
1052
1053 int lfsck_async_request(const struct lu_env *env, struct obd_export *exp,
1054                         struct lfsck_request *lr,
1055                         struct ptlrpc_request_set *set,
1056                         ptlrpc_interpterer_t interpreter,
1057                         void *args, int request)
1058 {
1059         struct lfsck_async_interpret_args *laia;
1060         struct ptlrpc_request             *req;
1061         struct lfsck_request              *tmp;
1062         struct req_format                 *format;
1063         int                                rc;
1064
1065         if (!(exp_connect_flags(exp) & OBD_CONNECT_LFSCK))
1066                 return -EOPNOTSUPP;
1067
1068         switch (request) {
1069         case LFSCK_NOTIFY:
1070                 format = &RQF_LFSCK_NOTIFY;
1071                 break;
1072         case LFSCK_QUERY:
1073                 format = &RQF_LFSCK_QUERY;
1074                 break;
1075         default:
1076                 CERROR("%s: unknown async request: opc = %d\n",
1077                        exp->exp_obd->obd_name, request);
1078                 return -EINVAL;
1079         }
1080
1081         req = ptlrpc_request_alloc(class_exp2cliimp(exp), format);
1082         if (req == NULL)
1083                 return -ENOMEM;
1084
1085         rc = ptlrpc_request_pack(req, LUSTRE_OBD_VERSION, request);
1086         if (rc != 0) {
1087                 ptlrpc_request_free(req);
1088
1089                 return rc;
1090         }
1091
1092         tmp = req_capsule_client_get(&req->rq_pill, &RMF_LFSCK_REQUEST);
1093         *tmp = *lr;
1094         ptlrpc_request_set_replen(req);
1095
1096         laia = ptlrpc_req_async_args(req);
1097         *laia = *(struct lfsck_async_interpret_args *)args;
1098         lfsck_component_get(laia->laia_com);
1099         req->rq_interpret_reply = interpreter;
1100         ptlrpc_set_add_req(set, req);
1101
1102         return 0;
1103 }
1104
1105 /* external interfaces */
1106
1107 int lfsck_get_speed(struct dt_device *key, void *buf, int len)
1108 {
1109         struct lu_env           env;
1110         struct lfsck_instance  *lfsck;
1111         int                     rc;
1112         ENTRY;
1113
1114         rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
1115         if (rc != 0)
1116                 RETURN(rc);
1117
1118         lfsck = lfsck_instance_find(key, true, false);
1119         if (likely(lfsck != NULL)) {
1120                 rc = snprintf(buf, len, "%u\n",
1121                               lfsck->li_bookmark_ram.lb_speed_limit);
1122                 lfsck_instance_put(&env, lfsck);
1123         } else {
1124                 rc = -ENODEV;
1125         }
1126
1127         lu_env_fini(&env);
1128
1129         RETURN(rc);
1130 }
1131 EXPORT_SYMBOL(lfsck_get_speed);
1132
1133 int lfsck_set_speed(struct dt_device *key, int val)
1134 {
1135         struct lu_env           env;
1136         struct lfsck_instance  *lfsck;
1137         int                     rc;
1138         ENTRY;
1139
1140         rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
1141         if (rc != 0)
1142                 RETURN(rc);
1143
1144         lfsck = lfsck_instance_find(key, true, false);
1145         if (likely(lfsck != NULL)) {
1146                 mutex_lock(&lfsck->li_mutex);
1147                 __lfsck_set_speed(lfsck, val);
1148                 rc = lfsck_bookmark_store(&env, lfsck);
1149                 mutex_unlock(&lfsck->li_mutex);
1150                 lfsck_instance_put(&env, lfsck);
1151         } else {
1152                 rc = -ENODEV;
1153         }
1154
1155         lu_env_fini(&env);
1156
1157         RETURN(rc);
1158 }
1159 EXPORT_SYMBOL(lfsck_set_speed);
1160
1161 int lfsck_get_windows(struct dt_device *key, void *buf, int len)
1162 {
1163         struct lu_env           env;
1164         struct lfsck_instance  *lfsck;
1165         int                     rc;
1166         ENTRY;
1167
1168         rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
1169         if (rc != 0)
1170                 RETURN(rc);
1171
1172         lfsck = lfsck_instance_find(key, true, false);
1173         if (likely(lfsck != NULL)) {
1174                 rc = snprintf(buf, len, "%u\n",
1175                               lfsck->li_bookmark_ram.lb_async_windows);
1176                 lfsck_instance_put(&env, lfsck);
1177         } else {
1178                 rc = -ENODEV;
1179         }
1180
1181         lu_env_fini(&env);
1182
1183         RETURN(rc);
1184 }
1185 EXPORT_SYMBOL(lfsck_get_windows);
1186
1187 int lfsck_set_windows(struct dt_device *key, int val)
1188 {
1189         struct lu_env           env;
1190         struct lfsck_instance  *lfsck;
1191         int                     rc;
1192         ENTRY;
1193
1194         rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
1195         if (rc != 0)
1196                 RETURN(rc);
1197
1198         lfsck = lfsck_instance_find(key, true, false);
1199         if (likely(lfsck != NULL)) {
1200                 if (val > LFSCK_ASYNC_WIN_MAX) {
1201                         CERROR("%s: Too large async windows size, which "
1202                                "may cause memory issues. The valid range "
1203                                "is [0 - %u]. If you do not want to restrict "
1204                                "the windows size for async requests pipeline, "
1205                                "just set it as 0.\n",
1206                                lfsck_lfsck2name(lfsck), LFSCK_ASYNC_WIN_MAX);
1207                         rc = -EINVAL;
1208                 } else if (lfsck->li_bookmark_ram.lb_async_windows != val) {
1209                         mutex_lock(&lfsck->li_mutex);
1210                         lfsck->li_bookmark_ram.lb_async_windows = val;
1211                         rc = lfsck_bookmark_store(&env, lfsck);
1212                         mutex_unlock(&lfsck->li_mutex);
1213                 }
1214                 lfsck_instance_put(&env, lfsck);
1215         } else {
1216                 rc = -ENODEV;
1217         }
1218
1219         lu_env_fini(&env);
1220
1221         RETURN(rc);
1222 }
1223 EXPORT_SYMBOL(lfsck_set_windows);
1224
1225 int lfsck_dump(struct dt_device *key, void *buf, int len, enum lfsck_type type)
1226 {
1227         struct lu_env           env;
1228         struct lfsck_instance  *lfsck;
1229         struct lfsck_component *com;
1230         int                     rc;
1231         ENTRY;
1232
1233         rc = lu_env_init(&env, LCT_MD_THREAD | LCT_DT_THREAD);
1234         if (rc != 0)
1235                 RETURN(rc);
1236
1237         lfsck = lfsck_instance_find(key, true, false);
1238         if (likely(lfsck != NULL)) {
1239                 com = lfsck_component_find(lfsck, type);
1240                 if (likely(com != NULL)) {
1241                         rc = com->lc_ops->lfsck_dump(&env, com, buf, len);
1242                         lfsck_component_put(&env, com);
1243                 } else {
1244                         rc = -ENOTSUPP;
1245                 }
1246
1247                 lfsck_instance_put(&env, lfsck);
1248         } else {
1249                 rc = -ENODEV;
1250         }
1251
1252         lu_env_fini(&env);
1253
1254         RETURN(rc);
1255 }
1256 EXPORT_SYMBOL(lfsck_dump);
1257
1258 int lfsck_start(const struct lu_env *env, struct dt_device *key,
1259                 struct lfsck_start_param *lsp)
1260 {
1261         struct lfsck_start              *start  = lsp->lsp_start;
1262         struct lfsck_instance           *lfsck;
1263         struct lfsck_bookmark           *bk;
1264         struct ptlrpc_thread            *thread;
1265         struct lfsck_component          *com;
1266         struct l_wait_info               lwi    = { 0 };
1267         struct lfsck_thread_args        *lta;
1268         bool                             dirty  = false;
1269         long                             rc     = 0;
1270         __u16                            valid  = 0;
1271         __u16                            flags  = 0;
1272         __u16                            type   = 1;
1273         ENTRY;
1274
1275         lfsck = lfsck_instance_find(key, true, false);
1276         if (unlikely(lfsck == NULL))
1277                 RETURN(-ENODEV);
1278
1279         /* start == NULL means auto trigger paused LFSCK. */
1280         if ((start == NULL) &&
1281             (cfs_list_empty(&lfsck->li_list_scan) ||
1282              OBD_FAIL_CHECK(OBD_FAIL_LFSCK_NO_AUTO)))
1283                 GOTO(put, rc = 0);
1284
1285         bk = &lfsck->li_bookmark_ram;
1286         thread = &lfsck->li_thread;
1287         mutex_lock(&lfsck->li_mutex);
1288         spin_lock(&lfsck->li_lock);
1289         if (!thread_is_init(thread) && !thread_is_stopped(thread)) {
1290                 rc = -EALREADY;
1291                 while (start->ls_active != 0) {
1292                         if (!(type & start->ls_active)) {
1293                                 type <<= 1;
1294                                 continue;
1295                         }
1296
1297                         com = __lfsck_component_find(lfsck, type,
1298                                                      &lfsck->li_list_scan);
1299                         if (com == NULL)
1300                                 com = __lfsck_component_find(lfsck, type,
1301                                                 &lfsck->li_list_double_scan);
1302                         if (com == NULL) {
1303                                 rc = -EOPNOTSUPP;
1304                                 break;
1305                         }
1306
1307                         if (com->lc_ops->lfsck_join != NULL) {
1308                                 rc = com->lc_ops->lfsck_join( env, com, lsp);
1309                                 if (rc != 0 && rc != -EALREADY)
1310                                         break;
1311                         }
1312                         start->ls_active &= ~type;
1313                         type <<= 1;
1314                 }
1315                 spin_unlock(&lfsck->li_lock);
1316                 GOTO(out, rc);
1317         }
1318         spin_unlock(&lfsck->li_lock);
1319
1320         lfsck->li_namespace = lsp->lsp_namespace;
1321         lfsck->li_status = 0;
1322         lfsck->li_oit_over = 0;
1323         lfsck->li_drop_dryrun = 0;
1324         lfsck->li_new_scanned = 0;
1325
1326         /* For auto trigger. */
1327         if (start == NULL)
1328                 goto trigger;
1329
1330         start->ls_version = bk->lb_version;
1331         if (start->ls_valid & LSV_SPEED_LIMIT) {
1332                 __lfsck_set_speed(lfsck, start->ls_speed_limit);
1333                 dirty = true;
1334         }
1335
1336         if (start->ls_valid & LSV_ASYNC_WINDOWS &&
1337             bk->lb_async_windows != start->ls_async_windows) {
1338                 bk->lb_async_windows = start->ls_async_windows;
1339                 dirty = true;
1340         }
1341
1342         if (start->ls_valid & LSV_ERROR_HANDLE) {
1343                 valid |= DOIV_ERROR_HANDLE;
1344                 if (start->ls_flags & LPF_FAILOUT)
1345                         flags |= DOIF_FAILOUT;
1346
1347                 if ((start->ls_flags & LPF_FAILOUT) &&
1348                     !(bk->lb_param & LPF_FAILOUT)) {
1349                         bk->lb_param |= LPF_FAILOUT;
1350                         dirty = true;
1351                 } else if (!(start->ls_flags & LPF_FAILOUT) &&
1352                            (bk->lb_param & LPF_FAILOUT)) {
1353                         bk->lb_param &= ~LPF_FAILOUT;
1354                         dirty = true;
1355                 }
1356         }
1357
1358         if (start->ls_valid & LSV_DRYRUN) {
1359                 valid |= DOIV_DRYRUN;
1360                 if (start->ls_flags & LPF_DRYRUN)
1361                         flags |= DOIF_DRYRUN;
1362
1363                 if ((start->ls_flags & LPF_DRYRUN) &&
1364                     !(bk->lb_param & LPF_DRYRUN)) {
1365                         bk->lb_param |= LPF_DRYRUN;
1366                         dirty = true;
1367                 } else if (!(start->ls_flags & LPF_DRYRUN) &&
1368                            (bk->lb_param & LPF_DRYRUN)) {
1369                         bk->lb_param &= ~LPF_DRYRUN;
1370                         lfsck->li_drop_dryrun = 1;
1371                         dirty = true;
1372                 }
1373         }
1374
1375         if (bk->lb_param & LPF_ALL_MDT &&
1376             !(start->ls_flags & LPF_ALL_MDT)) {
1377                 bk->lb_param &= ~LPF_ALL_MDT;
1378                 dirty = true;
1379         } else if (!(bk->lb_param & LPF_ALL_MDT) &&
1380                    start->ls_flags & LPF_ALL_MDT) {
1381                 bk->lb_param |= LPF_ALL_MDT;
1382                 dirty = true;
1383         }
1384
1385         if (dirty) {
1386                 rc = lfsck_bookmark_store(env, lfsck);
1387                 if (rc != 0)
1388                         GOTO(out, rc);
1389         }
1390
1391         if (start->ls_flags & LPF_RESET)
1392                 flags |= DOIF_RESET;
1393
1394         if (start->ls_active != 0) {
1395                 struct lfsck_component *next;
1396
1397                 if (start->ls_active == LFSCK_TYPES_ALL)
1398                         start->ls_active = LFSCK_TYPES_SUPPORTED;
1399
1400                 if (start->ls_active & ~LFSCK_TYPES_SUPPORTED) {
1401                         start->ls_active &= ~LFSCK_TYPES_SUPPORTED;
1402                         GOTO(out, rc = -ENOTSUPP);
1403                 }
1404
1405                 cfs_list_for_each_entry_safe(com, next,
1406                                              &lfsck->li_list_scan, lc_link) {
1407                         if (!(com->lc_type & start->ls_active)) {
1408                                 rc = com->lc_ops->lfsck_post(env, com, 0,
1409                                                              false);
1410                                 if (rc != 0)
1411                                         GOTO(out, rc);
1412                         }
1413                 }
1414
1415                 while (start->ls_active != 0) {
1416                         if (type & start->ls_active) {
1417                                 com = __lfsck_component_find(lfsck, type,
1418                                                         &lfsck->li_list_idle);
1419                                 if (com != NULL) {
1420                                         /* The component status will be updated
1421                                          * when its prep() is called later by
1422                                          * the LFSCK main engine. */
1423                                         cfs_list_del_init(&com->lc_link);
1424                                         cfs_list_add_tail(&com->lc_link,
1425                                                           &lfsck->li_list_scan);
1426                                 }
1427                                 start->ls_active &= ~type;
1428                         }
1429                         type <<= 1;
1430                 }
1431         }
1432
1433         cfs_list_for_each_entry(com, &lfsck->li_list_scan, lc_link) {
1434                 start->ls_active |= com->lc_type;
1435                 if (flags & DOIF_RESET) {
1436                         rc = com->lc_ops->lfsck_reset(env, com, false);
1437                         if (rc != 0)
1438                                 GOTO(out, rc);
1439                 }
1440         }
1441
1442 trigger:
1443         lfsck->li_args_dir = LUDA_64BITHASH | LUDA_VERIFY;
1444         if (bk->lb_param & LPF_DRYRUN) {
1445                 lfsck->li_args_dir |= LUDA_VERIFY_DRYRUN;
1446                 valid |= DOIV_DRYRUN;
1447                 flags |= DOIF_DRYRUN;
1448         }
1449
1450         if (bk->lb_param & LPF_FAILOUT) {
1451                 valid |= DOIV_ERROR_HANDLE;
1452                 flags |= DOIF_FAILOUT;
1453         }
1454
1455         if (!cfs_list_empty(&lfsck->li_list_scan))
1456                 flags |= DOIF_OUTUSED;
1457
1458         lfsck->li_args_oit = (flags << DT_OTABLE_IT_FLAGS_SHIFT) | valid;
1459         thread_set_flags(thread, 0);
1460         lta = lfsck_thread_args_init(lfsck, NULL, lsp);
1461         if (IS_ERR(lta))
1462                 GOTO(out, rc = PTR_ERR(lta));
1463
1464         rc = PTR_ERR(kthread_run(lfsck_master_engine, lta, "lfsck"));
1465         if (IS_ERR_VALUE(rc)) {
1466                 CERROR("%s: cannot start LFSCK thread: rc = %ld\n",
1467                        lfsck_lfsck2name(lfsck), rc);
1468                 lfsck_thread_args_fini(lta);
1469         } else {
1470                 rc = 0;
1471                 l_wait_event(thread->t_ctl_waitq,
1472                              thread_is_running(thread) ||
1473                              thread_is_stopped(thread),
1474                              &lwi);
1475         }
1476
1477         GOTO(out, rc);
1478
1479 out:
1480         mutex_unlock(&lfsck->li_mutex);
1481 put:
1482         lfsck_instance_put(env, lfsck);
1483         return (rc < 0 ? rc : 0);
1484 }
1485 EXPORT_SYMBOL(lfsck_start);
1486
1487 int lfsck_stop(const struct lu_env *env, struct dt_device *key,
1488                struct lfsck_stop *stop)
1489 {
1490         struct lfsck_instance   *lfsck;
1491         struct ptlrpc_thread    *thread;
1492         struct l_wait_info       lwi    = { 0 };
1493         int                      rc     = 0;
1494         ENTRY;
1495
1496         lfsck = lfsck_instance_find(key, true, false);
1497         if (unlikely(lfsck == NULL))
1498                 RETURN(-ENODEV);
1499
1500         thread = &lfsck->li_thread;
1501         mutex_lock(&lfsck->li_mutex);
1502         spin_lock(&lfsck->li_lock);
1503         if (thread_is_init(thread) || thread_is_stopped(thread)) {
1504                 spin_unlock(&lfsck->li_lock);
1505                 GOTO(out, rc = -EALREADY);
1506         }
1507
1508         if (stop != NULL) {
1509                 lfsck->li_status = stop->ls_status;
1510                 lfsck->li_flags = stop->ls_flags;
1511         } else {
1512                 lfsck->li_status = LS_STOPPED;
1513                 lfsck->li_flags = 0;
1514         }
1515
1516         thread_set_flags(thread, SVC_STOPPING);
1517         spin_unlock(&lfsck->li_lock);
1518
1519         wake_up_all(&thread->t_ctl_waitq);
1520         l_wait_event(thread->t_ctl_waitq,
1521                      thread_is_stopped(thread),
1522                      &lwi);
1523
1524         GOTO(out, rc = 0);
1525
1526 out:
1527         mutex_unlock(&lfsck->li_mutex);
1528         lfsck_instance_put(env, lfsck);
1529
1530         return rc;
1531 }
1532 EXPORT_SYMBOL(lfsck_stop);
1533
1534 int lfsck_in_notify(const struct lu_env *env, struct dt_device *key,
1535                     struct lfsck_request *lr)
1536 {
1537         struct lfsck_instance  *lfsck;
1538         struct lfsck_component *com;
1539         int                     rc;
1540         ENTRY;
1541
1542         switch (lr->lr_event) {
1543         case LE_STOP:
1544         case LE_PHASE1_DONE:
1545         case LE_PHASE2_DONE:
1546                 break;
1547         default:
1548                 RETURN(-EOPNOTSUPP);
1549         }
1550
1551         lfsck = lfsck_instance_find(key, true, false);
1552         if (unlikely(lfsck == NULL))
1553                 RETURN(-ENODEV);
1554
1555         com = lfsck_component_find(lfsck, lr->lr_active);
1556         if (likely(com != NULL)) {
1557                 rc = com->lc_ops->lfsck_in_notify(env, com, lr);
1558                 lfsck_component_put(env, com);
1559         } else {
1560                 rc = -ENOTSUPP;
1561         }
1562
1563         lfsck_instance_put(env, lfsck);
1564
1565         RETURN(rc);
1566 }
1567 EXPORT_SYMBOL(lfsck_in_notify);
1568
1569 int lfsck_query(const struct lu_env *env, struct dt_device *key,
1570                 struct lfsck_request *lr)
1571 {
1572         struct lfsck_instance  *lfsck;
1573         struct lfsck_component *com;
1574         int                     rc;
1575         ENTRY;
1576
1577         lfsck = lfsck_instance_find(key, true, false);
1578         if (unlikely(lfsck == NULL))
1579                 RETURN(-ENODEV);
1580
1581         com = lfsck_component_find(lfsck, lr->lr_active);
1582         if (likely(com != NULL)) {
1583                 rc = com->lc_ops->lfsck_query(env, com);
1584                 lfsck_component_put(env, com);
1585         } else {
1586                 rc = -ENOTSUPP;
1587         }
1588
1589         lfsck_instance_put(env, lfsck);
1590
1591         RETURN(rc);
1592 }
1593 EXPORT_SYMBOL(lfsck_query);
1594
1595 int lfsck_register(const struct lu_env *env, struct dt_device *key,
1596                    struct dt_device *next, struct obd_device *obd,
1597                    lfsck_out_notify notify, void *notify_data, bool master)
1598 {
1599         struct lfsck_instance   *lfsck;
1600         struct dt_object        *root  = NULL;
1601         struct dt_object        *obj;
1602         struct lu_fid           *fid   = &lfsck_env_info(env)->lti_fid;
1603         int                      rc;
1604         ENTRY;
1605
1606         lfsck = lfsck_instance_find(key, false, false);
1607         if (unlikely(lfsck != NULL))
1608                 RETURN(-EEXIST);
1609
1610         OBD_ALLOC_PTR(lfsck);
1611         if (lfsck == NULL)
1612                 RETURN(-ENOMEM);
1613
1614         mutex_init(&lfsck->li_mutex);
1615         spin_lock_init(&lfsck->li_lock);
1616         CFS_INIT_LIST_HEAD(&lfsck->li_link);
1617         CFS_INIT_LIST_HEAD(&lfsck->li_list_scan);
1618         CFS_INIT_LIST_HEAD(&lfsck->li_list_dir);
1619         CFS_INIT_LIST_HEAD(&lfsck->li_list_double_scan);
1620         CFS_INIT_LIST_HEAD(&lfsck->li_list_idle);
1621         atomic_set(&lfsck->li_ref, 1);
1622         atomic_set(&lfsck->li_double_scan_count, 0);
1623         init_waitqueue_head(&lfsck->li_thread.t_ctl_waitq);
1624         lfsck->li_out_notify = notify;
1625         lfsck->li_out_notify_data = notify_data;
1626         lfsck->li_next = next;
1627         lfsck->li_bottom = key;
1628         lfsck->li_obd = obd;
1629
1630         rc = lfsck_tgt_descs_init(&lfsck->li_ost_descs);
1631         if (rc != 0)
1632                 GOTO(out, rc);
1633
1634         rc = lfsck_tgt_descs_init(&lfsck->li_mdt_descs);
1635         if (rc != 0)
1636                 GOTO(out, rc);
1637
1638         fid->f_seq = FID_SEQ_LOCAL_NAME;
1639         fid->f_oid = 1;
1640         fid->f_ver = 0;
1641         rc = local_oid_storage_init(env, lfsck->li_bottom, fid, &lfsck->li_los);
1642         if (rc != 0)
1643                 GOTO(out, rc);
1644
1645         rc = dt_root_get(env, key, fid);
1646         if (rc != 0)
1647                 GOTO(out, rc);
1648
1649         root = dt_locate(env, lfsck->li_bottom, fid);
1650         if (IS_ERR(root))
1651                 GOTO(out, rc = PTR_ERR(root));
1652
1653         if (unlikely(!dt_try_as_dir(env, root)))
1654                 GOTO(out, rc = -ENOTDIR);
1655
1656         lfsck->li_local_root_fid = *fid;
1657         if (master) {
1658                 lfsck->li_master = 1;
1659                 if (lfsck_dev_idx(lfsck->li_bottom) == 0) {
1660                         rc = dt_lookup(env, root,
1661                                 (struct dt_rec *)(&lfsck->li_global_root_fid),
1662                                 (const struct dt_key *)"ROOT", BYPASS_CAPA);
1663                         if (rc != 0)
1664                                 GOTO(out, rc);
1665                 }
1666         }
1667
1668         fid->f_seq = FID_SEQ_LOCAL_FILE;
1669         fid->f_oid = OTABLE_IT_OID;
1670         fid->f_ver = 0;
1671         obj = dt_locate(env, lfsck->li_bottom, fid);
1672         if (IS_ERR(obj))
1673                 GOTO(out, rc = PTR_ERR(obj));
1674
1675         lfsck->li_obj_oit = obj;
1676         rc = obj->do_ops->do_index_try(env, obj, &dt_otable_features);
1677         if (rc != 0) {
1678                 if (rc == -ENOTSUPP)
1679                         GOTO(add, rc = 0);
1680
1681                 GOTO(out, rc);
1682         }
1683
1684         rc = lfsck_bookmark_setup(env, lfsck);
1685         if (rc != 0)
1686                 GOTO(out, rc);
1687
1688         if (master) {
1689                 rc = lfsck_namespace_setup(env, lfsck);
1690                 if (rc < 0)
1691                         GOTO(out, rc);
1692         }
1693
1694         rc = lfsck_layout_setup(env, lfsck);
1695         if (rc < 0)
1696                 GOTO(out, rc);
1697
1698         /* XXX: more LFSCK components initialization to be added here. */
1699
1700 add:
1701         rc = lfsck_instance_add(lfsck);
1702         if (rc == 0)
1703                 rc = lfsck_add_target_from_orphan(env, lfsck);
1704 out:
1705         if (root != NULL && !IS_ERR(root))
1706                 lu_object_put(env, &root->do_lu);
1707         if (rc != 0)
1708                 lfsck_instance_cleanup(env, lfsck);
1709         return rc;
1710 }
1711 EXPORT_SYMBOL(lfsck_register);
1712
1713 void lfsck_degister(const struct lu_env *env, struct dt_device *key)
1714 {
1715         struct lfsck_instance *lfsck;
1716
1717         lfsck = lfsck_instance_find(key, false, true);
1718         if (lfsck != NULL)
1719                 lfsck_instance_put(env, lfsck);
1720 }
1721 EXPORT_SYMBOL(lfsck_degister);
1722
1723 int lfsck_add_target(const struct lu_env *env, struct dt_device *key,
1724                      struct dt_device *tgt, struct obd_export *exp,
1725                      __u32 index, bool for_ost)
1726 {
1727         struct lfsck_instance   *lfsck;
1728         struct lfsck_tgt_desc   *ltd;
1729         int                      rc;
1730         ENTRY;
1731
1732         OBD_ALLOC_PTR(ltd);
1733         if (ltd == NULL)
1734                 RETURN(-ENOMEM);
1735
1736         ltd->ltd_tgt = tgt;
1737         ltd->ltd_key = key;
1738         ltd->ltd_exp = exp;
1739         INIT_LIST_HEAD(&ltd->ltd_orphan_list);
1740         INIT_LIST_HEAD(&ltd->ltd_layout_list);
1741         INIT_LIST_HEAD(&ltd->ltd_layout_phase_list);
1742         atomic_set(&ltd->ltd_ref, 1);
1743         ltd->ltd_index = index;
1744
1745         spin_lock(&lfsck_instance_lock);
1746         lfsck = __lfsck_instance_find(key, true, false);
1747         if (lfsck == NULL) {
1748                 if (for_ost)
1749                         list_add_tail(&ltd->ltd_orphan_list,
1750                                       &lfsck_ost_orphan_list);
1751                 else
1752                         list_add_tail(&ltd->ltd_orphan_list,
1753                                       &lfsck_mdt_orphan_list);
1754                 spin_unlock(&lfsck_instance_lock);
1755
1756                 RETURN(0);
1757         }
1758         spin_unlock(&lfsck_instance_lock);
1759
1760         rc = __lfsck_add_target(env, lfsck, ltd, for_ost, false);
1761         if (rc != 0)
1762                 lfsck_tgt_put(ltd);
1763
1764         lfsck_instance_put(env, lfsck);
1765
1766         RETURN(rc);
1767 }
1768 EXPORT_SYMBOL(lfsck_add_target);
1769
1770 void lfsck_del_target(const struct lu_env *env, struct dt_device *key,
1771                       struct dt_device *tgt, __u32 index, bool for_ost)
1772 {
1773         struct lfsck_instance   *lfsck;
1774         struct lfsck_tgt_descs  *ltds;
1775         struct lfsck_tgt_desc   *ltd;
1776         struct list_head        *head;
1777         bool                     found = false;
1778         bool                     stop  = false;
1779
1780         if (for_ost)
1781                 head = &lfsck_ost_orphan_list;
1782         else
1783                 head = &lfsck_mdt_orphan_list;
1784
1785         spin_lock(&lfsck_instance_lock);
1786         list_for_each_entry(ltd, head, ltd_orphan_list) {
1787                 if (ltd->ltd_tgt == tgt) {
1788                         list_del_init(&ltd->ltd_orphan_list);
1789                         spin_unlock(&lfsck_instance_lock);
1790                         lfsck_tgt_put(ltd);
1791
1792                         return;
1793                 }
1794         }
1795
1796         lfsck = __lfsck_instance_find(key, true, false);
1797         spin_unlock(&lfsck_instance_lock);
1798         if (unlikely(lfsck == NULL))
1799                 return;
1800
1801         if (for_ost)
1802                 ltds = &lfsck->li_ost_descs;
1803         else
1804                 ltds = &lfsck->li_mdt_descs;
1805
1806         down_write(&ltds->ltd_rw_sem);
1807
1808         LASSERT(ltds->ltd_tgts_bitmap != NULL);
1809
1810         if (unlikely(index >= ltds->ltd_tgts_bitmap->size))
1811                 goto unlock;
1812
1813         ltd = LTD_TGT(ltds, index);
1814         if (unlikely(ltd == NULL))
1815                 goto unlock;
1816
1817         found = true;
1818         spin_lock(&ltds->ltd_lock);
1819         ltd->ltd_dead = 1;
1820         if (!list_empty(&ltd->ltd_layout_list)) {
1821                 list_del_init(&ltd->ltd_layout_phase_list);
1822                 list_del_init(&ltd->ltd_layout_list);
1823                 stop = true;
1824         } else {
1825                 LASSERT(list_empty(&ltd->ltd_layout_phase_list));
1826         }
1827         spin_unlock(&ltds->ltd_lock);
1828
1829         if (stop && lfsck->li_master)
1830                 lfsck_stop_notify(env, lfsck, ltds, ltd);
1831
1832         LASSERT(ltds->ltd_tgtnr > 0);
1833
1834         ltds->ltd_tgtnr--;
1835         cfs_bitmap_clear(ltds->ltd_tgts_bitmap, index);
1836         LTD_TGT(ltds, index) = NULL;
1837         lfsck_tgt_put(ltd);
1838
1839 unlock:
1840         if (!found) {
1841                 if (for_ost)
1842                         head = &lfsck->li_ost_descs.ltd_orphan;
1843                 else
1844                         head = &lfsck->li_ost_descs.ltd_orphan;
1845
1846                 list_for_each_entry(ltd, head, ltd_orphan_list) {
1847                         if (ltd->ltd_tgt == tgt) {
1848                                 list_del_init(&ltd->ltd_orphan_list);
1849                                 lfsck_tgt_put(ltd);
1850                                 break;
1851                         }
1852                 }
1853         }
1854
1855         up_write(&ltds->ltd_rw_sem);
1856         lfsck_instance_put(env, lfsck);
1857 }
1858 EXPORT_SYMBOL(lfsck_del_target);
1859
1860 static int __init lfsck_init(void)
1861 {
1862         int rc;
1863
1864         INIT_LIST_HEAD(&lfsck_ost_orphan_list);
1865         INIT_LIST_HEAD(&lfsck_mdt_orphan_list);
1866         lfsck_key_init_generic(&lfsck_thread_key, NULL);
1867         rc = lu_context_key_register(&lfsck_thread_key);
1868         if (rc == 0) {
1869                 tgt_register_lfsck_start(lfsck_start);
1870                 tgt_register_lfsck_in_notify(lfsck_in_notify);
1871                 tgt_register_lfsck_query(lfsck_query);
1872         }
1873
1874         return rc;
1875 }
1876
1877 static void __exit lfsck_exit(void)
1878 {
1879         struct lfsck_tgt_desc *ltd;
1880         struct lfsck_tgt_desc *next;
1881
1882         LASSERT(cfs_list_empty(&lfsck_instance_list));
1883
1884         list_for_each_entry_safe(ltd, next, &lfsck_ost_orphan_list,
1885                                  ltd_orphan_list) {
1886                 list_del_init(&ltd->ltd_orphan_list);
1887                 lfsck_tgt_put(ltd);
1888         }
1889
1890         list_for_each_entry_safe(ltd, next, &lfsck_mdt_orphan_list,
1891                                  ltd_orphan_list) {
1892                 list_del_init(&ltd->ltd_orphan_list);
1893                 lfsck_tgt_put(ltd);
1894         }
1895
1896         lu_context_key_degister(&lfsck_thread_key);
1897 }
1898
1899 MODULE_AUTHOR("Intel Corporation <http://www.intel.com/>");
1900 MODULE_DESCRIPTION("LFSCK");
1901 MODULE_LICENSE("GPL");
1902
1903 cfs_module(lfsck, LUSTRE_VERSION_STRING, lfsck_init, lfsck_exit);