4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License version 2 for more details. A copy is
14 * included in the COPYING file that accompanied this code.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * Copyright (c) 2013, 2014, Intel Corporation.
26 * lustre/lfsck/lfsck_internal.h
28 * Shared definitions and declarations for the LFSCK.
30 * Author: Fan, Yong <fan.yong@intel.com>
33 #ifndef _LFSCK_INTERNAL_H
34 # define _LFSCK_INTERNAL_H
36 #include <lustre/lustre_lfsck_user.h>
37 #include <lustre/lustre_user.h>
38 #include <lustre/lustre_idl.h>
39 #include <lustre_lfsck.h>
41 #include <lu_object.h>
42 #include <dt_object.h>
43 #include <md_object.h>
44 #include <lustre_net.h>
45 #include <lustre_dlm.h>
46 #include <lustre_fid.h>
47 #include <md_object.h>
48 #include <lustre_linkea.h>
50 #define HALF_SEC msecs_to_jiffies(MSEC_PER_SEC >> 1)
51 #define LFSCK_CHECKPOINT_INTERVAL 60
54 /* Finish the first cycle scanning. */
55 LF_SCANNED_ONCE = 0x00000001ULL,
57 /* There is some namespace inconsistency. */
58 LF_INCONSISTENT = 0x00000002ULL,
60 /* The device is upgraded from 1.8 format. */
61 LF_UPGRADE = 0x00000004ULL,
63 /* The server ever restarted during the LFSCK, and may miss to process
64 * some objects check/repair. */
65 LF_INCOMPLETE = 0x00000008ULL,
67 /* The LAST_ID (file) crashed. */
68 LF_CRASHED_LASTID = 0x00000010ULL,
71 struct lfsck_position {
72 /* low layer object table-based iteration position. */
75 /* parent FID for directory traversal. */
76 struct lu_fid lp_dir_parent;
78 /* namespace-based directory traversal position. */
82 struct lfsck_bookmark {
83 /* Magic number to detect that this struct contains valid data. */
86 /* For compatible with old versions. */
89 /* See 'enum lfsck_param_flags' */
92 /* How many items can be scanned at most per second. */
95 /* The windows size for async requests pipeline. */
96 __u16 lb_async_windows;
98 /* For 64-bits aligned. */
101 /* The FID for .lustre/lost+found/MDTxxxx */
102 struct lu_fid lb_lpf_fid;
104 /* The FID for the last MDT-object created by the LFSCK repairing. */
105 struct lu_fid lb_last_fid;
107 /* For future using. */
108 __u64 lb_reserved[2];
111 enum lfsck_namespace_trace_flags {
112 LNTF_CHECK_LINKEA = 0x01,
113 LNTF_CHECK_PARENT = 0x02,
114 LNTF_SKIP_NLINK = 0x04,
115 LNTF_CHECK_ORPHAN = 0x08,
116 LNTF_UNCERTAIN_LMV = 0x10,
117 LNTF_RECHECK_NAME_HASH = 0x20,
121 enum lfsck_namespace_inconsistency_type {
124 LNIT_UNMATCHED_PAIRS = 2,
131 struct lfsck_namespace {
132 /* Magic number to detect that this struct contains valid data. */
135 /* See 'enum lfsck_status'. */
138 /* See 'enum lfsck_flags'. */
141 /* How many completed LFSCK runs on the device. */
142 __u32 ln_success_count;
144 /* How long the LFSCK phase1 has run in seconds. */
145 __u32 ln_run_time_phase1;
147 /* How long the LFSCK phase2 has run in seconds. */
148 __u32 ln_run_time_phase2;
150 /* Time for the last LFSCK completed in seconds since epoch. */
151 __u64 ln_time_last_complete;
153 /* Time for the latest LFSCK ran in seconds since epoch. */
154 __u64 ln_time_latest_start;
156 /* Time for the last LFSCK checkpoint in seconds since epoch. */
157 __u64 ln_time_last_checkpoint;
159 /* Position for the latest LFSCK started from. */
160 struct lfsck_position ln_pos_latest_start;
162 /* Position for the last LFSCK checkpoint. */
163 struct lfsck_position ln_pos_last_checkpoint;
165 /* Position for the first should be updated object. */
166 struct lfsck_position ln_pos_first_inconsistent;
168 /* How many items (including dir) have been checked. */
169 __u64 ln_items_checked;
171 /* How many items have been repaired. */
172 __u64 ln_items_repaired;
174 /* How many items failed to be processed. */
175 __u64 ln_items_failed;
177 /* How many directories have been traversed. */
178 __u64 ln_dirs_checked;
180 /* How many objects have been double scanned. */
181 __u64 ln_objs_checked_phase2;
183 /* How many objects have been reparied during double scan. */
184 __u64 ln_objs_repaired_phase2;
186 /* How many objects failed to be processed during double scan. */
187 __u64 ln_objs_failed_phase2;
189 /* How many objects with nlink fixed. */
190 __u64 ln_objs_nlink_repaired;
192 /* The latest object has been processed (failed) during double scan. */
193 struct lu_fid ln_fid_latest_scanned_phase2;
195 /* How many FID-in-dirent entries have been repaired. */
196 __u64 ln_dirent_repaired;
198 /* How many linkEA entries have been repaired. */
199 __u64 ln_linkea_repaired;
201 /* How many multiple-linked objects have been checked. */
202 __u64 ln_mul_linked_checked;
204 /* How many multiple-linked objects have been repaired. */
205 __u64 ln_mul_linked_repaired;
207 /* How many undefined inconsistency found in phase2. */
208 __u64 ln_unknown_inconsistency;
210 /* How many unmatched pairs have been repaired. */
211 __u64 ln_unmatched_pairs_repaired;
213 /* How many dangling name entries have been found/repaired. */
214 __u64 ln_dangling_repaired;
216 /* How many multiple referenced name entries have been
218 __u64 ln_mul_ref_repaired;
220 /* How many name entries with bad file type have been repaired. */
221 __u64 ln_bad_type_repaired;
223 /* How many lost name entries have been re-inserted. */
224 __u64 ln_lost_dirent_repaired;
226 /* How many objects under /lost+found have been scanned. */
227 __u64 ln_local_lpf_scanned;
229 /* How many objects under /lost+found have been moved to
230 * namespace visible directory. */
231 __u64 ln_local_lpf_moved;
233 /* How many objects under /lost+found have been skipped. */
234 __u64 ln_local_lpf_skipped;
236 /* How many objects under /lost+found failed to be processed. */
237 __u64 ln_local_lpf_failed;
239 /* How many striped directories (master) have been scanned. */
240 __u64 ln_striped_dirs_scanned;
242 /* How many striped directories (master) have been repaired. */
243 __u64 ln_striped_dirs_repaired;
245 /* How many striped directories (master) failed verification. */
246 __u64 ln_striped_dirs_failed;
248 /* How many striped directories (master) has been disabled. */
249 __u64 ln_striped_dirs_disabled;
251 /* How many striped directory's (master) have been skipped
252 * (for shards verification) because of lost master LMV EA. */
253 __u64 ln_striped_dirs_skipped;
255 /* How many striped directory's shards (slave) have been scanned. */
256 __u64 ln_striped_shards_scanned;
258 /* How many striped directory's shards (slave) have been repaired. */
259 __u64 ln_striped_shards_repaired;
261 /* How many striped directory's shards (slave) failed verification. */
262 __u64 ln_striped_shards_failed;
264 /* How many striped directory's shards (slave) have been skipped
265 * (for name hash verification) because do not know whether the slave
266 * LMV EA is valid or not. */
267 __u64 ln_striped_shards_skipped;
269 /* How many name entries under striped directory with bad name
270 * hash have been repaired. */
271 __u64 ln_name_hash_repaired;
273 /* The size of MDT targets bitmap with nbits. Such bitmap records
274 * the MDTs that contain non-verified MDT-objects. */
275 __u32 ln_bitmap_size;
278 /* For further using. 256-bytes aligned now. */
279 __u64 ln_reserved[15];
282 enum lfsck_layout_inconsistency_type {
285 LLIT_UNMATCHED_PAIR = 2,
286 LLIT_MULTIPLE_REFERENCED = 3,
288 LLIT_INCONSISTENT_OWNER = 5,
290 LLIT_MAX = LLIT_OTHERS
293 struct lfsck_layout {
294 /* Magic number to detect that this struct contains valid data. */
297 /* See 'enum lfsck_status'. */
300 /* See 'enum lfsck_flags'. */
303 /* How many completed LFSCK runs on the device. */
304 __u32 ll_success_count;
306 /* How long the LFSCK phase1 has run in seconds. */
307 __u32 ll_run_time_phase1;
309 /* How long the LFSCK phase2 has run in seconds. */
310 __u32 ll_run_time_phase2;
312 /* Time for the last LFSCK completed in seconds since epoch. */
313 __u64 ll_time_last_complete;
315 /* Time for the latest LFSCK ran in seconds since epoch. */
316 __u64 ll_time_latest_start;
318 /* Time for the last LFSCK checkpoint in seconds since epoch. */
319 __u64 ll_time_last_checkpoint;
321 /* Position for the latest LFSCK started from. */
322 __u64 ll_pos_latest_start;
324 /* Position for the last LFSCK checkpoint. */
325 __u64 ll_pos_last_checkpoint;
327 /* Position for the first object to be fixed or
328 * failed to be checked in the phase1. */
329 __u64 ll_pos_first_inconsistent;
331 /* How many objects have been checked. */
332 __u64 ll_objs_checked_phase1;
334 /* How many objects failed to be processed. */
335 __u64 ll_objs_failed_phase1;
337 /* How many objects have been double scanned. */
338 __u64 ll_objs_checked_phase2;
340 /* How many objects failed to be processed during double scan. */
341 __u64 ll_objs_failed_phase2;
343 /* kinds of inconsistency have been or to be repaired.
344 * ll_objs_repaired[type - 1] is the count for the given @type. */
345 __u64 ll_objs_repaired[LLIT_MAX];
347 /* How many objects have been skipped because of related
348 * MDT(s)/OST(s) do not participate in the LFSCK */
349 __u64 ll_objs_skipped;
351 /* The size of ll_ost_bitmap with nbits. */
352 __u32 ll_bitmap_size;
354 /* For further using. 256-bytes aligned now. */
356 __u64 ll_reserved_2[11];
358 /* The OST targets bitmap to record the OSTs that contain
359 * non-verified OST-objects. */
360 __u8 ll_ost_bitmap[0];
363 struct lfsck_assistant_object {
364 struct lu_fid lso_fid;
365 __u64 lso_oit_cookie;
366 struct lu_attr lso_attr;
368 unsigned int lso_dead:1,
372 struct lfsck_component;
373 struct lfsck_tgt_descs;
374 struct lfsck_tgt_desc;
376 struct lfsck_operations {
377 int (*lfsck_reset)(const struct lu_env *env,
378 struct lfsck_component *com,
381 void (*lfsck_fail)(const struct lu_env *env,
382 struct lfsck_component *com,
385 void (*lfsck_close_dir)(const struct lu_env *env,
386 struct lfsck_component *com);
388 int (*lfsck_open_dir)(const struct lu_env *env,
389 struct lfsck_component *com);
391 int (*lfsck_checkpoint)(const struct lu_env *env,
392 struct lfsck_component *com,
395 int (*lfsck_prep)(const struct lu_env *env,
396 struct lfsck_component *com,
397 struct lfsck_start_param *lsp);
399 int (*lfsck_exec_oit)(const struct lu_env *env,
400 struct lfsck_component *com,
401 struct dt_object *obj);
403 int (*lfsck_exec_dir)(const struct lu_env *env,
404 struct lfsck_component *com,
405 struct lfsck_assistant_object *lso,
406 struct lu_dirent *ent,
409 int (*lfsck_post)(const struct lu_env *env,
410 struct lfsck_component *com,
414 int (*lfsck_dump)(const struct lu_env *env,
415 struct lfsck_component *com,
418 int (*lfsck_double_scan)(const struct lu_env *env,
419 struct lfsck_component *com);
421 void (*lfsck_data_release)(const struct lu_env *env,
422 struct lfsck_component *com);
424 void (*lfsck_quit)(const struct lu_env *env,
425 struct lfsck_component *com);
427 int (*lfsck_in_notify)(const struct lu_env *env,
428 struct lfsck_component *com,
429 struct lfsck_request *lr,
432 int (*lfsck_query)(const struct lu_env *env,
433 struct lfsck_component *com);
435 int (*lfsck_join)(const struct lu_env *env,
436 struct lfsck_component *com,
437 struct lfsck_start_param *lsp);
440 #define TGT_PTRS 256 /* number of pointers at 1st level */
441 #define TGT_PTRS_PER_BLOCK 256 /* number of pointers at 2nd level */
443 struct lfsck_tgt_desc {
444 struct list_head ltd_orphan_list;
445 struct dt_device *ltd_tgt;
446 struct dt_device *ltd_key;
447 struct obd_export *ltd_exp;
448 struct list_head ltd_layout_list;
449 struct list_head ltd_layout_phase_list;
450 struct list_head ltd_namespace_list;
451 struct list_head ltd_namespace_phase_list;
454 __u32 ltd_layout_gen;
455 __u32 ltd_namespace_gen;
456 unsigned int ltd_dead:1,
458 ltd_namespace_done:1,
459 ltd_synced_failures:1;
462 struct lfsck_tgt_desc_idx {
463 struct lfsck_tgt_desc *ldi_tgts[TGT_PTRS_PER_BLOCK];
466 struct lfsck_tgt_descs {
467 /* list of known TGTs */
468 struct lfsck_tgt_desc_idx *ltd_tgts_idx[TGT_PTRS];
470 /* bitmap of TGTs available */
471 cfs_bitmap_t *ltd_tgts_bitmap;
473 /* for lfsck_tgt_desc::ltd_xxx_list */
476 /* for tgts table accessing and changes */
477 struct rw_semaphore ltd_rw_sem;
479 /* Temporary list for orphan targets. */
480 struct list_head ltd_orphan;
482 /* number of registered TGTs */
486 #define LTD_TGT(ltd, index) \
487 ((ltd)->ltd_tgts_idx[(index) / TGT_PTRS_PER_BLOCK]->\
488 ldi_tgts[(index) % TGT_PTRS_PER_BLOCK])
490 #define OST_TGT(lfsck, index) LTD_TGT(&lfsck->li_ost_descs, index)
491 #define MDT_TGT(lfsck, index) LTD_TGT(&lfsck->li_mdt_descs, index)
493 #define LFSCK_STF_BITS 4
494 /* If want to adjust the LFSCK_STF_COUNT, please change LFSCK_STF_BITS. */
495 #define LFSCK_STF_COUNT (1 << LFSCK_STF_BITS)
497 struct lfsck_sub_trace_obj {
498 struct dt_object *lsto_obj;
499 struct mutex lsto_mutex;
502 struct lfsck_component {
503 /* into lfsck_instance::li_list_(scan,double_scan,idle} */
504 struct list_head lc_link;
506 /* into lfsck_instance::li_list_dir */
507 struct list_head lc_link_dir;
509 struct rw_semaphore lc_sem;
512 struct lfsck_position lc_pos_start;
513 struct lfsck_instance *lc_lfsck;
514 struct dt_object *lc_obj;
515 struct lfsck_sub_trace_obj lc_sub_trace_objs[LFSCK_STF_COUNT];
516 struct lfsck_operations *lc_ops;
520 struct lu_fid lc_fid_latest_scanned_phase2;
522 /* The time for last checkpoint, jiffies */
523 cfs_time_t lc_time_last_checkpoint;
525 /* The time for next checkpoint, jiffies */
526 cfs_time_t lc_time_next_checkpoint;
530 /* How many objects have been checked since last checkpoint. */
531 __u32 lc_new_checked;
533 /* How many objects have been scanned since last sleep. */
534 __u32 lc_new_scanned;
539 #define LFSCK_LMV_MAX_STRIPES LMV_MAX_STRIPE_COUNT
540 #define LFSCK_LMV_DEF_STRIPES 4
542 /* Warning: NOT change the lfsck_slave_lmv_flags members order,
543 * otherwise the lfsck_record_lmv() may be wrong. */
544 enum lfsck_slave_lmv_flags {
552 /* When the namespace LFSCK scans a striped directory, it will record all
553 * the known shards' information in the structure "lfsck_slave_lmv_rec",
554 * including the shard's FID, index, slave LMV EA, and so on. Each shard
555 * will take one lfsck_slave_lmv_rec slot. After the 1st cycle scanning
556 * the striped directory, the LFSCK will get all the information about
557 * whether there are some inconsistency, and then it can repair them in
558 * the 2nd cycle scanning. */
559 struct lfsck_slave_lmv_rec {
560 struct lu_fid lslr_fid;
561 __u32 lslr_stripe_count;
562 __u32 lslr_index; /* the index in name or in slave lmv */
563 __u32 lslr_hash_type;
568 struct lmv_mds_md_v1 ll_lmv;
570 int ll_stripes_allocated;
571 int ll_stripes_filled;
573 __u32 ll_max_stripe_count;
574 __u32 ll_max_filled_off;
576 unsigned int ll_lmv_master:1,
583 struct lfsck_slave_lmv_rec *ll_lslr;
586 /* If the namespace LFSCK finds that the master MDT-object of a striped
587 * directory lost its master LMV EA, it will re-generate the master LMV
588 * EA and notify the LFSCK instance on the MDT on which the striped dir
589 * master MDT-object resides to rescan the striped directory. To do that,
590 * the notify handler will insert a "lfsck_lmv_unit" structure into the
591 * lfsck::li_list_lmv. The LFSCK instance will scan such list from time
592 * to time to check whether needs to rescan some stirped directories. */
593 struct lfsck_lmv_unit {
594 struct list_head llu_link;
595 struct lfsck_lmv llu_lmv;
596 struct dt_object *llu_obj;
597 struct lfsck_instance *llu_lfsck;
600 struct lfsck_rec_lmv_save {
601 struct lu_fid lrls_fid;
602 struct lmv_mds_md_v1 lrls_lmv;
605 /* Allow lfsck_record_lmv() to be called recursively at most three times. */
606 #define LFSCK_REC_LMV_MAX_DEPTH 3
608 struct lfsck_instance {
609 struct mutex li_mutex;
612 /* Link into the lfsck_instance_list. */
613 struct list_head li_link;
615 /* For the components in (first) scanning via otable-based iteration. */
616 struct list_head li_list_scan;
618 /* For the components in scanning via directory traversal. Because
619 * directory traversal cannot guarantee all the object be scanned,
620 * so the component in the li_list_dir must be in li_list_scan. */
621 struct list_head li_list_dir;
623 /* For the components in double scanning. */
624 struct list_head li_list_double_scan;
626 /* For the components those are not scanning now. */
627 struct list_head li_list_idle;
629 /* For the lfsck_lmv_unit to be handled. */
630 struct list_head li_list_lmv;
633 atomic_t li_double_scan_count;
634 struct ptlrpc_thread li_thread;
636 /* The time for last checkpoint, jiffies */
637 cfs_time_t li_time_last_checkpoint;
639 /* The time for next checkpoint, jiffies */
640 cfs_time_t li_time_next_checkpoint;
642 lfsck_out_notify li_out_notify;
643 void *li_out_notify_data;
644 struct dt_device *li_next;
645 struct dt_device *li_bottom;
646 struct obd_device *li_obd;
647 struct ldlm_namespace *li_namespace;
648 struct local_oid_storage *li_los;
649 struct lu_fid li_local_root_fid; /* backend root "/" */
650 struct lu_fid li_global_root_fid; /* /ROOT */
651 struct dt_object *li_lfsck_dir;
652 struct dt_object *li_bookmark_obj;
653 struct dt_object *li_lpf_obj;
654 struct dt_object *li_lpf_root_obj;
655 struct lu_client_seq *li_seq;
656 struct lfsck_bookmark li_bookmark_ram;
657 struct lfsck_bookmark li_bookmark_disk;
658 struct lfsck_position li_pos_current;
659 struct lfsck_position li_pos_checkpoint;
661 struct lfsck_lmv *li_lmv;
663 /* Obj for otable-based iteration */
664 struct dt_object *li_obj_oit;
666 /* Obj for directory traversal */
667 struct dt_object *li_obj_dir;
669 /* It for otable-based iteration */
670 struct dt_it *li_di_oit;
672 /* It for directory traversal */
673 struct dt_it *li_di_dir;
675 /* Description of OST */
676 struct lfsck_tgt_descs li_ost_descs;
678 /* Description of MDT */
679 struct lfsck_tgt_descs li_mdt_descs;
681 /* namespace-based directory traversal position. */
684 /* Arguments for low layer otable-based iteration. */
687 /* Arugments for namespace-based directory traversal. */
690 /* Schedule for every N objects. */
693 /* Sleep N jiffies for each schedule. */
696 /* How many objects have been scanned since last sleep. */
697 __u32 li_new_scanned;
699 /* The status when the LFSCK stopped or paused. */
702 /* The flags when the lFSCK stopped or paused. */
705 unsigned int li_oit_over:1, /* oit is finished. */
706 li_drop_dryrun:1, /* Ever dryrun, not now. */
707 li_master:1, /* Master instance or not. */
708 li_current_oit_processed:1,
710 struct lfsck_rec_lmv_save li_rec_lmv_save[LFSCK_REC_LMV_MAX_DEPTH];
713 struct lfsck_async_interpret_args {
714 struct lfsck_component *laia_com;
715 struct lfsck_tgt_descs *laia_ltds;
716 struct lfsck_tgt_desc *laia_ltd;
717 struct lfsck_request *laia_lr;
718 atomic_t *laia_count;
720 unsigned int laia_shared:1;
723 struct lfsck_thread_args {
724 struct lu_env lta_env;
725 struct lfsck_instance *lta_lfsck;
726 struct lfsck_component *lta_com;
727 struct lfsck_start_param *lta_lsp;
730 struct lfsck_assistant_req {
731 struct list_head lar_list;
732 struct lfsck_assistant_object *lar_parent;
735 struct lfsck_namespace_req {
736 struct lfsck_assistant_req lnr_lar;
737 struct lfsck_lmv *lnr_lmv;
738 struct lu_fid lnr_fid;
739 __u64 lnr_dir_cookie;
747 struct lfsck_layout_req {
748 struct lfsck_assistant_req llr_lar;
749 struct dt_object *llr_child;
751 __u32 llr_lov_idx; /* offset in LOV EA */
754 struct lfsck_assistant_operations {
755 int (*la_handler_p1)(const struct lu_env *env,
756 struct lfsck_component *com,
757 struct lfsck_assistant_req *lar);
759 int (*la_handler_p2)(const struct lu_env *env,
760 struct lfsck_component *com);
762 void (*la_fill_pos)(const struct lu_env *env,
763 struct lfsck_component *com,
764 struct lfsck_position *pos);
766 int (*la_double_scan_result)(const struct lu_env *env,
767 struct lfsck_component *com,
770 void (*la_req_fini)(const struct lu_env *env,
771 struct lfsck_assistant_req *lar);
773 void (*la_sync_failures)(const struct lu_env *env,
774 struct lfsck_component *com,
775 struct lfsck_request *lr);
778 struct lfsck_assistant_data {
780 struct list_head lad_req_list;
782 /* list for the ost targets involve LFSCK. */
783 struct list_head lad_ost_list;
785 /* list for the ost targets in phase1 scanning. */
786 struct list_head lad_ost_phase1_list;
788 /* list for the ost targets in phase1 scanning. */
789 struct list_head lad_ost_phase2_list;
791 /* list for the mdt targets involve LFSCK. */
792 struct list_head lad_mdt_list;
794 /* list for the mdt targets in phase1 scanning. */
795 struct list_head lad_mdt_phase1_list;
797 /* list for the mdt targets in phase1 scanning. */
798 struct list_head lad_mdt_phase2_list;
800 const char *lad_name;
801 struct ptlrpc_thread lad_thread;
803 struct lfsck_assistant_operations *lad_ops;
805 cfs_bitmap_t *lad_bitmap;
809 int lad_assistant_status;
811 unsigned int lad_to_post:1,
812 lad_to_double_scan:1,
813 lad_in_double_scan:1,
816 bool lad_advance_lock;
819 #define LFSCK_TMPBUF_LEN 64
821 struct lfsck_lock_handle {
822 struct lustre_handle llh_pdo_lh;
823 struct lustre_handle llh_reg_lh;
824 ldlm_mode_t llh_pdo_mode;
825 ldlm_mode_t llh_reg_mode;
828 struct lfsck_thread_info {
829 struct lu_name lti_name_const;
830 struct lu_name lti_name;
831 struct lu_name lti_name2;
832 struct lu_buf lti_buf;
833 struct lu_buf lti_linkea_buf;
834 struct lu_buf lti_linkea_buf2;
835 struct lu_buf lti_big_buf;
836 struct lu_fid lti_fid;
837 struct lu_fid lti_fid2;
838 struct lu_fid lti_fid3;
839 struct lu_attr lti_la;
840 struct lu_attr lti_la2;
841 struct ost_id lti_oi;
843 struct lustre_mdt_attrs lti_lma;
844 /* old LMA for compatibility */
845 char lti_lma_old[LMA_OLD_SIZE];
847 struct dt_object_format lti_dof;
848 /* There will be '\0' at the end of the name. */
849 char lti_key[sizeof(struct lu_dirent) + NAME_MAX + 1];
850 char lti_tmpbuf[LFSCK_TMPBUF_LEN];
851 char lti_tmpbuf2[LFSCK_TMPBUF_LEN];
852 struct lfsck_request lti_lr;
853 struct lfsck_async_interpret_args lti_laia;
854 struct lfsck_async_interpret_args lti_laia2;
855 struct lfsck_start lti_start;
856 struct lfsck_stop lti_stop;
857 ldlm_policy_data_t lti_policy;
858 struct ldlm_enqueue_info lti_einfo;
859 struct ldlm_res_id lti_resid;
861 struct filter_fid_old lti_old_pfid;
862 struct filter_fid lti_new_pfid;
864 struct dt_allocation_hint lti_hint;
865 struct lu_orphan_rec lti_rec;
866 struct lov_user_md lti_lum;
867 struct dt_insert_rec lti_dt_rec;
868 struct lu_object_conf lti_conf;
869 struct lu_seq_range lti_range;
870 struct lmv_mds_md_v1 lti_lmv;
871 struct lmv_mds_md_v1 lti_lmv2;
872 struct lmv_mds_md_v1 lti_lmv3;
873 struct lmv_mds_md_v1 lti_lmv4;
874 struct lfsck_lock_handle lti_llh;
878 int lfsck_fid_alloc(const struct lu_env *env, struct lfsck_instance *lfsck,
879 struct lu_fid *fid, bool locked);
880 int lfsck_ibits_lock(const struct lu_env *env, struct lfsck_instance *lfsck,
881 struct dt_object *obj, struct lustre_handle *lh,
882 __u64 bits, ldlm_mode_t mode);
883 void lfsck_ibits_unlock(struct lustre_handle *lh, ldlm_mode_t mode);
884 int lfsck_lock(const struct lu_env *env, struct lfsck_instance *lfsck,
885 struct dt_object *obj, const char *name,
886 struct lfsck_lock_handle *llh, __u64 bits, ldlm_mode_t mode);
887 void lfsck_unlock(struct lfsck_lock_handle *llh);
888 int lfsck_find_mdt_idx_by_fid(const struct lu_env *env,
889 struct lfsck_instance *lfsck,
890 const struct lu_fid *fid);
891 int lfsck_verify_lpf(const struct lu_env *env, struct lfsck_instance *lfsck);
892 struct lfsck_instance *lfsck_instance_find(struct dt_device *key, bool ref,
894 struct lfsck_component *lfsck_component_find(struct lfsck_instance *lfsck,
896 const char *lfsck_status2names(enum lfsck_status status);
897 void lfsck_component_cleanup(const struct lu_env *env,
898 struct lfsck_component *com);
899 void lfsck_instance_cleanup(const struct lu_env *env,
900 struct lfsck_instance *lfsck);
901 int lfsck_bits_dump(struct seq_file *m, int bits, const char *names[],
903 int lfsck_time_dump(struct seq_file *m, __u64 time, const char *name);
904 int lfsck_pos_dump(struct seq_file *m, struct lfsck_position *pos,
906 void lfsck_pos_fill(const struct lu_env *env, struct lfsck_instance *lfsck,
907 struct lfsck_position *pos, bool init);
908 bool __lfsck_set_speed(struct lfsck_instance *lfsck, __u32 limit);
909 void lfsck_control_speed(struct lfsck_instance *lfsck);
910 void lfsck_control_speed_by_self(struct lfsck_component *com);
911 void lfsck_thread_args_fini(struct lfsck_thread_args *lta);
912 struct lfsck_assistant_data *
913 lfsck_assistant_data_init(struct lfsck_assistant_operations *lao,
915 struct lfsck_assistant_object *
916 lfsck_assistant_object_init(const struct lu_env *env, const struct lu_fid *fid,
917 const struct lu_attr *attr, __u64 cookie,
920 lfsck_assistant_object_load(const struct lu_env *env,
921 struct lfsck_instance *lfsck,
922 struct lfsck_assistant_object *lso);
923 int lfsck_async_interpret_common(const struct lu_env *env,
924 struct ptlrpc_request *req,
926 int lfsck_async_request(const struct lu_env *env, struct obd_export *exp,
927 struct lfsck_request *lr,
928 struct ptlrpc_request_set *set,
929 ptlrpc_interpterer_t interpterer,
930 void *args, int request);
931 int lfsck_start_assistant(const struct lu_env *env, struct lfsck_component *com,
932 struct lfsck_start_param *lsp);
933 int lfsck_checkpoint_generic(const struct lu_env *env,
934 struct lfsck_component *com);
935 void lfsck_post_generic(const struct lu_env *env,
936 struct lfsck_component *com, int *result);
937 int lfsck_double_scan_generic(const struct lu_env *env,
938 struct lfsck_component *com, int status);
939 void lfsck_quit_generic(const struct lu_env *env,
940 struct lfsck_component *com);
943 int lfsck_unpack_ent(struct lu_dirent *ent, __u64 *cookie, __u16 *type);
944 void lfsck_close_dir(const struct lu_env *env,
945 struct lfsck_instance *lfsck, int result);
946 int lfsck_open_dir(const struct lu_env *env,
947 struct lfsck_instance *lfsck, __u64 cookie);
948 int lfsck_master_engine(void *args);
949 int lfsck_assistant_engine(void *args);
951 /* lfsck_bookmark.c */
952 void lfsck_bookmark_cpu_to_le(struct lfsck_bookmark *des,
953 struct lfsck_bookmark *src);
954 int lfsck_bookmark_store(const struct lu_env *env,
955 struct lfsck_instance *lfsck);
956 int lfsck_bookmark_setup(const struct lu_env *env,
957 struct lfsck_instance *lfsck);
958 int lfsck_set_param(const struct lu_env *env, struct lfsck_instance *lfsck,
959 struct lfsck_start *start, bool reset);
961 /* lfsck_namespace.c */
962 int lfsck_namespace_trace_update(const struct lu_env *env,
963 struct lfsck_component *com,
964 const struct lu_fid *fid,
965 const __u8 flags, bool add);
966 int lfsck_namespace_check_exist(const struct lu_env *env,
967 struct dt_object *dir,
968 struct dt_object *obj, const char *name);
969 int __lfsck_links_read(const struct lu_env *env, struct dt_object *obj,
970 struct linkea_data *ldata);
971 int lfsck_namespace_rebuild_linkea(const struct lu_env *env,
972 struct lfsck_component *com,
973 struct dt_object *obj,
974 struct linkea_data *ldata);
975 int lfsck_namespace_repair_dangling(const struct lu_env *env,
976 struct lfsck_component *com,
977 struct dt_object *parent,
978 struct dt_object *child,
979 struct lfsck_namespace_req *lnr);
980 int lfsck_namespace_repair_dirent(const struct lu_env *env,
981 struct lfsck_component *com,
982 struct dt_object *parent,
983 struct dt_object *child,
984 const char *name, const char *name2,
985 __u16 type, bool update, bool dec);
986 int lfsck_verify_linkea(const struct lu_env *env, struct dt_object *obj,
987 const struct lu_name *cname, const struct lu_fid *pfid);
988 int lfsck_links_get_first(const struct lu_env *env, struct dt_object *obj,
989 char *name, struct lu_fid *pfid);
990 int lfsck_update_name_entry(const struct lu_env *env,
991 struct lfsck_instance *lfsck,
992 struct dt_object *dir, const char *name,
993 const struct lu_fid *fid, __u32 type);
994 int lfsck_namespace_setup(const struct lu_env *env,
995 struct lfsck_instance *lfsck);
997 /* lfsck_striped_dir.c */
998 void lfsck_lmv_put(const struct lu_env *env, struct lfsck_lmv *llmv);
999 int lfsck_read_stripe_lmv(const struct lu_env *env, struct dt_object *obj,
1000 struct lmv_mds_md_v1 *lmv);
1001 int lfsck_shard_name_to_index(const struct lu_env *env, const char *name,
1002 int namelen, __u16 type,
1003 const struct lu_fid *fid);
1004 bool lfsck_is_valid_slave_name_entry(const struct lu_env *env,
1005 struct lfsck_lmv *llmv,
1006 const char *name, int namelen);
1007 int lfsck_namespace_check_name(const struct lu_env *env,
1008 struct dt_object *parent,
1009 struct dt_object *child,
1010 const struct lu_name *cname);
1011 int lfsck_namespace_update_lmv(const struct lu_env *env,
1012 struct lfsck_component *com,
1013 struct dt_object *obj,
1014 struct lmv_mds_md_v1 *lmv, bool locked);
1015 int lfsck_namespace_verify_stripe_slave(const struct lu_env *env,
1016 struct lfsck_component *com,
1017 struct dt_object *obj,
1018 struct lfsck_lmv *llmv);
1019 int lfsck_namespace_scan_shard(const struct lu_env *env,
1020 struct lfsck_component *com,
1021 struct dt_object *child);
1022 int lfsck_namespace_notify_lmv_master_local(const struct lu_env *env,
1023 struct lfsck_component *com,
1024 struct dt_object *obj);
1025 int lfsck_namespace_repair_bad_name_hash(const struct lu_env *env,
1026 struct lfsck_component *com,
1027 struct dt_object *shard,
1028 struct lfsck_lmv *llmv,
1030 int lfsck_namespace_striped_dir_rescan(const struct lu_env *env,
1031 struct lfsck_component *com,
1032 struct lfsck_namespace_req *lnr);
1033 int lfsck_namespace_handle_striped_master(const struct lu_env *env,
1034 struct lfsck_component *com,
1035 struct lfsck_namespace_req *lnr);
1037 /* lfsck_layout.c */
1038 int lfsck_layout_setup(const struct lu_env *env, struct lfsck_instance *lfsck);
1040 extern const char dot[];
1041 extern const char dotdot[];
1042 extern const char *lfsck_flags_names[];
1043 extern const char *lfsck_param_names[];
1044 extern struct lu_context_key lfsck_thread_key;
1046 static inline bool name_is_dot_or_dotdot(const char *name, int namelen)
1048 return name[0] == '.' &&
1049 (namelen == 1 || (namelen == 2 && name[1] == '.'));
1052 static inline struct dt_device *lfsck_obj2dev(struct dt_object *obj)
1054 return container_of0(obj->do_lu.lo_dev, struct dt_device, dd_lu_dev);
1057 static inline struct lfsck_thread_info *
1058 lfsck_env_info(const struct lu_env *env)
1060 struct lfsck_thread_info *info;
1062 info = lu_context_key_get(&env->le_ctx, &lfsck_thread_key);
1063 LASSERT(info != NULL);
1067 static inline const struct lu_name *
1068 lfsck_name_get_const(const struct lu_env *env, const void *area, ssize_t len)
1070 struct lu_name *lname;
1072 lname = &lfsck_env_info(env)->lti_name_const;
1073 lname->ln_name = area;
1074 lname->ln_namelen = len;
1079 lfsck_buf_init(struct lu_buf *buf, void *area, ssize_t len)
1085 static inline struct lu_buf *
1086 lfsck_buf_get(const struct lu_env *env, void *area, ssize_t len)
1090 buf = &lfsck_env_info(env)->lti_buf;
1096 static inline const struct lu_buf *
1097 lfsck_buf_get_const(const struct lu_env *env, const void *area, ssize_t len)
1101 buf = &lfsck_env_info(env)->lti_buf;
1102 buf->lb_buf = (void *)area;
1107 static inline char *lfsck_lfsck2name(struct lfsck_instance *lfsck)
1109 return lfsck->li_bottom->dd_lu_dev.ld_obd->obd_name;
1112 static inline const struct lu_fid *lfsck_dto2fid(const struct dt_object *obj)
1114 return lu_object_fid(&obj->do_lu);
1117 static inline void lfsck_pos_set_zero(struct lfsck_position *pos)
1119 memset(pos, 0, sizeof(*pos));
1122 static inline int lfsck_pos_is_zero(const struct lfsck_position *pos)
1124 return pos->lp_oit_cookie == 0 && fid_is_zero(&pos->lp_dir_parent);
1127 static inline int lfsck_pos_is_eq(const struct lfsck_position *pos1,
1128 const struct lfsck_position *pos2)
1130 if (pos1->lp_oit_cookie < pos2->lp_oit_cookie)
1133 if (pos1->lp_oit_cookie > pos2->lp_oit_cookie)
1136 if (fid_is_zero(&pos1->lp_dir_parent) &&
1137 !fid_is_zero(&pos2->lp_dir_parent))
1140 if (!fid_is_zero(&pos1->lp_dir_parent) &&
1141 fid_is_zero(&pos2->lp_dir_parent))
1144 if (fid_is_zero(&pos1->lp_dir_parent) &&
1145 fid_is_zero(&pos2->lp_dir_parent))
1148 LASSERT(lu_fid_eq(&pos1->lp_dir_parent, &pos2->lp_dir_parent));
1150 if (pos1->lp_dir_cookie < pos2->lp_dir_cookie)
1153 if (pos1->lp_dir_cookie > pos2->lp_dir_cookie)
1159 static void inline lfsck_position_le_to_cpu(struct lfsck_position *des,
1160 struct lfsck_position *src)
1162 des->lp_oit_cookie = le64_to_cpu(src->lp_oit_cookie);
1163 fid_le_to_cpu(&des->lp_dir_parent, &src->lp_dir_parent);
1164 des->lp_dir_cookie = le64_to_cpu(src->lp_dir_cookie);
1167 static void inline lfsck_position_cpu_to_le(struct lfsck_position *des,
1168 struct lfsck_position *src)
1170 des->lp_oit_cookie = cpu_to_le64(src->lp_oit_cookie);
1171 fid_cpu_to_le(&des->lp_dir_parent, &src->lp_dir_parent);
1172 des->lp_dir_cookie = cpu_to_le64(src->lp_dir_cookie);
1175 static inline umode_t lfsck_object_type(const struct dt_object *obj)
1177 return lu_object_attr(&obj->do_lu);
1180 static inline int lfsck_is_dead_obj(const struct dt_object *obj)
1182 struct lu_object_header *loh = obj->do_lu.lo_header;
1184 return !!test_bit(LU_OBJECT_HEARD_BANSHEE, &loh->loh_flags);
1187 static inline struct dt_object *lfsck_object_get(struct dt_object *obj)
1189 lu_object_get(&obj->do_lu);
1193 static inline void lfsck_object_put(const struct lu_env *env,
1194 struct dt_object *obj)
1196 lu_object_put(env, &obj->do_lu);
1199 static inline struct seq_server_site
1200 *lfsck_dev_site(struct lfsck_instance *lfsck)
1202 return lu_site2seq(lfsck->li_bottom->dd_lu_dev.ld_site);
1205 static inline u32 lfsck_dev_idx(struct lfsck_instance *lfsck)
1207 return lfsck_dev_site(lfsck)->ss_node_id;
1210 static inline struct dt_object *
1211 lfsck_object_find_by_dev_nowait(const struct lu_env *env, struct dt_device *dev,
1212 const struct lu_fid *fid)
1214 struct lu_object_conf *conf = &lfsck_env_info(env)->lti_conf;
1216 conf->loc_flags = LOC_F_NOWAIT;
1217 return lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, conf));
1220 static inline struct dt_object *
1221 lfsck_object_find_by_dev(const struct lu_env *env, struct dt_device *dev,
1222 const struct lu_fid *fid)
1224 return lu2dt(lu_object_find_slice(env, dt2lu_dev(dev), fid, NULL));
1227 static inline struct dt_device *
1228 lfsck_find_dev_by_fid(const struct lu_env *env, struct lfsck_instance *lfsck,
1229 const struct lu_fid *fid)
1231 struct dt_device *dev;
1234 if (!lfsck->li_master)
1235 return lfsck->li_bottom;
1237 idx = lfsck_find_mdt_idx_by_fid(env, lfsck, fid);
1239 return ERR_PTR(idx);
1241 if (idx == lfsck_dev_idx(lfsck)) {
1242 dev = lfsck->li_bottom;
1244 struct lfsck_tgt_desc *ltd;
1246 ltd = LTD_TGT(&lfsck->li_mdt_descs, idx);
1247 if (unlikely(ltd == NULL))
1248 return ERR_PTR(-ENODEV);
1256 static inline struct dt_object *
1257 lfsck_object_find_bottom(const struct lu_env *env, struct lfsck_instance *lfsck,
1258 const struct lu_fid *fid)
1260 struct dt_device *dev;
1262 dev = lfsck_find_dev_by_fid(env, lfsck, fid);
1264 return (struct dt_object *)dev;
1266 return lfsck_object_find_by_dev(env, dev, fid);
1269 static inline struct dt_object *
1270 lfsck_object_find_bottom_nowait(const struct lu_env *env,
1271 struct lfsck_instance *lfsck,
1272 const struct lu_fid *fid)
1274 struct dt_device *dev;
1276 dev = lfsck_find_dev_by_fid(env, lfsck, fid);
1278 return (struct dt_object *)dev;
1280 return lfsck_object_find_by_dev_nowait(env, dev, fid);
1283 static inline struct dt_object *
1284 lfsck_object_locate(struct dt_device *dev, struct dt_object *obj)
1286 if (lfsck_obj2dev(obj) == dev) {
1289 struct lu_object *lo;
1291 lo = lu_object_locate(obj->do_lu.lo_header,
1292 dev->dd_lu_dev.ld_type);
1293 if (unlikely(lo == NULL))
1294 return ERR_PTR(-ENOENT);
1300 static inline struct lfsck_tgt_desc *lfsck_tgt_get(struct lfsck_tgt_descs *ltds,
1303 struct lfsck_tgt_desc *ltd;
1305 ltd = LTD_TGT(ltds, index);
1307 atomic_inc(<d->ltd_ref);
1312 static inline void lfsck_tgt_put(struct lfsck_tgt_desc *ltd)
1314 if (atomic_dec_and_test(<d->ltd_ref))
1318 static inline struct lfsck_component *
1319 lfsck_component_get(struct lfsck_component *com)
1321 atomic_inc(&com->lc_ref);
1326 static inline void lfsck_component_put(const struct lu_env *env,
1327 struct lfsck_component *com)
1329 if (atomic_dec_and_test(&com->lc_ref)) {
1330 struct lfsck_sub_trace_obj *lsto;
1333 for (i = 0, lsto = &com->lc_sub_trace_objs[0];
1334 i < LFSCK_STF_COUNT; i++, lsto++) {
1335 if (lsto->lsto_obj != NULL)
1336 lfsck_object_put(env, lsto->lsto_obj);
1339 if (com->lc_obj != NULL)
1340 lfsck_object_put(env, com->lc_obj);
1341 if (com->lc_file_ram != NULL)
1342 OBD_FREE(com->lc_file_ram, com->lc_file_size);
1343 if (com->lc_file_disk != NULL)
1344 OBD_FREE(com->lc_file_disk, com->lc_file_size);
1345 if (com->lc_data != NULL) {
1346 LASSERT(com->lc_ops->lfsck_data_release != NULL);
1348 com->lc_ops->lfsck_data_release(env, com);
1355 static inline struct lfsck_instance *
1356 lfsck_instance_get(struct lfsck_instance *lfsck)
1358 atomic_inc(&lfsck->li_ref);
1363 static inline void lfsck_instance_put(const struct lu_env *env,
1364 struct lfsck_instance *lfsck)
1366 if (atomic_dec_and_test(&lfsck->li_ref))
1367 lfsck_instance_cleanup(env, lfsck);
1370 static inline bool lfsck_phase2_next_ready(struct lfsck_assistant_data *lad)
1372 return list_empty(&lad->lad_mdt_phase1_list) &&
1373 (!list_empty(&lad->lad_ost_phase2_list) ||
1374 list_empty(&lad->lad_ost_phase1_list));
1377 static inline void lfsck_lad_set_bitmap(const struct lu_env *env,
1378 struct lfsck_component *com,
1381 struct lfsck_assistant_data *lad = com->lc_data;
1382 cfs_bitmap_t *bitmap = lad->lad_bitmap;
1384 LASSERT(com->lc_lfsck->li_master);
1385 LASSERT(bitmap != NULL);
1387 if (likely(bitmap->size > index)) {
1388 cfs_bitmap_set(bitmap, index);
1389 lad->lad_incomplete = 1;
1390 } else if (com->lc_type == LFSCK_TYPE_NAMESPACE) {
1391 struct lfsck_namespace *ns = com->lc_file_ram;
1393 ns->ln_flags |= LF_INCOMPLETE;
1397 static inline int lfsck_links_read(const struct lu_env *env,
1398 struct dt_object *obj,
1399 struct linkea_data *ldata)
1402 lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf,
1405 return __lfsck_links_read(env, obj, ldata);
1408 static inline int lfsck_links_read2(const struct lu_env *env,
1409 struct dt_object *obj,
1410 struct linkea_data *ldata)
1413 lu_buf_check_and_alloc(&lfsck_env_info(env)->lti_linkea_buf2,
1416 return __lfsck_links_read(env, obj, ldata);
1419 static inline struct lfsck_lmv *lfsck_lmv_get(struct lfsck_lmv *llmv)
1422 atomic_inc(&llmv->ll_ref);
1427 static inline int lfsck_sub_trace_file_fid2idx(const struct lu_fid *fid)
1429 return fid->f_oid & (LFSCK_STF_COUNT - 1);
1432 static inline void lfsck_lmv_header_le_to_cpu(struct lmv_mds_md_v1 *dst,
1433 const struct lmv_mds_md_v1 *src)
1435 dst->lmv_magic = le32_to_cpu(src->lmv_magic);
1436 dst->lmv_stripe_count = le32_to_cpu(src->lmv_stripe_count);
1437 dst->lmv_master_mdt_index = le32_to_cpu(src->lmv_master_mdt_index);
1438 dst->lmv_hash_type = le32_to_cpu(src->lmv_hash_type);
1439 dst->lmv_layout_version = le32_to_cpu(src->lmv_layout_version);
1442 static inline void lfsck_lmv_header_cpu_to_le(struct lmv_mds_md_v1 *dst,
1443 const struct lmv_mds_md_v1 *src)
1445 dst->lmv_magic = cpu_to_le32(src->lmv_magic);
1446 dst->lmv_stripe_count = cpu_to_le32(src->lmv_stripe_count);
1447 dst->lmv_master_mdt_index = cpu_to_le32(src->lmv_master_mdt_index);
1448 dst->lmv_hash_type = cpu_to_le32(src->lmv_hash_type);
1449 dst->lmv_layout_version = cpu_to_le32(src->lmv_layout_version);
1452 static inline struct lfsck_assistant_object *
1453 lfsck_assistant_object_get(struct lfsck_assistant_object *lso)
1455 atomic_inc(&lso->lso_ref);
1461 lfsck_assistant_object_put(const struct lu_env *env,
1462 struct lfsck_assistant_object *lso)
1464 if (atomic_dec_and_test(&lso->lso_ref))
1467 #endif /* _LFSCK_INTERNAL_H */