Whamcloud - gitweb
e2fsck: copy fs when using multi-thread fsck
[tools/e2fsprogs.git] / e2fsck / pass1.c
1 /*
2  * pass1.c -- pass #1 of e2fsck: sequential scan of the inode table
3  *
4  * Copyright (C) 1993, 1994, 1995, 1996, 1997 Theodore Ts'o.
5  *
6  * %Begin-Header%
7  * This file may be redistributed under the terms of the GNU Public
8  * License.
9  * %End-Header%
10  *
11  * Pass 1 of e2fsck iterates over all the inodes in the filesystems,
12  * and applies the following tests to each inode:
13  *
14  *      - The mode field of the inode must be legal.
15  *      - The size and block count fields of the inode are correct.
16  *      - A data block must not be used by another inode
17  *
18  * Pass 1 also gathers the collects the following information:
19  *
20  *      - A bitmap of which inodes are in use.          (inode_used_map)
21  *      - A bitmap of which inodes are directories.     (inode_dir_map)
22  *      - A bitmap of which inodes are regular files.   (inode_reg_map)
23  *      - A bitmap of which inodes have bad fields.     (inode_bad_map)
24  *      - A bitmap of which inodes are in bad blocks.   (inode_bb_map)
25  *      - A bitmap of which inodes are imagic inodes.   (inode_imagic_map)
26  *      - A bitmap of which inodes are casefolded.      (inode_casefold_map)
27  *      - A bitmap of which blocks are in use.          (block_found_map)
28  *      - A bitmap of which blocks are in use by two inodes     (block_dup_map)
29  *      - The data blocks of the directory inodes.      (dir_map)
30  *      - Ref counts for ea_inodes.                     (ea_inode_refs)
31  *      - The encryption policy ID of each encrypted inode. (encrypted_files)
32  *
33  * Pass 1 is designed to stash away enough information so that the
34  * other passes should not need to read in the inode information
35  * during the normal course of a filesystem check.  (Although if an
36  * inconsistency is detected, other passes may need to read in an
37  * inode to fix it.)
38  *
39  * Note that pass 1B will be invoked if there are any duplicate blocks
40  * found.
41  */
42
43 #define _GNU_SOURCE 1 /* get strnlen() */
44 #include "config.h"
45 #include <string.h>
46 #include <time.h>
47 #ifdef HAVE_ERRNO_H
48 #include <errno.h>
49 #endif
50
51 #include "e2fsck.h"
52 #include <ext2fs/ext2_ext_attr.h>
53 /* todo remove this finally */
54 #include <ext2fs/ext2fsP.h>
55 #include <e2p/e2p.h>
56
57 #include "problem.h"
58
59 #ifdef NO_INLINE_FUNCS
60 #define _INLINE_
61 #else
62 #define _INLINE_ inline
63 #endif
64
65 #undef DEBUG
66
67 struct ea_quota {
68         blk64_t blocks;
69         __u64 inodes;
70 };
71
72 static int process_block(ext2_filsys fs, blk64_t        *blocknr,
73                          e2_blkcnt_t blockcnt, blk64_t ref_blk,
74                          int ref_offset, void *priv_data);
75 static int process_bad_block(ext2_filsys fs, blk64_t *block_nr,
76                              e2_blkcnt_t blockcnt, blk64_t ref_blk,
77                              int ref_offset, void *priv_data);
78 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
79                          char *block_buf,
80                          const struct ea_quota *ea_ibody_quota);
81 static void mark_table_blocks(e2fsck_t ctx);
82 static void alloc_bb_map(e2fsck_t ctx);
83 static void alloc_imagic_map(e2fsck_t ctx);
84 static void mark_inode_bad(e2fsck_t ctx, ino_t ino);
85 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino);
86 static void handle_fs_bad_blocks(e2fsck_t ctx);
87 static void process_inodes(e2fsck_t ctx, char *block_buf);
88 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b);
89 static errcode_t scan_callback(ext2_filsys fs, ext2_inode_scan scan,
90                                   dgrp_t group, void * priv_data);
91 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
92                                     char *block_buf, int adjust_sign);
93 /* static char *describe_illegal_block(ext2_filsys fs, blk64_t block); */
94
95 struct process_block_struct {
96         ext2_ino_t      ino;
97         unsigned        is_dir:1, is_reg:1, clear:1, suppress:1,
98                                 fragmented:1, compressed:1, bbcheck:1,
99                                 inode_modified:1;
100         blk64_t         num_blocks;
101         blk64_t         max_blocks;
102         blk64_t         last_block;
103         e2_blkcnt_t     last_init_lblock;
104         e2_blkcnt_t     last_db_block;
105         int             num_illegal_blocks;
106         blk64_t         previous_block;
107         struct ext2_inode *inode;
108         struct problem_context *pctx;
109         ext2fs_block_bitmap fs_meta_blocks;
110         e2fsck_t        ctx;
111         blk64_t         next_lblock;
112         struct extent_tree_info eti;
113 };
114
115 struct process_inode_block {
116         ext2_ino_t ino;
117         struct ea_quota ea_ibody_quota;
118         struct ext2_inode_large inode;
119 };
120
121 struct scan_callback_struct {
122         e2fsck_t        ctx;
123         char            *block_buf;
124 };
125
126 /*
127  * For the inodes to process list.
128  */
129 static struct process_inode_block *inodes_to_process;
130 static int process_inode_count;
131
132 static __u64 ext2_max_sizes[EXT2_MAX_BLOCK_LOG_SIZE -
133                             EXT2_MIN_BLOCK_LOG_SIZE + 1];
134
135 /*
136  * Check to make sure a device inode is real.  Returns 1 if the device
137  * checks out, 0 if not.
138  *
139  * Note: this routine is now also used to check FIFO's and Sockets,
140  * since they have the same requirement; the i_block fields should be
141  * zero.
142  */
143 int e2fsck_pass1_check_device_inode(ext2_filsys fs EXT2FS_ATTR((unused)),
144                                     struct ext2_inode *inode)
145 {
146         int     i;
147
148         /*
149          * If the index or extents flag is set, then this is a bogus
150          * device/fifo/socket
151          */
152         if (inode->i_flags & (EXT2_INDEX_FL | EXT4_EXTENTS_FL))
153                 return 0;
154
155         /*
156          * We should be able to do the test below all the time, but
157          * because the kernel doesn't forcibly clear the device
158          * inode's additional i_block fields, there are some rare
159          * occasions when a legitimate device inode will have non-zero
160          * additional i_block fields.  So for now, we only complain
161          * when the immutable flag is set, which should never happen
162          * for devices.  (And that's when the problem is caused, since
163          * you can't set or clear immutable flags for devices.)  Once
164          * the kernel has been fixed we can change this...
165          */
166         if (inode->i_flags & (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)) {
167                 for (i=4; i < EXT2_N_BLOCKS; i++)
168                         if (inode->i_block[i])
169                                 return 0;
170         }
171         return 1;
172 }
173
174 /*
175  * Check to make sure a symlink inode is real.  Returns 1 if the symlink
176  * checks out, 0 if not.
177  */
178 int e2fsck_pass1_check_symlink(ext2_filsys fs, ext2_ino_t ino,
179                                struct ext2_inode *inode, char *buf)
180 {
181         unsigned int buflen;
182         unsigned int len;
183
184         if ((inode->i_size_high || inode->i_size == 0) ||
185             (inode->i_flags & EXT2_INDEX_FL))
186                 return 0;
187
188         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
189                 size_t inline_size;
190
191                 if (inode->i_flags & EXT4_EXTENTS_FL)
192                         return 0;
193                 if (ext2fs_inline_data_size(fs, ino, &inline_size))
194                         return 0;
195                 if (inode->i_size != inline_size)
196                         return 0;
197
198                 return 1;
199         }
200
201         if (ext2fs_is_fast_symlink(inode)) {
202                 if (inode->i_flags & EXT4_EXTENTS_FL)
203                         return 0;
204                 buf = (char *)inode->i_block;
205                 buflen = sizeof(inode->i_block);
206         } else {
207                 ext2_extent_handle_t    handle;
208                 struct ext2_extent_info info;
209                 struct ext2fs_extent    extent;
210                 blk64_t blk;
211                 int i;
212
213                 if (inode->i_flags & EXT4_EXTENTS_FL) {
214                         if (ext2fs_extent_open2(fs, ino, inode, &handle))
215                                 return 0;
216                         if (ext2fs_extent_get_info(handle, &info) ||
217                             (info.num_entries != 1) ||
218                             (info.max_depth != 0)) {
219                                 ext2fs_extent_free(handle);
220                                 return 0;
221                         }
222                         if (ext2fs_extent_get(handle, EXT2_EXTENT_ROOT,
223                                               &extent) ||
224                             (extent.e_lblk != 0) ||
225                             (extent.e_len != 1)) {
226                                 ext2fs_extent_free(handle);
227                                 return 0;
228                         }
229                         blk = extent.e_pblk;
230                         ext2fs_extent_free(handle);
231                 } else {
232                         blk = inode->i_block[0];
233
234                         for (i = 1; i < EXT2_N_BLOCKS; i++)
235                                 if (inode->i_block[i])
236                                         return 0;
237                 }
238
239                 if (blk < fs->super->s_first_data_block ||
240                     blk >= ext2fs_blocks_count(fs->super))
241                         return 0;
242
243                 if (io_channel_read_blk64(fs->io, blk, 1, buf))
244                         return 0;
245
246                 buflen = fs->blocksize;
247         }
248
249         if (inode->i_flags & EXT4_ENCRYPT_FL)
250                 len = ext2fs_le16_to_cpu(*(__u16 *)buf) + 2;
251         else
252                 len = strnlen(buf, buflen);
253
254         if (len >= buflen)
255                 return 0;
256
257         if (len != inode->i_size)
258                 return 0;
259         return 1;
260 }
261
262 /*
263  * If the extents or inlinedata flags are set on the inode, offer to clear 'em.
264  */
265 #define BAD_SPECIAL_FLAGS (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)
266 static void check_extents_inlinedata(e2fsck_t ctx,
267                                      struct problem_context *pctx)
268 {
269         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
270                 return;
271
272         if (!fix_problem(ctx, PR_1_SPECIAL_EXTENTS_IDATA, pctx))
273                 return;
274
275         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
276         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
277 }
278 #undef BAD_SPECIAL_FLAGS
279
280 /*
281  * If the immutable (or append-only) flag is set on the inode, offer
282  * to clear it.
283  */
284 #define BAD_SPECIAL_FLAGS (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)
285 static void check_immutable(e2fsck_t ctx, struct problem_context *pctx)
286 {
287         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
288                 return;
289
290         if (!fix_problem(ctx, PR_1_SET_IMMUTABLE, pctx))
291                 return;
292
293         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
294         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
295 }
296
297 /*
298  * If device, fifo or socket, check size is zero -- if not offer to
299  * clear it
300  */
301 static void check_size(e2fsck_t ctx, struct problem_context *pctx)
302 {
303         struct ext2_inode *inode = pctx->inode;
304
305         if (EXT2_I_SIZE(inode) == 0)
306                 return;
307
308         if (!fix_problem(ctx, PR_1_SET_NONZSIZE, pctx))
309                 return;
310
311         ext2fs_inode_size_set(ctx->fs, inode, 0);
312         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
313 }
314
315 /*
316  * For a given size, calculate how many blocks would be charged towards quota.
317  */
318 static blk64_t size_to_quota_blocks(ext2_filsys fs, size_t size)
319 {
320         blk64_t clusters;
321
322         clusters = DIV_ROUND_UP(size, fs->blocksize << fs->cluster_ratio_bits);
323         return EXT2FS_C2B(fs, clusters);
324 }
325
326 /*
327  * Check validity of EA inode. Return 0 if EA inode is valid, otherwise return
328  * the problem code.
329  */
330 static problem_t check_large_ea_inode(e2fsck_t ctx,
331                                       struct ext2_ext_attr_entry *entry,
332                                       struct problem_context *pctx,
333                                       blk64_t *quota_blocks)
334 {
335         struct ext2_inode inode;
336         __u32 hash;
337         errcode_t retval;
338
339         /* Check if inode is within valid range */
340         if ((entry->e_value_inum < EXT2_FIRST_INODE(ctx->fs->super)) ||
341             (entry->e_value_inum > ctx->fs->super->s_inodes_count)) {
342                 pctx->num = entry->e_value_inum;
343                 return PR_1_ATTR_VALUE_EA_INODE;
344         }
345
346         e2fsck_read_inode(ctx, entry->e_value_inum, &inode, "pass1");
347
348         retval = ext2fs_ext_attr_hash_entry2(ctx->fs, entry, NULL, &hash);
349         if (retval) {
350                 com_err("check_large_ea_inode", retval,
351                         _("while hashing entry with e_value_inum = %u"),
352                         entry->e_value_inum);
353                 fatal_error(ctx, 0);
354         }
355
356         if (hash == entry->e_hash) {
357                 *quota_blocks = size_to_quota_blocks(ctx->fs,
358                                                      entry->e_value_size);
359         } else {
360                 /* This might be an old Lustre-style ea_inode reference. */
361                 if (inode.i_mtime == pctx->ino &&
362                     inode.i_generation == pctx->inode->i_generation) {
363                         *quota_blocks = 0;
364                 } else {
365                         /* If target inode is also missing EA_INODE flag,
366                          * this is likely to be a bad reference.
367                          */
368                         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
369                                 pctx->num = entry->e_value_inum;
370                                 return PR_1_ATTR_VALUE_EA_INODE;
371                         } else {
372                                 pctx->num = entry->e_hash;
373                                 return PR_1_ATTR_HASH;
374                         }
375                 }
376         }
377
378         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
379                 pctx->num = entry->e_value_inum;
380                 if (fix_problem(ctx, PR_1_ATTR_SET_EA_INODE_FL, pctx)) {
381                         inode.i_flags |= EXT4_EA_INODE_FL;
382                         ext2fs_write_inode(ctx->fs, entry->e_value_inum,
383                                            &inode);
384                 } else {
385                         return PR_1_ATTR_NO_EA_INODE_FL;
386                 }
387         }
388         return 0;
389 }
390
391 static void inc_ea_inode_refs(e2fsck_t ctx, struct problem_context *pctx,
392                               struct ext2_ext_attr_entry *first, void *end)
393 {
394         struct ext2_ext_attr_entry *entry;
395
396         for (entry = first;
397              (void *)entry < end && !EXT2_EXT_IS_LAST_ENTRY(entry);
398              entry = EXT2_EXT_ATTR_NEXT(entry)) {
399                 if (!entry->e_value_inum)
400                         continue;
401                 if (!ctx->ea_inode_refs) {
402                         pctx->errcode = ea_refcount_create(0,
403                                                            &ctx->ea_inode_refs);
404                         if (pctx->errcode) {
405                                 pctx->num = 4;
406                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
407                                 ctx->flags |= E2F_FLAG_ABORT;
408                                 return;
409                         }
410                 }
411                 ea_refcount_increment(ctx->ea_inode_refs, entry->e_value_inum,
412                                       0);
413         }
414 }
415
416 static void check_ea_in_inode(e2fsck_t ctx, struct problem_context *pctx,
417                               struct ea_quota *ea_ibody_quota)
418 {
419         struct ext2_super_block *sb = ctx->fs->super;
420         struct ext2_inode_large *inode;
421         struct ext2_ext_attr_entry *entry;
422         char *start, *header, *end;
423         unsigned int storage_size, remain;
424         problem_t problem = 0;
425         region_t region = 0;
426
427         ea_ibody_quota->blocks = 0;
428         ea_ibody_quota->inodes = 0;
429
430         inode = (struct ext2_inode_large *) pctx->inode;
431         storage_size = EXT2_INODE_SIZE(ctx->fs->super) - EXT2_GOOD_OLD_INODE_SIZE -
432                 inode->i_extra_isize;
433         header = ((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
434                  inode->i_extra_isize;
435         end = header + storage_size;
436         start = header + sizeof(__u32);
437         entry = (struct ext2_ext_attr_entry *) start;
438
439         /* scan all entry's headers first */
440
441         /* take finish entry 0UL into account */
442         remain = storage_size - sizeof(__u32);
443
444         region = region_create(0, storage_size);
445         if (!region) {
446                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
447                 problem = 0;
448                 ctx->flags |= E2F_FLAG_ABORT;
449                 return;
450         }
451         if (region_allocate(region, 0, sizeof(__u32))) {
452                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
453                 goto fix;
454         }
455
456         while (remain >= sizeof(struct ext2_ext_attr_entry) &&
457                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
458                 __u32 hash;
459
460                 if (region_allocate(region, (char *)entry - (char *)header,
461                                     EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
462                         problem = PR_1_INODE_EA_ALLOC_COLLISION;
463                         goto fix;
464                 }
465
466                 /* header eats this space */
467                 remain -= sizeof(struct ext2_ext_attr_entry);
468
469                 /* is attribute name valid? */
470                 if (EXT2_EXT_ATTR_SIZE(entry->e_name_len) > remain) {
471                         pctx->num = entry->e_name_len;
472                         problem = PR_1_ATTR_NAME_LEN;
473                         goto fix;
474                 }
475
476                 /* attribute len eats this space */
477                 remain -= EXT2_EXT_ATTR_SIZE(entry->e_name_len);
478
479                 if (entry->e_value_inum == 0) {
480                         /* check value size */
481                         if (entry->e_value_size > remain) {
482                                 pctx->num = entry->e_value_size;
483                                 problem = PR_1_ATTR_VALUE_SIZE;
484                                 goto fix;
485                         }
486
487                         if (entry->e_value_size &&
488                             region_allocate(region,
489                                             sizeof(__u32) + entry->e_value_offs,
490                                             EXT2_EXT_ATTR_SIZE(
491                                                 entry->e_value_size))) {
492                                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
493                                 goto fix;
494                         }
495
496                         hash = ext2fs_ext_attr_hash_entry(entry,
497                                                           start + entry->e_value_offs);
498
499                         /* e_hash may be 0 in older inode's ea */
500                         if (entry->e_hash != 0 && entry->e_hash != hash) {
501                                 pctx->num = entry->e_hash;
502                                 problem = PR_1_ATTR_HASH;
503                                 goto fix;
504                         }
505                 } else {
506                         blk64_t quota_blocks;
507
508                         problem = check_large_ea_inode(ctx, entry, pctx,
509                                                        &quota_blocks);
510                         if (problem != 0)
511                                 goto fix;
512
513                         ea_ibody_quota->blocks += quota_blocks;
514                         ea_ibody_quota->inodes++;
515                 }
516
517                 /* If EA value is stored in external inode then it does not
518                  * consume space here */
519                 if (entry->e_value_inum == 0)
520                         remain -= entry->e_value_size;
521
522                 entry = EXT2_EXT_ATTR_NEXT(entry);
523         }
524
525         if (region_allocate(region, (char *)entry - (char *)header,
526                             sizeof(__u32))) {
527                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
528                 goto fix;
529         }
530 fix:
531         if (region)
532                 region_free(region);
533         /*
534          * it seems like a corruption. it's very unlikely we could repair
535          * EA(s) in automatic fashion -bzzz
536          */
537         if (problem == 0 || !fix_problem(ctx, problem, pctx)) {
538                 inc_ea_inode_refs(ctx, pctx,
539                                   (struct ext2_ext_attr_entry *)start, end);
540                 return;
541         }
542
543         /* simply remove all possible EA(s) */
544         *((__u32 *)header) = 0UL;
545         e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
546                                 EXT2_INODE_SIZE(sb), "pass1");
547         ea_ibody_quota->blocks = 0;
548         ea_ibody_quota->inodes = 0;
549 }
550
551 static int check_inode_extra_negative_epoch(__u32 xtime, __u32 extra) {
552         return (xtime & (1U << 31)) != 0 &&
553                 (extra & EXT4_EPOCH_MASK) == EXT4_EPOCH_MASK;
554 }
555
556 #define CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, xtime) \
557         check_inode_extra_negative_epoch(inode->i_##xtime, \
558                                          inode->i_##xtime##_extra)
559
560 /* When today's date is earlier than 2242, we assume that atimes,
561  * ctimes, crtimes, and mtimes with years in the range 2310..2378 are
562  * actually pre-1970 dates mis-encoded.
563  */
564 #define EXT4_EXTRA_NEGATIVE_DATE_CUTOFF 2 * (1LL << 32)
565
566 static void check_inode_extra_space(e2fsck_t ctx, struct problem_context *pctx,
567                                     struct ea_quota *ea_ibody_quota)
568 {
569         struct ext2_super_block *sb = ctx->fs->super;
570         struct ext2_inode_large *inode;
571         __u32 *eamagic;
572         int min, max;
573
574         ea_ibody_quota->blocks = 0;
575         ea_ibody_quota->inodes = 0;
576
577         inode = (struct ext2_inode_large *) pctx->inode;
578         if (EXT2_INODE_SIZE(sb) == EXT2_GOOD_OLD_INODE_SIZE) {
579                 /* this isn't large inode. so, nothing to check */
580                 return;
581         }
582
583 #if 0
584         printf("inode #%u, i_extra_size %d\n", pctx->ino,
585                         inode->i_extra_isize);
586 #endif
587         /* i_extra_isize must cover i_extra_isize + i_checksum_hi at least */
588         min = sizeof(inode->i_extra_isize) + sizeof(inode->i_checksum_hi);
589         max = EXT2_INODE_SIZE(sb) - EXT2_GOOD_OLD_INODE_SIZE;
590         /*
591          * For now we will allow i_extra_isize to be 0, but really
592          * implementations should never allow i_extra_isize to be 0
593          */
594         if (inode->i_extra_isize &&
595             (inode->i_extra_isize < min || inode->i_extra_isize > max ||
596              inode->i_extra_isize & 3)) {
597                 if (!fix_problem(ctx, PR_1_EXTRA_ISIZE, pctx))
598                         return;
599                 if (inode->i_extra_isize < min || inode->i_extra_isize > max)
600                         inode->i_extra_isize = sb->s_want_extra_isize;
601                 else
602                         inode->i_extra_isize = (inode->i_extra_isize + 3) & ~3;
603                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
604                                         EXT2_INODE_SIZE(sb), "pass1");
605         }
606
607         /* check if there is no place for an EA header */
608         if (inode->i_extra_isize >= max - sizeof(__u32))
609                 return;
610
611         eamagic = (__u32 *) (((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
612                         inode->i_extra_isize);
613         if (*eamagic == EXT2_EXT_ATTR_MAGIC) {
614                 /* it seems inode has an extended attribute(s) in body */
615                 check_ea_in_inode(ctx, pctx, ea_ibody_quota);
616         }
617
618         /*
619          * If the inode's extended atime (ctime, crtime, mtime) is stored in
620          * the old, invalid format, repair it.
621          */
622         if (((sizeof(time_t) <= 4) ||
623              (((sizeof(time_t) > 4) &&
624                ctx->now < EXT4_EXTRA_NEGATIVE_DATE_CUTOFF))) &&
625             (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime) ||
626              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime) ||
627              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime) ||
628              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))) {
629
630                 if (!fix_problem(ctx, PR_1_EA_TIME_OUT_OF_RANGE, pctx))
631                         return;
632
633                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime))
634                         inode->i_atime_extra &= ~EXT4_EPOCH_MASK;
635                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime))
636                         inode->i_ctime_extra &= ~EXT4_EPOCH_MASK;
637                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime))
638                         inode->i_crtime_extra &= ~EXT4_EPOCH_MASK;
639                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))
640                         inode->i_mtime_extra &= ~EXT4_EPOCH_MASK;
641                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
642                                         EXT2_INODE_SIZE(sb), "pass1");
643         }
644
645 }
646
647 /*
648  * Check to see if the inode might really be a directory, despite i_mode
649  *
650  * This is a lot of complexity for something for which I'm not really
651  * convinced happens frequently in the wild.  If for any reason this
652  * causes any problems, take this code out.
653  * [tytso:20070331.0827EDT]
654  */
655 static void check_is_really_dir(e2fsck_t ctx, struct problem_context *pctx,
656                                 char *buf)
657 {
658         struct ext2_inode *inode = pctx->inode;
659         struct ext2_dir_entry   *dirent;
660         errcode_t               retval;
661         blk64_t                 blk;
662         unsigned int            i, rec_len, not_device = 0;
663         int                     extent_fs;
664         int                     inlinedata_fs;
665
666         /*
667          * If the mode looks OK, we believe it.  If the first block in
668          * the i_block array is 0, this cannot be a directory. If the
669          * inode is extent-mapped, it is still the case that the latter
670          * cannot be 0 - the magic number in the extent header would make
671          * it nonzero.
672          */
673         if (LINUX_S_ISDIR(inode->i_mode) || LINUX_S_ISREG(inode->i_mode) ||
674             LINUX_S_ISLNK(inode->i_mode) || inode->i_block[0] == 0)
675                 return;
676
677         /* 
678          * Check the block numbers in the i_block array for validity:
679          * zero blocks are skipped (but the first one cannot be zero -
680          * see above), other blocks are checked against the first and
681          * max data blocks (from the the superblock) and against the
682          * block bitmap. Any invalid block found means this cannot be
683          * a directory.
684          * 
685          * If there are non-zero blocks past the fourth entry, then
686          * this cannot be a device file: we remember that for the next
687          * check.
688          *
689          * For extent mapped files, we don't do any sanity checking:
690          * just try to get the phys block of logical block 0 and run
691          * with it.
692          *
693          * For inline data files, we just try to get the size of inline
694          * data.  If it's true, we will treat it as a directory.
695          */
696
697         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
698         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
699         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL)) {
700                 size_t size;
701                 __u32 dotdot;
702                 unsigned int rec_len2;
703                 struct ext2_dir_entry de;
704
705                 if (ext2fs_inline_data_size(ctx->fs, pctx->ino, &size))
706                         return;
707                 /*
708                  * If the size isn't a multiple of 4, it's probably not a
709                  * directory??
710                  */
711                 if (size & 3)
712                         return;
713                 /*
714                  * If the first 10 bytes don't look like a directory entry,
715                  * it's probably not a directory.
716                  */
717                 memcpy(&dotdot, inode->i_block, sizeof(dotdot));
718                 memcpy(&de, ((char *)inode->i_block) + EXT4_INLINE_DATA_DOTDOT_SIZE,
719                        EXT2_DIR_REC_LEN(0));
720                 dotdot = ext2fs_le32_to_cpu(dotdot);
721                 de.inode = ext2fs_le32_to_cpu(de.inode);
722                 de.rec_len = ext2fs_le16_to_cpu(de.rec_len);
723                 ext2fs_get_rec_len(ctx->fs, &de, &rec_len2);
724                 if (dotdot >= ctx->fs->super->s_inodes_count ||
725                     (dotdot < EXT2_FIRST_INO(ctx->fs->super) &&
726                      dotdot != EXT2_ROOT_INO) ||
727                     de.inode >= ctx->fs->super->s_inodes_count ||
728                     (de.inode < EXT2_FIRST_INO(ctx->fs->super) &&
729                      de.inode != 0) ||
730                     rec_len2 > EXT4_MIN_INLINE_DATA_SIZE -
731                               EXT4_INLINE_DATA_DOTDOT_SIZE)
732                         return;
733                 /* device files never have a "system.data" entry */
734                 goto isdir;
735         } else if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) {
736                 /* extent mapped */
737                 if  (ext2fs_bmap2(ctx->fs, pctx->ino, inode, 0, 0, 0, 0,
738                                  &blk))
739                         return;
740                 /* device files are never extent mapped */
741                 not_device++;
742         } else {
743                 for (i=0; i < EXT2_N_BLOCKS; i++) {
744                         blk = inode->i_block[i];
745                         if (!blk)
746                                 continue;
747                         if (i >= 4)
748                                 not_device++;
749
750                         if (blk < ctx->fs->super->s_first_data_block ||
751                             blk >= ext2fs_blocks_count(ctx->fs->super) ||
752                             ext2fs_fast_test_block_bitmap2(ctx->block_found_map,
753                                                            blk))
754                                 return; /* Invalid block, can't be dir */
755                 }
756                 blk = inode->i_block[0];
757         }
758
759         /*
760          * If the mode says this is a device file and the i_links_count field
761          * is sane and we have not ruled it out as a device file previously,
762          * we declare it a device file, not a directory.
763          */
764         if ((LINUX_S_ISCHR(inode->i_mode) || LINUX_S_ISBLK(inode->i_mode)) &&
765             (inode->i_links_count == 1) && !not_device)
766                 return;
767
768         /* read the first block */
769         ehandler_operation(_("reading directory block"));
770         retval = ext2fs_read_dir_block4(ctx->fs, blk, buf, 0, pctx->ino);
771         ehandler_operation(0);
772         if (retval)
773                 return;
774
775         dirent = (struct ext2_dir_entry *) buf;
776         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
777         if (retval)
778                 return;
779         if ((ext2fs_dirent_name_len(dirent) != 1) ||
780             (dirent->name[0] != '.') ||
781             (dirent->inode != pctx->ino) ||
782             (rec_len < 12) ||
783             (rec_len % 4) ||
784             (rec_len >= ctx->fs->blocksize - 12))
785                 return;
786
787         dirent = (struct ext2_dir_entry *) (buf + rec_len);
788         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
789         if (retval)
790                 return;
791         if ((ext2fs_dirent_name_len(dirent) != 2) ||
792             (dirent->name[0] != '.') ||
793             (dirent->name[1] != '.') ||
794             (rec_len < 12) ||
795             (rec_len % 4))
796                 return;
797
798 isdir:
799         if (fix_problem(ctx, PR_1_TREAT_AS_DIRECTORY, pctx)) {
800                 inode->i_mode = (inode->i_mode & 07777) | LINUX_S_IFDIR;
801                 e2fsck_write_inode_full(ctx, pctx->ino, inode,
802                                         EXT2_INODE_SIZE(ctx->fs->super),
803                                         "check_is_really_dir");
804         }
805 }
806
807 extern errcode_t e2fsck_setup_icount(e2fsck_t ctx, const char *icount_name,
808                                      int flags, ext2_icount_t hint,
809                                      ext2_icount_t *ret)
810 {
811         unsigned int            threshold;
812         unsigned int            save_type;
813         ext2_ino_t              num_dirs;
814         errcode_t               retval;
815         char                    *tdb_dir;
816         int                     enable;
817
818         *ret = 0;
819
820         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
821                            &tdb_dir);
822         profile_get_uint(ctx->profile, "scratch_files",
823                          "numdirs_threshold", 0, 0, &threshold);
824         profile_get_boolean(ctx->profile, "scratch_files",
825                             "icount", 0, 1, &enable);
826
827         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
828         if (retval)
829                 num_dirs = 1024;        /* Guess */
830
831         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
832             (!threshold || num_dirs > threshold)) {
833                 retval = ext2fs_create_icount_tdb(ctx->fs, tdb_dir,
834                                                   flags, ret);
835                 if (retval == 0)
836                         return 0;
837         }
838         e2fsck_set_bitmap_type(ctx->fs, EXT2FS_BMAP64_RBTREE, icount_name,
839                                &save_type);
840         if (ctx->options & E2F_OPT_ICOUNT_FULLMAP)
841                 flags |= EXT2_ICOUNT_OPT_FULLMAP;
842         retval = ext2fs_create_icount2(ctx->fs, flags, 0, hint, ret);
843         ctx->fs->default_bitmap_type = save_type;
844         return retval;
845 }
846
847 static errcode_t recheck_bad_inode_checksum(ext2_filsys fs, ext2_ino_t ino,
848                                             e2fsck_t ctx,
849                                             struct problem_context *pctx)
850 {
851         errcode_t retval;
852         struct ext2_inode_large inode;
853
854         /*
855          * Reread inode.  If we don't see checksum error, then this inode
856          * has been fixed elsewhere.
857          */
858         ctx->stashed_ino = 0;
859         retval = ext2fs_read_inode_full(fs, ino, (struct ext2_inode *)&inode,
860                                         sizeof(inode));
861         if (retval && retval != EXT2_ET_INODE_CSUM_INVALID)
862                 return retval;
863         if (!retval)
864                 return 0;
865
866         /*
867          * Checksum still doesn't match.  That implies that the inode passes
868          * all the sanity checks, so maybe the checksum is simply corrupt.
869          * See if the user will go for fixing that.
870          */
871         if (!fix_problem(ctx, PR_1_INODE_ONLY_CSUM_INVALID, pctx))
872                 return 0;
873
874         retval = ext2fs_write_inode_full(fs, ino, (struct ext2_inode *)&inode,
875                                          sizeof(inode));
876         return retval;
877 }
878
879 static void reserve_block_for_root_repair(e2fsck_t ctx)
880 {
881         blk64_t         blk = 0;
882         errcode_t       err;
883         ext2_filsys     fs = ctx->fs;
884
885         ctx->root_repair_block = 0;
886         if (ext2fs_test_inode_bitmap2(ctx->inode_used_map, EXT2_ROOT_INO))
887                 return;
888
889         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
890         if (err)
891                 return;
892         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
893         ctx->root_repair_block = blk;
894 }
895
896 static void reserve_block_for_lnf_repair(e2fsck_t ctx)
897 {
898         blk64_t         blk = 0;
899         errcode_t       err;
900         ext2_filsys     fs = ctx->fs;
901         static const char name[] = "lost+found";
902         ext2_ino_t      ino;
903
904         ctx->lnf_repair_block = 0;
905         if (!ext2fs_lookup(fs, EXT2_ROOT_INO, name, sizeof(name)-1, 0, &ino))
906                 return;
907
908         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
909         if (err)
910                 return;
911         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
912         ctx->lnf_repair_block = blk;
913 }
914
915 static errcode_t get_inline_data_ea_size(ext2_filsys fs, ext2_ino_t ino,
916                                          size_t *sz)
917 {
918         void *p;
919         struct ext2_xattr_handle *handle;
920         errcode_t retval;
921
922         retval = ext2fs_xattrs_open(fs, ino, &handle);
923         if (retval)
924                 return retval;
925
926         retval = ext2fs_xattrs_read(handle);
927         if (retval)
928                 goto err;
929
930         retval = ext2fs_xattr_get(handle, "system.data", &p, sz);
931         if (retval)
932                 goto err;
933         ext2fs_free_mem(&p);
934 err:
935         (void) ext2fs_xattrs_close(&handle);
936         return retval;
937 }
938
939 static void finish_processing_inode(e2fsck_t ctx, ext2_ino_t ino,
940                                     struct problem_context *pctx,
941                                     int failed_csum)
942 {
943         if (!failed_csum)
944                 return;
945
946         /*
947          * If the inode failed the checksum and the user didn't
948          * clear the inode, test the checksum again -- if it still
949          * fails, ask the user if the checksum should be corrected.
950          */
951         pctx->errcode = recheck_bad_inode_checksum(ctx->fs, ino, ctx, pctx);
952         if (pctx->errcode)
953                 ctx->flags |= E2F_FLAG_ABORT;
954 }
955 #define FINISH_INODE_LOOP(ctx, ino, pctx, failed_csum) \
956         do { \
957                 finish_processing_inode((ctx), (ino), (pctx), (failed_csum)); \
958                 if ((ctx)->flags & E2F_FLAG_ABORT) \
959                         return; \
960         } while (0)
961
962 static int could_be_block_map(ext2_filsys fs, struct ext2_inode *inode)
963 {
964         __u32 x;
965         int i;
966
967         for (i = 0; i < EXT2_N_BLOCKS; i++) {
968                 x = inode->i_block[i];
969 #ifdef WORDS_BIGENDIAN
970                 x = ext2fs_swab32(x);
971 #endif
972                 if (x >= ext2fs_blocks_count(fs->super))
973                         return 0;
974         }
975
976         return 1;
977 }
978
979 /*
980  * Figure out what to do with an inode that has both extents and inline data
981  * inode flags set.  Returns -1 if we decide to erase the inode, 0 otherwise.
982  */
983 static int fix_inline_data_extents_file(e2fsck_t ctx,
984                                         ext2_ino_t ino,
985                                         struct ext2_inode *inode,
986                                         int inode_size,
987                                         struct problem_context *pctx)
988 {
989         size_t max_inline_ea_size;
990         ext2_filsys fs = ctx->fs;
991         int dirty = 0;
992
993         /* Both feature flags not set?  Just run the regular checks */
994         if (!ext2fs_has_feature_extents(fs->super) &&
995             !ext2fs_has_feature_inline_data(fs->super))
996                 return 0;
997
998         /* Clear both flags if it's a special file */
999         if (LINUX_S_ISCHR(inode->i_mode) ||
1000             LINUX_S_ISBLK(inode->i_mode) ||
1001             LINUX_S_ISFIFO(inode->i_mode) ||
1002             LINUX_S_ISSOCK(inode->i_mode)) {
1003                 check_extents_inlinedata(ctx, pctx);
1004                 return 0;
1005         }
1006
1007         /* If it looks like an extent tree, try to clear inlinedata */
1008         if (ext2fs_extent_header_verify(inode->i_block,
1009                                  sizeof(inode->i_block)) == 0 &&
1010             fix_problem(ctx, PR_1_CLEAR_INLINE_DATA_FOR_EXTENT, pctx)) {
1011                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1012                 dirty = 1;
1013                 goto out;
1014         }
1015
1016         /* If it looks short enough to be inline data, try to clear extents */
1017         if (inode_size > EXT2_GOOD_OLD_INODE_SIZE)
1018                 max_inline_ea_size = inode_size -
1019                                      (EXT2_GOOD_OLD_INODE_SIZE +
1020                                       ((struct ext2_inode_large *)inode)->i_extra_isize);
1021         else
1022                 max_inline_ea_size = 0;
1023         if (EXT2_I_SIZE(inode) <
1024             EXT4_MIN_INLINE_DATA_SIZE + max_inline_ea_size &&
1025             fix_problem(ctx, PR_1_CLEAR_EXTENT_FOR_INLINE_DATA, pctx)) {
1026                 inode->i_flags &= ~EXT4_EXTENTS_FL;
1027                 dirty = 1;
1028                 goto out;
1029         }
1030
1031         /*
1032          * Too big for inline data, but no evidence of extent tree -
1033          * maybe it's a block map file?  If the mappings all look valid?
1034          */
1035         if (could_be_block_map(fs, inode) &&
1036             fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_FLAGS, pctx)) {
1037 #ifdef WORDS_BIGENDIAN
1038                 int i;
1039
1040                 for (i = 0; i < EXT2_N_BLOCKS; i++)
1041                         inode->i_block[i] = ext2fs_swab32(inode->i_block[i]);
1042 #endif
1043
1044                 inode->i_flags &= ~(EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL);
1045                 dirty = 1;
1046                 goto out;
1047         }
1048
1049         /* Oh well, just clear the busted inode. */
1050         if (fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_INODE, pctx)) {
1051                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1052                 return -1;
1053         }
1054
1055 out:
1056         if (dirty)
1057                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1058
1059         return 0;
1060 }
1061
1062 static void pass1_readahead(e2fsck_t ctx, dgrp_t *group, ext2_ino_t *next_ino)
1063 {
1064         ext2_ino_t inodes_in_group = 0, inodes_per_block, inodes_per_buffer;
1065         dgrp_t start = *group, grp;
1066         blk64_t blocks_to_read = 0;
1067         errcode_t err = EXT2_ET_INVALID_ARGUMENT;
1068
1069         if (ctx->readahead_kb == 0)
1070                 goto out;
1071
1072         /* Keep iterating groups until we have enough to readahead */
1073         inodes_per_block = EXT2_INODES_PER_BLOCK(ctx->fs->super);
1074         for (grp = start; grp < ctx->fs->group_desc_count; grp++) {
1075                 if (ext2fs_bg_flags_test(ctx->fs, grp, EXT2_BG_INODE_UNINIT))
1076                         continue;
1077                 inodes_in_group = ctx->fs->super->s_inodes_per_group -
1078                                         ext2fs_bg_itable_unused(ctx->fs, grp);
1079                 blocks_to_read += (inodes_in_group + inodes_per_block - 1) /
1080                                         inodes_per_block;
1081                 if (blocks_to_read * ctx->fs->blocksize >
1082                     ctx->readahead_kb * 1024)
1083                         break;
1084         }
1085
1086         err = e2fsck_readahead(ctx->fs, E2FSCK_READA_ITABLE, start,
1087                                grp - start + 1);
1088         if (err == EAGAIN) {
1089                 ctx->readahead_kb /= 2;
1090                 err = 0;
1091         }
1092
1093 out:
1094         if (err) {
1095                 /* Error; disable itable readahead */
1096                 *group = ctx->fs->group_desc_count;
1097                 *next_ino = ctx->fs->super->s_inodes_count;
1098         } else {
1099                 /*
1100                  * Don't do more readahead until we've reached the first inode
1101                  * of the last inode scan buffer block for the last group.
1102                  */
1103                 *group = grp + 1;
1104                 inodes_per_buffer = (ctx->inode_buffer_blocks ?
1105                                      ctx->inode_buffer_blocks :
1106                                      EXT2_INODE_SCAN_DEFAULT_BUFFER_BLOCKS) *
1107                                     ctx->fs->blocksize /
1108                                     EXT2_INODE_SIZE(ctx->fs->super);
1109                 inodes_in_group--;
1110                 *next_ino = inodes_in_group -
1111                             (inodes_in_group % inodes_per_buffer) + 1 +
1112                             (grp * ctx->fs->super->s_inodes_per_group);
1113         }
1114 }
1115
1116 /*
1117  * Check if the passed ino is one of the used superblock quota inodes.
1118  *
1119  * Before the quota inodes were journaled, older superblock quota inodes
1120  * were just regular files in the filesystem and not reserved inodes.  This
1121  * checks if the passed ino is one of the s_*_quota_inum superblock fields,
1122  * which may not always be the same as the EXT4_*_QUOTA_INO fields.
1123  */
1124 static int quota_inum_is_super(struct ext2_super_block *sb, ext2_ino_t ino)
1125 {
1126         enum quota_type qtype;
1127
1128         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1129                 if (*quota_sb_inump(sb, qtype) == ino)
1130                         return 1;
1131
1132         return 0;
1133 }
1134
1135 /*
1136  * Check if the passed ino is one of the reserved quota inodes.
1137  * This checks if the inode number is one of the reserved EXT4_*_QUOTA_INO
1138  * inodes.  These inodes may or may not be in use by the quota feature.
1139  */
1140 static int quota_inum_is_reserved(ext2_filsys fs, ext2_ino_t ino)
1141 {
1142         enum quota_type qtype;
1143
1144         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1145                 if (quota_type2inum(qtype, fs->super) == ino)
1146                         return 1;
1147
1148         return 0;
1149 }
1150
1151 static int e2fsck_should_abort(e2fsck_t ctx)
1152 {
1153         e2fsck_t global_ctx;
1154
1155         if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1156                 return 1;
1157
1158         if (ctx->global_ctx) {
1159                 global_ctx = ctx->global_ctx;
1160                 if (global_ctx->flags & E2F_FLAG_SIGNAL_MASK)
1161                         return 1;
1162         }
1163         return 0;
1164 }
1165
1166 void e2fsck_pass1_thread(e2fsck_t ctx)
1167 {
1168         int     i;
1169         __u64   max_sizes;
1170         ext2_filsys fs = ctx->fs;
1171         ext2_ino_t      ino = 0;
1172         struct ext2_inode *inode = NULL;
1173         ext2_inode_scan scan = NULL;
1174         char            *block_buf = NULL;
1175 #ifdef RESOURCE_TRACK
1176         struct resource_track   rtrack;
1177 #endif
1178         unsigned char   frag, fsize;
1179         struct          problem_context pctx;
1180         struct          scan_callback_struct scan_struct;
1181         struct ext2_super_block *sb = ctx->fs->super;
1182         const char      *old_op;
1183         const char      *eop_next_inode = _("getting next inode from scan");
1184         int             imagic_fs, extent_fs, inlinedata_fs, casefold_fs;
1185         int             low_dtime_check = 1;
1186         unsigned int    inode_size = EXT2_INODE_SIZE(fs->super);
1187         unsigned int    bufsize;
1188         int             failed_csum = 0;
1189         ext2_ino_t      ino_threshold = 0;
1190         dgrp_t          ra_group = 0;
1191         struct ea_quota ea_ibody_quota;
1192
1193         init_resource_track(&rtrack, ctx->fs->io);
1194         clear_problem_context(&pctx);
1195
1196         /* If we can do readahead, figure out how many groups to pull in. */
1197         if (!e2fsck_can_readahead(ctx->fs))
1198                 ctx->readahead_kb = 0;
1199         else if (ctx->readahead_kb == ~0ULL)
1200                 ctx->readahead_kb = e2fsck_guess_readahead(ctx->fs);
1201         pass1_readahead(ctx, &ra_group, &ino_threshold);
1202
1203         if (!(ctx->options & E2F_OPT_PREEN))
1204                 fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1205
1206         if (ext2fs_has_feature_dir_index(fs->super) &&
1207             !(ctx->options & E2F_OPT_NO)) {
1208                 if (ext2fs_u32_list_create(&ctx->dirs_to_hash, 50))
1209                         ctx->dirs_to_hash = 0;
1210         }
1211
1212 #ifdef MTRACE
1213         mtrace_print("Pass 1");
1214 #endif
1215
1216 #define EXT2_BPP(bits) (1ULL << ((bits) - 2))
1217
1218         for (i = EXT2_MIN_BLOCK_LOG_SIZE; i <= EXT2_MAX_BLOCK_LOG_SIZE; i++) {
1219                 max_sizes = EXT2_NDIR_BLOCKS + EXT2_BPP(i);
1220                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i);
1221                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i) * EXT2_BPP(i);
1222                 max_sizes = (max_sizes * (1UL << i));
1223                 ext2_max_sizes[i - EXT2_MIN_BLOCK_LOG_SIZE] = max_sizes;
1224         }
1225 #undef EXT2_BPP
1226
1227         imagic_fs = ext2fs_has_feature_imagic_inodes(sb);
1228         extent_fs = ext2fs_has_feature_extents(sb);
1229         inlinedata_fs = ext2fs_has_feature_inline_data(sb);
1230         casefold_fs = ext2fs_has_feature_casefold(sb);
1231
1232         /*
1233          * Allocate bitmaps structures
1234          */
1235         pctx.errcode = e2fsck_allocate_inode_bitmap(fs, _("in-use inode map"),
1236                                                     EXT2FS_BMAP64_RBTREE,
1237                                                     "inode_used_map",
1238                                                     &ctx->inode_used_map);
1239         if (pctx.errcode) {
1240                 pctx.num = 1;
1241                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1242                 ctx->flags |= E2F_FLAG_ABORT;
1243                 return;
1244         }
1245         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1246                         _("directory inode map"),
1247                         EXT2FS_BMAP64_AUTODIR,
1248                         "inode_dir_map", &ctx->inode_dir_map);
1249         if (pctx.errcode) {
1250                 pctx.num = 2;
1251                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1252                 ctx->flags |= E2F_FLAG_ABORT;
1253                 return;
1254         }
1255         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1256                         _("regular file inode map"), EXT2FS_BMAP64_RBTREE,
1257                         "inode_reg_map", &ctx->inode_reg_map);
1258         if (pctx.errcode) {
1259                 pctx.num = 6;
1260                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1261                 ctx->flags |= E2F_FLAG_ABORT;
1262                 return;
1263         }
1264         pctx.errcode = e2fsck_allocate_subcluster_bitmap(fs,
1265                         _("in-use block map"), EXT2FS_BMAP64_RBTREE,
1266                         "block_found_map", &ctx->block_found_map);
1267         if (pctx.errcode) {
1268                 pctx.num = 1;
1269                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1270                 ctx->flags |= E2F_FLAG_ABORT;
1271                 return;
1272         }
1273         pctx.errcode = e2fsck_allocate_block_bitmap(fs,
1274                         _("metadata block map"), EXT2FS_BMAP64_RBTREE,
1275                         "block_metadata_map", &ctx->block_metadata_map);
1276         if (pctx.errcode) {
1277                 pctx.num = 1;
1278                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1279                 ctx->flags |= E2F_FLAG_ABORT;
1280                 return;
1281         }
1282         if (casefold_fs) {
1283                 pctx.errcode =
1284                         e2fsck_allocate_inode_bitmap(fs,
1285                                                      _("inode casefold map"),
1286                                                      EXT2FS_BMAP64_RBTREE,
1287                                                      "inode_casefold_map",
1288                                                      &ctx->inode_casefold_map);
1289                 if (pctx.errcode) {
1290                         pctx.num = 1;
1291                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1292                         ctx->flags |= E2F_FLAG_ABORT;
1293                         return;
1294                 }
1295         }
1296         pctx.errcode = e2fsck_setup_icount(ctx, "inode_link_info", 0, NULL,
1297                                            &ctx->inode_link_info);
1298         if (pctx.errcode) {
1299                 fix_problem(ctx, PR_1_ALLOCATE_ICOUNT, &pctx);
1300                 ctx->flags |= E2F_FLAG_ABORT;
1301                 return;
1302         }
1303         bufsize = inode_size;
1304         if (bufsize < sizeof(struct ext2_inode_large))
1305                 bufsize = sizeof(struct ext2_inode_large);
1306         inode = (struct ext2_inode *)
1307                 e2fsck_allocate_memory(ctx, bufsize, "scratch inode");
1308
1309         inodes_to_process = (struct process_inode_block *)
1310                 e2fsck_allocate_memory(ctx,
1311                                        (ctx->process_inode_size *
1312                                         sizeof(struct process_inode_block)),
1313                                        "array of inodes to process");
1314         process_inode_count = 0;
1315
1316         pctx.errcode = ext2fs_init_dblist(fs, 0);
1317         if (pctx.errcode) {
1318                 fix_problem(ctx, PR_1_ALLOCATE_DBCOUNT, &pctx);
1319                 ctx->flags |= E2F_FLAG_ABORT;
1320                 goto endit;
1321         }
1322
1323         /*
1324          * If the last orphan field is set, clear it, since the pass1
1325          * processing will automatically find and clear the orphans.
1326          * In the future, we may want to try using the last_orphan
1327          * linked list ourselves, but for now, we clear it so that the
1328          * ext3 mount code won't get confused.
1329          */
1330         if (!(ctx->options & E2F_OPT_READONLY)) {
1331                 if (fs->super->s_last_orphan) {
1332                         fs->super->s_last_orphan = 0;
1333                         ext2fs_mark_super_dirty(fs);
1334                 }
1335         }
1336
1337         mark_table_blocks(ctx);
1338         pctx.errcode = ext2fs_convert_subcluster_bitmap(fs,
1339                                                 &ctx->block_found_map);
1340         if (pctx.errcode) {
1341                 fix_problem(ctx, PR_1_CONVERT_SUBCLUSTER, &pctx);
1342                 ctx->flags |= E2F_FLAG_ABORT;
1343                 goto endit;
1344         }
1345         block_buf = (char *) e2fsck_allocate_memory(ctx, fs->blocksize * 3,
1346                                                     "block interate buffer");
1347         if (EXT2_INODE_SIZE(fs->super) == EXT2_GOOD_OLD_INODE_SIZE)
1348                 e2fsck_use_inode_shortcuts(ctx, 1);
1349         e2fsck_intercept_block_allocations(ctx);
1350         old_op = ehandler_operation(_("opening inode scan"));
1351         pctx.errcode = ext2fs_open_inode_scan(fs, ctx->inode_buffer_blocks,
1352                                               &scan);
1353         ehandler_operation(old_op);
1354         if (pctx.errcode) {
1355                 fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1356                 ctx->flags |= E2F_FLAG_ABORT;
1357                 goto endit;
1358         }
1359         ext2fs_inode_scan_flags(scan, EXT2_SF_SKIP_MISSING_ITABLE |
1360                                       EXT2_SF_WARN_GARBAGE_INODES, 0);
1361         ctx->stashed_inode = inode;
1362         scan_struct.ctx = ctx;
1363         scan_struct.block_buf = block_buf;
1364         ext2fs_set_inode_callback(scan, scan_callback, &scan_struct);
1365         if (ctx->progress && ((ctx->progress)(ctx, 1, 0,
1366                                               ctx->fs->group_desc_count)))
1367                 goto endit;
1368         if ((fs->super->s_wtime &&
1369              fs->super->s_wtime < fs->super->s_inodes_count) ||
1370             (fs->super->s_mtime &&
1371              fs->super->s_mtime < fs->super->s_inodes_count) ||
1372             (fs->super->s_mkfs_time &&
1373              fs->super->s_mkfs_time < fs->super->s_inodes_count))
1374                 low_dtime_check = 0;
1375
1376         if (ext2fs_has_feature_mmp(fs->super) &&
1377             fs->super->s_mmp_block > fs->super->s_first_data_block &&
1378             fs->super->s_mmp_block < ext2fs_blocks_count(fs->super))
1379                 ext2fs_mark_block_bitmap2(ctx->block_found_map,
1380                                           fs->super->s_mmp_block);
1381
1382         /* Set up ctx->lost_and_found if possible */
1383         (void) e2fsck_get_lost_and_found(ctx, 0);
1384
1385         while (1) {
1386                 if (ino % (fs->super->s_inodes_per_group * 4) == 1) {
1387                         if (e2fsck_mmp_update(fs))
1388                                 fatal_error(ctx, 0);
1389                 }
1390                 old_op = ehandler_operation(eop_next_inode);
1391                 pctx.errcode = ext2fs_get_next_inode_full(scan, &ino,
1392                                                           inode, inode_size);
1393                 if (ino > ino_threshold)
1394                         pass1_readahead(ctx, &ra_group, &ino_threshold);
1395                 ehandler_operation(old_op);
1396                 if (e2fsck_should_abort(ctx))
1397                         goto endit;
1398                 if (pctx.errcode == EXT2_ET_BAD_BLOCK_IN_INODE_TABLE) {
1399                         /*
1400                          * If badblocks says badblocks is bad, offer to clear
1401                          * the list, update the in-core bb list, and restart
1402                          * the inode scan.
1403                          */
1404                         if (ino == EXT2_BAD_INO &&
1405                             fix_problem(ctx, PR_1_BADBLOCKS_IN_BADBLOCKS,
1406                                         &pctx)) {
1407                                 errcode_t err;
1408
1409                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1410                                 ext2fs_badblocks_list_free(ctx->fs->badblocks);
1411                                 ctx->fs->badblocks = NULL;
1412                                 err = ext2fs_read_bb_inode(ctx->fs,
1413                                                         &ctx->fs->badblocks);
1414                                 if (err) {
1415                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1416                                                     &pctx);
1417                                         ctx->flags |= E2F_FLAG_ABORT;
1418                                 } else
1419                                         ctx->flags |= E2F_FLAG_RESTART;
1420                                 goto endit;
1421                         }
1422                         if (!ctx->inode_bb_map)
1423                                 alloc_bb_map(ctx);
1424                         ext2fs_mark_inode_bitmap2(ctx->inode_bb_map, ino);
1425                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1426                         continue;
1427                 }
1428                 if (pctx.errcode &&
1429                     pctx.errcode != EXT2_ET_INODE_CSUM_INVALID &&
1430                     pctx.errcode != EXT2_ET_INODE_IS_GARBAGE) {
1431                         fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1432                         ctx->flags |= E2F_FLAG_ABORT;
1433                         goto endit;
1434                 }
1435                 if (!ino)
1436                         break;
1437                 pctx.ino = ino;
1438                 pctx.inode = inode;
1439                 ctx->stashed_ino = ino;
1440
1441                 /* Clear trashed inode? */
1442                 if (pctx.errcode == EXT2_ET_INODE_IS_GARBAGE &&
1443                     inode->i_links_count > 0 &&
1444                     fix_problem(ctx, PR_1_INODE_IS_GARBAGE, &pctx)) {
1445                         pctx.errcode = 0;
1446                         e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1447                 }
1448                 failed_csum = pctx.errcode != 0;
1449
1450                 /*
1451                  * Check for inodes who might have been part of the
1452                  * orphaned list linked list.  They should have gotten
1453                  * dealt with by now, unless the list had somehow been
1454                  * corrupted.
1455                  *
1456                  * FIXME: In the future, inodes which are still in use
1457                  * (and which are therefore) pending truncation should
1458                  * be handled specially.  Right now we just clear the
1459                  * dtime field, and the normal e2fsck handling of
1460                  * inodes where i_size and the inode blocks are
1461                  * inconsistent is to fix i_size, instead of releasing
1462                  * the extra blocks.  This won't catch the inodes that
1463                  * was at the end of the orphan list, but it's better
1464                  * than nothing.  The right answer is that there
1465                  * shouldn't be any bugs in the orphan list handling.  :-)
1466                  */
1467                 if (inode->i_dtime && low_dtime_check &&
1468                     inode->i_dtime < ctx->fs->super->s_inodes_count) {
1469                         if (fix_problem(ctx, PR_1_LOW_DTIME, &pctx)) {
1470                                 inode->i_dtime = inode->i_links_count ?
1471                                         0 : ctx->now;
1472                                 e2fsck_write_inode(ctx, ino, inode,
1473                                                    "pass1");
1474                                 failed_csum = 0;
1475                         }
1476                 }
1477
1478                 if (inode->i_links_count) {
1479                         pctx.errcode = ext2fs_icount_store(ctx->inode_link_info,
1480                                            ino, inode->i_links_count);
1481                         if (pctx.errcode) {
1482                                 pctx.num = inode->i_links_count;
1483                                 fix_problem(ctx, PR_1_ICOUNT_STORE, &pctx);
1484                                 ctx->flags |= E2F_FLAG_ABORT;
1485                                 goto endit;
1486                         }
1487                 } else if ((ino >= EXT2_FIRST_INODE(fs->super)) &&
1488                            !quota_inum_is_reserved(fs, ino)) {
1489                         if (!inode->i_dtime && inode->i_mode) {
1490                                 if (fix_problem(ctx,
1491                                             PR_1_ZERO_DTIME, &pctx)) {
1492                                         inode->i_dtime = ctx->now;
1493                                         e2fsck_write_inode(ctx, ino, inode,
1494                                                            "pass1");
1495                                         failed_csum = 0;
1496                                 }
1497                         }
1498                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1499                         continue;
1500                 }
1501
1502                 if ((inode->i_flags & EXT4_CASEFOLD_FL) &&
1503                     ((!LINUX_S_ISDIR(inode->i_mode) &&
1504                       fix_problem(ctx, PR_1_CASEFOLD_NONDIR, &pctx)) ||
1505                      (!casefold_fs &&
1506                       fix_problem(ctx, PR_1_CASEFOLD_FEATURE, &pctx)))) {
1507                         inode->i_flags &= ~EXT4_CASEFOLD_FL;
1508                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1509                 }
1510
1511                 /* Conflicting inlinedata/extents inode flags? */
1512                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) &&
1513                     (inode->i_flags & EXT4_EXTENTS_FL)) {
1514                         int res = fix_inline_data_extents_file(ctx, ino, inode,
1515                                                                inode_size,
1516                                                                &pctx);
1517                         if (res < 0) {
1518                                 /* skip FINISH_INODE_LOOP */
1519                                 continue;
1520                         }
1521                 }
1522
1523                 /* Test for incorrect inline_data flags settings. */
1524                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && !inlinedata_fs &&
1525                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1526                         size_t size = 0;
1527
1528                         pctx.errcode = get_inline_data_ea_size(fs, ino, &size);
1529                         if (!pctx.errcode &&
1530                             fix_problem(ctx, PR_1_INLINE_DATA_FEATURE, &pctx)) {
1531                                 ext2fs_set_feature_inline_data(sb);
1532                                 ext2fs_mark_super_dirty(fs);
1533                                 inlinedata_fs = 1;
1534                         } else if (fix_problem(ctx, PR_1_INLINE_DATA_SET, &pctx)) {
1535                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1536                                 /* skip FINISH_INODE_LOOP */
1537                                 continue;
1538                         }
1539                 }
1540
1541                 /* Test for inline data flag but no attr */
1542                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && inlinedata_fs &&
1543                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1544                         size_t size = 0;
1545                         errcode_t err;
1546                         int flags;
1547
1548                         flags = fs->flags;
1549                         if (failed_csum)
1550                                 fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
1551                         err = get_inline_data_ea_size(fs, ino, &size);
1552                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
1553                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
1554
1555                         switch (err) {
1556                         case 0:
1557                                 /* Everything is awesome... */
1558                                 break;
1559                         case EXT2_ET_BAD_EA_BLOCK_NUM:
1560                         case EXT2_ET_BAD_EA_HASH:
1561                         case EXT2_ET_BAD_EA_HEADER:
1562                         case EXT2_ET_EA_BAD_NAME_LEN:
1563                         case EXT2_ET_EA_BAD_VALUE_SIZE:
1564                         case EXT2_ET_EA_KEY_NOT_FOUND:
1565                         case EXT2_ET_EA_NO_SPACE:
1566                         case EXT2_ET_MISSING_EA_FEATURE:
1567                         case EXT2_ET_INLINE_DATA_CANT_ITERATE:
1568                         case EXT2_ET_INLINE_DATA_NO_BLOCK:
1569                         case EXT2_ET_INLINE_DATA_NO_SPACE:
1570                         case EXT2_ET_NO_INLINE_DATA:
1571                         case EXT2_ET_EXT_ATTR_CSUM_INVALID:
1572                         case EXT2_ET_EA_BAD_VALUE_OFFSET:
1573                         case EXT2_ET_EA_INODE_CORRUPTED:
1574                                 /* broken EA or no system.data EA; truncate */
1575                                 if (fix_problem(ctx, PR_1_INLINE_DATA_NO_ATTR,
1576                                                 &pctx)) {
1577                                         err = ext2fs_inode_size_set(fs, inode, 0);
1578                                         if (err) {
1579                                                 pctx.errcode = err;
1580                                                 ctx->flags |= E2F_FLAG_ABORT;
1581                                                 goto endit;
1582                                         }
1583                                         inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1584                                         memset(&inode->i_block, 0,
1585                                                sizeof(inode->i_block));
1586                                         e2fsck_write_inode(ctx, ino, inode,
1587                                                            "pass1");
1588                                         failed_csum = 0;
1589                                 }
1590                                 break;
1591                         default:
1592                                 /* Some other kind of non-xattr error? */
1593                                 pctx.errcode = err;
1594                                 ctx->flags |= E2F_FLAG_ABORT;
1595                                 goto endit;
1596                         }
1597                 }
1598
1599                 /*
1600                  * Test for incorrect extent flag settings.
1601                  *
1602                  * On big-endian machines we must be careful:
1603                  * When the inode is read, the i_block array is not swapped
1604                  * if the extent flag is set.  Therefore if we are testing
1605                  * for or fixing a wrongly-set flag, we must potentially
1606                  * (un)swap before testing, or after fixing.
1607                  */
1608
1609                 /*
1610                  * In this case the extents flag was set when read, so
1611                  * extent_header_verify is ok.  If the inode is cleared,
1612                  * no need to swap... so no extra swapping here.
1613                  */
1614                 if ((inode->i_flags & EXT4_EXTENTS_FL) && !extent_fs &&
1615                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1616                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO))) {
1617                         if ((ext2fs_extent_header_verify(inode->i_block,
1618                                                  sizeof(inode->i_block)) == 0) &&
1619                             fix_problem(ctx, PR_1_EXTENT_FEATURE, &pctx)) {
1620                                 ext2fs_set_feature_extents(sb);
1621                                 ext2fs_mark_super_dirty(fs);
1622                                 extent_fs = 1;
1623                         } else if (fix_problem(ctx, PR_1_EXTENTS_SET, &pctx)) {
1624                         clear_inode:
1625                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1626                                 if (ino == EXT2_BAD_INO)
1627                                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map,
1628                                                                  ino);
1629                                 /* skip FINISH_INODE_LOOP */
1630                                 continue;
1631                         }
1632                 }
1633
1634                 /*
1635                  * For big-endian machines:
1636                  * If the inode didn't have the extents flag set when it
1637                  * was read, then the i_blocks array was swapped.  To test
1638                  * as an extents header, we must swap it back first.
1639                  * IF we then set the extents flag, the entire i_block
1640                  * array must be un/re-swapped to make it proper extents data.
1641                  */
1642                 if (extent_fs && !(inode->i_flags & EXT4_EXTENTS_FL) &&
1643                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1644                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO)) &&
1645                     (LINUX_S_ISREG(inode->i_mode) ||
1646                      LINUX_S_ISDIR(inode->i_mode))) {
1647                         void *ehp;
1648 #ifdef WORDS_BIGENDIAN
1649                         __u32 tmp_block[EXT2_N_BLOCKS];
1650
1651                         for (i = 0; i < EXT2_N_BLOCKS; i++)
1652                                 tmp_block[i] = ext2fs_swab32(inode->i_block[i]);
1653                         ehp = tmp_block;
1654 #else
1655                         ehp = inode->i_block;
1656 #endif
1657                         if ((ext2fs_extent_header_verify(ehp,
1658                                          sizeof(inode->i_block)) == 0) &&
1659                             (fix_problem(ctx, PR_1_UNSET_EXTENT_FL, &pctx))) {
1660                                 inode->i_flags |= EXT4_EXTENTS_FL;
1661 #ifdef WORDS_BIGENDIAN
1662                                 memcpy(inode->i_block, tmp_block,
1663                                        sizeof(inode->i_block));
1664 #endif
1665                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1666                                 failed_csum = 0;
1667                         }
1668                 }
1669
1670                 if (ino == EXT2_BAD_INO) {
1671                         struct process_block_struct pb;
1672
1673                         if ((failed_csum || inode->i_mode || inode->i_uid ||
1674                              inode->i_gid || inode->i_links_count ||
1675                              (inode->i_flags & EXT4_INLINE_DATA_FL) ||
1676                              inode->i_file_acl) &&
1677                             fix_problem(ctx, PR_1_INVALID_BAD_INODE, &pctx)) {
1678                                 memset(inode, 0, sizeof(struct ext2_inode));
1679                                 e2fsck_write_inode(ctx, ino, inode,
1680                                                    "clear bad inode");
1681                                 failed_csum = 0;
1682                         }
1683
1684                         pctx.errcode = ext2fs_copy_bitmap(ctx->block_found_map,
1685                                                           &pb.fs_meta_blocks);
1686                         if (pctx.errcode) {
1687                                 pctx.num = 4;
1688                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1689                                 ctx->flags |= E2F_FLAG_ABORT;
1690                                 goto endit;
1691                         }
1692                         pb.ino = EXT2_BAD_INO;
1693                         pb.num_blocks = pb.last_block = 0;
1694                         pb.last_db_block = -1;
1695                         pb.num_illegal_blocks = 0;
1696                         pb.suppress = 0; pb.clear = 0; pb.is_dir = 0;
1697                         pb.is_reg = 0; pb.fragmented = 0; pb.bbcheck = 0;
1698                         pb.inode = inode;
1699                         pb.pctx = &pctx;
1700                         pb.ctx = ctx;
1701                         pctx.errcode = ext2fs_block_iterate3(fs, ino, 0,
1702                                      block_buf, process_bad_block, &pb);
1703                         ext2fs_free_block_bitmap(pb.fs_meta_blocks);
1704                         if (pctx.errcode) {
1705                                 fix_problem(ctx, PR_1_BLOCK_ITERATE, &pctx);
1706                                 ctx->flags |= E2F_FLAG_ABORT;
1707                                 goto endit;
1708                         }
1709                         if (pb.bbcheck)
1710                                 if (!fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK_PROMPT, &pctx)) {
1711                                 ctx->flags |= E2F_FLAG_ABORT;
1712                                 goto endit;
1713                         }
1714                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1715                         clear_problem_context(&pctx);
1716                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1717                         continue;
1718                 } else if (ino == EXT2_ROOT_INO) {
1719                         /*
1720                          * Make sure the root inode is a directory; if
1721                          * not, offer to clear it.  It will be
1722                          * regenerated in pass #3.
1723                          */
1724                         if (!LINUX_S_ISDIR(inode->i_mode)) {
1725                                 if (fix_problem(ctx, PR_1_ROOT_NO_DIR, &pctx))
1726                                         goto clear_inode;
1727                         }
1728                         /*
1729                          * If dtime is set, offer to clear it.  mke2fs
1730                          * version 0.2b created filesystems with the
1731                          * dtime field set for the root and lost+found
1732                          * directories.  We won't worry about
1733                          * /lost+found, since that can be regenerated
1734                          * easily.  But we will fix the root directory
1735                          * as a special case.
1736                          */
1737                         if (inode->i_dtime && inode->i_links_count) {
1738                                 if (fix_problem(ctx, PR_1_ROOT_DTIME, &pctx)) {
1739                                         inode->i_dtime = 0;
1740                                         e2fsck_write_inode(ctx, ino, inode,
1741                                                            "pass1");
1742                                         failed_csum = 0;
1743                                 }
1744                         }
1745                 } else if (ino == EXT2_JOURNAL_INO) {
1746                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1747                         if (fs->super->s_journal_inum == EXT2_JOURNAL_INO) {
1748                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1749                                     fix_problem(ctx, PR_1_JOURNAL_BAD_MODE,
1750                                                 &pctx)) {
1751                                         inode->i_mode = LINUX_S_IFREG;
1752                                         e2fsck_write_inode(ctx, ino, inode,
1753                                                            "pass1");
1754                                         failed_csum = 0;
1755                                 }
1756                                 check_blocks(ctx, &pctx, block_buf, NULL);
1757                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1758                                 continue;
1759                         }
1760                         if ((inode->i_links_count ||
1761                              inode->i_blocks || inode->i_block[0]) &&
1762                             fix_problem(ctx, PR_1_JOURNAL_INODE_NOT_CLEAR,
1763                                         &pctx)) {
1764                                 memset(inode, 0, inode_size);
1765                                 ext2fs_icount_store(ctx->inode_link_info,
1766                                                     ino, 0);
1767                                 e2fsck_write_inode_full(ctx, ino, inode,
1768                                                         inode_size, "pass1");
1769                                 failed_csum = 0;
1770                         }
1771                 } else if (quota_inum_is_reserved(fs, ino)) {
1772                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1773                         if (ext2fs_has_feature_quota(fs->super) &&
1774                             quota_inum_is_super(fs->super, ino)) {
1775                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1776                                     fix_problem(ctx, PR_1_QUOTA_BAD_MODE,
1777                                                         &pctx)) {
1778                                         inode->i_mode = LINUX_S_IFREG;
1779                                         e2fsck_write_inode(ctx, ino, inode,
1780                                                         "pass1");
1781                                         failed_csum = 0;
1782                                 }
1783                                 check_blocks(ctx, &pctx, block_buf, NULL);
1784                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1785                                 continue;
1786                         }
1787                         if ((inode->i_links_count ||
1788                              inode->i_blocks || inode->i_block[0]) &&
1789                             fix_problem(ctx, PR_1_QUOTA_INODE_NOT_CLEAR,
1790                                         &pctx)) {
1791                                 memset(inode, 0, inode_size);
1792                                 ext2fs_icount_store(ctx->inode_link_info,
1793                                                     ino, 0);
1794                                 e2fsck_write_inode_full(ctx, ino, inode,
1795                                                         inode_size, "pass1");
1796                                 failed_csum = 0;
1797                         }
1798                 } else if (ino < EXT2_FIRST_INODE(fs->super)) {
1799                         problem_t problem = 0;
1800
1801                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1802                         if (ino == EXT2_BOOT_LOADER_INO) {
1803                                 if (LINUX_S_ISDIR(inode->i_mode))
1804                                         problem = PR_1_RESERVED_BAD_MODE;
1805                         } else if (ino == EXT2_RESIZE_INO) {
1806                                 if (inode->i_mode &&
1807                                     !LINUX_S_ISREG(inode->i_mode))
1808                                         problem = PR_1_RESERVED_BAD_MODE;
1809                         } else {
1810                                 if (inode->i_mode != 0)
1811                                         problem = PR_1_RESERVED_BAD_MODE;
1812                         }
1813                         if (problem) {
1814                                 if (fix_problem(ctx, problem, &pctx)) {
1815                                         inode->i_mode = 0;
1816                                         e2fsck_write_inode(ctx, ino, inode,
1817                                                            "pass1");
1818                                         failed_csum = 0;
1819                                 }
1820                         }
1821                         check_blocks(ctx, &pctx, block_buf, NULL);
1822                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1823                         continue;
1824                 }
1825
1826                 if (!inode->i_links_count) {
1827                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1828                         continue;
1829                 }
1830                 /*
1831                  * n.b.  0.3c ext2fs code didn't clear i_links_count for
1832                  * deleted files.  Oops.
1833                  *
1834                  * Since all new ext2 implementations get this right,
1835                  * we now assume that the case of non-zero
1836                  * i_links_count and non-zero dtime means that we
1837                  * should keep the file, not delete it.
1838                  *
1839                  */
1840                 if (inode->i_dtime) {
1841                         if (fix_problem(ctx, PR_1_SET_DTIME, &pctx)) {
1842                                 inode->i_dtime = 0;
1843                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1844                                 failed_csum = 0;
1845                         }
1846                 }
1847
1848                 ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1849                 switch (fs->super->s_creator_os) {
1850                     case EXT2_OS_HURD:
1851                         frag = inode->osd2.hurd2.h_i_frag;
1852                         fsize = inode->osd2.hurd2.h_i_fsize;
1853                         break;
1854                     default:
1855                         frag = fsize = 0;
1856                 }
1857
1858                 if (inode->i_faddr || frag || fsize ||
1859                     (!ext2fs_has_feature_largedir(fs->super) &&
1860                     (LINUX_S_ISDIR(inode->i_mode) && inode->i_size_high)))
1861                         mark_inode_bad(ctx, ino);
1862                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1863                     !ext2fs_has_feature_64bit(fs->super) &&
1864                     inode->osd2.linux2.l_i_file_acl_high != 0)
1865                         mark_inode_bad(ctx, ino);
1866                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1867                     !ext2fs_has_feature_huge_file(fs->super) &&
1868                     (inode->osd2.linux2.l_i_blocks_hi != 0))
1869                         mark_inode_bad(ctx, ino);
1870                 if (inode->i_flags & EXT2_IMAGIC_FL) {
1871                         if (imagic_fs) {
1872                                 if (!ctx->inode_imagic_map)
1873                                         alloc_imagic_map(ctx);
1874                                 ext2fs_mark_inode_bitmap2(ctx->inode_imagic_map,
1875                                                          ino);
1876                         } else {
1877                                 if (fix_problem(ctx, PR_1_SET_IMAGIC, &pctx)) {
1878                                         inode->i_flags &= ~EXT2_IMAGIC_FL;
1879                                         e2fsck_write_inode(ctx, ino,
1880                                                            inode, "pass1");
1881                                         failed_csum = 0;
1882                                 }
1883                         }
1884                 }
1885
1886                 check_inode_extra_space(ctx, &pctx, &ea_ibody_quota);
1887                 check_is_really_dir(ctx, &pctx, block_buf);
1888
1889                 /*
1890                  * ext2fs_inode_has_valid_blocks2 does not actually look
1891                  * at i_block[] values, so not endian-sensitive here.
1892                  */
1893                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL) &&
1894                     LINUX_S_ISLNK(inode->i_mode) &&
1895                     !ext2fs_inode_has_valid_blocks2(fs, inode) &&
1896                     fix_problem(ctx, PR_1_FAST_SYMLINK_EXTENT_FL, &pctx)) {
1897                         inode->i_flags &= ~EXT4_EXTENTS_FL;
1898                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1899                         failed_csum = 0;
1900                 }
1901
1902                 if ((inode->i_flags & EXT4_ENCRYPT_FL) &&
1903                     add_encrypted_file(ctx, &pctx) < 0)
1904                         goto clear_inode;
1905
1906                 if (casefold_fs && inode->i_flags & EXT4_CASEFOLD_FL)
1907                         ext2fs_mark_inode_bitmap2(ctx->inode_casefold_map, ino);
1908
1909                 if (LINUX_S_ISDIR(inode->i_mode)) {
1910                         ext2fs_mark_inode_bitmap2(ctx->inode_dir_map, ino);
1911                         e2fsck_add_dir_info(ctx, ino, 0);
1912                         ctx->fs_directory_count++;
1913                         if (inode->i_flags & EXT4_CASEFOLD_FL)
1914                                 add_casefolded_dir(ctx, ino);
1915                 } else if (LINUX_S_ISREG (inode->i_mode)) {
1916                         ext2fs_mark_inode_bitmap2(ctx->inode_reg_map, ino);
1917                         ctx->fs_regular_count++;
1918                 } else if (LINUX_S_ISCHR (inode->i_mode) &&
1919                            e2fsck_pass1_check_device_inode(fs, inode)) {
1920                         check_extents_inlinedata(ctx, &pctx);
1921                         check_immutable(ctx, &pctx);
1922                         check_size(ctx, &pctx);
1923                         ctx->fs_chardev_count++;
1924                 } else if (LINUX_S_ISBLK (inode->i_mode) &&
1925                            e2fsck_pass1_check_device_inode(fs, inode)) {
1926                         check_extents_inlinedata(ctx, &pctx);
1927                         check_immutable(ctx, &pctx);
1928                         check_size(ctx, &pctx);
1929                         ctx->fs_blockdev_count++;
1930                 } else if (LINUX_S_ISLNK (inode->i_mode) &&
1931                            e2fsck_pass1_check_symlink(fs, ino, inode,
1932                                                       block_buf)) {
1933                         check_immutable(ctx, &pctx);
1934                         ctx->fs_symlinks_count++;
1935                         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
1936                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1937                                 continue;
1938                         } else if (ext2fs_is_fast_symlink(inode)) {
1939                                 ctx->fs_fast_symlinks_count++;
1940                                 check_blocks(ctx, &pctx, block_buf,
1941                                              &ea_ibody_quota);
1942                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1943                                 continue;
1944                         }
1945                 }
1946                 else if (LINUX_S_ISFIFO (inode->i_mode) &&
1947                          e2fsck_pass1_check_device_inode(fs, inode)) {
1948                         check_extents_inlinedata(ctx, &pctx);
1949                         check_immutable(ctx, &pctx);
1950                         check_size(ctx, &pctx);
1951                         ctx->fs_fifo_count++;
1952                 } else if ((LINUX_S_ISSOCK (inode->i_mode)) &&
1953                            e2fsck_pass1_check_device_inode(fs, inode)) {
1954                         check_extents_inlinedata(ctx, &pctx);
1955                         check_immutable(ctx, &pctx);
1956                         check_size(ctx, &pctx);
1957                         ctx->fs_sockets_count++;
1958                 } else
1959                         mark_inode_bad(ctx, ino);
1960                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1961                     !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
1962                         if (inode->i_block[EXT2_IND_BLOCK])
1963                                 ctx->fs_ind_count++;
1964                         if (inode->i_block[EXT2_DIND_BLOCK])
1965                                 ctx->fs_dind_count++;
1966                         if (inode->i_block[EXT2_TIND_BLOCK])
1967                                 ctx->fs_tind_count++;
1968                 }
1969                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1970                     !(inode->i_flags & EXT4_INLINE_DATA_FL) &&
1971                     (inode->i_block[EXT2_IND_BLOCK] ||
1972                      inode->i_block[EXT2_DIND_BLOCK] ||
1973                      inode->i_block[EXT2_TIND_BLOCK] ||
1974                      ext2fs_file_acl_block(fs, inode))) {
1975                         struct process_inode_block *itp;
1976
1977                         itp = &inodes_to_process[process_inode_count];
1978                         itp->ino = ino;
1979                         itp->ea_ibody_quota = ea_ibody_quota;
1980                         if (inode_size < sizeof(struct ext2_inode_large))
1981                                 memcpy(&itp->inode, inode, inode_size);
1982                         else
1983                                 memcpy(&itp->inode, inode, sizeof(itp->inode));
1984                         process_inode_count++;
1985                 } else
1986                         check_blocks(ctx, &pctx, block_buf, &ea_ibody_quota);
1987
1988                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1989
1990                 if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1991                         goto endit;
1992
1993                 if (process_inode_count >= ctx->process_inode_size) {
1994                         process_inodes(ctx, block_buf);
1995
1996                         if (e2fsck_should_abort(ctx))
1997                                 goto endit;
1998                 }
1999         }
2000         process_inodes(ctx, block_buf);
2001         ext2fs_close_inode_scan(scan);
2002         scan = NULL;
2003
2004         reserve_block_for_root_repair(ctx);
2005         reserve_block_for_lnf_repair(ctx);
2006
2007         /*
2008          * If any extended attribute blocks' reference counts need to
2009          * be adjusted, either up (ctx->refcount_extra), or down
2010          * (ctx->refcount), then fix them.
2011          */
2012         if (ctx->refcount) {
2013                 adjust_extattr_refcount(ctx, ctx->refcount, block_buf, -1);
2014                 ea_refcount_free(ctx->refcount);
2015                 ctx->refcount = 0;
2016         }
2017         if (ctx->refcount_extra) {
2018                 adjust_extattr_refcount(ctx, ctx->refcount_extra,
2019                                         block_buf, +1);
2020                 ea_refcount_free(ctx->refcount_extra);
2021                 ctx->refcount_extra = 0;
2022         }
2023
2024         if (ctx->ea_block_quota_blocks) {
2025                 ea_refcount_free(ctx->ea_block_quota_blocks);
2026                 ctx->ea_block_quota_blocks = 0;
2027         }
2028
2029         if (ctx->ea_block_quota_inodes) {
2030                 ea_refcount_free(ctx->ea_block_quota_inodes);
2031                 ctx->ea_block_quota_inodes = 0;
2032         }
2033
2034         if (ctx->invalid_bitmaps)
2035                 handle_fs_bad_blocks(ctx);
2036
2037         /* We don't need the block_ea_map any more */
2038         if (ctx->block_ea_map) {
2039                 ext2fs_free_block_bitmap(ctx->block_ea_map);
2040                 ctx->block_ea_map = 0;
2041         }
2042
2043         /* We don't need the encryption policy => ID map any more */
2044         destroy_encryption_policy_map(ctx);
2045
2046         if (ctx->flags & E2F_FLAG_RESIZE_INODE) {
2047                 clear_problem_context(&pctx);
2048                 pctx.errcode = ext2fs_create_resize_inode(fs);
2049                 if (pctx.errcode) {
2050                         if (!fix_problem(ctx, PR_1_RESIZE_INODE_CREATE,
2051                                          &pctx)) {
2052                                 ctx->flags |= E2F_FLAG_ABORT;
2053                                 goto endit;
2054                         }
2055                         pctx.errcode = 0;
2056                 }
2057                 if (!pctx.errcode) {
2058                         e2fsck_read_inode(ctx, EXT2_RESIZE_INO, inode,
2059                                           "recreate inode");
2060                         inode->i_mtime = ctx->now;
2061                         e2fsck_write_inode(ctx, EXT2_RESIZE_INO, inode,
2062                                            "recreate inode");
2063                 }
2064                 ctx->flags &= ~E2F_FLAG_RESIZE_INODE;
2065         }
2066
2067         if (ctx->flags & E2F_FLAG_RESTART) {
2068                 /*
2069                  * Only the master copy of the superblock and block
2070                  * group descriptors are going to be written during a
2071                  * restart, so set the superblock to be used to be the
2072                  * master superblock.
2073                  */
2074                 ctx->use_superblock = 0;
2075                 goto endit;
2076         }
2077
2078         if (ctx->large_dirs && !ext2fs_has_feature_largedir(fs->super)) {
2079                 if (fix_problem(ctx, PR_2_FEATURE_LARGE_DIRS, &pctx)) {
2080                         ext2fs_set_feature_largedir(fs->super);
2081                         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
2082                         ext2fs_mark_super_dirty(fs);
2083                 }
2084                 if (fs->super->s_rev_level == EXT2_GOOD_OLD_REV &&
2085                     fix_problem(ctx, PR_1_FS_REV_LEVEL, &pctx)) {
2086                         ext2fs_update_dynamic_rev(fs);
2087                         ext2fs_mark_super_dirty(fs);
2088                 }
2089         }
2090
2091         if (ctx->block_dup_map) {
2092                 if (ctx->options & E2F_OPT_PREEN) {
2093                         clear_problem_context(&pctx);
2094                         fix_problem(ctx, PR_1_DUP_BLOCKS_PREENSTOP, &pctx);
2095                 }
2096                 e2fsck_pass1_dupblocks(ctx, block_buf);
2097         }
2098         ctx->flags |= E2F_FLAG_ALLOC_OK;
2099 endit:
2100         e2fsck_use_inode_shortcuts(ctx, 0);
2101         ext2fs_free_mem(&inodes_to_process);
2102         inodes_to_process = 0;
2103
2104         if (scan)
2105                 ext2fs_close_inode_scan(scan);
2106         if (block_buf)
2107                 ext2fs_free_mem(&block_buf);
2108         if (inode)
2109                 ext2fs_free_mem(&inode);
2110
2111         /*
2112          * The l+f inode may have been cleared, so zap it now and
2113          * later passes will recalculate it if necessary
2114          */
2115         ctx->lost_and_found = 0;
2116
2117         if ((ctx->flags & E2F_FLAG_SIGNAL_MASK) == 0)
2118                 print_resource_track(ctx, _("Pass 1"), &rtrack, ctx->fs->io);
2119         else
2120                 ctx->invalid_bitmaps++;
2121 }
2122
2123 static void e2fsck_pass1_copy_fs(ext2_filsys dest, ext2_filsys src)
2124 {
2125         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2126         if (dest->dblist)
2127                 dest->dblist->fs = dest;
2128         if (dest->inode_map)
2129                 dest->inode_map->fs = dest;
2130         if (dest->block_map)
2131                 dest->block_map->fs = dest;
2132 }
2133
2134 static errcode_t e2fsck_pass1_thread_prepare(e2fsck_t global_ctx, e2fsck_t *thread_ctx)
2135 {
2136         errcode_t       retval;
2137         e2fsck_t        thread_context;
2138         ext2_filsys     thread_fs;
2139         ext2_filsys     global_fs = global_ctx->fs;
2140
2141         retval = ext2fs_get_mem(sizeof(struct e2fsck_struct), &thread_context);
2142         if (retval) {
2143                 com_err(global_ctx->program_name, retval, "while allocating memory");
2144                 return retval;
2145         }
2146         memcpy(thread_context, global_ctx, sizeof(struct e2fsck_struct));
2147         thread_context->global_ctx = global_ctx;
2148
2149         retval = ext2fs_get_mem(sizeof(struct struct_ext2_filsys), &thread_fs);
2150         if (retval) {
2151                 com_err(global_ctx->program_name, retval, "while allocating memory");
2152                 goto out_context;
2153         }
2154
2155         e2fsck_pass1_copy_fs(thread_fs, global_fs);
2156         thread_fs->priv_data = thread_context;
2157
2158         thread_context->fs = thread_fs;
2159         *thread_ctx = thread_context;
2160         return 0;
2161 out_context:
2162         ext2fs_free_mem(&thread_context);
2163         return retval;
2164 }
2165
2166 static int e2fsck_pass1_thread_join(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2167 {
2168         int             flags = global_ctx->flags;
2169         ext2_filsys     thread_fs = thread_ctx->fs;
2170         ext2_filsys     global_fs = global_ctx->fs;
2171 #ifdef HAVE_SETJMP_H
2172         jmp_buf         old_jmp;
2173
2174         memcpy(old_jmp, global_ctx->abort_loc, sizeof(jmp_buf));
2175 #endif
2176         memcpy(global_ctx, thread_ctx, sizeof(struct e2fsck_struct));
2177 #ifdef HAVE_SETJMP_H
2178         memcpy(global_ctx->abort_loc, old_jmp, sizeof(jmp_buf));
2179 #endif
2180         /* Keep the global singal flags*/
2181         global_ctx->flags |= (flags & E2F_FLAG_SIGNAL_MASK) |
2182                              (global_ctx->flags & E2F_FLAG_SIGNAL_MASK);
2183
2184         e2fsck_pass1_copy_fs(global_fs, thread_fs);
2185         global_fs->priv_data = global_ctx;
2186         global_ctx->fs = global_fs;
2187
2188         ext2fs_free_mem(&thread_ctx->fs);
2189         ext2fs_free_mem(&thread_ctx);
2190         return 0;
2191 }
2192
2193 void e2fsck_pass1_multithread(e2fsck_t ctx)
2194 {
2195         errcode_t       retval;
2196         e2fsck_t        thread_ctx;
2197
2198         retval = e2fsck_pass1_thread_prepare(ctx, &thread_ctx);
2199         if (retval) {
2200                 com_err(ctx->program_name, 0,
2201                         _("while preparing pass1 thread\n"));
2202                 ctx->flags |= E2F_FLAG_ABORT;
2203                 return;
2204         }
2205
2206 #ifdef HAVE_SETJMP_H
2207         /*
2208          * When fatal_error() happens, jump to here. The thread
2209          * context's flags will be saved, but its abort_loc will
2210          * be overwritten by original jump buffer for the later
2211          * tests.
2212          */
2213         if (setjmp(thread_ctx->abort_loc)) {
2214                 thread_ctx->flags &= ~E2F_FLAG_SETJMP_OK;
2215                 e2fsck_pass1_thread_join(ctx, thread_ctx);
2216                 return;
2217         }
2218         thread_ctx->flags |= E2F_FLAG_SETJMP_OK;
2219 #endif
2220
2221         e2fsck_pass1_thread(thread_ctx);
2222         retval = e2fsck_pass1_thread_join(ctx, thread_ctx);
2223         if (retval) {
2224                 com_err(ctx->program_name, 0,
2225                         _("while joining pass1 thread\n"));
2226                 ctx->flags |= E2F_FLAG_ABORT;
2227                 return;
2228         }
2229 }
2230
2231 void e2fsck_pass1(e2fsck_t ctx)
2232 {
2233         e2fsck_pass1_multithread(ctx);
2234 }
2235
2236 #undef FINISH_INODE_LOOP
2237
2238 /*
2239  * When the inode_scan routines call this callback at the end of the
2240  * glock group, call process_inodes.
2241  */
2242 static errcode_t scan_callback(ext2_filsys fs,
2243                                ext2_inode_scan scan EXT2FS_ATTR((unused)),
2244                                dgrp_t group, void * priv_data)
2245 {
2246         struct scan_callback_struct *scan_struct;
2247         e2fsck_t ctx;
2248
2249         scan_struct = (struct scan_callback_struct *) priv_data;
2250         ctx = scan_struct->ctx;
2251
2252         process_inodes((e2fsck_t) fs->priv_data, scan_struct->block_buf);
2253
2254         if (ctx->progress)
2255                 if ((ctx->progress)(ctx, 1, group+1,
2256                                     ctx->fs->group_desc_count))
2257                         return EXT2_ET_CANCEL_REQUESTED;
2258
2259         return 0;
2260 }
2261
2262 /*
2263  * Process the inodes in the "inodes to process" list.
2264  */
2265 static void process_inodes(e2fsck_t ctx, char *block_buf)
2266 {
2267         int                     i;
2268         struct ext2_inode       *old_stashed_inode;
2269         ext2_ino_t              old_stashed_ino;
2270         const char              *old_operation;
2271         char                    buf[80];
2272         struct problem_context  pctx;
2273
2274 #if 0
2275         printf("begin process_inodes: ");
2276 #endif
2277         if (process_inode_count == 0)
2278                 return;
2279         old_operation = ehandler_operation(0);
2280         old_stashed_inode = ctx->stashed_inode;
2281         old_stashed_ino = ctx->stashed_ino;
2282         qsort(inodes_to_process, process_inode_count,
2283                       sizeof(struct process_inode_block), process_inode_cmp);
2284         clear_problem_context(&pctx);
2285         for (i=0; i < process_inode_count; i++) {
2286                 pctx.inode = ctx->stashed_inode =
2287                         (struct ext2_inode *) &inodes_to_process[i].inode;
2288                 pctx.ino = ctx->stashed_ino = inodes_to_process[i].ino;
2289
2290 #if 0
2291                 printf("%u ", pctx.ino);
2292 #endif
2293                 sprintf(buf, _("reading indirect blocks of inode %u"),
2294                         pctx.ino);
2295                 ehandler_operation(buf);
2296                 check_blocks(ctx, &pctx, block_buf,
2297                              &inodes_to_process[i].ea_ibody_quota);
2298                 if (e2fsck_should_abort(ctx))
2299                         break;
2300         }
2301         ctx->stashed_inode = old_stashed_inode;
2302         ctx->stashed_ino = old_stashed_ino;
2303         process_inode_count = 0;
2304 #if 0
2305         printf("end process inodes\n");
2306 #endif
2307         ehandler_operation(old_operation);
2308 }
2309
2310 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b)
2311 {
2312         const struct process_inode_block *ib_a =
2313                 (const struct process_inode_block *) a;
2314         const struct process_inode_block *ib_b =
2315                 (const struct process_inode_block *) b;
2316         int     ret;
2317
2318         ret = (ib_a->inode.i_block[EXT2_IND_BLOCK] -
2319                ib_b->inode.i_block[EXT2_IND_BLOCK]);
2320         if (ret == 0)
2321                 /*
2322                  * We only call process_inodes() for non-extent
2323                  * inodes, so it's OK to pass NULL to
2324                  * ext2fs_file_acl_block() here.
2325                  */
2326                 ret = ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_a->inode)) -
2327                         ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_b->inode));
2328         if (ret == 0)
2329                 ret = ib_a->ino - ib_b->ino;
2330         return ret;
2331 }
2332
2333 /*
2334  * Mark an inode as being bad in some what
2335  */
2336 static void mark_inode_bad(e2fsck_t ctx, ino_t ino)
2337 {
2338         struct          problem_context pctx;
2339
2340         if (!ctx->inode_bad_map) {
2341                 clear_problem_context(&pctx);
2342
2343                 pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
2344                                 _("bad inode map"), EXT2FS_BMAP64_RBTREE,
2345                                 "inode_bad_map", &ctx->inode_bad_map);
2346                 if (pctx.errcode) {
2347                         pctx.num = 3;
2348                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
2349                         /* Should never get here */
2350                         ctx->flags |= E2F_FLAG_ABORT;
2351                         return;
2352                 }
2353         }
2354         ext2fs_mark_inode_bitmap2(ctx->inode_bad_map, ino);
2355 }
2356
2357 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino)
2358 {
2359         struct          problem_context pctx;
2360
2361         if (!ctx->casefolded_dirs) {
2362                 pctx.errcode = ext2fs_u32_list_create(&ctx->casefolded_dirs, 0);
2363                 if (pctx.errcode)
2364                         goto error;
2365         }
2366         pctx.errcode = ext2fs_u32_list_add(ctx->casefolded_dirs, ino);
2367         if (pctx.errcode == 0)
2368                 return;
2369 error:
2370         fix_problem(ctx, PR_1_ALLOCATE_CASEFOLDED_DIRLIST, &pctx);
2371         /* Should never get here */
2372         ctx->flags |= E2F_FLAG_ABORT;
2373 }
2374
2375 /*
2376  * This procedure will allocate the inode "bb" (badblock) map table
2377  */
2378 static void alloc_bb_map(e2fsck_t ctx)
2379 {
2380         struct          problem_context pctx;
2381
2382         clear_problem_context(&pctx);
2383         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
2384                         _("inode in bad block map"), EXT2FS_BMAP64_RBTREE,
2385                         "inode_bb_map", &ctx->inode_bb_map);
2386         if (pctx.errcode) {
2387                 pctx.num = 4;
2388                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
2389                 /* Should never get here */
2390                 ctx->flags |= E2F_FLAG_ABORT;
2391                 return;
2392         }
2393 }
2394
2395 /*
2396  * This procedure will allocate the inode imagic table
2397  */
2398 static void alloc_imagic_map(e2fsck_t ctx)
2399 {
2400         struct          problem_context pctx;
2401
2402         clear_problem_context(&pctx);
2403         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
2404                         _("imagic inode map"), EXT2FS_BMAP64_RBTREE,
2405                         "inode_imagic_map", &ctx->inode_imagic_map);
2406         if (pctx.errcode) {
2407                 pctx.num = 5;
2408                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
2409                 /* Should never get here */
2410                 ctx->flags |= E2F_FLAG_ABORT;
2411                 return;
2412         }
2413 }
2414
2415 /*
2416  * Marks a block as in use, setting the dup_map if it's been set
2417  * already.  Called by process_block and process_bad_block.
2418  *
2419  * WARNING: Assumes checks have already been done to make sure block
2420  * is valid.  This is true in both process_block and process_bad_block.
2421  */
2422 static _INLINE_ void mark_block_used(e2fsck_t ctx, blk64_t block)
2423 {
2424         struct          problem_context pctx;
2425
2426         clear_problem_context(&pctx);
2427
2428         if (ext2fs_fast_test_block_bitmap2(ctx->block_found_map, block)) {
2429                 if (ext2fs_has_feature_shared_blocks(ctx->fs->super) &&
2430                     !(ctx->options & E2F_OPT_UNSHARE_BLOCKS)) {
2431                         return;
2432                 }
2433                 if (!ctx->block_dup_map) {
2434                         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
2435                                         _("multiply claimed block map"),
2436                                         EXT2FS_BMAP64_RBTREE, "block_dup_map",
2437                                         &ctx->block_dup_map);
2438                         if (pctx.errcode) {
2439                                 pctx.num = 3;
2440                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR,
2441                                             &pctx);
2442                                 /* Should never get here */
2443                                 ctx->flags |= E2F_FLAG_ABORT;
2444                                 return;
2445                         }
2446                 }
2447                 ext2fs_fast_mark_block_bitmap2(ctx->block_dup_map, block);
2448         } else {
2449                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, block);
2450         }
2451 }
2452
2453 /*
2454  * When cluster size is greater than one block, it is caller's responsibility
2455  * to make sure block parameter starts at a cluster boundary.
2456  */
2457 static _INLINE_ void mark_blocks_used(e2fsck_t ctx, blk64_t block,
2458                                       unsigned int num)
2459 {
2460         if (ext2fs_test_block_bitmap_range2(ctx->block_found_map, block, num))
2461                 ext2fs_mark_block_bitmap_range2(ctx->block_found_map, block, num);
2462         else {
2463                 unsigned int i;
2464
2465                 for (i = 0; i < num; i += EXT2FS_CLUSTER_RATIO(ctx->fs))
2466                         mark_block_used(ctx, block + i);
2467         }
2468 }
2469
2470 /*
2471  * Adjust the extended attribute block's reference counts at the end
2472  * of pass 1, either by subtracting out references for EA blocks that
2473  * are still referenced in ctx->refcount, or by adding references for
2474  * EA blocks that had extra references as accounted for in
2475  * ctx->refcount_extra.
2476  */
2477 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
2478                                     char *block_buf, int adjust_sign)
2479 {
2480         struct ext2_ext_attr_header     *header;
2481         struct problem_context          pctx;
2482         ext2_filsys                     fs = ctx->fs;
2483         blk64_t                         blk;
2484         __u32                           should_be;
2485         ea_value_t                      count;
2486
2487         clear_problem_context(&pctx);
2488
2489         ea_refcount_intr_begin(refcount);
2490         while (1) {
2491                 if ((blk = ea_refcount_intr_next(refcount, &count)) == 0)
2492                         break;
2493                 pctx.blk = blk;
2494                 pctx.errcode = ext2fs_read_ext_attr3(fs, blk, block_buf,
2495                                                      pctx.ino);
2496                 if (pctx.errcode) {
2497                         fix_problem(ctx, PR_1_EXTATTR_READ_ABORT, &pctx);
2498                         return;
2499                 }
2500                 header = (struct ext2_ext_attr_header *) block_buf;
2501                 pctx.blkcount = header->h_refcount;
2502                 should_be = header->h_refcount + adjust_sign * (int)count;
2503                 pctx.num = should_be;
2504                 if (fix_problem(ctx, PR_1_EXTATTR_REFCOUNT, &pctx)) {
2505                         header->h_refcount = should_be;
2506                         pctx.errcode = ext2fs_write_ext_attr3(fs, blk,
2507                                                              block_buf,
2508                                                              pctx.ino);
2509                         if (pctx.errcode) {
2510                                 fix_problem(ctx, PR_1_EXTATTR_WRITE_ABORT,
2511                                             &pctx);
2512                                 continue;
2513                         }
2514                 }
2515         }
2516 }
2517
2518 /*
2519  * Handle processing the extended attribute blocks
2520  */
2521 static int check_ext_attr(e2fsck_t ctx, struct problem_context *pctx,
2522                            char *block_buf, struct ea_quota *ea_block_quota)
2523 {
2524         ext2_filsys fs = ctx->fs;
2525         ext2_ino_t      ino = pctx->ino;
2526         struct ext2_inode *inode = pctx->inode;
2527         blk64_t         blk;
2528         char *          end;
2529         struct ext2_ext_attr_header *header;
2530         struct ext2_ext_attr_entry *first, *entry;
2531         blk64_t         quota_blocks = EXT2FS_C2B(fs, 1);
2532         __u64           quota_inodes = 0;
2533         region_t        region = 0;
2534         int             failed_csum = 0;
2535
2536         ea_block_quota->blocks = 0;
2537         ea_block_quota->inodes = 0;
2538
2539         blk = ext2fs_file_acl_block(fs, inode);
2540         if (blk == 0)
2541                 return 0;
2542
2543         /*
2544          * If the Extended attribute flag isn't set, then a non-zero
2545          * file acl means that the inode is corrupted.
2546          *
2547          * Or if the extended attribute block is an invalid block,
2548          * then the inode is also corrupted.
2549          */
2550         if (!ext2fs_has_feature_xattr(fs->super) ||
2551             (blk < fs->super->s_first_data_block) ||
2552             (blk >= ext2fs_blocks_count(fs->super))) {
2553                 mark_inode_bad(ctx, ino);
2554                 return 0;
2555         }
2556
2557         /* If ea bitmap hasn't been allocated, create it */
2558         if (!ctx->block_ea_map) {
2559                 pctx->errcode = e2fsck_allocate_block_bitmap(fs,
2560                                         _("ext attr block map"),
2561                                         EXT2FS_BMAP64_RBTREE, "block_ea_map",
2562                                         &ctx->block_ea_map);
2563                 if (pctx->errcode) {
2564                         pctx->num = 2;
2565                         fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, pctx);
2566                         ctx->flags |= E2F_FLAG_ABORT;
2567                         return 0;
2568                 }
2569         }
2570
2571         /* Create the EA refcount structure if necessary */
2572         if (!ctx->refcount) {
2573                 pctx->errcode = ea_refcount_create(0, &ctx->refcount);
2574                 if (pctx->errcode) {
2575                         pctx->num = 1;
2576                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
2577                         ctx->flags |= E2F_FLAG_ABORT;
2578                         return 0;
2579                 }
2580         }
2581
2582 #if 0
2583         /* Debugging text */
2584         printf("Inode %u has EA block %u\n", ino, blk);
2585 #endif
2586
2587         /* Have we seen this EA block before? */
2588         if (ext2fs_fast_test_block_bitmap2(ctx->block_ea_map, blk)) {
2589                 ea_block_quota->blocks = EXT2FS_C2B(fs, 1);
2590                 ea_block_quota->inodes = 0;
2591
2592                 if (ctx->ea_block_quota_blocks) {
2593                         ea_refcount_fetch(ctx->ea_block_quota_blocks, blk,
2594                                           &quota_blocks);
2595                         if (quota_blocks)
2596                                 ea_block_quota->blocks = quota_blocks;
2597                 }
2598
2599                 if (ctx->ea_block_quota_inodes)
2600                         ea_refcount_fetch(ctx->ea_block_quota_inodes, blk,
2601                                           &ea_block_quota->inodes);
2602
2603                 if (ea_refcount_decrement(ctx->refcount, blk, 0) == 0)
2604                         return 1;
2605                 /* Ooops, this EA was referenced more than it stated */
2606                 if (!ctx->refcount_extra) {
2607                         pctx->errcode = ea_refcount_create(0,
2608                                            &ctx->refcount_extra);
2609                         if (pctx->errcode) {
2610                                 pctx->num = 2;
2611                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
2612                                 ctx->flags |= E2F_FLAG_ABORT;
2613                                 return 0;
2614                         }
2615                 }
2616                 ea_refcount_increment(ctx->refcount_extra, blk, 0);
2617                 return 1;
2618         }
2619
2620         /*
2621          * OK, we haven't seen this EA block yet.  So we need to
2622          * validate it
2623          */
2624         pctx->blk = blk;
2625         pctx->errcode = ext2fs_read_ext_attr3(fs, blk, block_buf, pctx->ino);
2626         if (pctx->errcode == EXT2_ET_EXT_ATTR_CSUM_INVALID) {
2627                 pctx->errcode = 0;
2628                 failed_csum = 1;
2629         } else if (pctx->errcode == EXT2_ET_BAD_EA_HEADER)
2630                 pctx->errcode = 0;
2631
2632         if (pctx->errcode &&
2633             fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx)) {
2634                 pctx->errcode = 0;
2635                 goto clear_extattr;
2636         }
2637         header = (struct ext2_ext_attr_header *) block_buf;
2638         pctx->blk = ext2fs_file_acl_block(fs, inode);
2639         if (((ctx->ext_attr_ver == 1) &&
2640              (header->h_magic != EXT2_EXT_ATTR_MAGIC_v1)) ||
2641             ((ctx->ext_attr_ver == 2) &&
2642              (header->h_magic != EXT2_EXT_ATTR_MAGIC))) {
2643                 if (fix_problem(ctx, PR_1_BAD_EA_BLOCK, pctx))
2644                         goto clear_extattr;
2645         }
2646
2647         if (header->h_blocks != 1) {
2648                 if (fix_problem(ctx, PR_1_EA_MULTI_BLOCK, pctx))
2649                         goto clear_extattr;
2650         }
2651
2652         if (pctx->errcode && fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx))
2653                 goto clear_extattr;
2654
2655         region = region_create(0, fs->blocksize);
2656         if (!region) {
2657                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
2658                 ctx->flags |= E2F_FLAG_ABORT;
2659                 return 0;
2660         }
2661         if (region_allocate(region, 0, sizeof(struct ext2_ext_attr_header))) {
2662                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
2663                         goto clear_extattr;
2664         }
2665
2666         first = (struct ext2_ext_attr_entry *)(header+1);
2667         end = block_buf + fs->blocksize;
2668         entry = first;
2669         while ((char *)entry < end && *(__u32 *)entry) {
2670                 __u32 hash;
2671
2672                 if (region_allocate(region, (char *)entry - (char *)header,
2673                                    EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
2674                         if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
2675                                 goto clear_extattr;
2676                         break;
2677                 }
2678                 if ((ctx->ext_attr_ver == 1 &&
2679                      (entry->e_name_len == 0 || entry->e_name_index != 0)) ||
2680                     (ctx->ext_attr_ver == 2 &&
2681                      entry->e_name_index == 0)) {
2682                         if (fix_problem(ctx, PR_1_EA_BAD_NAME, pctx))
2683                                 goto clear_extattr;
2684                         break;
2685                 }
2686                 if (entry->e_value_inum == 0) {
2687                         if (entry->e_value_offs + entry->e_value_size >
2688                             fs->blocksize) {
2689                                 if (fix_problem(ctx, PR_1_EA_BAD_VALUE, pctx))
2690                                         goto clear_extattr;
2691                                 break;
2692                         }
2693                         if (entry->e_value_size &&
2694                             region_allocate(region, entry->e_value_offs,
2695                                             EXT2_EXT_ATTR_SIZE(entry->e_value_size))) {
2696                                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION,
2697                                                 pctx))
2698                                         goto clear_extattr;
2699                         }
2700
2701                         hash = ext2fs_ext_attr_hash_entry(entry, block_buf +
2702                                                           entry->e_value_offs);
2703
2704                         if (entry->e_hash != hash) {
2705                                 pctx->num = entry->e_hash;
2706                                 if (fix_problem(ctx, PR_1_ATTR_HASH, pctx))
2707                                         goto clear_extattr;
2708                                 entry->e_hash = hash;
2709                         }
2710                 } else {
2711                         problem_t problem;
2712                         blk64_t entry_quota_blocks;
2713
2714                         problem = check_large_ea_inode(ctx, entry, pctx,
2715                                                        &entry_quota_blocks);
2716                         if (problem && fix_problem(ctx, problem, pctx))
2717                                 goto clear_extattr;
2718
2719                         quota_blocks += entry_quota_blocks;
2720                         quota_inodes++;
2721                 }
2722
2723                 entry = EXT2_EXT_ATTR_NEXT(entry);
2724         }
2725         if (region_allocate(region, (char *)entry - (char *)header, 4)) {
2726                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
2727                         goto clear_extattr;
2728         }
2729         region_free(region);
2730
2731         /*
2732          * We only get here if there was no other errors that were fixed.
2733          * If there was a checksum fail, ask to correct it.
2734          */
2735         if (failed_csum &&
2736             fix_problem(ctx, PR_1_EA_BLOCK_ONLY_CSUM_INVALID, pctx)) {
2737                 pctx->errcode = ext2fs_write_ext_attr3(fs, blk, block_buf,
2738                                                        pctx->ino);
2739                 if (pctx->errcode)
2740                         return 0;
2741         }
2742
2743         if (quota_blocks != EXT2FS_C2B(fs, 1U)) {
2744                 if (!ctx->ea_block_quota_blocks) {
2745                         pctx->errcode = ea_refcount_create(0,
2746                                                 &ctx->ea_block_quota_blocks);
2747                         if (pctx->errcode) {
2748                                 pctx->num = 3;
2749                                 goto refcount_fail;
2750                         }
2751                 }
2752                 ea_refcount_store(ctx->ea_block_quota_blocks, blk,
2753                                   quota_blocks);
2754         }
2755
2756         if (quota_inodes) {
2757                 if (!ctx->ea_block_quota_inodes) {
2758                         pctx->errcode = ea_refcount_create(0,
2759                                                 &ctx->ea_block_quota_inodes);
2760                         if (pctx->errcode) {
2761                                 pctx->num = 4;
2762 refcount_fail:
2763                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
2764                                 ctx->flags |= E2F_FLAG_ABORT;
2765                                 return 0;
2766                         }
2767                 }
2768
2769                 ea_refcount_store(ctx->ea_block_quota_inodes, blk,
2770                                   quota_inodes);
2771         }
2772         ea_block_quota->blocks = quota_blocks;
2773         ea_block_quota->inodes = quota_inodes;
2774
2775         inc_ea_inode_refs(ctx, pctx, first, end);
2776         ea_refcount_store(ctx->refcount, blk, header->h_refcount - 1);
2777         mark_block_used(ctx, blk);
2778         ext2fs_fast_mark_block_bitmap2(ctx->block_ea_map, blk);
2779         return 1;
2780
2781 clear_extattr:
2782         if (region)
2783                 region_free(region);
2784         ext2fs_file_acl_block_set(fs, inode, 0);
2785         e2fsck_write_inode(ctx, ino, inode, "check_ext_attr");
2786         return 0;
2787 }
2788
2789 /* Returns 1 if bad htree, 0 if OK */
2790 static int handle_htree(e2fsck_t ctx, struct problem_context *pctx,
2791                         ext2_ino_t ino, struct ext2_inode *inode,
2792                         char *block_buf)
2793 {
2794         struct ext2_dx_root_info        *root;
2795         ext2_filsys                     fs = ctx->fs;
2796         errcode_t                       retval;
2797         blk64_t                         blk;
2798
2799         if ((!LINUX_S_ISDIR(inode->i_mode) &&
2800              fix_problem(ctx, PR_1_HTREE_NODIR, pctx)) ||
2801             (!ext2fs_has_feature_dir_index(fs->super) &&
2802              fix_problem(ctx, PR_1_HTREE_SET, pctx)))
2803                 return 1;
2804
2805         pctx->errcode = ext2fs_bmap2(fs, ino, inode, 0, 0, 0, 0, &blk);
2806
2807         if ((pctx->errcode) ||
2808             (blk == 0) ||
2809             (blk < fs->super->s_first_data_block) ||
2810             (blk >= ext2fs_blocks_count(fs->super))) {
2811                 if (fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
2812                         return 1;
2813                 else
2814                         return 0;
2815         }
2816
2817         retval = io_channel_read_blk64(fs->io, blk, 1, block_buf);
2818         if (retval && fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
2819                 return 1;
2820
2821         /* XXX should check that beginning matches a directory */
2822         root = (struct ext2_dx_root_info *) (block_buf + 24);
2823
2824         if ((root->reserved_zero || root->info_length < 8) &&
2825             fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
2826                 return 1;
2827
2828         pctx->num = root->hash_version;
2829         if ((root->hash_version != EXT2_HASH_LEGACY) &&
2830             (root->hash_version != EXT2_HASH_HALF_MD4) &&
2831             (root->hash_version != EXT2_HASH_TEA) &&
2832             (root->hash_version != EXT2_HASH_SIPHASH) &&
2833             fix_problem(ctx, PR_1_HTREE_HASHV, pctx))
2834                 return 1;
2835
2836         if (ext4_hash_in_dirent(inode)) {
2837                 if (root->hash_version != EXT2_HASH_SIPHASH &&
2838                     fix_problem(ctx, PR_1_HTREE_NEEDS_SIPHASH, pctx))
2839                         return 1;
2840         } else {
2841                 if (root->hash_version == EXT2_HASH_SIPHASH &&
2842                    fix_problem(ctx, PR_1_HTREE_CANNOT_SIPHASH, pctx))
2843                         return 1;
2844         }
2845
2846         if ((root->unused_flags & EXT2_HASH_FLAG_INCOMPAT) &&
2847             fix_problem(ctx, PR_1_HTREE_INCOMPAT, pctx))
2848                 return 1;
2849
2850         pctx->num = root->indirect_levels;
2851         /* if htree level is clearly too high, consider it to be broken */
2852         if (root->indirect_levels > EXT4_HTREE_LEVEL &&
2853             fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
2854                 return 1;
2855
2856         /* if level is only maybe too high, LARGE_DIR feature could be unset */
2857         if (root->indirect_levels > ext2_dir_htree_level(fs) &&
2858             !ext2fs_has_feature_largedir(fs->super)) {
2859                 int blockbits = EXT2_BLOCK_SIZE_BITS(fs->super) + 10;
2860                 unsigned idx_pb = 1 << (blockbits - 3);
2861
2862                 /* compare inode size/blocks vs. max-sized 2-level htree */
2863                 if (EXT2_I_SIZE(pctx->inode) <
2864                     (idx_pb - 1) * (idx_pb - 2) << blockbits &&
2865                     pctx->inode->i_blocks <
2866                     (idx_pb - 1) * (idx_pb - 2) << (blockbits - 9) &&
2867                     fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
2868                         return 1;
2869         }
2870
2871         if (root->indirect_levels > EXT4_HTREE_LEVEL_COMPAT ||
2872             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
2873                 ctx->large_dirs++;
2874
2875         return 0;
2876 }
2877
2878 void e2fsck_clear_inode(e2fsck_t ctx, ext2_ino_t ino,
2879                         struct ext2_inode *inode, int restart_flag,
2880                         const char *source)
2881 {
2882         inode->i_flags = 0;
2883         inode->i_links_count = 0;
2884         ext2fs_icount_store(ctx->inode_link_info, ino, 0);
2885         inode->i_dtime = ctx->now;
2886
2887         /*
2888          * If a special inode has such rotten block mappings that we
2889          * want to clear the whole inode, be sure to actually zap
2890          * the block maps because i_links_count isn't checked for
2891          * special inodes, and we'll end up right back here the next
2892          * time we run fsck.
2893          */
2894         if (ino < EXT2_FIRST_INODE(ctx->fs->super))
2895                 memset(inode->i_block, 0, sizeof(inode->i_block));
2896
2897         ext2fs_unmark_inode_bitmap2(ctx->inode_dir_map, ino);
2898         ext2fs_unmark_inode_bitmap2(ctx->inode_used_map, ino);
2899         if (ctx->inode_reg_map)
2900                 ext2fs_unmark_inode_bitmap2(ctx->inode_reg_map, ino);
2901         if (ctx->inode_bad_map)
2902                 ext2fs_unmark_inode_bitmap2(ctx->inode_bad_map, ino);
2903
2904         /*
2905          * If the inode was partially accounted for before processing
2906          * was aborted, we need to restart the pass 1 scan.
2907          */
2908         ctx->flags |= restart_flag;
2909
2910         if (ino == EXT2_BAD_INO)
2911                 memset(inode, 0, sizeof(struct ext2_inode));
2912
2913         e2fsck_write_inode(ctx, ino, inode, source);
2914 }
2915
2916 /*
2917  * Use the multiple-blocks reclamation code to fix alignment problems in
2918  * a bigalloc filesystem.  We want a logical cluster to map to *only* one
2919  * physical cluster, and we want the block offsets within that cluster to
2920  * line up.
2921  */
2922 static int has_unaligned_cluster_map(e2fsck_t ctx,
2923                                      blk64_t last_pblk, blk64_t last_lblk,
2924                                      blk64_t pblk, blk64_t lblk)
2925 {
2926         blk64_t cluster_mask;
2927
2928         if (!ctx->fs->cluster_ratio_bits)
2929                 return 0;
2930         cluster_mask = EXT2FS_CLUSTER_MASK(ctx->fs);
2931
2932         /*
2933          * If the block in the logical cluster doesn't align with the block in
2934          * the physical cluster...
2935          */
2936         if ((lblk & cluster_mask) != (pblk & cluster_mask))
2937                 return 1;
2938
2939         /*
2940          * If we cross a physical cluster boundary within a logical cluster...
2941          */
2942         if (last_pblk && (lblk & cluster_mask) != 0 &&
2943             EXT2FS_B2C(ctx->fs, lblk) == EXT2FS_B2C(ctx->fs, last_lblk) &&
2944             EXT2FS_B2C(ctx->fs, pblk) != EXT2FS_B2C(ctx->fs, last_pblk))
2945                 return 1;
2946
2947         return 0;
2948 }
2949
2950 static void scan_extent_node(e2fsck_t ctx, struct problem_context *pctx,
2951                              struct process_block_struct *pb,
2952                              blk64_t start_block, blk64_t end_block,
2953                              blk64_t eof_block,
2954                              ext2_extent_handle_t ehandle,
2955                              int try_repairs)
2956 {
2957         struct ext2fs_extent    extent;
2958         blk64_t                 blk, last_lblk;
2959         unsigned int            i, n;
2960         int                     is_dir, is_leaf;
2961         problem_t               problem;
2962         struct ext2_extent_info info;
2963         int                     failed_csum = 0;
2964
2965         if (pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID)
2966                 failed_csum = 1;
2967
2968         pctx->errcode = ext2fs_extent_get_info(ehandle, &info);
2969         if (pctx->errcode)
2970                 return;
2971         if (!(ctx->options & E2F_OPT_FIXES_ONLY) &&
2972             !pb->eti.force_rebuild) {
2973                 struct extent_tree_level *etl;
2974
2975                 etl = pb->eti.ext_info + info.curr_level;
2976                 etl->num_extents += info.num_entries;
2977                 etl->max_extents += info.max_entries;
2978                 /*
2979                  * Implementation wart: Splitting extent blocks when appending
2980                  * will leave the old block with one free entry.  Therefore
2981                  * unless the node is totally full, pretend that a non-root
2982                  * extent block can hold one fewer entry than it actually does,
2983                  * so that we don't repeatedly rebuild the extent tree.
2984                  */
2985                 if (info.curr_level && info.num_entries < info.max_entries)
2986                         etl->max_extents--;
2987         }
2988
2989         pctx->errcode = ext2fs_extent_get(ehandle, EXT2_EXTENT_FIRST_SIB,
2990                                           &extent);
2991         while ((pctx->errcode == 0 ||
2992                 pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID) &&
2993                info.num_entries-- > 0) {
2994                 is_leaf = extent.e_flags & EXT2_EXTENT_FLAGS_LEAF;
2995                 is_dir = LINUX_S_ISDIR(pctx->inode->i_mode);
2996                 last_lblk = extent.e_lblk + extent.e_len - 1;
2997
2998                 problem = 0;
2999                 pctx->blk = extent.e_pblk;
3000                 pctx->blk2 = extent.e_lblk;
3001                 pctx->num = extent.e_len;
3002                 pctx->blkcount = extent.e_lblk + extent.e_len;
3003
3004                 if (extent.e_pblk == 0 ||
3005                     extent.e_pblk < ctx->fs->super->s_first_data_block ||
3006                     extent.e_pblk >= ext2fs_blocks_count(ctx->fs->super))
3007                         problem = PR_1_EXTENT_BAD_START_BLK;
3008                 else if (extent.e_lblk < start_block)
3009                         problem = PR_1_OUT_OF_ORDER_EXTENTS;
3010                 else if ((end_block && last_lblk > end_block) &&
3011                          !(last_lblk > eof_block &&
3012                            ((extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) ||
3013                             (pctx->inode->i_flags & EXT4_VERITY_FL))))
3014                         problem = PR_1_EXTENT_END_OUT_OF_BOUNDS;
3015                 else if (is_leaf && extent.e_len == 0)
3016                         problem = PR_1_EXTENT_LENGTH_ZERO;
3017                 else if (is_leaf &&
3018                          (extent.e_pblk + extent.e_len) >
3019                          ext2fs_blocks_count(ctx->fs->super))
3020                         problem = PR_1_EXTENT_ENDS_BEYOND;
3021                 else if (is_leaf && is_dir && !pctx->inode->i_size_high &&
3022                          !ext2fs_has_feature_largedir(ctx->fs->super) &&
3023                          ((extent.e_lblk + extent.e_len) >
3024                           (1U << (21 - ctx->fs->super->s_log_block_size))))
3025                         problem = PR_1_TOOBIG_DIR;
3026
3027                 if (is_leaf && problem == 0 && extent.e_len > 0) {
3028 #if 0
3029                         printf("extent_region(ino=%u, expect=%llu, "
3030                                "lblk=%llu, len=%u)\n", pb->ino,
3031                                (unsigned long long) pb->next_lblock,
3032                                (unsigned long long) extent.e_lblk,
3033                                extent.e_len);
3034 #endif
3035                         if (extent.e_lblk < pb->next_lblock)
3036                                 problem = PR_1_EXTENT_COLLISION;
3037                         else if (extent.e_lblk + extent.e_len > pb->next_lblock)
3038                                 pb->next_lblock = extent.e_lblk + extent.e_len;
3039                 }
3040
3041                 /*
3042                  * Uninitialized blocks in a directory?  Clear the flag and
3043                  * we'll interpret the blocks later.
3044                  */
3045                 if (try_repairs && is_dir && problem == 0 &&
3046                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3047                     fix_problem(ctx, PR_1_UNINIT_DBLOCK, pctx)) {
3048                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3049                         pb->inode_modified = 1;
3050                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3051                                                               &extent);
3052                         if (pctx->errcode)
3053                                 return;
3054                         failed_csum = 0;
3055                 }
3056 #ifdef CONFIG_DEVELOPER_FEATURES
3057                 if (try_repairs && !is_dir && problem == 0 &&
3058                     (ctx->options & E2F_OPT_CLEAR_UNINIT) &&
3059                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3060                     fix_problem(ctx, PR_1_CLEAR_UNINIT_EXTENT, pctx)) {
3061                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3062                         pb->inode_modified = 1;
3063                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3064                                                               &extent);
3065                         if (pctx->errcode)
3066                                 return;
3067                         failed_csum = 0;
3068                 }
3069 #endif
3070                 if (try_repairs && problem) {
3071 report_problem:
3072                         if (fix_problem(ctx, problem, pctx)) {
3073                                 if (ctx->invalid_bitmaps) {
3074                                         /*
3075                                          * If fsck knows the bitmaps are bad,
3076                                          * skip to the next extent and
3077                                          * try to clear this extent again
3078                                          * after fixing the bitmaps, by
3079                                          * restarting fsck.
3080                                          */
3081                                         pctx->errcode = ext2fs_extent_get(
3082                                                           ehandle,
3083                                                           EXT2_EXTENT_NEXT_SIB,
3084                                                           &extent);
3085                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3086                                         if (pctx->errcode ==
3087                                                     EXT2_ET_NO_CURRENT_NODE) {
3088                                                 pctx->errcode = 0;
3089                                                 break;
3090                                         }
3091                                         continue;
3092                                 }
3093                                 e2fsck_read_bitmaps(ctx);
3094                                 pb->inode_modified = 1;
3095                                 pctx->errcode =
3096                                         ext2fs_extent_delete(ehandle, 0);
3097                                 if (pctx->errcode) {
3098                                         pctx->str = "ext2fs_extent_delete";
3099                                         return;
3100                                 }
3101                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
3102                                 if (pctx->errcode &&
3103                                     pctx->errcode != EXT2_ET_NO_CURRENT_NODE) {
3104                                         pctx->str = "ext2fs_extent_fix_parents";
3105                                         return;
3106                                 }
3107                                 pctx->errcode = ext2fs_extent_get(ehandle,
3108                                                                   EXT2_EXTENT_CURRENT,
3109                                                                   &extent);
3110                                 if (pctx->errcode == EXT2_ET_NO_CURRENT_NODE) {
3111                                         pctx->errcode = 0;
3112                                         break;
3113                                 }
3114                                 failed_csum = 0;
3115                                 continue;
3116                         }
3117                         goto next;
3118                 }
3119
3120                 if (!is_leaf) {
3121                         blk64_t lblk = extent.e_lblk;
3122                         int next_try_repairs = 1;
3123
3124                         blk = extent.e_pblk;
3125
3126                         /*
3127                          * If this lower extent block collides with critical
3128                          * metadata, don't try to repair the damage.  Pass 1b
3129                          * will reallocate the block; then we can try again.
3130                          */
3131                         if (pb->ino != EXT2_RESIZE_INO &&
3132                             extent.e_pblk < ctx->fs->super->s_blocks_count &&
3133                             ext2fs_test_block_bitmap2(ctx->block_metadata_map,
3134                                                       extent.e_pblk)) {
3135                                 next_try_repairs = 0;
3136                                 pctx->blk = blk;
3137                                 fix_problem(ctx,
3138                                             PR_1_CRITICAL_METADATA_COLLISION,
3139                                             pctx);
3140                                 if ((ctx->options & E2F_OPT_NO) == 0)
3141                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3142                         }
3143                         pctx->errcode = ext2fs_extent_get(ehandle,
3144                                                   EXT2_EXTENT_DOWN, &extent);
3145                         if (pctx->errcode &&
3146                             pctx->errcode != EXT2_ET_EXTENT_CSUM_INVALID) {
3147                                 pctx->str = "EXT2_EXTENT_DOWN";
3148                                 problem = PR_1_EXTENT_HEADER_INVALID;
3149                                 if (!next_try_repairs)
3150                                         return;
3151                                 if (pctx->errcode == EXT2_ET_EXTENT_HEADER_BAD)
3152                                         goto report_problem;
3153                                 return;
3154                         }
3155                         /* The next extent should match this index's logical start */
3156                         if (extent.e_lblk != lblk) {
3157                                 struct ext2_extent_info e_info;
3158
3159                                 pctx->errcode = ext2fs_extent_get_info(ehandle,
3160                                                                        &e_info);
3161                                 if (pctx->errcode) {
3162                                         pctx->str = "ext2fs_extent_get_info";
3163                                         return;
3164                                 }
3165                                 pctx->blk = lblk;
3166                                 pctx->blk2 = extent.e_lblk;
3167                                 pctx->num = e_info.curr_level - 1;
3168                                 problem = PR_1_EXTENT_INDEX_START_INVALID;
3169                                 if (fix_problem(ctx, problem, pctx)) {
3170                                         pb->inode_modified = 1;
3171                                         pctx->errcode =
3172                                                 ext2fs_extent_fix_parents(ehandle);
3173                                         if (pctx->errcode) {
3174                                                 pctx->str = "ext2fs_extent_fix_parents";
3175                                                 return;
3176                                         }
3177                                 }
3178                         }
3179                         scan_extent_node(ctx, pctx, pb, extent.e_lblk,
3180                                          last_lblk, eof_block, ehandle,
3181                                          next_try_repairs);
3182                         if (pctx->errcode)
3183                                 return;
3184                         pctx->errcode = ext2fs_extent_get(ehandle,
3185                                                   EXT2_EXTENT_UP, &extent);
3186                         if (pctx->errcode) {
3187                                 pctx->str = "EXT2_EXTENT_UP";
3188                                 return;
3189                         }
3190                         mark_block_used(ctx, blk);
3191                         pb->num_blocks++;
3192                         goto next;
3193                 }
3194
3195                 if ((pb->previous_block != 0) &&
3196                     (pb->previous_block+1 != extent.e_pblk)) {
3197                         if (ctx->options & E2F_OPT_FRAGCHECK) {
3198                                 char type = '?';
3199
3200                                 if (pb->is_dir)
3201                                         type = 'd';
3202                                 else if (pb->is_reg)
3203                                         type = 'f';
3204
3205                                 printf(("%6lu(%c): expecting %6lu "
3206                                         "actual extent "
3207                                         "phys %6lu log %lu len %lu\n"),
3208                                        (unsigned long) pctx->ino, type,
3209                                        (unsigned long) pb->previous_block+1,
3210                                        (unsigned long) extent.e_pblk,
3211                                        (unsigned long) extent.e_lblk,
3212                                        (unsigned long) extent.e_len);
3213                         }
3214                         pb->fragmented = 1;
3215                 }
3216                 /*
3217                  * If we notice a gap in the logical block mappings of an
3218                  * extent-mapped directory, offer to close the hole by
3219                  * moving the logical block down, otherwise we'll go mad in
3220                  * pass 3 allocating empty directory blocks to fill the hole.
3221                  */
3222                 if (try_repairs && is_dir &&
3223                     pb->last_block + 1 < extent.e_lblk) {
3224                         blk64_t new_lblk;
3225
3226                         new_lblk = pb->last_block + 1;
3227                         if (EXT2FS_CLUSTER_RATIO(ctx->fs) > 1)
3228                                 new_lblk = ((new_lblk +
3229                                              EXT2FS_CLUSTER_RATIO(ctx->fs) - 1) &
3230                                             ~EXT2FS_CLUSTER_MASK(ctx->fs)) |
3231                                            (extent.e_pblk &
3232                                             EXT2FS_CLUSTER_MASK(ctx->fs));
3233                         pctx->blk = extent.e_lblk;
3234                         pctx->blk2 = new_lblk;
3235                         if (fix_problem(ctx, PR_1_COLLAPSE_DBLOCK, pctx)) {
3236                                 extent.e_lblk = new_lblk;
3237                                 pb->inode_modified = 1;
3238                                 pctx->errcode = ext2fs_extent_replace(ehandle,
3239                                                                 0, &extent);
3240                                 if (pctx->errcode) {
3241                                         pctx->errcode = 0;
3242                                         goto alloc_later;
3243                                 }
3244                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
3245                                 if (pctx->errcode)
3246                                         goto failed_add_dir_block;
3247                                 pctx->errcode = ext2fs_extent_goto(ehandle,
3248                                                                 extent.e_lblk);
3249                                 if (pctx->errcode)
3250                                         goto failed_add_dir_block;
3251                                 last_lblk = extent.e_lblk + extent.e_len - 1;
3252                                 failed_csum = 0;
3253                         }
3254                 }
3255 alloc_later:
3256                 if (is_dir) {
3257                         while (++pb->last_db_block <
3258                                (e2_blkcnt_t) extent.e_lblk) {
3259                                 pctx->errcode = ext2fs_add_dir_block2(
3260                                                         ctx->fs->dblist,
3261                                                         pb->ino, 0,
3262                                                         pb->last_db_block);
3263                                 if (pctx->errcode) {
3264                                         pctx->blk = 0;
3265                                         pctx->num = pb->last_db_block;
3266                                         goto failed_add_dir_block;
3267                                 }
3268                         }
3269
3270                         for (i = 0; i < extent.e_len; i++) {
3271                                 pctx->errcode = ext2fs_add_dir_block2(
3272                                                         ctx->fs->dblist,
3273                                                         pctx->ino,
3274                                                         extent.e_pblk + i,
3275                                                         extent.e_lblk + i);
3276                                 if (pctx->errcode) {
3277                                         pctx->blk = extent.e_pblk + i;
3278                                         pctx->num = extent.e_lblk + i;
3279                                 failed_add_dir_block:
3280                                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
3281                                         /* Should never get here */
3282                                         ctx->flags |= E2F_FLAG_ABORT;
3283                                         return;
3284                                 }
3285                         }
3286                         if (extent.e_len > 0)
3287                                 pb->last_db_block = extent.e_lblk + extent.e_len - 1;
3288                 }
3289                 if (has_unaligned_cluster_map(ctx, pb->previous_block,
3290                                               pb->last_block,
3291                                               extent.e_pblk,
3292                                               extent.e_lblk)) {
3293                         for (i = 0; i < extent.e_len; i++) {
3294                                 pctx->blk = extent.e_lblk + i;
3295                                 pctx->blk2 = extent.e_pblk + i;
3296                                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
3297                                 mark_block_used(ctx, extent.e_pblk + i);
3298                                 mark_block_used(ctx, extent.e_pblk + i);
3299                         }
3300                 }
3301
3302                 /*
3303                  * Check whether first cluster got marked in previous iteration.
3304                  */
3305                 if (ctx->fs->cluster_ratio_bits &&
3306                     pb->previous_block &&
3307                     (EXT2FS_B2C(ctx->fs, extent.e_pblk) ==
3308                      EXT2FS_B2C(ctx->fs, pb->previous_block)))
3309                         /* Set blk to the beginning of next cluster. */
3310                         blk = EXT2FS_C2B(
3311                                 ctx->fs,
3312                                 EXT2FS_B2C(ctx->fs, extent.e_pblk) + 1);
3313                 else
3314                         /* Set blk to the beginning of current cluster. */
3315                         blk = EXT2FS_C2B(ctx->fs,
3316                                          EXT2FS_B2C(ctx->fs, extent.e_pblk));
3317
3318                 if (blk < extent.e_pblk + extent.e_len) {
3319                         mark_blocks_used(ctx, blk,
3320                                          extent.e_pblk + extent.e_len - blk);
3321                         n = DIV_ROUND_UP(extent.e_pblk + extent.e_len - blk,
3322                                          EXT2FS_CLUSTER_RATIO(ctx->fs));
3323                         pb->num_blocks += n;
3324                 }
3325                 pb->last_block = extent.e_lblk + extent.e_len - 1;
3326                 pb->previous_block = extent.e_pblk + extent.e_len - 1;
3327                 start_block = pb->last_block = last_lblk;
3328                 if (is_leaf && !is_dir &&
3329                     !(extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT))
3330                         pb->last_init_lblock = last_lblk;
3331         next:
3332                 pctx->errcode = ext2fs_extent_get(ehandle,
3333                                                   EXT2_EXTENT_NEXT_SIB,
3334                                                   &extent);
3335         }
3336
3337         /* Failed csum but passes checks?  Ask to fix checksum. */
3338         if (failed_csum &&
3339             fix_problem(ctx, PR_1_EXTENT_ONLY_CSUM_INVALID, pctx)) {
3340                 pb->inode_modified = 1;
3341                 pctx->errcode = ext2fs_extent_replace(ehandle, 0, &extent);
3342                 if (pctx->errcode)
3343                         return;
3344         }
3345
3346         if (pctx->errcode == EXT2_ET_EXTENT_NO_NEXT)
3347                 pctx->errcode = 0;
3348 }
3349
3350 static void check_blocks_extents(e2fsck_t ctx, struct problem_context *pctx,
3351                                  struct process_block_struct *pb)
3352 {
3353         struct ext2_extent_info info;
3354         struct ext2_inode       *inode = pctx->inode;
3355         ext2_extent_handle_t    ehandle;
3356         ext2_filsys             fs = ctx->fs;
3357         ext2_ino_t              ino = pctx->ino;
3358         errcode_t               retval;
3359         blk64_t                 eof_lblk;
3360         struct ext3_extent_header       *eh;
3361
3362         /* Check for a proper extent header... */
3363         eh = (struct ext3_extent_header *) &inode->i_block[0];
3364         retval = ext2fs_extent_header_verify(eh, sizeof(inode->i_block));
3365         if (retval) {
3366                 if (fix_problem(ctx, PR_1_MISSING_EXTENT_HEADER, pctx))
3367                         e2fsck_clear_inode(ctx, ino, inode, 0,
3368                                            "check_blocks_extents");
3369                 pctx->errcode = 0;
3370                 return;
3371         }
3372
3373         /* ...since this function doesn't fail if i_block is zeroed. */
3374         pctx->errcode = ext2fs_extent_open2(fs, ino, inode, &ehandle);
3375         if (pctx->errcode) {
3376                 if (fix_problem(ctx, PR_1_READ_EXTENT, pctx))
3377                         e2fsck_clear_inode(ctx, ino, inode, 0,
3378                                            "check_blocks_extents");
3379                 pctx->errcode = 0;
3380                 return;
3381         }
3382
3383         retval = ext2fs_extent_get_info(ehandle, &info);
3384         if (retval == 0) {
3385                 int max_depth = info.max_depth;
3386
3387                 if (max_depth >= MAX_EXTENT_DEPTH_COUNT)
3388                         max_depth = MAX_EXTENT_DEPTH_COUNT-1;
3389                 ctx->extent_depth_count[max_depth]++;
3390         }
3391
3392         /* Check maximum extent depth */
3393         pctx->blk = info.max_depth;
3394         pctx->blk2 = ext2fs_max_extent_depth(ehandle);
3395         if (pctx->blk2 < pctx->blk &&
3396             fix_problem(ctx, PR_1_EXTENT_BAD_MAX_DEPTH, pctx))
3397                 pb->eti.force_rebuild = 1;
3398
3399         /* Can we collect extent tree level stats? */
3400         pctx->blk = MAX_EXTENT_DEPTH_COUNT;
3401         if (pctx->blk2 > pctx->blk)
3402                 fix_problem(ctx, PR_1E_MAX_EXTENT_TREE_DEPTH, pctx);
3403         memset(pb->eti.ext_info, 0, sizeof(pb->eti.ext_info));
3404         pb->eti.ino = pb->ino;
3405
3406         pb->next_lblock = 0;
3407
3408         eof_lblk = ((EXT2_I_SIZE(inode) + fs->blocksize - 1) >>
3409                 EXT2_BLOCK_SIZE_BITS(fs->super)) - 1;
3410         scan_extent_node(ctx, pctx, pb, 0, 0, eof_lblk, ehandle, 1);
3411         if (pctx->errcode &&
3412             fix_problem(ctx, PR_1_EXTENT_ITERATE_FAILURE, pctx)) {
3413                 pb->num_blocks = 0;
3414                 inode->i_blocks = 0;
3415                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
3416                                    "check_blocks_extents");
3417                 pctx->errcode = 0;
3418         }
3419         ext2fs_extent_free(ehandle);
3420
3421         /* Rebuild unless it's a dir and we're rehashing it */
3422         if (LINUX_S_ISDIR(inode->i_mode) &&
3423             e2fsck_dir_will_be_rehashed(ctx, ino))
3424                 return;
3425
3426         if (ctx->options & E2F_OPT_CONVERT_BMAP)
3427                 e2fsck_rebuild_extents_later(ctx, ino);
3428         else
3429                 e2fsck_should_rebuild_extents(ctx, pctx, &pb->eti, &info);
3430 }
3431
3432 /*
3433  * In fact we don't need to check blocks for an inode with inline data
3434  * because this inode doesn't have any blocks.  In this function all
3435  * we need to do is add this inode into dblist when it is a directory.
3436  */
3437 static void check_blocks_inline_data(e2fsck_t ctx, struct problem_context *pctx,
3438                                      struct process_block_struct *pb)
3439 {
3440         int     flags;
3441         size_t  inline_data_size = 0;
3442
3443         if (!pb->is_dir) {
3444                 pctx->errcode = 0;
3445                 return;
3446         }
3447
3448         /* Process the dirents in i_block[] as the "first" block. */
3449         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 0);
3450         if (pctx->errcode)
3451                 goto err;
3452
3453         /* Process the dirents in the EA as a "second" block. */
3454         flags = ctx->fs->flags;
3455         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
3456         pctx->errcode = ext2fs_inline_data_size(ctx->fs, pb->ino,
3457                                                 &inline_data_size);
3458         ctx->fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
3459                          (ctx->fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
3460         if (pctx->errcode) {
3461                 pctx->errcode = 0;
3462                 return;
3463         }
3464
3465         if (inline_data_size <= EXT4_MIN_INLINE_DATA_SIZE)
3466                 return;
3467
3468         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 1);
3469         if (pctx->errcode)
3470                 goto err;
3471
3472         return;
3473 err:
3474         pctx->blk = 0;
3475         pctx->num = 0;
3476         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
3477         ctx->flags |= E2F_FLAG_ABORT;
3478 }
3479
3480 /*
3481  * This subroutine is called on each inode to account for all of the
3482  * blocks used by that inode.
3483  */
3484 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
3485                          char *block_buf, const struct ea_quota *ea_ibody_quota)
3486 {
3487         ext2_filsys fs = ctx->fs;
3488         struct process_block_struct pb;
3489         ext2_ino_t      ino = pctx->ino;
3490         struct ext2_inode *inode = pctx->inode;
3491         unsigned        bad_size = 0;
3492         int             dirty_inode = 0;
3493         int             extent_fs;
3494         int             inlinedata_fs;
3495         __u64           size;
3496         struct ea_quota ea_block_quota;
3497
3498         pb.ino = ino;
3499         pb.num_blocks = EXT2FS_B2C(ctx->fs,
3500                                    ea_ibody_quota ? ea_ibody_quota->blocks : 0);
3501         pb.last_block = ~0;
3502         pb.last_init_lblock = -1;
3503         pb.last_db_block = -1;
3504         pb.num_illegal_blocks = 0;
3505         pb.suppress = 0; pb.clear = 0;
3506         pb.fragmented = 0;
3507         pb.compressed = 0;
3508         pb.previous_block = 0;
3509         pb.is_dir = LINUX_S_ISDIR(inode->i_mode);
3510         pb.is_reg = LINUX_S_ISREG(inode->i_mode);
3511         pb.max_blocks = 1U << (31 - fs->super->s_log_block_size);
3512         pb.inode = inode;
3513         pb.pctx = pctx;
3514         pb.ctx = ctx;
3515         pb.inode_modified = 0;
3516         pb.eti.force_rebuild = 0;
3517         pctx->ino = ino;
3518         pctx->errcode = 0;
3519
3520         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
3521         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
3522
3523         if (check_ext_attr(ctx, pctx, block_buf, &ea_block_quota)) {
3524                 if (e2fsck_should_abort(ctx))
3525                         goto out;
3526                 pb.num_blocks += EXT2FS_B2C(ctx->fs, ea_block_quota.blocks);
3527         }
3528
3529         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL))
3530                 check_blocks_inline_data(ctx, pctx, &pb);
3531         else if (ext2fs_inode_has_valid_blocks2(fs, inode)) {
3532                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL))
3533                         check_blocks_extents(ctx, pctx, &pb);
3534                 else {
3535                         int flags;
3536                         /*
3537                          * If we've modified the inode, write it out before
3538                          * iterate() tries to use it.
3539                          */
3540                         if (dirty_inode) {
3541                                 e2fsck_write_inode(ctx, ino, inode,
3542                                                    "check_blocks");
3543                                 dirty_inode = 0;
3544                         }
3545                         flags = fs->flags;
3546                         fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
3547                         pctx->errcode = ext2fs_block_iterate3(fs, ino,
3548                                                 pb.is_dir ? BLOCK_FLAG_HOLE : 0,
3549                                                 block_buf, process_block, &pb);
3550                         /*
3551                          * We do not have uninitialized extents in non extent
3552                          * files.
3553                          */
3554                         pb.last_init_lblock = pb.last_block;
3555                         /*
3556                          * If iterate() changed a block mapping, we have to
3557                          * re-read the inode.  If we decide to clear the
3558                          * inode after clearing some stuff, we'll re-write the
3559                          * bad mappings into the inode!
3560                          */
3561                         if (pb.inode_modified)
3562                                 e2fsck_read_inode(ctx, ino, inode,
3563                                                   "check_blocks");
3564                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
3565                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
3566
3567                         if (ctx->options & E2F_OPT_CONVERT_BMAP) {
3568 #ifdef DEBUG
3569                                 printf("bmap rebuild ino=%d\n", ino);
3570 #endif
3571                                 if (!LINUX_S_ISDIR(inode->i_mode) ||
3572                                     !e2fsck_dir_will_be_rehashed(ctx, ino))
3573                                         e2fsck_rebuild_extents_later(ctx, ino);
3574                         }
3575                 }
3576         }
3577         end_problem_latch(ctx, PR_LATCH_BLOCK);
3578         end_problem_latch(ctx, PR_LATCH_TOOBIG);
3579         if (e2fsck_should_abort(ctx))
3580                 goto out;
3581         if (pctx->errcode)
3582                 fix_problem(ctx, PR_1_BLOCK_ITERATE, pctx);
3583
3584         if (pb.fragmented && pb.num_blocks < fs->super->s_blocks_per_group) {
3585                 if (LINUX_S_ISDIR(inode->i_mode))
3586                         ctx->fs_fragmented_dir++;
3587                 else
3588                         ctx->fs_fragmented++;
3589         }
3590
3591         if (pb.clear) {
3592                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
3593                                    "check_blocks");
3594                 return;
3595         }
3596
3597         if (inode->i_flags & EXT2_INDEX_FL) {
3598                 if (handle_htree(ctx, pctx, ino, inode, block_buf)) {
3599                         inode->i_flags &= ~EXT2_INDEX_FL;
3600                         dirty_inode++;
3601                 } else {
3602                         e2fsck_add_dx_dir(ctx, ino, inode, pb.last_block+1);
3603                 }
3604         }
3605
3606         if (!pb.num_blocks && pb.is_dir &&
3607             !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
3608                 if (fix_problem(ctx, PR_1_ZERO_LENGTH_DIR, pctx)) {
3609                         e2fsck_clear_inode(ctx, ino, inode, 0, "check_blocks");
3610                         ctx->fs_directory_count--;
3611                         return;
3612                 }
3613         }
3614
3615         if (ino != quota_type2inum(PRJQUOTA, fs->super) &&
3616             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INODE(ctx->fs->super)) &&
3617             !(inode->i_flags & EXT4_EA_INODE_FL)) {
3618                 quota_data_add(ctx->qctx, (struct ext2_inode_large *) inode,
3619                                ino,
3620                                pb.num_blocks * EXT2_CLUSTER_SIZE(fs->super));
3621                 quota_data_inodes(ctx->qctx, (struct ext2_inode_large *) inode,
3622                                   ino, (ea_ibody_quota ?
3623                                         ea_ibody_quota->inodes : 0) +
3624                                                 ea_block_quota.inodes + 1);
3625         }
3626
3627         if (!ext2fs_has_feature_huge_file(fs->super) ||
3628             !(inode->i_flags & EXT4_HUGE_FILE_FL))
3629                 pb.num_blocks *= (fs->blocksize / 512);
3630         pb.num_blocks *= EXT2FS_CLUSTER_RATIO(fs);
3631 #if 0
3632         printf("inode %u, i_size = %u, last_block = %llu, i_blocks=%llu, num_blocks = %llu\n",
3633                ino, inode->i_size, (unsigned long long) pb.last_block,
3634                (unsigned long long) ext2fs_inode_i_blocks(fs, inode),
3635                (unsigned long long) pb.num_blocks);
3636 #endif
3637         size = EXT2_I_SIZE(inode);
3638         if (pb.is_dir) {
3639                 unsigned nblock = size >> EXT2_BLOCK_SIZE_BITS(fs->super);
3640                 if (inode->i_flags & EXT4_INLINE_DATA_FL) {
3641                         int flags;
3642                         size_t sz = 0;
3643                         errcode_t err;
3644
3645                         flags = ctx->fs->flags;
3646                         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
3647                         err = ext2fs_inline_data_size(ctx->fs, pctx->ino,
3648                                                       &sz);
3649                         ctx->fs->flags = (flags &
3650                                           EXT2_FLAG_IGNORE_CSUM_ERRORS) |
3651                                          (ctx->fs->flags &
3652                                           ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
3653                         if (err || sz != size) {
3654                                 bad_size = 7;
3655                                 pctx->num = sz;
3656                         }
3657                 } else if (size & (fs->blocksize - 1))
3658                         bad_size = 5;
3659                 else if (nblock > (pb.last_block + 1))
3660                         bad_size = 1;
3661                 else if (nblock < (pb.last_block + 1)) {
3662                         if (((pb.last_block + 1) - nblock) >
3663                             fs->super->s_prealloc_dir_blocks)
3664                                 bad_size = 2;
3665                 }
3666         } else {
3667                 if ((pb.last_init_lblock >= 0) &&
3668                     /* Do not allow initialized allocated blocks past i_size*/
3669                     (size < (__u64)pb.last_init_lblock * fs->blocksize) &&
3670                     !(inode->i_flags & EXT4_VERITY_FL))
3671                         bad_size = 3;
3672                 else if (!(extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
3673                          size > ext2_max_sizes[fs->super->s_log_block_size])
3674                         /* too big for a direct/indirect-mapped file */
3675                         bad_size = 4;
3676                 else if ((extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
3677                          size >
3678                          ((1ULL << (32 + EXT2_BLOCK_SIZE_BITS(fs->super))) - 1))
3679                         /* too big for an extent-based file - 32bit ee_block */
3680                         bad_size = 6;
3681         }
3682         /* i_size for symlinks is checked elsewhere */
3683         if (bad_size && !LINUX_S_ISLNK(inode->i_mode)) {
3684                 /* Did inline_data set pctx->num earlier? */
3685                 if (bad_size != 7)
3686                         pctx->num = (pb.last_block + 1) * fs->blocksize;
3687                 pctx->group = bad_size;
3688                 if (fix_problem(ctx, PR_1_BAD_I_SIZE, pctx)) {
3689                         ext2fs_inode_size_set(fs, inode, pctx->num);
3690                         if (EXT2_I_SIZE(inode) == 0 &&
3691                             (inode->i_flags & EXT4_INLINE_DATA_FL)) {
3692                                 memset(inode->i_block, 0,
3693                                        sizeof(inode->i_block));
3694                                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
3695                         }
3696                         dirty_inode++;
3697                 }
3698                 pctx->num = 0;
3699         }
3700         if (LINUX_S_ISREG(inode->i_mode) &&
3701             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
3702                 ctx->large_files++;
3703         if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
3704             ((pb.num_blocks != ext2fs_inode_i_blocks(fs, inode)) ||
3705              (ext2fs_has_feature_huge_file(fs->super) &&
3706               (inode->i_flags & EXT4_HUGE_FILE_FL) &&
3707               (inode->osd2.linux2.l_i_blocks_hi != 0)))) {
3708                 pctx->num = pb.num_blocks;
3709                 if (fix_problem(ctx, PR_1_BAD_I_BLOCKS, pctx)) {
3710                         inode->i_blocks = pb.num_blocks;
3711                         inode->osd2.linux2.l_i_blocks_hi = pb.num_blocks >> 32;
3712                         dirty_inode++;
3713                 }
3714                 pctx->num = 0;
3715         }
3716
3717         /*
3718          * The kernel gets mad if we ask it to allocate bigalloc clusters to
3719          * a block mapped file, so rebuild it as an extent file.  We can skip
3720          * symlinks because they're never rewritten.
3721          */
3722         if (ext2fs_has_feature_bigalloc(fs->super) &&
3723             (LINUX_S_ISREG(inode->i_mode) || LINUX_S_ISDIR(inode->i_mode)) &&
3724             ext2fs_inode_data_blocks2(fs, inode) > 0 &&
3725             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INO(fs->super)) &&
3726             !(inode->i_flags & (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)) &&
3727             fix_problem(ctx, PR_1_NO_BIGALLOC_BLOCKMAP_FILES, pctx)) {
3728                 pctx->errcode = e2fsck_rebuild_extents_later(ctx, ino);
3729                 if (pctx->errcode)
3730                         goto out;
3731         }
3732
3733         if (ctx->dirs_to_hash && pb.is_dir &&
3734             !(ctx->lost_and_found && ctx->lost_and_found == ino) &&
3735             !(inode->i_flags & EXT2_INDEX_FL) &&
3736             ((inode->i_size / fs->blocksize) >= 3))
3737                 e2fsck_rehash_dir_later(ctx, ino);
3738
3739 out:
3740         if (dirty_inode)
3741                 e2fsck_write_inode(ctx, ino, inode, "check_blocks");
3742 }
3743
3744 #if 0
3745 /*
3746  * Helper function called by process block when an illegal block is
3747  * found.  It returns a description about why the block is illegal
3748  */
3749 static char *describe_illegal_block(ext2_filsys fs, blk64_t block)
3750 {
3751         blk64_t super;
3752         int     i;
3753         static char     problem[80];
3754
3755         super = fs->super->s_first_data_block;
3756         strcpy(problem, "PROGRAMMING ERROR: Unknown reason for illegal block");
3757         if (block < super) {
3758                 sprintf(problem, "< FIRSTBLOCK (%u)", super);
3759                 return(problem);
3760         } else if (block >= ext2fs_blocks_count(fs->super)) {
3761                 sprintf(problem, "> BLOCKS (%u)", ext2fs_blocks_count(fs->super));
3762                 return(problem);
3763         }
3764         for (i = 0; i < fs->group_desc_count; i++) {
3765                 if (block == super) {
3766                         sprintf(problem, "is the superblock in group %d", i);
3767                         break;
3768                 }
3769                 if (block > super &&
3770                     block <= (super + fs->desc_blocks)) {
3771                         sprintf(problem, "is in the group descriptors "
3772                                 "of group %d", i);
3773                         break;
3774                 }
3775                 if (block == ext2fs_block_bitmap_loc(fs, i)) {
3776                         sprintf(problem, "is the block bitmap of group %d", i);
3777                         break;
3778                 }
3779                 if (block == ext2fs_inode_bitmap_loc(fs, i)) {
3780                         sprintf(problem, "is the inode bitmap of group %d", i);
3781                         break;
3782                 }
3783                 if (block >= ext2fs_inode_table_loc(fs, i) &&
3784                     (block < ext2fs_inode_table_loc(fs, i)
3785                      + fs->inode_blocks_per_group)) {
3786                         sprintf(problem, "is in the inode table of group %d",
3787                                 i);
3788                         break;
3789                 }
3790                 super += fs->super->s_blocks_per_group;
3791         }
3792         return(problem);
3793 }
3794 #endif
3795
3796 /*
3797  * This is a helper function for check_blocks().
3798  */
3799 static int process_block(ext2_filsys fs,
3800                   blk64_t       *block_nr,
3801                   e2_blkcnt_t blockcnt,
3802                   blk64_t ref_block EXT2FS_ATTR((unused)),
3803                   int ref_offset EXT2FS_ATTR((unused)),
3804                   void *priv_data)
3805 {
3806         struct process_block_struct *p;
3807         struct problem_context *pctx;
3808         blk64_t blk = *block_nr;
3809         int     ret_code = 0;
3810         problem_t       problem = 0;
3811         e2fsck_t        ctx;
3812
3813         p = (struct process_block_struct *) priv_data;
3814         pctx = p->pctx;
3815         ctx = p->ctx;
3816
3817         /*
3818          * For a directory, add logical block zero for processing even if it's
3819          * not mapped or we'll be perennially stuck with broken "." and ".."
3820          * entries.
3821          */
3822         if (p->is_dir && blockcnt == 0 && blk == 0) {
3823                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino, 0, 0);
3824                 if (pctx->errcode) {
3825                         pctx->blk = blk;
3826                         pctx->num = blockcnt;
3827                         goto failed_add_dir_block;
3828                 }
3829                 p->last_db_block++;
3830         }
3831
3832         if (blk == 0)
3833                 return 0;
3834
3835 #if 0
3836         printf("Process_block, inode %lu, block %u, #%d\n", p->ino, blk,
3837                blockcnt);
3838 #endif
3839
3840         /*
3841          * Simplistic fragmentation check.  We merely require that the
3842          * file be contiguous.  (Which can never be true for really
3843          * big files that are greater than a block group.)
3844          */
3845         if (p->previous_block && p->ino != EXT2_RESIZE_INO) {
3846                 if (p->previous_block+1 != blk) {
3847                         if (ctx->options & E2F_OPT_FRAGCHECK) {
3848                                 char type = '?';
3849
3850                                 if (p->is_dir)
3851                                         type = 'd';
3852                                 else if (p->is_reg)
3853                                         type = 'f';
3854
3855                                 printf(_("%6lu(%c): expecting %6lu "
3856                                          "got phys %6lu (blkcnt %lld)\n"),
3857                                        (unsigned long) pctx->ino, type,
3858                                        (unsigned long) p->previous_block+1,
3859                                        (unsigned long) blk,
3860                                        (long long) blockcnt);
3861                         }
3862                         p->fragmented = 1;
3863                 }
3864         }
3865
3866         if (p->is_dir && !ext2fs_has_feature_largedir(fs->super) &&
3867             !pctx->inode->i_size_high &&
3868             blockcnt > (1 << (21 - fs->super->s_log_block_size)))
3869                 problem = PR_1_TOOBIG_DIR;
3870         if (p->is_dir && p->num_blocks + 1 >= p->max_blocks)
3871                 problem = PR_1_TOOBIG_DIR;
3872         if (p->is_reg && p->num_blocks + 1 >= p->max_blocks)
3873                 problem = PR_1_TOOBIG_REG;
3874         if (!p->is_dir && !p->is_reg && blockcnt > 0)
3875                 problem = PR_1_TOOBIG_SYMLINK;
3876
3877         if (blk < fs->super->s_first_data_block ||
3878             blk >= ext2fs_blocks_count(fs->super))
3879                 problem = PR_1_ILLEGAL_BLOCK_NUM;
3880
3881         /*
3882          * If this IND/DIND/TIND block is squatting atop some critical metadata
3883          * (group descriptors, superblock, bitmap, inode table), any write to
3884          * "fix" mapping problems will destroy the metadata.  We'll let pass 1b
3885          * fix that and restart fsck.
3886          */
3887         if (blockcnt < 0 &&
3888             p->ino != EXT2_RESIZE_INO &&
3889             blk < ctx->fs->super->s_blocks_count &&
3890             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk)) {
3891                 pctx->blk = blk;
3892                 fix_problem(ctx, PR_1_CRITICAL_METADATA_COLLISION, pctx);
3893                 if ((ctx->options & E2F_OPT_NO) == 0)
3894                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3895         }
3896
3897         if (problem) {
3898                 p->num_illegal_blocks++;
3899                 /*
3900                  * A bit of subterfuge here -- we're trying to fix a block
3901                  * mapping, but the IND/DIND/TIND block could have collided
3902                  * with some critical metadata.  So, fix the in-core mapping so
3903                  * iterate won't go insane, but return 0 instead of
3904                  * BLOCK_CHANGED so that it won't write the remapping out to
3905                  * our multiply linked block.
3906                  *
3907                  * Even if we previously determined that an *IND block
3908                  * conflicts with critical metadata, we must still try to
3909                  * iterate the *IND block as if it is an *IND block to find and
3910                  * mark the blocks it points to.  Better to be overly cautious
3911                  * with the used_blocks map so that we don't move the *IND
3912                  * block to a block that's really in use!
3913                  */
3914                 if (p->ino != EXT2_RESIZE_INO &&
3915                     ref_block != 0 &&
3916                     ext2fs_test_block_bitmap2(ctx->block_metadata_map,
3917                                               ref_block)) {
3918                         *block_nr = 0;
3919                         return 0;
3920                 }
3921                 if (!p->suppress && (p->num_illegal_blocks % 12) == 0) {
3922                         if (fix_problem(ctx, PR_1_TOO_MANY_BAD_BLOCKS, pctx)) {
3923                                 p->clear = 1;
3924                                 return BLOCK_ABORT;
3925                         }
3926                         if (fix_problem(ctx, PR_1_SUPPRESS_MESSAGES, pctx)) {
3927                                 p->suppress = 1;
3928                                 set_latch_flags(PR_LATCH_BLOCK,
3929                                                 PRL_SUPPRESS, 0);
3930                         }
3931                 }
3932                 pctx->blk = blk;
3933                 pctx->blkcount = blockcnt;
3934                 if (fix_problem(ctx, problem, pctx)) {
3935                         blk = *block_nr = 0;
3936                         ret_code = BLOCK_CHANGED;
3937                         p->inode_modified = 1;
3938                         /*
3939                          * If the directory block is too big and is beyond the
3940                          * end of the FS, don't bother trying to add it for
3941                          * processing -- the kernel would never have created a
3942                          * directory this large, and we risk an ENOMEM abort.
3943                          * In any case, the toobig handler for extent-based
3944                          * directories also doesn't feed toobig blocks to
3945                          * pass 2.
3946                          */
3947                         if (problem == PR_1_TOOBIG_DIR)
3948                                 return ret_code;
3949                         goto mark_dir;
3950                 } else
3951                         return 0;
3952         }
3953
3954         if (p->ino == EXT2_RESIZE_INO) {
3955                 /*
3956                  * The resize inode has already be sanity checked
3957                  * during pass #0 (the superblock checks).  All we
3958                  * have to do is mark the double indirect block as
3959                  * being in use; all of the other blocks are handled
3960                  * by mark_table_blocks()).
3961                  */
3962                 if (blockcnt == BLOCK_COUNT_DIND)
3963                         mark_block_used(ctx, blk);
3964                 p->num_blocks++;
3965         } else if (!(ctx->fs->cluster_ratio_bits &&
3966                      p->previous_block &&
3967                      (EXT2FS_B2C(ctx->fs, blk) ==
3968                       EXT2FS_B2C(ctx->fs, p->previous_block)) &&
3969                      (blk & EXT2FS_CLUSTER_MASK(ctx->fs)) ==
3970                      ((unsigned) blockcnt & EXT2FS_CLUSTER_MASK(ctx->fs)))) {
3971                 mark_block_used(ctx, blk);
3972                 p->num_blocks++;
3973         } else if (has_unaligned_cluster_map(ctx, p->previous_block,
3974                                              p->last_block, blk, blockcnt)) {
3975                 pctx->blk = blockcnt;
3976                 pctx->blk2 = blk;
3977                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
3978                 mark_block_used(ctx, blk);
3979                 mark_block_used(ctx, blk);
3980         }
3981         if (blockcnt >= 0)
3982                 p->last_block = blockcnt;
3983         p->previous_block = blk;
3984 mark_dir:
3985         if (p->is_dir && (blockcnt >= 0)) {
3986                 while (++p->last_db_block < blockcnt) {
3987                         pctx->errcode = ext2fs_add_dir_block2(fs->dblist,
3988                                                               p->ino, 0,
3989                                                               p->last_db_block);
3990                         if (pctx->errcode) {
3991                                 pctx->blk = 0;
3992                                 pctx->num = p->last_db_block;
3993                                 goto failed_add_dir_block;
3994                         }
3995                 }
3996                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino,
3997                                                       blk, blockcnt);
3998                 if (pctx->errcode) {
3999                         pctx->blk = blk;
4000                         pctx->num = blockcnt;
4001                 failed_add_dir_block:
4002                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4003                         /* Should never get here */
4004                         ctx->flags |= E2F_FLAG_ABORT;
4005                         return BLOCK_ABORT;
4006                 }
4007         }
4008         return ret_code;
4009 }
4010
4011 static int process_bad_block(ext2_filsys fs,
4012                       blk64_t *block_nr,
4013                       e2_blkcnt_t blockcnt,
4014                       blk64_t ref_block EXT2FS_ATTR((unused)),
4015                       int ref_offset EXT2FS_ATTR((unused)),
4016                       void *priv_data)
4017 {
4018         struct process_block_struct *p;
4019         blk64_t         blk = *block_nr;
4020         blk64_t         first_block;
4021         dgrp_t          i;
4022         struct problem_context *pctx;
4023         e2fsck_t        ctx;
4024
4025         if (!blk)
4026                 return 0;
4027
4028         p = (struct process_block_struct *) priv_data;
4029         ctx = p->ctx;
4030         pctx = p->pctx;
4031
4032         pctx->ino = EXT2_BAD_INO;
4033         pctx->blk = blk;
4034         pctx->blkcount = blockcnt;
4035
4036         if ((blk < fs->super->s_first_data_block) ||
4037             (blk >= ext2fs_blocks_count(fs->super))) {
4038                 if (fix_problem(ctx, PR_1_BB_ILLEGAL_BLOCK_NUM, pctx)) {
4039                         *block_nr = 0;
4040                         return BLOCK_CHANGED;
4041                 } else
4042                         return 0;
4043         }
4044
4045         if (blockcnt < 0) {
4046                 if (ext2fs_test_block_bitmap2(p->fs_meta_blocks, blk)) {
4047                         p->bbcheck = 1;
4048                         if (fix_problem(ctx, PR_1_BB_FS_BLOCK, pctx)) {
4049                                 *block_nr = 0;
4050                                 return BLOCK_CHANGED;
4051                         }
4052                 } else if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4053                                                     blk)) {
4054                         p->bbcheck = 1;
4055                         if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK,
4056                                         pctx)) {
4057                                 *block_nr = 0;
4058                                 return BLOCK_CHANGED;
4059                         }
4060                         if (e2fsck_should_abort(ctx))
4061                                 return BLOCK_ABORT;
4062                 } else
4063                         mark_block_used(ctx, blk);
4064                 return 0;
4065         }
4066 #if 0
4067         printf ("DEBUG: Marking %u as bad.\n", blk);
4068 #endif
4069         ctx->fs_badblocks_count++;
4070         /*
4071          * If the block is not used, then mark it as used and return.
4072          * If it is already marked as found, this must mean that
4073          * there's an overlap between the filesystem table blocks
4074          * (bitmaps and inode table) and the bad block list.
4075          */
4076         if (!ext2fs_test_block_bitmap2(ctx->block_found_map, blk)) {
4077                 ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
4078                 return 0;
4079         }
4080         /*
4081          * Try to find the where the filesystem block was used...
4082          */
4083         first_block = fs->super->s_first_data_block;
4084
4085         for (i = 0; i < fs->group_desc_count; i++ ) {
4086                 pctx->group = i;
4087                 pctx->blk = blk;
4088                 if (!ext2fs_bg_has_super(fs, i))
4089                         goto skip_super;
4090                 if (blk == first_block) {
4091                         if (i == 0) {
4092                                 if (fix_problem(ctx,
4093                                                 PR_1_BAD_PRIMARY_SUPERBLOCK,
4094                                                 pctx)) {
4095                                         *block_nr = 0;
4096                                         return BLOCK_CHANGED;
4097                                 }
4098                                 return 0;
4099                         }
4100                         fix_problem(ctx, PR_1_BAD_SUPERBLOCK, pctx);
4101                         return 0;
4102                 }
4103                 if ((blk > first_block) &&
4104                     (blk <= first_block + fs->desc_blocks)) {
4105                         if (i == 0) {
4106                                 pctx->blk = *block_nr;
4107                                 if (fix_problem(ctx,
4108                         PR_1_BAD_PRIMARY_GROUP_DESCRIPTOR, pctx)) {
4109                                         *block_nr = 0;
4110                                         return BLOCK_CHANGED;
4111                                 }
4112                                 return 0;
4113                         }
4114                         fix_problem(ctx, PR_1_BAD_GROUP_DESCRIPTORS, pctx);
4115                         return 0;
4116                 }
4117         skip_super:
4118                 if (blk == ext2fs_block_bitmap_loc(fs, i)) {
4119                         if (fix_problem(ctx, PR_1_BB_BAD_BLOCK, pctx)) {
4120                                 ctx->invalid_block_bitmap_flag[i]++;
4121                                 ctx->invalid_bitmaps++;
4122                         }
4123                         return 0;
4124                 }
4125                 if (blk == ext2fs_inode_bitmap_loc(fs, i)) {
4126                         if (fix_problem(ctx, PR_1_IB_BAD_BLOCK, pctx)) {
4127                                 ctx->invalid_inode_bitmap_flag[i]++;
4128                                 ctx->invalid_bitmaps++;
4129                         }
4130                         return 0;
4131                 }
4132                 if ((blk >= ext2fs_inode_table_loc(fs, i)) &&
4133                     (blk < (ext2fs_inode_table_loc(fs, i) +
4134                             fs->inode_blocks_per_group))) {
4135                         /*
4136                          * If there are bad blocks in the inode table,
4137                          * the inode scan code will try to do
4138                          * something reasonable automatically.
4139                          */
4140                         return 0;
4141                 }
4142                 first_block += fs->super->s_blocks_per_group;
4143         }
4144         /*
4145          * If we've gotten to this point, then the only
4146          * possibility is that the bad block inode meta data
4147          * is using a bad block.
4148          */
4149         if ((blk == p->inode->i_block[EXT2_IND_BLOCK]) ||
4150             (blk == p->inode->i_block[EXT2_DIND_BLOCK]) ||
4151             (blk == p->inode->i_block[EXT2_TIND_BLOCK])) {
4152                 p->bbcheck = 1;
4153                 if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK, pctx)) {
4154                         *block_nr = 0;
4155                         return BLOCK_CHANGED;
4156                 }
4157                 if (e2fsck_should_abort(ctx))
4158                         return BLOCK_ABORT;
4159                 return 0;
4160         }
4161
4162         pctx->group = -1;
4163
4164         /* Warn user that the block wasn't claimed */
4165         fix_problem(ctx, PR_1_PROGERR_CLAIMED_BLOCK, pctx);
4166
4167         return 0;
4168 }
4169
4170 static void new_table_block(e2fsck_t ctx, blk64_t first_block, dgrp_t group,
4171                             const char *name, int num, blk64_t *new_block)
4172 {
4173         ext2_filsys fs = ctx->fs;
4174         dgrp_t          last_grp;
4175         blk64_t         old_block = *new_block;
4176         blk64_t         last_block;
4177         dgrp_t          flexbg;
4178         unsigned        flexbg_size;
4179         int             i, is_flexbg;
4180         char            *buf;
4181         struct problem_context  pctx;
4182
4183         clear_problem_context(&pctx);
4184
4185         pctx.group = group;
4186         pctx.blk = old_block;
4187         pctx.str = name;
4188
4189         /*
4190          * For flex_bg filesystems, first try to allocate the metadata
4191          * within the flex_bg, and if that fails then try finding the
4192          * space anywhere in the filesystem.
4193          */
4194         is_flexbg = ext2fs_has_feature_flex_bg(fs->super);
4195         if (is_flexbg) {
4196                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
4197                 flexbg = group / flexbg_size;
4198                 first_block = ext2fs_group_first_block2(fs,
4199                                                         flexbg_size * flexbg);
4200                 last_grp = group | (flexbg_size - 1);
4201                 if (last_grp >= fs->group_desc_count)
4202                         last_grp = fs->group_desc_count - 1;
4203                 last_block = ext2fs_group_last_block2(fs, last_grp);
4204         } else
4205                 last_block = ext2fs_group_last_block2(fs, group);
4206         pctx.errcode = ext2fs_get_free_blocks2(fs, first_block, last_block,
4207                                                num, ctx->block_found_map,
4208                                                new_block);
4209         if (is_flexbg && (pctx.errcode == EXT2_ET_BLOCK_ALLOC_FAIL))
4210                 pctx.errcode = ext2fs_get_free_blocks2(fs,
4211                                 fs->super->s_first_data_block,
4212                                 ext2fs_blocks_count(fs->super),
4213                                 num, ctx->block_found_map, new_block);
4214         if (pctx.errcode) {
4215                 pctx.num = num;
4216                 fix_problem(ctx, PR_1_RELOC_BLOCK_ALLOCATE, &pctx);
4217                 ext2fs_unmark_valid(fs);
4218                 ctx->flags |= E2F_FLAG_ABORT;
4219                 return;
4220         }
4221         pctx.errcode = ext2fs_get_mem(fs->blocksize, &buf);
4222         if (pctx.errcode) {
4223                 fix_problem(ctx, PR_1_RELOC_MEMORY_ALLOCATE, &pctx);
4224                 ext2fs_unmark_valid(fs);
4225                 ctx->flags |= E2F_FLAG_ABORT;
4226                 return;
4227         }
4228         ext2fs_mark_super_dirty(fs);
4229         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
4230         pctx.blk2 = *new_block;
4231         fix_problem(ctx, (old_block ? PR_1_RELOC_FROM_TO :
4232                           PR_1_RELOC_TO), &pctx);
4233         pctx.blk2 = 0;
4234         for (i = 0; i < num; i++) {
4235                 pctx.blk = i;
4236                 ext2fs_mark_block_bitmap2(ctx->block_found_map, (*new_block)+i);
4237                 if (old_block) {
4238                         pctx.errcode = io_channel_read_blk64(fs->io,
4239                                    old_block + i, 1, buf);
4240                         if (pctx.errcode)
4241                                 fix_problem(ctx, PR_1_RELOC_READ_ERR, &pctx);
4242                         pctx.blk = (*new_block) + i;
4243                         pctx.errcode = io_channel_write_blk64(fs->io, pctx.blk,
4244                                                               1, buf);
4245                 } else {
4246                         pctx.blk = (*new_block) + i;
4247                         pctx.errcode = ext2fs_zero_blocks2(fs, pctx.blk, 1,
4248                                                            NULL, NULL);
4249                 }
4250
4251                 if (pctx.errcode)
4252                         fix_problem(ctx, PR_1_RELOC_WRITE_ERR, &pctx);
4253         }
4254         ext2fs_free_mem(&buf);
4255 }
4256
4257 /*
4258  * This routine gets called at the end of pass 1 if bad blocks are
4259  * detected in the superblock, group descriptors, inode_bitmaps, or
4260  * block bitmaps.  At this point, all of the blocks have been mapped
4261  * out, so we can try to allocate new block(s) to replace the bad
4262  * blocks.
4263  */
4264 static void handle_fs_bad_blocks(e2fsck_t ctx)
4265 {
4266         ext2_filsys fs = ctx->fs;
4267         dgrp_t          i;
4268         blk64_t         first_block;
4269         blk64_t         new_blk;
4270
4271         for (i = 0; i < fs->group_desc_count; i++) {
4272                 first_block = ext2fs_group_first_block2(fs, i);
4273
4274                 if (ctx->invalid_block_bitmap_flag[i]) {
4275                         new_blk = ext2fs_block_bitmap_loc(fs, i);
4276                         new_table_block(ctx, first_block, i, _("block bitmap"),
4277                                         1, &new_blk);
4278                         ext2fs_block_bitmap_loc_set(fs, i, new_blk);
4279                 }
4280                 if (ctx->invalid_inode_bitmap_flag[i]) {
4281                         new_blk = ext2fs_inode_bitmap_loc(fs, i);
4282                         new_table_block(ctx, first_block, i, _("inode bitmap"),
4283                                         1, &new_blk);
4284                         ext2fs_inode_bitmap_loc_set(fs, i, new_blk);
4285                 }
4286                 if (ctx->invalid_inode_table_flag[i]) {
4287                         new_blk = ext2fs_inode_table_loc(fs, i);
4288                         new_table_block(ctx, first_block, i, _("inode table"),
4289                                         fs->inode_blocks_per_group,
4290                                         &new_blk);
4291                         ext2fs_inode_table_loc_set(fs, i, new_blk);
4292                         ctx->flags |= E2F_FLAG_RESTART;
4293                 }
4294         }
4295         ctx->invalid_bitmaps = 0;
4296 }
4297
4298 /*
4299  * This routine marks all blocks which are used by the superblock,
4300  * group descriptors, inode bitmaps, and block bitmaps.
4301  */
4302 static void mark_table_blocks(e2fsck_t ctx)
4303 {
4304         ext2_filsys fs = ctx->fs;
4305         blk64_t b;
4306         dgrp_t  i;
4307         unsigned int    j;
4308         struct problem_context pctx;
4309
4310         clear_problem_context(&pctx);
4311
4312         for (i = 0; i < fs->group_desc_count; i++) {
4313                 pctx.group = i;
4314
4315                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_found_map);
4316                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_metadata_map);
4317
4318                 /*
4319                  * Mark the blocks used for the inode table
4320                  */
4321                 if (ext2fs_inode_table_loc(fs, i)) {
4322                         for (j = 0, b = ext2fs_inode_table_loc(fs, i);
4323                              j < fs->inode_blocks_per_group;
4324                              j++, b++) {
4325                                 if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4326                                                              b)) {
4327                                         pctx.blk = b;
4328                                         if (!ctx->invalid_inode_table_flag[i] &&
4329                                             fix_problem(ctx,
4330                                                 PR_1_ITABLE_CONFLICT, &pctx)) {
4331                                                 ctx->invalid_inode_table_flag[i]++;
4332                                                 ctx->invalid_bitmaps++;
4333                                         }
4334                                 } else {
4335                                     ext2fs_mark_block_bitmap2(
4336                                                 ctx->block_found_map, b);
4337                                     ext2fs_mark_block_bitmap2(
4338                                                 ctx->block_metadata_map, b);
4339                                 }
4340                         }
4341                 }
4342
4343                 /*
4344                  * Mark block used for the block bitmap
4345                  */
4346                 if (ext2fs_block_bitmap_loc(fs, i)) {
4347                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4348                                      ext2fs_block_bitmap_loc(fs, i))) {
4349                                 pctx.blk = ext2fs_block_bitmap_loc(fs, i);
4350                                 if (fix_problem(ctx, PR_1_BB_CONFLICT, &pctx)) {
4351                                         ctx->invalid_block_bitmap_flag[i]++;
4352                                         ctx->invalid_bitmaps++;
4353                                 }
4354                         } else {
4355                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
4356                                      ext2fs_block_bitmap_loc(fs, i));
4357                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
4358                                      ext2fs_block_bitmap_loc(fs, i));
4359                         }
4360                 }
4361                 /*
4362                  * Mark block used for the inode bitmap
4363                  */
4364                 if (ext2fs_inode_bitmap_loc(fs, i)) {
4365                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4366                                      ext2fs_inode_bitmap_loc(fs, i))) {
4367                                 pctx.blk = ext2fs_inode_bitmap_loc(fs, i);
4368                                 if (fix_problem(ctx, PR_1_IB_CONFLICT, &pctx)) {
4369                                         ctx->invalid_inode_bitmap_flag[i]++;
4370                                         ctx->invalid_bitmaps++;
4371                                 }
4372                         } else {
4373                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
4374                                      ext2fs_inode_bitmap_loc(fs, i));
4375                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
4376                                      ext2fs_inode_bitmap_loc(fs, i));
4377                         }
4378                 }
4379         }
4380 }
4381
4382 /*
4383  * These subroutines short circuits ext2fs_get_blocks and
4384  * ext2fs_check_directory; we use them since we already have the inode
4385  * structure, so there's no point in letting the ext2fs library read
4386  * the inode again.
4387  */
4388 static errcode_t pass1_get_blocks(ext2_filsys fs, ext2_ino_t ino,
4389                                   blk_t *blocks)
4390 {
4391         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4392         int     i;
4393
4394         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
4395                 return EXT2_ET_CALLBACK_NOTHANDLED;
4396
4397         for (i=0; i < EXT2_N_BLOCKS; i++)
4398                 blocks[i] = ctx->stashed_inode->i_block[i];
4399         return 0;
4400 }
4401
4402 static errcode_t pass1_read_inode(ext2_filsys fs, ext2_ino_t ino,
4403                                   struct ext2_inode *inode)
4404 {
4405         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4406
4407         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
4408                 return EXT2_ET_CALLBACK_NOTHANDLED;
4409         *inode = *ctx->stashed_inode;
4410         return 0;
4411 }
4412
4413 static errcode_t pass1_write_inode(ext2_filsys fs, ext2_ino_t ino,
4414                             struct ext2_inode *inode)
4415 {
4416         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4417
4418         if ((ino == ctx->stashed_ino) && ctx->stashed_inode &&
4419                 (inode != ctx->stashed_inode))
4420                 *ctx->stashed_inode = *inode;
4421         return EXT2_ET_CALLBACK_NOTHANDLED;
4422 }
4423
4424 static errcode_t pass1_check_directory(ext2_filsys fs, ext2_ino_t ino)
4425 {
4426         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4427
4428         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
4429                 return EXT2_ET_CALLBACK_NOTHANDLED;
4430
4431         if (!LINUX_S_ISDIR(ctx->stashed_inode->i_mode))
4432                 return EXT2_ET_NO_DIRECTORY;
4433         return 0;
4434 }
4435
4436 static errcode_t e2fsck_get_alloc_block(ext2_filsys fs, blk64_t goal,
4437                                         blk64_t *ret)
4438 {
4439         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4440         errcode_t       retval;
4441         blk64_t         new_block;
4442
4443         if (ctx->block_found_map) {
4444                 retval = ext2fs_new_block2(fs, goal, ctx->block_found_map,
4445                                            &new_block);
4446                 if (retval)
4447                         return retval;
4448                 if (fs->block_map) {
4449                         ext2fs_mark_block_bitmap2(fs->block_map, new_block);
4450                         ext2fs_mark_bb_dirty(fs);
4451                 }
4452         } else {
4453                 if (!fs->block_map) {
4454                         retval = ext2fs_read_block_bitmap(fs);
4455                         if (retval)
4456                                 return retval;
4457                 }
4458
4459                 retval = ext2fs_new_block2(fs, goal, fs->block_map, &new_block);
4460                 if (retval)
4461                         return retval;
4462         }
4463
4464         *ret = new_block;
4465         return (0);
4466 }
4467
4468 static errcode_t e2fsck_new_range(ext2_filsys fs, int flags, blk64_t goal,
4469                                   blk64_t len, blk64_t *pblk, blk64_t *plen)
4470 {
4471         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4472         errcode_t       retval;
4473
4474         if (ctx->block_found_map)
4475                 return ext2fs_new_range(fs, flags, goal, len,
4476                                         ctx->block_found_map, pblk, plen);
4477
4478         if (!fs->block_map) {
4479                 retval = ext2fs_read_block_bitmap(fs);
4480                 if (retval)
4481                         return retval;
4482         }
4483
4484         return ext2fs_new_range(fs, flags, goal, len, fs->block_map,
4485                                 pblk, plen);
4486 }
4487
4488 static void e2fsck_block_alloc_stats(ext2_filsys fs, blk64_t blk, int inuse)
4489 {
4490         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4491
4492         /* Never free a critical metadata block */
4493         if (ctx->block_found_map &&
4494             ctx->block_metadata_map &&
4495             inuse < 0 &&
4496             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk))
4497                 return;
4498
4499         if (ctx->block_found_map) {
4500                 if (inuse > 0)
4501                         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
4502                 else
4503                         ext2fs_unmark_block_bitmap2(ctx->block_found_map, blk);
4504         }
4505 }
4506
4507 static void e2fsck_block_alloc_stats_range(ext2_filsys fs, blk64_t blk,
4508                                            blk_t num, int inuse)
4509 {
4510         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
4511
4512         /* Never free a critical metadata block */
4513         if (ctx->block_found_map &&
4514             ctx->block_metadata_map &&
4515             inuse < 0 &&
4516             ext2fs_test_block_bitmap_range2(ctx->block_metadata_map, blk, num))
4517                 return;
4518
4519         if (ctx->block_found_map) {
4520                 if (inuse > 0)
4521                         ext2fs_mark_block_bitmap_range2(ctx->block_found_map,
4522                                                         blk, num);
4523                 else
4524                         ext2fs_unmark_block_bitmap_range2(ctx->block_found_map,
4525                                                         blk, num);
4526         }
4527 }
4528
4529 void e2fsck_use_inode_shortcuts(e2fsck_t ctx, int use_shortcuts)
4530 {
4531         ext2_filsys fs = ctx->fs;
4532
4533         if (use_shortcuts) {
4534                 fs->get_blocks = pass1_get_blocks;
4535                 fs->check_directory = pass1_check_directory;
4536                 fs->read_inode = pass1_read_inode;
4537                 fs->write_inode = pass1_write_inode;
4538                 ctx->stashed_ino = 0;
4539         } else {
4540                 fs->get_blocks = 0;
4541                 fs->check_directory = 0;
4542                 fs->read_inode = 0;
4543                 fs->write_inode = 0;
4544         }
4545 }
4546
4547 void e2fsck_intercept_block_allocations(e2fsck_t ctx)
4548 {
4549         ext2fs_set_alloc_block_callback(ctx->fs, e2fsck_get_alloc_block, 0);
4550         ext2fs_set_block_alloc_stats_callback(ctx->fs,
4551                                                 e2fsck_block_alloc_stats, 0);
4552         ext2fs_set_new_range_callback(ctx->fs, e2fsck_new_range, NULL);
4553         ext2fs_set_block_alloc_stats_range_callback(ctx->fs,
4554                                         e2fsck_block_alloc_stats_range, NULL);
4555 }