Whamcloud - gitweb
e2fsck: merge context flags properly
[tools/e2fsprogs.git] / e2fsck / pass1.c
1 /*
2  * pass1.c -- pass #1 of e2fsck: sequential scan of the inode table
3  *
4  * Copyright (C) 1993, 1994, 1995, 1996, 1997 Theodore Ts'o.
5  *
6  * %Begin-Header%
7  * This file may be redistributed under the terms of the GNU Public
8  * License.
9  * %End-Header%
10  *
11  * Pass 1 of e2fsck iterates over all the inodes in the filesystems,
12  * and applies the following tests to each inode:
13  *
14  *      - The mode field of the inode must be legal.
15  *      - The size and block count fields of the inode are correct.
16  *      - A data block must not be used by another inode
17  *
18  * Pass 1 also gathers the collects the following information:
19  *
20  *      - A bitmap of which inodes are in use.          (inode_used_map)
21  *      - A bitmap of which inodes are directories.     (inode_dir_map)
22  *      - A bitmap of which inodes are regular files.   (inode_reg_map)
23  *      - A bitmap of which inodes have bad fields.     (inode_bad_map)
24  *      - A bitmap of which inodes are in bad blocks.   (inode_bb_map)
25  *      - A bitmap of which inodes are imagic inodes.   (inode_imagic_map)
26  *      - A bitmap of which inodes are casefolded.      (inode_casefold_map)
27  *      - A bitmap of which blocks are in use.          (block_found_map)
28  *      - A bitmap of which blocks are in use by two inodes     (block_dup_map)
29  *      - The data blocks of the directory inodes.      (dir_map)
30  *      - Ref counts for ea_inodes.                     (ea_inode_refs)
31  *      - The encryption policy ID of each encrypted inode. (encrypted_files)
32  *
33  * Pass 1 is designed to stash away enough information so that the
34  * other passes should not need to read in the inode information
35  * during the normal course of a filesystem check.  (Although if an
36  * inconsistency is detected, other passes may need to read in an
37  * inode to fix it.)
38  *
39  * Note that pass 1B will be invoked if there are any duplicate blocks
40  * found.
41  */
42
43 #define _GNU_SOURCE 1 /* get strnlen() */
44 #include "config.h"
45 #include <string.h>
46 #include <time.h>
47 #ifdef HAVE_ERRNO_H
48 #include <errno.h>
49 #endif
50 #include <assert.h>
51 #ifdef HAVE_PTHREAD
52 #include <pthread.h>
53 #endif
54
55 #include "e2fsck.h"
56 #include <ext2fs/ext2_ext_attr.h>
57 /* todo remove this finally */
58 #include <ext2fs/ext2fsP.h>
59 #include <e2p/e2p.h>
60
61 #include "problem.h"
62
63 #ifdef NO_INLINE_FUNCS
64 #define _INLINE_
65 #else
66 #define _INLINE_ inline
67 #endif
68
69 #undef DEBUG
70
71 struct ea_quota {
72         blk64_t blocks;
73         __u64 inodes;
74 };
75
76 static int process_block(ext2_filsys fs, blk64_t        *blocknr,
77                          e2_blkcnt_t blockcnt, blk64_t ref_blk,
78                          int ref_offset, void *priv_data);
79 static int process_bad_block(ext2_filsys fs, blk64_t *block_nr,
80                              e2_blkcnt_t blockcnt, blk64_t ref_blk,
81                              int ref_offset, void *priv_data);
82 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
83                          char *block_buf,
84                          const struct ea_quota *ea_ibody_quota);
85 static void mark_table_blocks(e2fsck_t ctx);
86 static void alloc_bb_map(e2fsck_t ctx);
87 static void alloc_imagic_map(e2fsck_t ctx);
88 static void mark_inode_bad(e2fsck_t ctx, ino_t ino);
89 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino);
90 static void handle_fs_bad_blocks(e2fsck_t ctx);
91 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b);
92 static errcode_t scan_callback(ext2_filsys fs, ext2_inode_scan scan,
93                                   dgrp_t group, void * priv_data);
94 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
95                                     char *block_buf, int adjust_sign);
96 /* static char *describe_illegal_block(ext2_filsys fs, blk64_t block); */
97
98 struct process_block_struct {
99         ext2_ino_t      ino;
100         unsigned        is_dir:1, is_reg:1, clear:1, suppress:1,
101                                 fragmented:1, compressed:1, bbcheck:1,
102                                 inode_modified:1;
103         blk64_t         num_blocks;
104         blk64_t         max_blocks;
105         blk64_t         last_block;
106         e2_blkcnt_t     last_init_lblock;
107         e2_blkcnt_t     last_db_block;
108         int             num_illegal_blocks;
109         blk64_t         previous_block;
110         struct ext2_inode *inode;
111         struct problem_context *pctx;
112         ext2fs_block_bitmap fs_meta_blocks;
113         e2fsck_t        ctx;
114         blk64_t         next_lblock;
115         struct extent_tree_info eti;
116 };
117
118 struct process_inode_block {
119         ext2_ino_t ino;
120         struct ea_quota ea_ibody_quota;
121         struct ext2_inode_large inode;
122 };
123
124 struct scan_callback_struct {
125         e2fsck_t                         ctx;
126         char                            *block_buf;
127         struct process_inode_block      *inodes_to_process;
128         int                             *process_inode_count;
129 };
130
131 static void process_inodes(e2fsck_t ctx, char *block_buf,
132                            struct process_inode_block *inodes_to_process,
133                            int *process_inode_count);
134
135 static __u64 ext2_max_sizes[EXT2_MAX_BLOCK_LOG_SIZE -
136                             EXT2_MIN_BLOCK_LOG_SIZE + 1];
137
138 /*
139  * Check to make sure a device inode is real.  Returns 1 if the device
140  * checks out, 0 if not.
141  *
142  * Note: this routine is now also used to check FIFO's and Sockets,
143  * since they have the same requirement; the i_block fields should be
144  * zero.
145  */
146 int e2fsck_pass1_check_device_inode(ext2_filsys fs EXT2FS_ATTR((unused)),
147                                     struct ext2_inode *inode)
148 {
149         int     i;
150
151         /*
152          * If the index or extents flag is set, then this is a bogus
153          * device/fifo/socket
154          */
155         if (inode->i_flags & (EXT2_INDEX_FL | EXT4_EXTENTS_FL))
156                 return 0;
157
158         /*
159          * We should be able to do the test below all the time, but
160          * because the kernel doesn't forcibly clear the device
161          * inode's additional i_block fields, there are some rare
162          * occasions when a legitimate device inode will have non-zero
163          * additional i_block fields.  So for now, we only complain
164          * when the immutable flag is set, which should never happen
165          * for devices.  (And that's when the problem is caused, since
166          * you can't set or clear immutable flags for devices.)  Once
167          * the kernel has been fixed we can change this...
168          */
169         if (inode->i_flags & (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)) {
170                 for (i=4; i < EXT2_N_BLOCKS; i++)
171                         if (inode->i_block[i])
172                                 return 0;
173         }
174         return 1;
175 }
176
177 /*
178  * Check to make sure a symlink inode is real.  Returns 1 if the symlink
179  * checks out, 0 if not.
180  */
181 int e2fsck_pass1_check_symlink(ext2_filsys fs, ext2_ino_t ino,
182                                struct ext2_inode *inode, char *buf)
183 {
184         unsigned int buflen;
185         unsigned int len;
186
187         if ((inode->i_size_high || inode->i_size == 0) ||
188             (inode->i_flags & EXT2_INDEX_FL))
189                 return 0;
190
191         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
192                 size_t inline_size;
193
194                 if (inode->i_flags & EXT4_EXTENTS_FL)
195                         return 0;
196                 if (ext2fs_inline_data_size(fs, ino, &inline_size))
197                         return 0;
198                 if (inode->i_size != inline_size)
199                         return 0;
200
201                 return 1;
202         }
203
204         if (ext2fs_is_fast_symlink(inode)) {
205                 if (inode->i_flags & EXT4_EXTENTS_FL)
206                         return 0;
207                 buf = (char *)inode->i_block;
208                 buflen = sizeof(inode->i_block);
209         } else {
210                 ext2_extent_handle_t    handle;
211                 struct ext2_extent_info info;
212                 struct ext2fs_extent    extent;
213                 blk64_t blk;
214                 int i;
215
216                 if (inode->i_flags & EXT4_EXTENTS_FL) {
217                         if (ext2fs_extent_open2(fs, ino, inode, &handle))
218                                 return 0;
219                         if (ext2fs_extent_get_info(handle, &info) ||
220                             (info.num_entries != 1) ||
221                             (info.max_depth != 0)) {
222                                 ext2fs_extent_free(handle);
223                                 return 0;
224                         }
225                         if (ext2fs_extent_get(handle, EXT2_EXTENT_ROOT,
226                                               &extent) ||
227                             (extent.e_lblk != 0) ||
228                             (extent.e_len != 1)) {
229                                 ext2fs_extent_free(handle);
230                                 return 0;
231                         }
232                         blk = extent.e_pblk;
233                         ext2fs_extent_free(handle);
234                 } else {
235                         blk = inode->i_block[0];
236
237                         for (i = 1; i < EXT2_N_BLOCKS; i++)
238                                 if (inode->i_block[i])
239                                         return 0;
240                 }
241
242                 if (blk < fs->super->s_first_data_block ||
243                     blk >= ext2fs_blocks_count(fs->super))
244                         return 0;
245
246                 if (io_channel_read_blk64(fs->io, blk, 1, buf))
247                         return 0;
248
249                 buflen = fs->blocksize;
250         }
251
252         if (inode->i_flags & EXT4_ENCRYPT_FL)
253                 len = ext2fs_le16_to_cpu(*(__u16 *)buf) + 2;
254         else
255                 len = strnlen(buf, buflen);
256
257         if (len >= buflen)
258                 return 0;
259
260         if (len != inode->i_size)
261                 return 0;
262         return 1;
263 }
264
265 /*
266  * If the extents or inlinedata flags are set on the inode, offer to clear 'em.
267  */
268 #define BAD_SPECIAL_FLAGS (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)
269 static void check_extents_inlinedata(e2fsck_t ctx,
270                                      struct problem_context *pctx)
271 {
272         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
273                 return;
274
275         if (!fix_problem(ctx, PR_1_SPECIAL_EXTENTS_IDATA, pctx))
276                 return;
277
278         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
279         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
280 }
281 #undef BAD_SPECIAL_FLAGS
282
283 /*
284  * If the immutable (or append-only) flag is set on the inode, offer
285  * to clear it.
286  */
287 #define BAD_SPECIAL_FLAGS (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)
288 static void check_immutable(e2fsck_t ctx, struct problem_context *pctx)
289 {
290         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
291                 return;
292
293         if (!fix_problem(ctx, PR_1_SET_IMMUTABLE, pctx))
294                 return;
295
296         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
297         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
298 }
299
300 /*
301  * If device, fifo or socket, check size is zero -- if not offer to
302  * clear it
303  */
304 static void check_size(e2fsck_t ctx, struct problem_context *pctx)
305 {
306         struct ext2_inode *inode = pctx->inode;
307
308         if (EXT2_I_SIZE(inode) == 0)
309                 return;
310
311         if (!fix_problem(ctx, PR_1_SET_NONZSIZE, pctx))
312                 return;
313
314         ext2fs_inode_size_set(ctx->fs, inode, 0);
315         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
316 }
317
318 /*
319  * For a given size, calculate how many blocks would be charged towards quota.
320  */
321 static blk64_t size_to_quota_blocks(ext2_filsys fs, size_t size)
322 {
323         blk64_t clusters;
324
325         clusters = DIV_ROUND_UP(size, fs->blocksize << fs->cluster_ratio_bits);
326         return EXT2FS_C2B(fs, clusters);
327 }
328
329 /*
330  * Check validity of EA inode. Return 0 if EA inode is valid, otherwise return
331  * the problem code.
332  */
333 static problem_t check_large_ea_inode(e2fsck_t ctx,
334                                       struct ext2_ext_attr_entry *entry,
335                                       struct problem_context *pctx,
336                                       blk64_t *quota_blocks)
337 {
338         struct ext2_inode inode;
339         __u32 hash;
340         errcode_t retval;
341
342         /* Check if inode is within valid range */
343         if ((entry->e_value_inum < EXT2_FIRST_INODE(ctx->fs->super)) ||
344             (entry->e_value_inum > ctx->fs->super->s_inodes_count)) {
345                 pctx->num = entry->e_value_inum;
346                 return PR_1_ATTR_VALUE_EA_INODE;
347         }
348
349         e2fsck_read_inode(ctx, entry->e_value_inum, &inode, "pass1");
350
351         retval = ext2fs_ext_attr_hash_entry2(ctx->fs, entry, NULL, &hash);
352         if (retval) {
353                 com_err("check_large_ea_inode", retval,
354                         _("while hashing entry with e_value_inum = %u"),
355                         entry->e_value_inum);
356                 fatal_error(ctx, 0);
357         }
358
359         if (hash == entry->e_hash) {
360                 *quota_blocks = size_to_quota_blocks(ctx->fs,
361                                                      entry->e_value_size);
362         } else {
363                 /* This might be an old Lustre-style ea_inode reference. */
364                 if (inode.i_mtime == pctx->ino &&
365                     inode.i_generation == pctx->inode->i_generation) {
366                         *quota_blocks = 0;
367                 } else {
368                         /* If target inode is also missing EA_INODE flag,
369                          * this is likely to be a bad reference.
370                          */
371                         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
372                                 pctx->num = entry->e_value_inum;
373                                 return PR_1_ATTR_VALUE_EA_INODE;
374                         } else {
375                                 pctx->num = entry->e_hash;
376                                 return PR_1_ATTR_HASH;
377                         }
378                 }
379         }
380
381         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
382                 pctx->num = entry->e_value_inum;
383                 if (fix_problem(ctx, PR_1_ATTR_SET_EA_INODE_FL, pctx)) {
384                         inode.i_flags |= EXT4_EA_INODE_FL;
385                         ext2fs_write_inode(ctx->fs, entry->e_value_inum,
386                                            &inode);
387                 } else {
388                         return PR_1_ATTR_NO_EA_INODE_FL;
389                 }
390         }
391         return 0;
392 }
393
394 static void inc_ea_inode_refs(e2fsck_t ctx, struct problem_context *pctx,
395                               struct ext2_ext_attr_entry *first, void *end)
396 {
397         struct ext2_ext_attr_entry *entry;
398
399         for (entry = first;
400              (void *)entry < end && !EXT2_EXT_IS_LAST_ENTRY(entry);
401              entry = EXT2_EXT_ATTR_NEXT(entry)) {
402                 if (!entry->e_value_inum)
403                         continue;
404                 if (!ctx->ea_inode_refs) {
405                         pctx->errcode = ea_refcount_create(0,
406                                                            &ctx->ea_inode_refs);
407                         if (pctx->errcode) {
408                                 pctx->num = 4;
409                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
410                                 ctx->flags |= E2F_FLAG_ABORT;
411                                 return;
412                         }
413                 }
414                 ea_refcount_increment(ctx->ea_inode_refs, entry->e_value_inum,
415                                       0);
416         }
417 }
418
419 static void check_ea_in_inode(e2fsck_t ctx, struct problem_context *pctx,
420                               struct ea_quota *ea_ibody_quota)
421 {
422         struct ext2_super_block *sb = ctx->fs->super;
423         struct ext2_inode_large *inode;
424         struct ext2_ext_attr_entry *entry;
425         char *start, *header, *end;
426         unsigned int storage_size, remain;
427         problem_t problem = 0;
428         region_t region = 0;
429
430         ea_ibody_quota->blocks = 0;
431         ea_ibody_quota->inodes = 0;
432
433         inode = (struct ext2_inode_large *) pctx->inode;
434         storage_size = EXT2_INODE_SIZE(ctx->fs->super) - EXT2_GOOD_OLD_INODE_SIZE -
435                 inode->i_extra_isize;
436         header = ((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
437                  inode->i_extra_isize;
438         end = header + storage_size;
439         start = header + sizeof(__u32);
440         entry = (struct ext2_ext_attr_entry *) start;
441
442         /* scan all entry's headers first */
443
444         /* take finish entry 0UL into account */
445         remain = storage_size - sizeof(__u32);
446
447         region = region_create(0, storage_size);
448         if (!region) {
449                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
450                 problem = 0;
451                 ctx->flags |= E2F_FLAG_ABORT;
452                 return;
453         }
454         if (region_allocate(region, 0, sizeof(__u32))) {
455                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
456                 goto fix;
457         }
458
459         while (remain >= sizeof(struct ext2_ext_attr_entry) &&
460                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
461                 __u32 hash;
462
463                 if (region_allocate(region, (char *)entry - (char *)header,
464                                     EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
465                         problem = PR_1_INODE_EA_ALLOC_COLLISION;
466                         goto fix;
467                 }
468
469                 /* header eats this space */
470                 remain -= sizeof(struct ext2_ext_attr_entry);
471
472                 /* is attribute name valid? */
473                 if (EXT2_EXT_ATTR_SIZE(entry->e_name_len) > remain) {
474                         pctx->num = entry->e_name_len;
475                         problem = PR_1_ATTR_NAME_LEN;
476                         goto fix;
477                 }
478
479                 /* attribute len eats this space */
480                 remain -= EXT2_EXT_ATTR_SIZE(entry->e_name_len);
481
482                 if (entry->e_value_inum == 0) {
483                         /* check value size */
484                         if (entry->e_value_size > remain) {
485                                 pctx->num = entry->e_value_size;
486                                 problem = PR_1_ATTR_VALUE_SIZE;
487                                 goto fix;
488                         }
489
490                         if (entry->e_value_size &&
491                             region_allocate(region,
492                                             sizeof(__u32) + entry->e_value_offs,
493                                             EXT2_EXT_ATTR_SIZE(
494                                                 entry->e_value_size))) {
495                                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
496                                 goto fix;
497                         }
498
499                         hash = ext2fs_ext_attr_hash_entry(entry,
500                                                           start + entry->e_value_offs);
501
502                         /* e_hash may be 0 in older inode's ea */
503                         if (entry->e_hash != 0 && entry->e_hash != hash) {
504                                 pctx->num = entry->e_hash;
505                                 problem = PR_1_ATTR_HASH;
506                                 goto fix;
507                         }
508                 } else {
509                         blk64_t quota_blocks;
510
511                         problem = check_large_ea_inode(ctx, entry, pctx,
512                                                        &quota_blocks);
513                         if (problem != 0)
514                                 goto fix;
515
516                         ea_ibody_quota->blocks += quota_blocks;
517                         ea_ibody_quota->inodes++;
518                 }
519
520                 /* If EA value is stored in external inode then it does not
521                  * consume space here */
522                 if (entry->e_value_inum == 0)
523                         remain -= entry->e_value_size;
524
525                 entry = EXT2_EXT_ATTR_NEXT(entry);
526         }
527
528         if (region_allocate(region, (char *)entry - (char *)header,
529                             sizeof(__u32))) {
530                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
531                 goto fix;
532         }
533 fix:
534         if (region)
535                 region_free(region);
536         /*
537          * it seems like a corruption. it's very unlikely we could repair
538          * EA(s) in automatic fashion -bzzz
539          */
540         if (problem == 0 || !fix_problem(ctx, problem, pctx)) {
541                 inc_ea_inode_refs(ctx, pctx,
542                                   (struct ext2_ext_attr_entry *)start, end);
543                 return;
544         }
545
546         /* simply remove all possible EA(s) */
547         *((__u32 *)header) = 0UL;
548         e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
549                                 EXT2_INODE_SIZE(sb), "pass1");
550         ea_ibody_quota->blocks = 0;
551         ea_ibody_quota->inodes = 0;
552 }
553
554 static int check_inode_extra_negative_epoch(__u32 xtime, __u32 extra) {
555         return (xtime & (1U << 31)) != 0 &&
556                 (extra & EXT4_EPOCH_MASK) == EXT4_EPOCH_MASK;
557 }
558
559 #define CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, xtime) \
560         check_inode_extra_negative_epoch(inode->i_##xtime, \
561                                          inode->i_##xtime##_extra)
562
563 /* When today's date is earlier than 2242, we assume that atimes,
564  * ctimes, crtimes, and mtimes with years in the range 2310..2378 are
565  * actually pre-1970 dates mis-encoded.
566  */
567 #define EXT4_EXTRA_NEGATIVE_DATE_CUTOFF 2 * (1LL << 32)
568
569 static void check_inode_extra_space(e2fsck_t ctx, struct problem_context *pctx,
570                                     struct ea_quota *ea_ibody_quota)
571 {
572         struct ext2_super_block *sb = ctx->fs->super;
573         struct ext2_inode_large *inode;
574         __u32 *eamagic;
575         int min, max;
576
577         ea_ibody_quota->blocks = 0;
578         ea_ibody_quota->inodes = 0;
579
580         inode = (struct ext2_inode_large *) pctx->inode;
581         if (EXT2_INODE_SIZE(sb) == EXT2_GOOD_OLD_INODE_SIZE) {
582                 /* this isn't large inode. so, nothing to check */
583                 return;
584         }
585
586 #if 0
587         printf("inode #%u, i_extra_size %d\n", pctx->ino,
588                         inode->i_extra_isize);
589 #endif
590         /* i_extra_isize must cover i_extra_isize + i_checksum_hi at least */
591         min = sizeof(inode->i_extra_isize) + sizeof(inode->i_checksum_hi);
592         max = EXT2_INODE_SIZE(sb) - EXT2_GOOD_OLD_INODE_SIZE;
593         /*
594          * For now we will allow i_extra_isize to be 0, but really
595          * implementations should never allow i_extra_isize to be 0
596          */
597         if (inode->i_extra_isize &&
598             (inode->i_extra_isize < min || inode->i_extra_isize > max ||
599              inode->i_extra_isize & 3)) {
600                 if (!fix_problem(ctx, PR_1_EXTRA_ISIZE, pctx))
601                         return;
602                 if (inode->i_extra_isize < min || inode->i_extra_isize > max)
603                         inode->i_extra_isize = sb->s_want_extra_isize;
604                 else
605                         inode->i_extra_isize = (inode->i_extra_isize + 3) & ~3;
606                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
607                                         EXT2_INODE_SIZE(sb), "pass1");
608         }
609
610         /* check if there is no place for an EA header */
611         if (inode->i_extra_isize >= max - sizeof(__u32))
612                 return;
613
614         eamagic = (__u32 *) (((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
615                         inode->i_extra_isize);
616         if (*eamagic == EXT2_EXT_ATTR_MAGIC) {
617                 /* it seems inode has an extended attribute(s) in body */
618                 check_ea_in_inode(ctx, pctx, ea_ibody_quota);
619         }
620
621         /*
622          * If the inode's extended atime (ctime, crtime, mtime) is stored in
623          * the old, invalid format, repair it.
624          */
625         if (((sizeof(time_t) <= 4) ||
626              (((sizeof(time_t) > 4) &&
627                ctx->now < EXT4_EXTRA_NEGATIVE_DATE_CUTOFF))) &&
628             (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime) ||
629              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime) ||
630              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime) ||
631              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))) {
632
633                 if (!fix_problem(ctx, PR_1_EA_TIME_OUT_OF_RANGE, pctx))
634                         return;
635
636                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime))
637                         inode->i_atime_extra &= ~EXT4_EPOCH_MASK;
638                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime))
639                         inode->i_ctime_extra &= ~EXT4_EPOCH_MASK;
640                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime))
641                         inode->i_crtime_extra &= ~EXT4_EPOCH_MASK;
642                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))
643                         inode->i_mtime_extra &= ~EXT4_EPOCH_MASK;
644                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
645                                         EXT2_INODE_SIZE(sb), "pass1");
646         }
647
648 }
649
650 /*
651  * Check to see if the inode might really be a directory, despite i_mode
652  *
653  * This is a lot of complexity for something for which I'm not really
654  * convinced happens frequently in the wild.  If for any reason this
655  * causes any problems, take this code out.
656  * [tytso:20070331.0827EDT]
657  */
658 static void check_is_really_dir(e2fsck_t ctx, struct problem_context *pctx,
659                                 char *buf)
660 {
661         struct ext2_inode *inode = pctx->inode;
662         struct ext2_dir_entry   *dirent;
663         errcode_t               retval;
664         blk64_t                 blk;
665         unsigned int            i, rec_len, not_device = 0;
666         int                     extent_fs;
667         int                     inlinedata_fs;
668
669         /*
670          * If the mode looks OK, we believe it.  If the first block in
671          * the i_block array is 0, this cannot be a directory. If the
672          * inode is extent-mapped, it is still the case that the latter
673          * cannot be 0 - the magic number in the extent header would make
674          * it nonzero.
675          */
676         if (LINUX_S_ISDIR(inode->i_mode) || LINUX_S_ISREG(inode->i_mode) ||
677             LINUX_S_ISLNK(inode->i_mode) || inode->i_block[0] == 0)
678                 return;
679
680         /* 
681          * Check the block numbers in the i_block array for validity:
682          * zero blocks are skipped (but the first one cannot be zero -
683          * see above), other blocks are checked against the first and
684          * max data blocks (from the the superblock) and against the
685          * block bitmap. Any invalid block found means this cannot be
686          * a directory.
687          * 
688          * If there are non-zero blocks past the fourth entry, then
689          * this cannot be a device file: we remember that for the next
690          * check.
691          *
692          * For extent mapped files, we don't do any sanity checking:
693          * just try to get the phys block of logical block 0 and run
694          * with it.
695          *
696          * For inline data files, we just try to get the size of inline
697          * data.  If it's true, we will treat it as a directory.
698          */
699
700         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
701         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
702         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL)) {
703                 size_t size;
704                 __u32 dotdot;
705                 unsigned int rec_len2;
706                 struct ext2_dir_entry de;
707
708                 if (ext2fs_inline_data_size(ctx->fs, pctx->ino, &size))
709                         return;
710                 /*
711                  * If the size isn't a multiple of 4, it's probably not a
712                  * directory??
713                  */
714                 if (size & 3)
715                         return;
716                 /*
717                  * If the first 10 bytes don't look like a directory entry,
718                  * it's probably not a directory.
719                  */
720                 memcpy(&dotdot, inode->i_block, sizeof(dotdot));
721                 memcpy(&de, ((char *)inode->i_block) + EXT4_INLINE_DATA_DOTDOT_SIZE,
722                        EXT2_DIR_REC_LEN(0));
723                 dotdot = ext2fs_le32_to_cpu(dotdot);
724                 de.inode = ext2fs_le32_to_cpu(de.inode);
725                 de.rec_len = ext2fs_le16_to_cpu(de.rec_len);
726                 ext2fs_get_rec_len(ctx->fs, &de, &rec_len2);
727                 if (dotdot >= ctx->fs->super->s_inodes_count ||
728                     (dotdot < EXT2_FIRST_INO(ctx->fs->super) &&
729                      dotdot != EXT2_ROOT_INO) ||
730                     de.inode >= ctx->fs->super->s_inodes_count ||
731                     (de.inode < EXT2_FIRST_INO(ctx->fs->super) &&
732                      de.inode != 0) ||
733                     rec_len2 > EXT4_MIN_INLINE_DATA_SIZE -
734                               EXT4_INLINE_DATA_DOTDOT_SIZE)
735                         return;
736                 /* device files never have a "system.data" entry */
737                 goto isdir;
738         } else if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) {
739                 /* extent mapped */
740                 if  (ext2fs_bmap2(ctx->fs, pctx->ino, inode, 0, 0, 0, 0,
741                                  &blk))
742                         return;
743                 /* device files are never extent mapped */
744                 not_device++;
745         } else {
746                 for (i=0; i < EXT2_N_BLOCKS; i++) {
747                         blk = inode->i_block[i];
748                         if (!blk)
749                                 continue;
750                         if (i >= 4)
751                                 not_device++;
752
753                         if (blk < ctx->fs->super->s_first_data_block ||
754                             blk >= ext2fs_blocks_count(ctx->fs->super) ||
755                             ext2fs_fast_test_block_bitmap2(ctx->block_found_map,
756                                                            blk))
757                                 return; /* Invalid block, can't be dir */
758                 }
759                 blk = inode->i_block[0];
760         }
761
762         /*
763          * If the mode says this is a device file and the i_links_count field
764          * is sane and we have not ruled it out as a device file previously,
765          * we declare it a device file, not a directory.
766          */
767         if ((LINUX_S_ISCHR(inode->i_mode) || LINUX_S_ISBLK(inode->i_mode)) &&
768             (inode->i_links_count == 1) && !not_device)
769                 return;
770
771         /* read the first block */
772         ehandler_operation(_("reading directory block"));
773         retval = ext2fs_read_dir_block4(ctx->fs, blk, buf, 0, pctx->ino);
774         ehandler_operation(0);
775         if (retval)
776                 return;
777
778         dirent = (struct ext2_dir_entry *) buf;
779         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
780         if (retval)
781                 return;
782         if ((ext2fs_dirent_name_len(dirent) != 1) ||
783             (dirent->name[0] != '.') ||
784             (dirent->inode != pctx->ino) ||
785             (rec_len < 12) ||
786             (rec_len % 4) ||
787             (rec_len >= ctx->fs->blocksize - 12))
788                 return;
789
790         dirent = (struct ext2_dir_entry *) (buf + rec_len);
791         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
792         if (retval)
793                 return;
794         if ((ext2fs_dirent_name_len(dirent) != 2) ||
795             (dirent->name[0] != '.') ||
796             (dirent->name[1] != '.') ||
797             (rec_len < 12) ||
798             (rec_len % 4))
799                 return;
800
801 isdir:
802         if (fix_problem(ctx, PR_1_TREAT_AS_DIRECTORY, pctx)) {
803                 inode->i_mode = (inode->i_mode & 07777) | LINUX_S_IFDIR;
804                 e2fsck_write_inode_full(ctx, pctx->ino, inode,
805                                         EXT2_INODE_SIZE(ctx->fs->super),
806                                         "check_is_really_dir");
807         }
808 }
809
810 extern errcode_t e2fsck_setup_icount(e2fsck_t ctx, const char *icount_name,
811                                      int flags, ext2_icount_t hint,
812                                      ext2_icount_t *ret)
813 {
814         unsigned int            threshold;
815         unsigned int            save_type;
816         ext2_ino_t              num_dirs;
817         errcode_t               retval;
818         char                    *tdb_dir;
819         int                     enable;
820
821         *ret = 0;
822
823         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
824                            &tdb_dir);
825         profile_get_uint(ctx->profile, "scratch_files",
826                          "numdirs_threshold", 0, 0, &threshold);
827         profile_get_boolean(ctx->profile, "scratch_files",
828                             "icount", 0, 1, &enable);
829
830         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
831         if (retval)
832                 num_dirs = 1024;        /* Guess */
833
834         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
835             (!threshold || num_dirs > threshold)) {
836                 retval = ext2fs_create_icount_tdb(ctx->fs, tdb_dir,
837                                                   flags, ret);
838                 if (retval == 0)
839                         return 0;
840         }
841         e2fsck_set_bitmap_type(ctx->fs, EXT2FS_BMAP64_RBTREE, icount_name,
842                                &save_type);
843         if (ctx->options & E2F_OPT_ICOUNT_FULLMAP)
844                 flags |= EXT2_ICOUNT_OPT_FULLMAP;
845         retval = ext2fs_create_icount2(ctx->fs, flags, 0, hint, ret);
846         ctx->fs->default_bitmap_type = save_type;
847         return retval;
848 }
849
850 static errcode_t recheck_bad_inode_checksum(ext2_filsys fs, ext2_ino_t ino,
851                                             e2fsck_t ctx,
852                                             struct problem_context *pctx)
853 {
854         errcode_t retval;
855         struct ext2_inode_large inode;
856
857         /*
858          * Reread inode.  If we don't see checksum error, then this inode
859          * has been fixed elsewhere.
860          */
861         ctx->stashed_ino = 0;
862         retval = ext2fs_read_inode_full(fs, ino, (struct ext2_inode *)&inode,
863                                         sizeof(inode));
864         if (retval && retval != EXT2_ET_INODE_CSUM_INVALID)
865                 return retval;
866         if (!retval)
867                 return 0;
868
869         /*
870          * Checksum still doesn't match.  That implies that the inode passes
871          * all the sanity checks, so maybe the checksum is simply corrupt.
872          * See if the user will go for fixing that.
873          */
874         if (!fix_problem(ctx, PR_1_INODE_ONLY_CSUM_INVALID, pctx))
875                 return 0;
876
877         retval = ext2fs_write_inode_full(fs, ino, (struct ext2_inode *)&inode,
878                                          sizeof(inode));
879         return retval;
880 }
881
882 static void reserve_block_for_root_repair(e2fsck_t ctx)
883 {
884         blk64_t         blk = 0;
885         errcode_t       err;
886         ext2_filsys     fs = ctx->fs;
887
888         ctx->root_repair_block = 0;
889         if (ext2fs_test_inode_bitmap2(ctx->inode_used_map, EXT2_ROOT_INO))
890                 return;
891
892         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
893         if (err)
894                 return;
895         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
896         ctx->root_repair_block = blk;
897 }
898
899 static void reserve_block_for_lnf_repair(e2fsck_t ctx)
900 {
901         blk64_t         blk = 0;
902         errcode_t       err;
903         ext2_filsys     fs = ctx->fs;
904         static const char name[] = "lost+found";
905         ext2_ino_t      ino;
906
907         ctx->lnf_repair_block = 0;
908         if (!ext2fs_lookup(fs, EXT2_ROOT_INO, name, sizeof(name)-1, 0, &ino))
909                 return;
910
911         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
912         if (err)
913                 return;
914         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
915         ctx->lnf_repair_block = blk;
916 }
917
918 static errcode_t get_inline_data_ea_size(ext2_filsys fs, ext2_ino_t ino,
919                                          size_t *sz)
920 {
921         void *p;
922         struct ext2_xattr_handle *handle;
923         errcode_t retval;
924
925         retval = ext2fs_xattrs_open(fs, ino, &handle);
926         if (retval)
927                 return retval;
928
929         retval = ext2fs_xattrs_read(handle);
930         if (retval)
931                 goto err;
932
933         retval = ext2fs_xattr_get(handle, "system.data", &p, sz);
934         if (retval)
935                 goto err;
936         ext2fs_free_mem(&p);
937 err:
938         (void) ext2fs_xattrs_close(&handle);
939         return retval;
940 }
941
942 static void finish_processing_inode(e2fsck_t ctx, ext2_ino_t ino,
943                                     struct problem_context *pctx,
944                                     int failed_csum)
945 {
946         if (!failed_csum)
947                 return;
948
949         /*
950          * If the inode failed the checksum and the user didn't
951          * clear the inode, test the checksum again -- if it still
952          * fails, ask the user if the checksum should be corrected.
953          */
954         pctx->errcode = recheck_bad_inode_checksum(ctx->fs, ino, ctx, pctx);
955         if (pctx->errcode)
956                 ctx->flags |= E2F_FLAG_ABORT;
957 }
958 #define FINISH_INODE_LOOP(ctx, ino, pctx, failed_csum) \
959         do { \
960                 finish_processing_inode((ctx), (ino), (pctx), (failed_csum)); \
961                 if ((ctx)->flags & E2F_FLAG_ABORT) \
962                         return; \
963         } while (0)
964
965 static int could_be_block_map(ext2_filsys fs, struct ext2_inode *inode)
966 {
967         __u32 x;
968         int i;
969
970         for (i = 0; i < EXT2_N_BLOCKS; i++) {
971                 x = inode->i_block[i];
972 #ifdef WORDS_BIGENDIAN
973                 x = ext2fs_swab32(x);
974 #endif
975                 if (x >= ext2fs_blocks_count(fs->super))
976                         return 0;
977         }
978
979         return 1;
980 }
981
982 /*
983  * Figure out what to do with an inode that has both extents and inline data
984  * inode flags set.  Returns -1 if we decide to erase the inode, 0 otherwise.
985  */
986 static int fix_inline_data_extents_file(e2fsck_t ctx,
987                                         ext2_ino_t ino,
988                                         struct ext2_inode *inode,
989                                         int inode_size,
990                                         struct problem_context *pctx)
991 {
992         size_t max_inline_ea_size;
993         ext2_filsys fs = ctx->fs;
994         int dirty = 0;
995
996         /* Both feature flags not set?  Just run the regular checks */
997         if (!ext2fs_has_feature_extents(fs->super) &&
998             !ext2fs_has_feature_inline_data(fs->super))
999                 return 0;
1000
1001         /* Clear both flags if it's a special file */
1002         if (LINUX_S_ISCHR(inode->i_mode) ||
1003             LINUX_S_ISBLK(inode->i_mode) ||
1004             LINUX_S_ISFIFO(inode->i_mode) ||
1005             LINUX_S_ISSOCK(inode->i_mode)) {
1006                 check_extents_inlinedata(ctx, pctx);
1007                 return 0;
1008         }
1009
1010         /* If it looks like an extent tree, try to clear inlinedata */
1011         if (ext2fs_extent_header_verify(inode->i_block,
1012                                  sizeof(inode->i_block)) == 0 &&
1013             fix_problem(ctx, PR_1_CLEAR_INLINE_DATA_FOR_EXTENT, pctx)) {
1014                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1015                 dirty = 1;
1016                 goto out;
1017         }
1018
1019         /* If it looks short enough to be inline data, try to clear extents */
1020         if (inode_size > EXT2_GOOD_OLD_INODE_SIZE)
1021                 max_inline_ea_size = inode_size -
1022                                      (EXT2_GOOD_OLD_INODE_SIZE +
1023                                       ((struct ext2_inode_large *)inode)->i_extra_isize);
1024         else
1025                 max_inline_ea_size = 0;
1026         if (EXT2_I_SIZE(inode) <
1027             EXT4_MIN_INLINE_DATA_SIZE + max_inline_ea_size &&
1028             fix_problem(ctx, PR_1_CLEAR_EXTENT_FOR_INLINE_DATA, pctx)) {
1029                 inode->i_flags &= ~EXT4_EXTENTS_FL;
1030                 dirty = 1;
1031                 goto out;
1032         }
1033
1034         /*
1035          * Too big for inline data, but no evidence of extent tree -
1036          * maybe it's a block map file?  If the mappings all look valid?
1037          */
1038         if (could_be_block_map(fs, inode) &&
1039             fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_FLAGS, pctx)) {
1040 #ifdef WORDS_BIGENDIAN
1041                 int i;
1042
1043                 for (i = 0; i < EXT2_N_BLOCKS; i++)
1044                         inode->i_block[i] = ext2fs_swab32(inode->i_block[i]);
1045 #endif
1046
1047                 inode->i_flags &= ~(EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL);
1048                 dirty = 1;
1049                 goto out;
1050         }
1051
1052         /* Oh well, just clear the busted inode. */
1053         if (fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_INODE, pctx)) {
1054                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1055                 return -1;
1056         }
1057
1058 out:
1059         if (dirty)
1060                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1061
1062         return 0;
1063 }
1064
1065 static void pass1_readahead(e2fsck_t ctx, dgrp_t *group, ext2_ino_t *next_ino)
1066 {
1067         ext2_ino_t inodes_in_group = 0, inodes_per_block, inodes_per_buffer;
1068         dgrp_t start = *group, grp;
1069         blk64_t blocks_to_read = 0;
1070         errcode_t err = EXT2_ET_INVALID_ARGUMENT;
1071
1072         if (ctx->readahead_kb == 0)
1073                 goto out;
1074
1075         /* Keep iterating groups until we have enough to readahead */
1076         inodes_per_block = EXT2_INODES_PER_BLOCK(ctx->fs->super);
1077         for (grp = start; grp < ctx->fs->group_desc_count; grp++) {
1078                 if (ext2fs_bg_flags_test(ctx->fs, grp, EXT2_BG_INODE_UNINIT))
1079                         continue;
1080                 inodes_in_group = ctx->fs->super->s_inodes_per_group -
1081                                         ext2fs_bg_itable_unused(ctx->fs, grp);
1082                 blocks_to_read += (inodes_in_group + inodes_per_block - 1) /
1083                                         inodes_per_block;
1084                 if (blocks_to_read * ctx->fs->blocksize >
1085                     ctx->readahead_kb * 1024)
1086                         break;
1087         }
1088
1089         err = e2fsck_readahead(ctx->fs, E2FSCK_READA_ITABLE, start,
1090                                grp - start + 1);
1091         if (err == EAGAIN) {
1092                 ctx->readahead_kb /= 2;
1093                 err = 0;
1094         }
1095
1096 out:
1097         if (err) {
1098                 /* Error; disable itable readahead */
1099                 *group = ctx->fs->group_desc_count;
1100                 *next_ino = ctx->fs->super->s_inodes_count;
1101         } else {
1102                 /*
1103                  * Don't do more readahead until we've reached the first inode
1104                  * of the last inode scan buffer block for the last group.
1105                  */
1106                 *group = grp + 1;
1107                 inodes_per_buffer = (ctx->inode_buffer_blocks ?
1108                                      ctx->inode_buffer_blocks :
1109                                      EXT2_INODE_SCAN_DEFAULT_BUFFER_BLOCKS) *
1110                                     ctx->fs->blocksize /
1111                                     EXT2_INODE_SIZE(ctx->fs->super);
1112                 inodes_in_group--;
1113                 *next_ino = inodes_in_group -
1114                             (inodes_in_group % inodes_per_buffer) + 1 +
1115                             (grp * ctx->fs->super->s_inodes_per_group);
1116         }
1117 }
1118
1119 /*
1120  * Check if the passed ino is one of the used superblock quota inodes.
1121  *
1122  * Before the quota inodes were journaled, older superblock quota inodes
1123  * were just regular files in the filesystem and not reserved inodes.  This
1124  * checks if the passed ino is one of the s_*_quota_inum superblock fields,
1125  * which may not always be the same as the EXT4_*_QUOTA_INO fields.
1126  */
1127 static int quota_inum_is_super(struct ext2_super_block *sb, ext2_ino_t ino)
1128 {
1129         enum quota_type qtype;
1130
1131         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1132                 if (*quota_sb_inump(sb, qtype) == ino)
1133                         return 1;
1134
1135         return 0;
1136 }
1137
1138 /*
1139  * Check if the passed ino is one of the reserved quota inodes.
1140  * This checks if the inode number is one of the reserved EXT4_*_QUOTA_INO
1141  * inodes.  These inodes may or may not be in use by the quota feature.
1142  */
1143 static int quota_inum_is_reserved(ext2_filsys fs, ext2_ino_t ino)
1144 {
1145         enum quota_type qtype;
1146
1147         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1148                 if (quota_type2inum(qtype, fs->super) == ino)
1149                         return 1;
1150
1151         return 0;
1152 }
1153
1154 static int e2fsck_should_abort(e2fsck_t ctx)
1155 {
1156         e2fsck_t global_ctx;
1157
1158         if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1159                 return 1;
1160
1161         if (ctx->global_ctx) {
1162                 global_ctx = ctx->global_ctx;
1163                 if (global_ctx->flags & E2F_FLAG_SIGNAL_MASK)
1164                         return 1;
1165         }
1166         return 0;
1167 }
1168
1169 void e2fsck_pass1_run(e2fsck_t ctx)
1170 {
1171         int     i;
1172         ext2_filsys fs = ctx->fs;
1173         ext2_ino_t      ino = 0;
1174         struct ext2_inode *inode = NULL;
1175         ext2_inode_scan scan = NULL;
1176         char            *block_buf = NULL;
1177 #ifdef RESOURCE_TRACK
1178         struct resource_track   rtrack;
1179 #endif
1180         unsigned char   frag, fsize;
1181         struct          problem_context pctx;
1182         struct          scan_callback_struct scan_struct;
1183         struct ext2_super_block *sb = ctx->fs->super;
1184         const char      *old_op;
1185         const char      *eop_next_inode = _("getting next inode from scan");
1186         int             imagic_fs, extent_fs, inlinedata_fs, casefold_fs;
1187         int             low_dtime_check = 1;
1188         unsigned int    inode_size = EXT2_INODE_SIZE(fs->super);
1189         unsigned int    bufsize;
1190         int             failed_csum = 0;
1191         ext2_ino_t      ino_threshold = 0;
1192         dgrp_t          ra_group = 0;
1193         struct ea_quota ea_ibody_quota;
1194         struct process_inode_block *inodes_to_process;
1195         int             process_inode_count;
1196
1197         init_resource_track(&rtrack, ctx->fs->io);
1198         clear_problem_context(&pctx);
1199
1200         /* If we can do readahead, figure out how many groups to pull in. */
1201         if (!e2fsck_can_readahead(ctx->fs))
1202                 ctx->readahead_kb = 0;
1203         else if (ctx->readahead_kb == ~0ULL)
1204                 ctx->readahead_kb = e2fsck_guess_readahead(ctx->fs);
1205         pass1_readahead(ctx, &ra_group, &ino_threshold);
1206
1207         if (!(ctx->options & E2F_OPT_PREEN))
1208                 fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1209
1210         if (ext2fs_has_feature_dir_index(fs->super) &&
1211             !(ctx->options & E2F_OPT_NO)) {
1212                 if (ext2fs_u32_list_create(&ctx->dirs_to_hash, 50))
1213                         ctx->dirs_to_hash = 0;
1214         }
1215
1216 #ifdef MTRACE
1217         mtrace_print("Pass 1");
1218 #endif
1219
1220         imagic_fs = ext2fs_has_feature_imagic_inodes(sb);
1221         extent_fs = ext2fs_has_feature_extents(sb);
1222         inlinedata_fs = ext2fs_has_feature_inline_data(sb);
1223         casefold_fs = ext2fs_has_feature_casefold(sb);
1224
1225         /*
1226          * Allocate bitmaps structures
1227          */
1228         pctx.errcode = e2fsck_allocate_inode_bitmap(fs, _("in-use inode map"),
1229                                                     EXT2FS_BMAP64_RBTREE,
1230                                                     "inode_used_map",
1231                                                     &ctx->inode_used_map);
1232         if (pctx.errcode) {
1233                 pctx.num = 1;
1234                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1235                 ctx->flags |= E2F_FLAG_ABORT;
1236                 return;
1237         }
1238         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1239                         _("directory inode map"),
1240                         ctx->global_ctx ? EXT2FS_BMAP64_RBTREE :
1241                         EXT2FS_BMAP64_AUTODIR,
1242                         "inode_dir_map", &ctx->inode_dir_map);
1243         if (pctx.errcode) {
1244                 pctx.num = 2;
1245                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1246                 ctx->flags |= E2F_FLAG_ABORT;
1247                 return;
1248         }
1249         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1250                         _("regular file inode map"), EXT2FS_BMAP64_RBTREE,
1251                         "inode_reg_map", &ctx->inode_reg_map);
1252         if (pctx.errcode) {
1253                 pctx.num = 6;
1254                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1255                 ctx->flags |= E2F_FLAG_ABORT;
1256                 return;
1257         }
1258         pctx.errcode = e2fsck_allocate_subcluster_bitmap(fs,
1259                         _("in-use block map"), EXT2FS_BMAP64_RBTREE,
1260                         "block_found_map", &ctx->block_found_map);
1261         if (pctx.errcode) {
1262                 pctx.num = 1;
1263                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1264                 ctx->flags |= E2F_FLAG_ABORT;
1265                 return;
1266         }
1267         pctx.errcode = e2fsck_allocate_block_bitmap(fs,
1268                         _("metadata block map"), EXT2FS_BMAP64_RBTREE,
1269                         "block_metadata_map", &ctx->block_metadata_map);
1270         if (pctx.errcode) {
1271                 pctx.num = 1;
1272                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1273                 ctx->flags |= E2F_FLAG_ABORT;
1274                 return;
1275         }
1276         if (casefold_fs) {
1277                 pctx.errcode =
1278                         e2fsck_allocate_inode_bitmap(fs,
1279                                                      _("inode casefold map"),
1280                                                      EXT2FS_BMAP64_RBTREE,
1281                                                      "inode_casefold_map",
1282                                                      &ctx->inode_casefold_map);
1283                 if (pctx.errcode) {
1284                         pctx.num = 1;
1285                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1286                         ctx->flags |= E2F_FLAG_ABORT;
1287                         return;
1288                 }
1289         }
1290         pctx.errcode = e2fsck_setup_icount(ctx, "inode_link_info", 0, NULL,
1291                                            &ctx->inode_link_info);
1292         if (pctx.errcode) {
1293                 fix_problem(ctx, PR_1_ALLOCATE_ICOUNT, &pctx);
1294                 ctx->flags |= E2F_FLAG_ABORT;
1295                 return;
1296         }
1297         bufsize = inode_size;
1298         if (bufsize < sizeof(struct ext2_inode_large))
1299                 bufsize = sizeof(struct ext2_inode_large);
1300         inode = (struct ext2_inode *)
1301                 e2fsck_allocate_memory(ctx, bufsize, "scratch inode");
1302
1303         inodes_to_process = (struct process_inode_block *)
1304                 e2fsck_allocate_memory(ctx,
1305                                        (ctx->process_inode_size *
1306                                         sizeof(struct process_inode_block)),
1307                                        "array of inodes to process");
1308         process_inode_count = 0;
1309
1310         pctx.errcode = ext2fs_init_dblist(fs, 0);
1311         if (pctx.errcode) {
1312                 fix_problem(ctx, PR_1_ALLOCATE_DBCOUNT, &pctx);
1313                 ctx->flags |= E2F_FLAG_ABORT;
1314                 goto endit;
1315         }
1316
1317         /*
1318          * If the last orphan field is set, clear it, since the pass1
1319          * processing will automatically find and clear the orphans.
1320          * In the future, we may want to try using the last_orphan
1321          * linked list ourselves, but for now, we clear it so that the
1322          * ext3 mount code won't get confused.
1323          */
1324         if (!(ctx->options & E2F_OPT_READONLY)) {
1325                 if (fs->super->s_last_orphan) {
1326                         fs->super->s_last_orphan = 0;
1327                         ext2fs_mark_super_dirty(fs);
1328                 }
1329         }
1330
1331         mark_table_blocks(ctx);
1332         pctx.errcode = ext2fs_convert_subcluster_bitmap(fs,
1333                                                 &ctx->block_found_map);
1334         if (pctx.errcode) {
1335                 fix_problem(ctx, PR_1_CONVERT_SUBCLUSTER, &pctx);
1336                 ctx->flags |= E2F_FLAG_ABORT;
1337                 goto endit;
1338         }
1339         block_buf = (char *) e2fsck_allocate_memory(ctx, fs->blocksize * 3,
1340                                                     "block interate buffer");
1341         if (EXT2_INODE_SIZE(fs->super) == EXT2_GOOD_OLD_INODE_SIZE)
1342                 e2fsck_use_inode_shortcuts(ctx, 1);
1343         e2fsck_intercept_block_allocations(ctx);
1344         old_op = ehandler_operation(_("opening inode scan"));
1345         pctx.errcode = ext2fs_open_inode_scan(fs, ctx->inode_buffer_blocks,
1346                                               &scan);
1347         ehandler_operation(old_op);
1348         if (pctx.errcode) {
1349                 fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1350                 ctx->flags |= E2F_FLAG_ABORT;
1351                 goto endit;
1352         }
1353         ext2fs_inode_scan_flags(scan, EXT2_SF_SKIP_MISSING_ITABLE |
1354                                       EXT2_SF_WARN_GARBAGE_INODES, 0);
1355         ctx->stashed_inode = inode;
1356         scan_struct.ctx = ctx;
1357         scan_struct.block_buf = block_buf;
1358         scan_struct.inodes_to_process = inodes_to_process;
1359         scan_struct.process_inode_count = &process_inode_count;
1360         ext2fs_set_inode_callback(scan, scan_callback, &scan_struct);
1361         if (ctx->progress && ((ctx->progress)(ctx, 1, 0,
1362                                               ctx->fs->group_desc_count)))
1363                 goto endit;
1364         if ((fs->super->s_wtime &&
1365              fs->super->s_wtime < fs->super->s_inodes_count) ||
1366             (fs->super->s_mtime &&
1367              fs->super->s_mtime < fs->super->s_inodes_count) ||
1368             (fs->super->s_mkfs_time &&
1369              fs->super->s_mkfs_time < fs->super->s_inodes_count))
1370                 low_dtime_check = 0;
1371
1372         if (ext2fs_has_feature_mmp(fs->super) &&
1373             fs->super->s_mmp_block > fs->super->s_first_data_block &&
1374             fs->super->s_mmp_block < ext2fs_blocks_count(fs->super))
1375                 ext2fs_mark_block_bitmap2(ctx->block_found_map,
1376                                           fs->super->s_mmp_block);
1377
1378         /* Set up ctx->lost_and_found if possible */
1379         (void) e2fsck_get_lost_and_found(ctx, 0);
1380
1381 #ifdef HAVE_PTHREAD
1382         if (ctx->global_ctx) {
1383                 if (ctx->options & E2F_OPT_DEBUG &&
1384                     ctx->options & E2F_OPT_MULTITHREAD)
1385                         fprintf(stderr, "thread %d jumping to group %d\n",
1386                                         ctx->thread_info.et_thread_index,
1387                                         ctx->thread_info.et_group_start);
1388                 pctx.errcode = ext2fs_inode_scan_goto_blockgroup(scan,
1389                                         ctx->thread_info.et_group_start);
1390                 if (pctx.errcode) {
1391                         fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1392                         ctx->flags |= E2F_FLAG_ABORT;
1393                         goto endit;
1394                 }
1395         }
1396 #endif
1397
1398         while (1) {
1399                 if (ino % (fs->super->s_inodes_per_group * 4) == 1) {
1400                         if (e2fsck_mmp_update(fs))
1401                                 fatal_error(ctx, 0);
1402                 }
1403                 old_op = ehandler_operation(eop_next_inode);
1404                 pctx.errcode = ext2fs_get_next_inode_full(scan, &ino,
1405                                                           inode, inode_size);
1406                 if (ino > ino_threshold)
1407                         pass1_readahead(ctx, &ra_group, &ino_threshold);
1408                 ehandler_operation(old_op);
1409                 if (e2fsck_should_abort(ctx))
1410                         goto endit;
1411                 if (pctx.errcode == EXT2_ET_BAD_BLOCK_IN_INODE_TABLE) {
1412                         /*
1413                          * If badblocks says badblocks is bad, offer to clear
1414                          * the list, update the in-core bb list, and restart
1415                          * the inode scan.
1416                          */
1417                         if (ino == EXT2_BAD_INO &&
1418                             fix_problem(ctx, PR_1_BADBLOCKS_IN_BADBLOCKS,
1419                                         &pctx)) {
1420                                 errcode_t err;
1421
1422                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1423                                 ext2fs_badblocks_list_free(ctx->fs->badblocks);
1424                                 ctx->fs->badblocks = NULL;
1425                                 err = ext2fs_read_bb_inode(ctx->fs,
1426                                                         &ctx->fs->badblocks);
1427                                 if (err) {
1428                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1429                                                     &pctx);
1430                                         ctx->flags |= E2F_FLAG_ABORT;
1431                                 } else
1432                                         ctx->flags |= E2F_FLAG_RESTART;
1433                                 goto endit;
1434                         }
1435                         if (!ctx->inode_bb_map)
1436                                 alloc_bb_map(ctx);
1437                         ext2fs_mark_inode_bitmap2(ctx->inode_bb_map, ino);
1438                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1439                         continue;
1440                 }
1441                 if (pctx.errcode == EXT2_ET_SCAN_FINISHED)
1442                         break;
1443                 if (pctx.errcode &&
1444                     pctx.errcode != EXT2_ET_INODE_CSUM_INVALID &&
1445                     pctx.errcode != EXT2_ET_INODE_IS_GARBAGE) {
1446                         fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1447                         ctx->flags |= E2F_FLAG_ABORT;
1448                         goto endit;
1449                 }
1450                 if (!ino)
1451                         break;
1452 #ifdef HAVE_PTHREAD
1453                 if (ctx->global_ctx)
1454                         ctx->thread_info.et_inode_number++;
1455 #endif
1456                 pctx.ino = ino;
1457                 pctx.inode = inode;
1458                 ctx->stashed_ino = ino;
1459
1460                 /* Clear trashed inode? */
1461                 if (pctx.errcode == EXT2_ET_INODE_IS_GARBAGE &&
1462                     inode->i_links_count > 0 &&
1463                     fix_problem(ctx, PR_1_INODE_IS_GARBAGE, &pctx)) {
1464                         pctx.errcode = 0;
1465                         e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1466                 }
1467                 failed_csum = pctx.errcode != 0;
1468
1469                 /*
1470                  * Check for inodes who might have been part of the
1471                  * orphaned list linked list.  They should have gotten
1472                  * dealt with by now, unless the list had somehow been
1473                  * corrupted.
1474                  *
1475                  * FIXME: In the future, inodes which are still in use
1476                  * (and which are therefore) pending truncation should
1477                  * be handled specially.  Right now we just clear the
1478                  * dtime field, and the normal e2fsck handling of
1479                  * inodes where i_size and the inode blocks are
1480                  * inconsistent is to fix i_size, instead of releasing
1481                  * the extra blocks.  This won't catch the inodes that
1482                  * was at the end of the orphan list, but it's better
1483                  * than nothing.  The right answer is that there
1484                  * shouldn't be any bugs in the orphan list handling.  :-)
1485                  */
1486                 if (inode->i_dtime && low_dtime_check &&
1487                     inode->i_dtime < ctx->fs->super->s_inodes_count) {
1488                         if (fix_problem(ctx, PR_1_LOW_DTIME, &pctx)) {
1489                                 inode->i_dtime = inode->i_links_count ?
1490                                         0 : ctx->now;
1491                                 e2fsck_write_inode(ctx, ino, inode,
1492                                                    "pass1");
1493                                 failed_csum = 0;
1494                         }
1495                 }
1496
1497                 if (inode->i_links_count) {
1498                         pctx.errcode = ext2fs_icount_store(ctx->inode_link_info,
1499                                            ino, inode->i_links_count);
1500                         if (pctx.errcode) {
1501                                 pctx.num = inode->i_links_count;
1502                                 fix_problem(ctx, PR_1_ICOUNT_STORE, &pctx);
1503                                 ctx->flags |= E2F_FLAG_ABORT;
1504                                 goto endit;
1505                         }
1506                 } else if ((ino >= EXT2_FIRST_INODE(fs->super)) &&
1507                            !quota_inum_is_reserved(fs, ino)) {
1508                         if (!inode->i_dtime && inode->i_mode) {
1509                                 if (fix_problem(ctx,
1510                                             PR_1_ZERO_DTIME, &pctx)) {
1511                                         inode->i_dtime = ctx->now;
1512                                         e2fsck_write_inode(ctx, ino, inode,
1513                                                            "pass1");
1514                                         failed_csum = 0;
1515                                 }
1516                         }
1517                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1518                         continue;
1519                 }
1520
1521                 if ((inode->i_flags & EXT4_CASEFOLD_FL) &&
1522                     ((!LINUX_S_ISDIR(inode->i_mode) &&
1523                       fix_problem(ctx, PR_1_CASEFOLD_NONDIR, &pctx)) ||
1524                      (!casefold_fs &&
1525                       fix_problem(ctx, PR_1_CASEFOLD_FEATURE, &pctx)))) {
1526                         inode->i_flags &= ~EXT4_CASEFOLD_FL;
1527                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1528                 }
1529
1530                 /* Conflicting inlinedata/extents inode flags? */
1531                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) &&
1532                     (inode->i_flags & EXT4_EXTENTS_FL)) {
1533                         int res = fix_inline_data_extents_file(ctx, ino, inode,
1534                                                                inode_size,
1535                                                                &pctx);
1536                         if (res < 0) {
1537                                 /* skip FINISH_INODE_LOOP */
1538                                 continue;
1539                         }
1540                 }
1541
1542                 /* Test for incorrect inline_data flags settings. */
1543                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && !inlinedata_fs &&
1544                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1545                         size_t size = 0;
1546
1547                         pctx.errcode = get_inline_data_ea_size(fs, ino, &size);
1548                         if (!pctx.errcode &&
1549                             fix_problem(ctx, PR_1_INLINE_DATA_FEATURE, &pctx)) {
1550                                 ext2fs_set_feature_inline_data(sb);
1551                                 ext2fs_mark_super_dirty(fs);
1552                                 inlinedata_fs = 1;
1553                         } else if (fix_problem(ctx, PR_1_INLINE_DATA_SET, &pctx)) {
1554                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1555                                 /* skip FINISH_INODE_LOOP */
1556                                 continue;
1557                         }
1558                 }
1559
1560                 /* Test for inline data flag but no attr */
1561                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && inlinedata_fs &&
1562                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1563                         size_t size = 0;
1564                         errcode_t err;
1565                         int flags;
1566
1567                         flags = fs->flags;
1568                         if (failed_csum)
1569                                 fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
1570                         err = get_inline_data_ea_size(fs, ino, &size);
1571                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
1572                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
1573
1574                         switch (err) {
1575                         case 0:
1576                                 /* Everything is awesome... */
1577                                 break;
1578                         case EXT2_ET_BAD_EA_BLOCK_NUM:
1579                         case EXT2_ET_BAD_EA_HASH:
1580                         case EXT2_ET_BAD_EA_HEADER:
1581                         case EXT2_ET_EA_BAD_NAME_LEN:
1582                         case EXT2_ET_EA_BAD_VALUE_SIZE:
1583                         case EXT2_ET_EA_KEY_NOT_FOUND:
1584                         case EXT2_ET_EA_NO_SPACE:
1585                         case EXT2_ET_MISSING_EA_FEATURE:
1586                         case EXT2_ET_INLINE_DATA_CANT_ITERATE:
1587                         case EXT2_ET_INLINE_DATA_NO_BLOCK:
1588                         case EXT2_ET_INLINE_DATA_NO_SPACE:
1589                         case EXT2_ET_NO_INLINE_DATA:
1590                         case EXT2_ET_EXT_ATTR_CSUM_INVALID:
1591                         case EXT2_ET_EA_BAD_VALUE_OFFSET:
1592                         case EXT2_ET_EA_INODE_CORRUPTED:
1593                                 /* broken EA or no system.data EA; truncate */
1594                                 if (fix_problem(ctx, PR_1_INLINE_DATA_NO_ATTR,
1595                                                 &pctx)) {
1596                                         err = ext2fs_inode_size_set(fs, inode, 0);
1597                                         if (err) {
1598                                                 pctx.errcode = err;
1599                                                 ctx->flags |= E2F_FLAG_ABORT;
1600                                                 goto endit;
1601                                         }
1602                                         inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1603                                         memset(&inode->i_block, 0,
1604                                                sizeof(inode->i_block));
1605                                         e2fsck_write_inode(ctx, ino, inode,
1606                                                            "pass1");
1607                                         failed_csum = 0;
1608                                 }
1609                                 break;
1610                         default:
1611                                 /* Some other kind of non-xattr error? */
1612                                 pctx.errcode = err;
1613                                 ctx->flags |= E2F_FLAG_ABORT;
1614                                 goto endit;
1615                         }
1616                 }
1617
1618                 /*
1619                  * Test for incorrect extent flag settings.
1620                  *
1621                  * On big-endian machines we must be careful:
1622                  * When the inode is read, the i_block array is not swapped
1623                  * if the extent flag is set.  Therefore if we are testing
1624                  * for or fixing a wrongly-set flag, we must potentially
1625                  * (un)swap before testing, or after fixing.
1626                  */
1627
1628                 /*
1629                  * In this case the extents flag was set when read, so
1630                  * extent_header_verify is ok.  If the inode is cleared,
1631                  * no need to swap... so no extra swapping here.
1632                  */
1633                 if ((inode->i_flags & EXT4_EXTENTS_FL) && !extent_fs &&
1634                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1635                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO))) {
1636                         if ((ext2fs_extent_header_verify(inode->i_block,
1637                                                  sizeof(inode->i_block)) == 0) &&
1638                             fix_problem(ctx, PR_1_EXTENT_FEATURE, &pctx)) {
1639                                 ext2fs_set_feature_extents(sb);
1640                                 ext2fs_mark_super_dirty(fs);
1641                                 extent_fs = 1;
1642                         } else if (fix_problem(ctx, PR_1_EXTENTS_SET, &pctx)) {
1643                         clear_inode:
1644                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1645                                 if (ino == EXT2_BAD_INO)
1646                                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map,
1647                                                                  ino);
1648                                 /* skip FINISH_INODE_LOOP */
1649                                 continue;
1650                         }
1651                 }
1652
1653                 /*
1654                  * For big-endian machines:
1655                  * If the inode didn't have the extents flag set when it
1656                  * was read, then the i_blocks array was swapped.  To test
1657                  * as an extents header, we must swap it back first.
1658                  * IF we then set the extents flag, the entire i_block
1659                  * array must be un/re-swapped to make it proper extents data.
1660                  */
1661                 if (extent_fs && !(inode->i_flags & EXT4_EXTENTS_FL) &&
1662                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1663                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO)) &&
1664                     (LINUX_S_ISREG(inode->i_mode) ||
1665                      LINUX_S_ISDIR(inode->i_mode))) {
1666                         void *ehp;
1667 #ifdef WORDS_BIGENDIAN
1668                         __u32 tmp_block[EXT2_N_BLOCKS];
1669
1670                         for (i = 0; i < EXT2_N_BLOCKS; i++)
1671                                 tmp_block[i] = ext2fs_swab32(inode->i_block[i]);
1672                         ehp = tmp_block;
1673 #else
1674                         ehp = inode->i_block;
1675 #endif
1676                         if ((ext2fs_extent_header_verify(ehp,
1677                                          sizeof(inode->i_block)) == 0) &&
1678                             (fix_problem(ctx, PR_1_UNSET_EXTENT_FL, &pctx))) {
1679                                 inode->i_flags |= EXT4_EXTENTS_FL;
1680 #ifdef WORDS_BIGENDIAN
1681                                 memcpy(inode->i_block, tmp_block,
1682                                        sizeof(inode->i_block));
1683 #endif
1684                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1685                                 failed_csum = 0;
1686                         }
1687                 }
1688
1689                 if (ino == EXT2_BAD_INO) {
1690                         struct process_block_struct pb;
1691
1692                         if ((failed_csum || inode->i_mode || inode->i_uid ||
1693                              inode->i_gid || inode->i_links_count ||
1694                              (inode->i_flags & EXT4_INLINE_DATA_FL) ||
1695                              inode->i_file_acl) &&
1696                             fix_problem(ctx, PR_1_INVALID_BAD_INODE, &pctx)) {
1697                                 memset(inode, 0, sizeof(struct ext2_inode));
1698                                 e2fsck_write_inode(ctx, ino, inode,
1699                                                    "clear bad inode");
1700                                 failed_csum = 0;
1701                         }
1702
1703                         pctx.errcode = ext2fs_copy_bitmap(ctx->block_found_map,
1704                                                           &pb.fs_meta_blocks);
1705                         if (pctx.errcode) {
1706                                 pctx.num = 4;
1707                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1708                                 ctx->flags |= E2F_FLAG_ABORT;
1709                                 goto endit;
1710                         }
1711                         pb.ino = EXT2_BAD_INO;
1712                         pb.num_blocks = pb.last_block = 0;
1713                         pb.last_db_block = -1;
1714                         pb.num_illegal_blocks = 0;
1715                         pb.suppress = 0; pb.clear = 0; pb.is_dir = 0;
1716                         pb.is_reg = 0; pb.fragmented = 0; pb.bbcheck = 0;
1717                         pb.inode = inode;
1718                         pb.pctx = &pctx;
1719                         pb.ctx = ctx;
1720                         pctx.errcode = ext2fs_block_iterate3(fs, ino, 0,
1721                                      block_buf, process_bad_block, &pb);
1722                         ext2fs_free_block_bitmap(pb.fs_meta_blocks);
1723                         if (pctx.errcode) {
1724                                 fix_problem(ctx, PR_1_BLOCK_ITERATE, &pctx);
1725                                 ctx->flags |= E2F_FLAG_ABORT;
1726                                 goto endit;
1727                         }
1728                         if (pb.bbcheck)
1729                                 if (!fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK_PROMPT, &pctx)) {
1730                                 ctx->flags |= E2F_FLAG_ABORT;
1731                                 goto endit;
1732                         }
1733                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1734                         clear_problem_context(&pctx);
1735                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1736                         continue;
1737                 } else if (ino == EXT2_ROOT_INO) {
1738                         /*
1739                          * Make sure the root inode is a directory; if
1740                          * not, offer to clear it.  It will be
1741                          * regenerated in pass #3.
1742                          */
1743                         if (!LINUX_S_ISDIR(inode->i_mode)) {
1744                                 if (fix_problem(ctx, PR_1_ROOT_NO_DIR, &pctx))
1745                                         goto clear_inode;
1746                         }
1747                         /*
1748                          * If dtime is set, offer to clear it.  mke2fs
1749                          * version 0.2b created filesystems with the
1750                          * dtime field set for the root and lost+found
1751                          * directories.  We won't worry about
1752                          * /lost+found, since that can be regenerated
1753                          * easily.  But we will fix the root directory
1754                          * as a special case.
1755                          */
1756                         if (inode->i_dtime && inode->i_links_count) {
1757                                 if (fix_problem(ctx, PR_1_ROOT_DTIME, &pctx)) {
1758                                         inode->i_dtime = 0;
1759                                         e2fsck_write_inode(ctx, ino, inode,
1760                                                            "pass1");
1761                                         failed_csum = 0;
1762                                 }
1763                         }
1764                 } else if (ino == EXT2_JOURNAL_INO) {
1765                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1766                         if (fs->super->s_journal_inum == EXT2_JOURNAL_INO) {
1767                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1768                                     fix_problem(ctx, PR_1_JOURNAL_BAD_MODE,
1769                                                 &pctx)) {
1770                                         inode->i_mode = LINUX_S_IFREG;
1771                                         e2fsck_write_inode(ctx, ino, inode,
1772                                                            "pass1");
1773                                         failed_csum = 0;
1774                                 }
1775                                 check_blocks(ctx, &pctx, block_buf, NULL);
1776                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1777                                 continue;
1778                         }
1779                         if ((inode->i_links_count ||
1780                              inode->i_blocks || inode->i_block[0]) &&
1781                             fix_problem(ctx, PR_1_JOURNAL_INODE_NOT_CLEAR,
1782                                         &pctx)) {
1783                                 memset(inode, 0, inode_size);
1784                                 ext2fs_icount_store(ctx->inode_link_info,
1785                                                     ino, 0);
1786                                 e2fsck_write_inode_full(ctx, ino, inode,
1787                                                         inode_size, "pass1");
1788                                 failed_csum = 0;
1789                         }
1790                 } else if (quota_inum_is_reserved(fs, ino)) {
1791                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1792                         if (ext2fs_has_feature_quota(fs->super) &&
1793                             quota_inum_is_super(fs->super, ino)) {
1794                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1795                                     fix_problem(ctx, PR_1_QUOTA_BAD_MODE,
1796                                                         &pctx)) {
1797                                         inode->i_mode = LINUX_S_IFREG;
1798                                         e2fsck_write_inode(ctx, ino, inode,
1799                                                         "pass1");
1800                                         failed_csum = 0;
1801                                 }
1802                                 check_blocks(ctx, &pctx, block_buf, NULL);
1803                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1804                                 continue;
1805                         }
1806                         if ((inode->i_links_count ||
1807                              inode->i_blocks || inode->i_block[0]) &&
1808                             fix_problem(ctx, PR_1_QUOTA_INODE_NOT_CLEAR,
1809                                         &pctx)) {
1810                                 memset(inode, 0, inode_size);
1811                                 ext2fs_icount_store(ctx->inode_link_info,
1812                                                     ino, 0);
1813                                 e2fsck_write_inode_full(ctx, ino, inode,
1814                                                         inode_size, "pass1");
1815                                 failed_csum = 0;
1816                         }
1817                 } else if (ino < EXT2_FIRST_INODE(fs->super)) {
1818                         problem_t problem = 0;
1819
1820                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1821                         if (ino == EXT2_BOOT_LOADER_INO) {
1822                                 if (LINUX_S_ISDIR(inode->i_mode))
1823                                         problem = PR_1_RESERVED_BAD_MODE;
1824                         } else if (ino == EXT2_RESIZE_INO) {
1825                                 if (inode->i_mode &&
1826                                     !LINUX_S_ISREG(inode->i_mode))
1827                                         problem = PR_1_RESERVED_BAD_MODE;
1828                         } else {
1829                                 if (inode->i_mode != 0)
1830                                         problem = PR_1_RESERVED_BAD_MODE;
1831                         }
1832                         if (problem) {
1833                                 if (fix_problem(ctx, problem, &pctx)) {
1834                                         inode->i_mode = 0;
1835                                         e2fsck_write_inode(ctx, ino, inode,
1836                                                            "pass1");
1837                                         failed_csum = 0;
1838                                 }
1839                         }
1840                         check_blocks(ctx, &pctx, block_buf, NULL);
1841                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1842                         continue;
1843                 }
1844
1845                 if (!inode->i_links_count) {
1846                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1847                         continue;
1848                 }
1849                 /*
1850                  * n.b.  0.3c ext2fs code didn't clear i_links_count for
1851                  * deleted files.  Oops.
1852                  *
1853                  * Since all new ext2 implementations get this right,
1854                  * we now assume that the case of non-zero
1855                  * i_links_count and non-zero dtime means that we
1856                  * should keep the file, not delete it.
1857                  *
1858                  */
1859                 if (inode->i_dtime) {
1860                         if (fix_problem(ctx, PR_1_SET_DTIME, &pctx)) {
1861                                 inode->i_dtime = 0;
1862                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1863                                 failed_csum = 0;
1864                         }
1865                 }
1866
1867                 ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1868                 switch (fs->super->s_creator_os) {
1869                     case EXT2_OS_HURD:
1870                         frag = inode->osd2.hurd2.h_i_frag;
1871                         fsize = inode->osd2.hurd2.h_i_fsize;
1872                         break;
1873                     default:
1874                         frag = fsize = 0;
1875                 }
1876
1877                 if (inode->i_faddr || frag || fsize ||
1878                     (!ext2fs_has_feature_largedir(fs->super) &&
1879                     (LINUX_S_ISDIR(inode->i_mode) && inode->i_size_high)))
1880                         mark_inode_bad(ctx, ino);
1881                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1882                     !ext2fs_has_feature_64bit(fs->super) &&
1883                     inode->osd2.linux2.l_i_file_acl_high != 0)
1884                         mark_inode_bad(ctx, ino);
1885                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1886                     !ext2fs_has_feature_huge_file(fs->super) &&
1887                     (inode->osd2.linux2.l_i_blocks_hi != 0))
1888                         mark_inode_bad(ctx, ino);
1889                 if (inode->i_flags & EXT2_IMAGIC_FL) {
1890                         if (imagic_fs) {
1891                                 if (!ctx->inode_imagic_map)
1892                                         alloc_imagic_map(ctx);
1893                                 ext2fs_mark_inode_bitmap2(ctx->inode_imagic_map,
1894                                                          ino);
1895                         } else {
1896                                 if (fix_problem(ctx, PR_1_SET_IMAGIC, &pctx)) {
1897                                         inode->i_flags &= ~EXT2_IMAGIC_FL;
1898                                         e2fsck_write_inode(ctx, ino,
1899                                                            inode, "pass1");
1900                                         failed_csum = 0;
1901                                 }
1902                         }
1903                 }
1904
1905                 check_inode_extra_space(ctx, &pctx, &ea_ibody_quota);
1906                 check_is_really_dir(ctx, &pctx, block_buf);
1907
1908                 /*
1909                  * ext2fs_inode_has_valid_blocks2 does not actually look
1910                  * at i_block[] values, so not endian-sensitive here.
1911                  */
1912                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL) &&
1913                     LINUX_S_ISLNK(inode->i_mode) &&
1914                     !ext2fs_inode_has_valid_blocks2(fs, inode) &&
1915                     fix_problem(ctx, PR_1_FAST_SYMLINK_EXTENT_FL, &pctx)) {
1916                         inode->i_flags &= ~EXT4_EXTENTS_FL;
1917                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1918                         failed_csum = 0;
1919                 }
1920
1921                 if ((inode->i_flags & EXT4_ENCRYPT_FL) &&
1922                     add_encrypted_file(ctx, &pctx) < 0)
1923                         goto clear_inode;
1924
1925                 if (casefold_fs && inode->i_flags & EXT4_CASEFOLD_FL)
1926                         ext2fs_mark_inode_bitmap2(ctx->inode_casefold_map, ino);
1927
1928                 if (LINUX_S_ISDIR(inode->i_mode)) {
1929                         ext2fs_mark_inode_bitmap2(ctx->inode_dir_map, ino);
1930                         e2fsck_add_dir_info(ctx, ino, 0);
1931                         ctx->fs_directory_count++;
1932                         if (inode->i_flags & EXT4_CASEFOLD_FL)
1933                                 add_casefolded_dir(ctx, ino);
1934                 } else if (LINUX_S_ISREG (inode->i_mode)) {
1935                         ext2fs_mark_inode_bitmap2(ctx->inode_reg_map, ino);
1936                         ctx->fs_regular_count++;
1937                 } else if (LINUX_S_ISCHR (inode->i_mode) &&
1938                            e2fsck_pass1_check_device_inode(fs, inode)) {
1939                         check_extents_inlinedata(ctx, &pctx);
1940                         check_immutable(ctx, &pctx);
1941                         check_size(ctx, &pctx);
1942                         ctx->fs_chardev_count++;
1943                 } else if (LINUX_S_ISBLK (inode->i_mode) &&
1944                            e2fsck_pass1_check_device_inode(fs, inode)) {
1945                         check_extents_inlinedata(ctx, &pctx);
1946                         check_immutable(ctx, &pctx);
1947                         check_size(ctx, &pctx);
1948                         ctx->fs_blockdev_count++;
1949                 } else if (LINUX_S_ISLNK (inode->i_mode) &&
1950                            e2fsck_pass1_check_symlink(fs, ino, inode,
1951                                                       block_buf)) {
1952                         check_immutable(ctx, &pctx);
1953                         ctx->fs_symlinks_count++;
1954                         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
1955                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1956                                 continue;
1957                         } else if (ext2fs_is_fast_symlink(inode)) {
1958                                 ctx->fs_fast_symlinks_count++;
1959                                 check_blocks(ctx, &pctx, block_buf,
1960                                              &ea_ibody_quota);
1961                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1962                                 continue;
1963                         }
1964                 }
1965                 else if (LINUX_S_ISFIFO (inode->i_mode) &&
1966                          e2fsck_pass1_check_device_inode(fs, inode)) {
1967                         check_extents_inlinedata(ctx, &pctx);
1968                         check_immutable(ctx, &pctx);
1969                         check_size(ctx, &pctx);
1970                         ctx->fs_fifo_count++;
1971                 } else if ((LINUX_S_ISSOCK (inode->i_mode)) &&
1972                            e2fsck_pass1_check_device_inode(fs, inode)) {
1973                         check_extents_inlinedata(ctx, &pctx);
1974                         check_immutable(ctx, &pctx);
1975                         check_size(ctx, &pctx);
1976                         ctx->fs_sockets_count++;
1977                 } else
1978                         mark_inode_bad(ctx, ino);
1979                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1980                     !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
1981                         if (inode->i_block[EXT2_IND_BLOCK])
1982                                 ctx->fs_ind_count++;
1983                         if (inode->i_block[EXT2_DIND_BLOCK])
1984                                 ctx->fs_dind_count++;
1985                         if (inode->i_block[EXT2_TIND_BLOCK])
1986                                 ctx->fs_tind_count++;
1987                 }
1988                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1989                     !(inode->i_flags & EXT4_INLINE_DATA_FL) &&
1990                     (inode->i_block[EXT2_IND_BLOCK] ||
1991                      inode->i_block[EXT2_DIND_BLOCK] ||
1992                      inode->i_block[EXT2_TIND_BLOCK] ||
1993                      ext2fs_file_acl_block(fs, inode))) {
1994                         struct process_inode_block *itp;
1995
1996                         itp = &inodes_to_process[process_inode_count];
1997                         itp->ino = ino;
1998                         itp->ea_ibody_quota = ea_ibody_quota;
1999                         if (inode_size < sizeof(struct ext2_inode_large))
2000                                 memcpy(&itp->inode, inode, inode_size);
2001                         else
2002                                 memcpy(&itp->inode, inode, sizeof(itp->inode));
2003                         process_inode_count++;
2004                 } else
2005                         check_blocks(ctx, &pctx, block_buf, &ea_ibody_quota);
2006
2007                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2008
2009                 if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
2010                         goto endit;
2011
2012                 if (process_inode_count >= ctx->process_inode_size) {
2013                         process_inodes(ctx, block_buf, inodes_to_process,
2014                                        &process_inode_count);
2015
2016                         if (e2fsck_should_abort(ctx))
2017                                 goto endit;
2018                 }
2019         }
2020         process_inodes(ctx, block_buf, inodes_to_process,
2021                        &process_inode_count);
2022         ext2fs_close_inode_scan(scan);
2023         scan = NULL;
2024
2025         reserve_block_for_root_repair(ctx);
2026         reserve_block_for_lnf_repair(ctx);
2027
2028         /*
2029          * If any extended attribute blocks' reference counts need to
2030          * be adjusted, either up (ctx->refcount_extra), or down
2031          * (ctx->refcount), then fix them.
2032          */
2033         if (ctx->refcount) {
2034                 adjust_extattr_refcount(ctx, ctx->refcount, block_buf, -1);
2035                 ea_refcount_free(ctx->refcount);
2036                 ctx->refcount = 0;
2037         }
2038         if (ctx->refcount_extra) {
2039                 adjust_extattr_refcount(ctx, ctx->refcount_extra,
2040                                         block_buf, +1);
2041                 ea_refcount_free(ctx->refcount_extra);
2042                 ctx->refcount_extra = 0;
2043         }
2044
2045         if (ctx->ea_block_quota_blocks) {
2046                 ea_refcount_free(ctx->ea_block_quota_blocks);
2047                 ctx->ea_block_quota_blocks = 0;
2048         }
2049
2050         if (ctx->ea_block_quota_inodes) {
2051                 ea_refcount_free(ctx->ea_block_quota_inodes);
2052                 ctx->ea_block_quota_inodes = 0;
2053         }
2054
2055         if (ctx->invalid_bitmaps)
2056                 handle_fs_bad_blocks(ctx);
2057
2058         /* We don't need the block_ea_map any more */
2059         if (ctx->block_ea_map) {
2060                 ext2fs_free_block_bitmap(ctx->block_ea_map);
2061                 ctx->block_ea_map = 0;
2062         }
2063
2064         /* We don't need the encryption policy => ID map any more */
2065         destroy_encryption_policy_map(ctx);
2066
2067         if (ctx->flags & E2F_FLAG_RESIZE_INODE) {
2068                 clear_problem_context(&pctx);
2069                 pctx.errcode = ext2fs_create_resize_inode(fs);
2070                 if (pctx.errcode) {
2071                         if (!fix_problem(ctx, PR_1_RESIZE_INODE_CREATE,
2072                                          &pctx)) {
2073                                 ctx->flags |= E2F_FLAG_ABORT;
2074                                 goto endit;
2075                         }
2076                         pctx.errcode = 0;
2077                 }
2078                 if (!pctx.errcode) {
2079                         e2fsck_read_inode(ctx, EXT2_RESIZE_INO, inode,
2080                                           "recreate inode");
2081                         inode->i_mtime = ctx->now;
2082                         e2fsck_write_inode(ctx, EXT2_RESIZE_INO, inode,
2083                                            "recreate inode");
2084                 }
2085                 ctx->flags &= ~E2F_FLAG_RESIZE_INODE;
2086         }
2087
2088         if (ctx->flags & E2F_FLAG_RESTART) {
2089                 /*
2090                  * Only the master copy of the superblock and block
2091                  * group descriptors are going to be written during a
2092                  * restart, so set the superblock to be used to be the
2093                  * master superblock.
2094                  */
2095                 ctx->use_superblock = 0;
2096                 goto endit;
2097         }
2098
2099         if (ctx->large_dirs && !ext2fs_has_feature_largedir(ctx->fs->super)) {
2100                 ext2_filsys fs = ctx->fs;
2101
2102                 if (fix_problem(ctx, PR_2_FEATURE_LARGE_DIRS, &pctx)) {
2103                         ext2fs_set_feature_largedir(fs->super);
2104                         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
2105                         ext2fs_mark_super_dirty(fs);
2106                 }
2107                 if (fs->super->s_rev_level == EXT2_GOOD_OLD_REV &&
2108                     fix_problem(ctx, PR_1_FS_REV_LEVEL, &pctx)) {
2109                         ext2fs_update_dynamic_rev(fs);
2110                         ext2fs_mark_super_dirty(fs);
2111                 }
2112         }
2113
2114         if (ctx->block_dup_map) {
2115                 if (ctx->options & E2F_OPT_PREEN) {
2116                         clear_problem_context(&pctx);
2117                         fix_problem(ctx, PR_1_DUP_BLOCKS_PREENSTOP, &pctx);
2118                 }
2119                 e2fsck_pass1_dupblocks(ctx, block_buf);
2120         }
2121         ctx->flags |= E2F_FLAG_ALLOC_OK;
2122 endit:
2123         e2fsck_use_inode_shortcuts(ctx, 0);
2124         ext2fs_free_mem(&inodes_to_process);
2125         inodes_to_process = 0;
2126
2127         if (scan)
2128                 ext2fs_close_inode_scan(scan);
2129         if (block_buf)
2130                 ext2fs_free_mem(&block_buf);
2131         if (inode)
2132                 ext2fs_free_mem(&inode);
2133
2134         /*
2135          * The l+f inode may have been cleared, so zap it now and
2136          * later passes will recalculate it if necessary
2137          */
2138         ctx->lost_and_found = 0;
2139
2140         if ((ctx->flags & E2F_FLAG_SIGNAL_MASK) == 0)
2141                 print_resource_track(ctx, _("Pass 1"), &rtrack, ctx->fs->io);
2142         else
2143                 ctx->invalid_bitmaps++;
2144 }
2145
2146 static void init_ext2_max_sizes()
2147 {
2148         int     i;
2149         __u64   max_sizes;
2150
2151         /*
2152          * Init ext2_max_sizes which will be immutable and shared between
2153          * threads
2154          */
2155 #define EXT2_BPP(bits) (1ULL << ((bits) - 2))
2156
2157         for (i = EXT2_MIN_BLOCK_LOG_SIZE; i <= EXT2_MAX_BLOCK_LOG_SIZE; i++) {
2158                 max_sizes = EXT2_NDIR_BLOCKS + EXT2_BPP(i);
2159                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i);
2160                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i) * EXT2_BPP(i);
2161                 max_sizes = (max_sizes * (1UL << i));
2162                 ext2_max_sizes[i - EXT2_MIN_BLOCK_LOG_SIZE] = max_sizes;
2163         }
2164 #undef EXT2_BPP
2165 }
2166
2167 #ifdef HAVE_PTHREAD
2168 static errcode_t e2fsck_pass1_copy_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2169                                           ext2fs_generic_bitmap *dest)
2170 {
2171         errcode_t ret;
2172
2173         ret = ext2fs_copy_bitmap(*src, dest);
2174         if (ret)
2175                 return ret;
2176
2177         (*dest)->fs = fs;
2178
2179         return 0;
2180 }
2181
2182 static void e2fsck_pass1_free_bitmap(ext2fs_generic_bitmap *bitmap)
2183 {
2184         if (*bitmap) {
2185                 ext2fs_free_generic_bmap(*bitmap);
2186                 *bitmap = NULL;
2187         }
2188
2189 }
2190
2191 static errcode_t e2fsck_pass1_merge_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2192                                           ext2fs_generic_bitmap *dest)
2193 {
2194         errcode_t ret = 0;
2195
2196         if (*src) {
2197                 if (*dest == NULL) {
2198                         *dest = *src;
2199                         *src = NULL;
2200                 } else {
2201                         ret = ext2fs_merge_bitmap(*src, *dest, NULL, NULL);
2202                         if (ret)
2203                                 return ret;
2204                 }
2205                 (*dest)->fs = fs;
2206         }
2207
2208         return 0;
2209 }
2210
2211 static errcode_t e2fsck_pass1_copy_fs(ext2_filsys dest, e2fsck_t src_context,
2212                                       ext2_filsys src)
2213 {
2214         errcode_t       retval;
2215
2216         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2217         dest->inode_map = NULL;
2218         dest->block_map = NULL;
2219         dest->badblocks = NULL;
2220         if (dest->dblist)
2221                 dest->dblist->fs = dest;
2222         if (src->block_map) {
2223                 retval = e2fsck_pass1_copy_bitmap(dest, &src->block_map,
2224                                                   &dest->block_map);
2225                 if (retval)
2226                         return retval;
2227         }
2228         if (src->inode_map) {
2229                 retval = e2fsck_pass1_copy_bitmap(dest, &src->inode_map,
2230                                                   &dest->inode_map);
2231                 if (retval)
2232                         return retval;
2233         }
2234
2235         if (src->badblocks) {
2236                 retval = ext2fs_badblocks_copy(src->badblocks,
2237                                                &dest->badblocks);
2238                 if (retval)
2239                         return retval;
2240         }
2241
2242         /* disable it for now */
2243         src_context->openfs_flags &= ~EXT2_FLAG_EXCLUSIVE;
2244         retval = ext2fs_open_channel(dest, src_context->io_options,
2245                                      src_context->io_manager,
2246                                      src_context->openfs_flags,
2247                                      src->io->block_size);
2248         if (retval)
2249                 return retval;
2250
2251         /* Block size might not be default */
2252         io_channel_set_blksize(dest->io, src->io->block_size);
2253         ehandler_init(dest->io);
2254
2255         assert(dest->io->magic == src->io->magic);
2256         assert(dest->io->manager == src->io->manager);
2257         assert(strcmp(dest->io->name, src->io->name) == 0);
2258         assert(dest->io->block_size == src->io->block_size);
2259         assert(dest->io->read_error == src->io->read_error);
2260         assert(dest->io->write_error == src->io->write_error);
2261         assert(dest->io->refcount == src->io->refcount);
2262         assert(dest->io->flags == src->io->flags);
2263         assert(dest->io->app_data == dest);
2264         assert(src->io->app_data == src);
2265         assert(dest->io->align == src->io->align);
2266
2267         /* The data should be written to disk immediately */
2268         dest->io->flags |= CHANNEL_FLAGS_WRITETHROUGH;
2269         /* icache will be rebuilt if needed, so do not copy from @src */
2270         src->icache = NULL;
2271         return 0;
2272 }
2273
2274 static int e2fsck_pass1_merge_fs(ext2_filsys dest, ext2_filsys src)
2275 {
2276         struct ext2_inode_cache *icache = dest->icache;
2277         errcode_t retval = 0;
2278         io_channel dest_io;
2279         io_channel dest_image_io;
2280         ext2fs_inode_bitmap inode_map;
2281         ext2fs_block_bitmap block_map;
2282         ext2_badblocks_list badblocks;
2283         ext2_dblist dblist;
2284         int flags;
2285
2286         dest_io = dest->io;
2287         dest_image_io = dest->image_io;
2288         inode_map = dest->inode_map;
2289         block_map = dest->block_map;
2290         badblocks = dest->badblocks;
2291         dblist = dest->dblist;
2292         flags = dest->flags;
2293
2294         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2295         dest->io = dest_io;
2296         dest->image_io = dest_image_io;
2297         dest->icache = icache;
2298         dest->inode_map = inode_map;
2299         dest->block_map = block_map;
2300         dest->badblocks = badblocks;
2301         dest->dblist = dblist;
2302         if (dest->dblist)
2303                 dest->dblist->fs = dest;
2304         dest->flags = src->flags | flags;
2305         if (!(src->flags & EXT2_FLAG_VALID) || !(flags & EXT2_FLAG_VALID))
2306                 ext2fs_unmark_valid(dest);
2307
2308         if (src->icache) {
2309                 ext2fs_free_inode_cache(src->icache);
2310                 src->icache = NULL;
2311         }
2312
2313         retval = e2fsck_pass1_merge_bitmap(dest, &src->inode_map,
2314                                            &dest->inode_map);
2315         if (retval)
2316                 goto out;
2317
2318         retval = e2fsck_pass1_merge_bitmap(dest, &src->block_map,
2319                                           &dest->block_map);
2320         if (retval)
2321                 goto out;
2322
2323         if (src->dblist) {
2324                 if (dest->dblist) {
2325                         retval = ext2fs_merge_dblist(src->dblist,
2326                                                      dest->dblist);
2327                         if (retval)
2328                                 goto out;
2329                 } else {
2330                         dest->dblist = src->dblist;
2331                         dest->dblist->fs = dest;
2332                         src->dblist = NULL;
2333                 }
2334         }
2335
2336         if (src->badblocks) {
2337                 if (dest->badblocks == NULL)
2338                         retval = ext2fs_badblocks_copy(src->badblocks,
2339                                                        &dest->badblocks);
2340                 else
2341                         retval = ext2fs_badblocks_merge(src->badblocks,
2342                                                         dest->badblocks);
2343         }
2344 out:
2345         io_channel_close(src->io);
2346         if (src->inode_map)
2347                 ext2fs_free_generic_bmap(src->inode_map);
2348         if (src->block_map)
2349                 ext2fs_free_generic_bmap(src->block_map);
2350         if (src->badblocks)
2351                 ext2fs_badblocks_list_free(src->badblocks);
2352         if (src->dblist)
2353                 ext2fs_free_dblist(src->dblist);
2354
2355         return retval;
2356 }
2357
2358 static errcode_t e2fsck_pass1_thread_prepare(e2fsck_t global_ctx, e2fsck_t *thread_ctx,
2359                                              int thread_index, int num_threads)
2360 {
2361         errcode_t               retval;
2362         e2fsck_t                thread_context;
2363         ext2_filsys             thread_fs;
2364         ext2_filsys             global_fs = global_ctx->fs;
2365         struct e2fsck_thread    *tinfo;
2366         dgrp_t                  average_group;
2367
2368         assert(global_ctx->inode_used_map == NULL);
2369         assert(global_ctx->inode_dir_map == NULL);
2370         assert(global_ctx->inode_bb_map == NULL);
2371         assert(global_ctx->inode_imagic_map == NULL);
2372         assert(global_ctx->inode_reg_map == NULL);
2373         assert(global_ctx->inodes_to_rebuild == NULL);
2374
2375         assert(global_ctx->block_found_map == NULL);
2376         assert(global_ctx->block_dup_map == NULL);
2377         assert(global_ctx->block_ea_map == NULL);
2378         assert(global_ctx->block_metadata_map == NULL);
2379         assert(global_ctx->fs->dblist == NULL);
2380
2381         retval = ext2fs_get_mem(sizeof(struct e2fsck_struct), &thread_context);
2382         if (retval) {
2383                 com_err(global_ctx->program_name, retval, "while allocating memory");
2384                 return retval;
2385         }
2386         memcpy(thread_context, global_ctx, sizeof(struct e2fsck_struct));
2387         thread_context->global_ctx = global_ctx;
2388
2389         retval = ext2fs_get_mem(sizeof(struct struct_ext2_filsys), &thread_fs);
2390         if (retval) {
2391                 com_err(global_ctx->program_name, retval, "while allocating memory");
2392                 goto out_context;
2393         }
2394
2395         io_channel_flush_cleanup(global_fs->io);
2396         retval = e2fsck_pass1_copy_fs(thread_fs, global_ctx, global_fs);
2397         if (retval) {
2398                 com_err(global_ctx->program_name, retval, "while copying fs");
2399                 goto out_fs;
2400         }
2401         thread_fs->priv_data = thread_context;
2402
2403         thread_context->thread_info.et_thread_index = thread_index;
2404         set_up_logging(thread_context);
2405
2406         /*
2407          * Distribute work to multiple threads:
2408          * Each thread work on fs->group_desc_count / nthread groups.
2409          */
2410         tinfo = &thread_context->thread_info;
2411         average_group = thread_fs->group_desc_count / num_threads;
2412         if (average_group == 0)
2413                 average_group = 1;
2414         tinfo->et_group_start = average_group * thread_index;
2415         if (thread_index == num_threads - 1)
2416                 tinfo->et_group_end = thread_fs->group_desc_count;
2417         else
2418                 tinfo->et_group_end = average_group * (thread_index + 1);
2419         tinfo->et_group_next = tinfo->et_group_start;
2420         tinfo->et_inode_number = 0;
2421         tinfo->et_log_buf[0] = '\0';
2422         tinfo->et_log_length = 0;
2423         if (thread_context->options & E2F_OPT_MULTITHREAD)
2424                 log_out(thread_context, _("Scan group range [%d, %d)\n"),
2425                         tinfo->et_group_start, tinfo->et_group_end);
2426         thread_context->fs = thread_fs;
2427         *thread_ctx = thread_context;
2428         return 0;
2429 out_fs:
2430         ext2fs_free_mem(&thread_fs);
2431 out_context:
2432         ext2fs_free_mem(&thread_context);
2433         return retval;
2434 }
2435
2436 static void e2fsck_pass1_merge_dir_info(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2437 {
2438         if (thread_ctx->dir_info == NULL)
2439                 return;
2440
2441         if (global_ctx->dir_info == NULL) {
2442                 global_ctx->dir_info = thread_ctx->dir_info;
2443                 thread_ctx->dir_info = NULL;
2444                 return;
2445         }
2446
2447         e2fsck_merge_dir_info(global_ctx, thread_ctx->dir_info,
2448                               global_ctx->dir_info);
2449 }
2450
2451 static void e2fsck_pass1_merge_dx_dir(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2452 {
2453         if (thread_ctx->dx_dir_info == NULL)
2454                 return;
2455
2456         if (global_ctx->dx_dir_info == NULL) {
2457                 global_ctx->dx_dir_info = thread_ctx->dx_dir_info;
2458                 global_ctx->dx_dir_info_size = thread_ctx->dx_dir_info_size;
2459                 global_ctx->dx_dir_info_count = thread_ctx->dx_dir_info_count;
2460                 thread_ctx->dx_dir_info = NULL;
2461                 return;
2462         }
2463
2464         e2fsck_merge_dx_dir(global_ctx, thread_ctx);
2465 }
2466
2467 static inline errcode_t
2468 e2fsck_pass1_merge_icount(ext2_icount_t *dest_icount,
2469                           ext2_icount_t *src_icount)
2470 {
2471         if (*src_icount) {
2472                 if (*dest_icount == NULL) {
2473                         *dest_icount = *src_icount;
2474                         *src_icount = NULL;
2475                 } else {
2476                         errcode_t ret;
2477
2478                         ret = ext2fs_icount_merge(*src_icount,
2479                                                   *dest_icount);
2480                         if (ret)
2481                                 return ret;
2482                 }
2483         }
2484
2485         return 0;
2486 }
2487
2488 static errcode_t e2fsck_pass1_merge_icounts(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2489 {
2490         errcode_t ret;
2491
2492         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_count,
2493                                         &thread_ctx->inode_count);
2494         if (ret)
2495                 return ret;
2496         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_link_info,
2497                                         &thread_ctx->inode_link_info);
2498
2499         return ret;
2500 }
2501
2502 static errcode_t e2fsck_pass1_merge_dirs_to_hash(e2fsck_t global_ctx,
2503                                                  e2fsck_t thread_ctx)
2504 {
2505         errcode_t retval = 0;
2506
2507         if (!thread_ctx->dirs_to_hash)
2508                 return 0;
2509
2510         if (!global_ctx->dirs_to_hash)
2511                 retval = ext2fs_badblocks_copy(thread_ctx->dirs_to_hash,
2512                                                &global_ctx->dirs_to_hash);
2513         else
2514                 retval = ext2fs_badblocks_merge(thread_ctx->dirs_to_hash,
2515                                                 global_ctx->dirs_to_hash);
2516
2517         return retval;
2518 }
2519
2520
2521 static int e2fsck_pass1_thread_join_one(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2522 {
2523         errcode_t        retval;
2524         int              flags = global_ctx->flags;
2525         ext2_filsys      thread_fs = thread_ctx->fs;
2526         ext2_filsys      global_fs = global_ctx->fs;
2527         FILE            *global_logf = global_ctx->logf;
2528         FILE            *global_problem_logf = global_ctx->problem_logf;
2529         ext2fs_inode_bitmap inode_bad_map = global_ctx->inode_bad_map;
2530         struct dir_info_db *dir_info = global_ctx->dir_info;
2531         struct dx_dir_info *dx_dir_info = global_ctx->dx_dir_info;
2532         ext2fs_inode_bitmap inode_used_map = global_ctx->inode_used_map;
2533         ext2fs_inode_bitmap inode_dir_map = global_ctx->inode_dir_map;
2534         ext2fs_inode_bitmap inode_bb_map = global_ctx->inode_bb_map;
2535         ext2fs_inode_bitmap inode_imagic_map = global_ctx->inode_imagic_map;
2536         ext2fs_inode_bitmap inode_reg_map = global_ctx->inode_reg_map;
2537         ext2fs_block_bitmap block_found_map = global_ctx->block_found_map;
2538         ext2fs_block_bitmap block_dup_map = global_ctx->block_dup_map;
2539         ext2fs_block_bitmap block_ea_map = global_ctx->block_ea_map;
2540         ext2fs_block_bitmap block_metadata_map = global_ctx->block_metadata_map;
2541         ext2fs_block_bitmap inodes_to_rebuild = global_ctx->inodes_to_rebuild;
2542         ext2_icount_t inode_count = global_ctx->inode_count;
2543         ext2_icount_t inode_link_info = global_ctx->inode_link_info;
2544         __u32 fs_directory_count = global_ctx->fs_directory_count;
2545         __u32 fs_regular_count = global_ctx->fs_regular_count;
2546         __u32 fs_blockdev_count = global_ctx->fs_blockdev_count;
2547         __u32 fs_chardev_count = global_ctx->fs_chardev_count;
2548         __u32 fs_links_count = global_ctx->fs_links_count;
2549         __u32 fs_symlinks_count = global_ctx->fs_symlinks_count;
2550         __u32 fs_fast_symlinks_count = global_ctx->fs_fast_symlinks_count;
2551         __u32 fs_fifo_count = global_ctx->fs_fifo_count;
2552         __u32 fs_total_count = global_ctx->fs_total_count;
2553         __u32 fs_badblocks_count = global_ctx->fs_badblocks_count;
2554         __u32 fs_sockets_count = global_ctx->fs_sockets_count;
2555         __u32 fs_ind_count = global_ctx->fs_ind_count;
2556         __u32 fs_dind_count = global_ctx->fs_dind_count;
2557         __u32 fs_tind_count = global_ctx->fs_tind_count;
2558         __u32 fs_fragmented = global_ctx->fs_fragmented;
2559         __u32 fs_fragmented_dir = global_ctx->fs_fragmented_dir;
2560         __u32 large_files = global_ctx->large_files;
2561         ext2_ino_t dx_dir_info_size = global_ctx->dx_dir_info_size;
2562         ext2_ino_t dx_dir_info_count = global_ctx->dx_dir_info_count;
2563         ext2_u32_list dirs_to_hash = global_ctx->dirs_to_hash;
2564
2565 #ifdef HAVE_SETJMP_H
2566         jmp_buf          old_jmp;
2567
2568         memcpy(old_jmp, global_ctx->abort_loc, sizeof(jmp_buf));
2569 #endif
2570         memcpy(global_ctx, thread_ctx, sizeof(struct e2fsck_struct));
2571 #ifdef HAVE_SETJMP_H
2572         memcpy(global_ctx->abort_loc, old_jmp, sizeof(jmp_buf));
2573 #endif
2574
2575         global_ctx->inode_used_map = inode_used_map;
2576         global_ctx->inode_bad_map = inode_bad_map;
2577         global_ctx->inode_dir_map = inode_dir_map;
2578         global_ctx->inode_bb_map = inode_bb_map;
2579         global_ctx->inode_imagic_map = inode_imagic_map;
2580         global_ctx->inodes_to_rebuild = inodes_to_rebuild;
2581         global_ctx->inode_reg_map = inode_reg_map;
2582         global_ctx->block_found_map = block_found_map;
2583         global_ctx->block_dup_map = block_dup_map;
2584         global_ctx->block_ea_map = block_ea_map;
2585         global_ctx->block_metadata_map = block_metadata_map;
2586         global_ctx->dir_info = dir_info;
2587         e2fsck_pass1_merge_dir_info(global_ctx, thread_ctx);
2588         global_ctx->dx_dir_info = dx_dir_info;
2589         global_ctx->dx_dir_info_count = dx_dir_info_count;
2590         global_ctx->dx_dir_info_size = dx_dir_info_size;
2591         e2fsck_pass1_merge_dx_dir(global_ctx, thread_ctx);
2592         global_ctx->inode_count = inode_count;
2593         global_ctx->inode_link_info = inode_link_info;
2594         global_ctx->fs_directory_count += fs_directory_count;
2595         global_ctx->fs_regular_count += fs_regular_count;
2596         global_ctx->fs_blockdev_count += fs_blockdev_count;
2597         global_ctx->fs_chardev_count += fs_chardev_count;
2598         global_ctx->fs_links_count += fs_links_count;
2599         global_ctx->fs_symlinks_count += fs_symlinks_count;
2600         global_ctx->fs_fast_symlinks_count += fs_fast_symlinks_count;
2601         global_ctx->fs_fifo_count += fs_fifo_count;
2602         global_ctx->fs_total_count += fs_total_count;
2603         global_ctx->fs_badblocks_count += fs_badblocks_count;
2604         global_ctx->fs_sockets_count += fs_sockets_count;
2605         global_ctx->fs_ind_count += fs_ind_count;
2606         global_ctx->fs_dind_count += fs_dind_count;
2607         global_ctx->fs_tind_count += fs_tind_count;
2608         global_ctx->fs_fragmented += fs_fragmented;
2609         global_ctx->fs_fragmented_dir += fs_fragmented_dir;
2610         global_ctx->large_files += large_files;
2611
2612         global_ctx->flags |= flags;
2613
2614         retval = e2fsck_pass1_merge_fs(global_fs, thread_fs);
2615         if (retval) {
2616                 com_err(global_ctx->program_name, 0, _("while merging fs\n"));
2617                 return retval;
2618         }
2619         global_fs->priv_data = global_ctx;
2620         global_ctx->fs = global_fs;
2621         global_ctx->logf = global_logf;
2622         global_ctx->problem_logf = global_problem_logf;
2623         global_ctx->global_ctx = NULL;
2624         retval = e2fsck_pass1_merge_icounts(global_ctx, thread_ctx);
2625         if (retval) {
2626                 com_err(global_ctx->program_name, 0,
2627                         _("while merging icounts\n"));
2628                 return retval;
2629         }
2630
2631         global_ctx->dirs_to_hash = dirs_to_hash;
2632         retval = e2fsck_pass1_merge_dirs_to_hash(global_ctx, thread_ctx);
2633         if (retval) {
2634                 com_err(global_ctx->program_name, 0,
2635                         _("while merging dirs to hash\n"));
2636                 return retval;
2637         }
2638
2639         retval = e2fsck_pass1_merge_bitmap(global_fs,
2640                                 &thread_ctx->inode_used_map,
2641                                 &global_ctx->inode_used_map);
2642         if (retval)
2643                 return retval;
2644
2645         retval = e2fsck_pass1_merge_bitmap(global_fs,
2646                                 &thread_ctx->inode_bad_map,
2647                                 &global_ctx->inode_bad_map);
2648         if (retval)
2649                 return retval;
2650         retval = e2fsck_pass1_merge_bitmap(global_fs,
2651                                         &thread_ctx->inode_dir_map,
2652                                         &global_ctx->inode_dir_map);
2653         if (retval)
2654                 return retval;
2655         retval = e2fsck_pass1_merge_bitmap(global_fs,
2656                                 &thread_ctx->inode_bb_map,
2657                                 &global_ctx->inode_bb_map);
2658         if (retval)
2659                 return retval;
2660         retval = e2fsck_pass1_merge_bitmap(global_fs,
2661                                 &thread_ctx->inode_imagic_map,
2662                                 &global_ctx->inode_imagic_map);
2663         if (retval)
2664                 return retval;
2665         retval = e2fsck_pass1_merge_bitmap(global_fs,
2666                                 &thread_ctx->inode_reg_map,
2667                                 &global_ctx->inode_reg_map);
2668         if (retval)
2669                 return retval;
2670         retval = e2fsck_pass1_merge_bitmap(global_fs,
2671                                 &thread_ctx->inodes_to_rebuild,
2672                                 &global_ctx->inodes_to_rebuild);
2673         if (retval)
2674                 return retval;
2675         retval = e2fsck_pass1_merge_bitmap(global_fs,
2676                                 &thread_ctx->block_found_map,
2677                                 &global_ctx->block_found_map);
2678         if (retval)
2679                 return retval;
2680         retval = e2fsck_pass1_merge_bitmap(global_fs,
2681                                 &thread_ctx->block_dup_map,
2682                                 &global_ctx->block_dup_map);
2683         if (retval)
2684                 return retval;
2685         retval = e2fsck_pass1_merge_bitmap(global_fs,
2686                                 &thread_ctx->block_ea_map,
2687                                 &global_ctx->block_ea_map);
2688         if (retval)
2689                 return retval;
2690         retval = e2fsck_pass1_merge_bitmap(global_fs,
2691                                 &thread_ctx->block_metadata_map,
2692                                 &global_ctx->block_metadata_map);
2693         if (retval)
2694                 return retval;
2695
2696         return 0;
2697 }
2698
2699 static int e2fsck_pass1_thread_join(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2700 {
2701         errcode_t       retval;
2702
2703         retval = e2fsck_pass1_thread_join_one(global_ctx, thread_ctx);
2704         ext2fs_free_mem(&thread_ctx->fs);
2705         if (thread_ctx->logf)
2706                 fclose(thread_ctx->logf);
2707         if (thread_ctx->problem_logf) {
2708                 fputs("</problem_log>\n", thread_ctx->problem_logf);
2709                 fclose(thread_ctx->problem_logf);
2710         }
2711         e2fsck_pass1_free_bitmap(&thread_ctx->inode_used_map);
2712         e2fsck_pass1_free_bitmap(&thread_ctx->inode_bad_map);
2713         e2fsck_pass1_free_bitmap(&thread_ctx->inode_dir_map);
2714         e2fsck_pass1_free_bitmap(&thread_ctx->inode_bb_map);
2715         e2fsck_pass1_free_bitmap(&thread_ctx->inode_imagic_map);
2716         e2fsck_pass1_free_bitmap(&thread_ctx->inode_reg_map);
2717         e2fsck_pass1_free_bitmap(&thread_ctx->inodes_to_rebuild);
2718         e2fsck_pass1_free_bitmap(&thread_ctx->block_found_map);
2719         e2fsck_pass1_free_bitmap(&thread_ctx->block_dup_map);
2720         e2fsck_pass1_free_bitmap(&thread_ctx->block_ea_map);
2721         e2fsck_pass1_free_bitmap(&thread_ctx->block_metadata_map);
2722         e2fsck_free_dir_info(thread_ctx);
2723         ext2fs_free_icount(thread_ctx->inode_count);
2724         ext2fs_free_icount(thread_ctx->inode_link_info);
2725         if (thread_ctx->dirs_to_hash)
2726                 ext2fs_badblocks_list_free(thread_ctx->dirs_to_hash);
2727         ext2fs_free_mem(&thread_ctx);
2728
2729         return retval;
2730 }
2731
2732 static int e2fsck_pass1_threads_join(struct e2fsck_thread_info *infos,
2733                                       int num_threads, e2fsck_t global_ctx)
2734 {
2735         errcode_t                        rc;
2736         errcode_t                        ret = 0;
2737         int                              i;
2738         struct e2fsck_thread_info       *pinfo;
2739
2740         for (i = 0; i < num_threads; i++) {
2741                 pinfo = &infos[i];
2742
2743                 if (!pinfo->eti_started)
2744                         continue;
2745
2746                 rc = pthread_join(pinfo->eti_thread_id, NULL);
2747                 if (rc) {
2748                         com_err(global_ctx->program_name, rc,
2749                                 _("while joining thread\n"));
2750                         if (ret == 0)
2751                                 ret = rc;
2752                 }
2753                 rc = e2fsck_pass1_thread_join(global_ctx, infos[i].eti_thread_ctx);
2754                 if (rc) {
2755                         com_err(global_ctx->program_name, rc,
2756                                 _("while joining pass1 thread\n"));
2757                         if (ret == 0)
2758                                 ret = rc;
2759                 }
2760         }
2761         free(infos);
2762
2763         return ret;
2764 }
2765
2766 static void *e2fsck_pass1_thread(void *arg)
2767 {
2768         struct e2fsck_thread_info       *info = arg;
2769         e2fsck_t                         thread_ctx = info->eti_thread_ctx;
2770 #ifdef DEBUG_THREADS
2771         struct e2fsck_thread_debug      *thread_debug = info->eti_debug;
2772 #endif
2773
2774 #ifdef DEBUG_THREADS
2775         pthread_mutex_lock(&thread_debug->etd_mutex);
2776         while (info->eti_thread_index > thread_debug->etd_finished_threads) {
2777                 pthread_cond_wait(&thread_debug->etd_cond,
2778                                   &thread_debug->etd_mutex);
2779         }
2780         pthread_mutex_unlock(&thread_debug->etd_mutex);
2781 #endif
2782
2783 #ifdef HAVE_SETJMP_H
2784         /*
2785          * When fatal_error() happens, jump to here. The thread
2786          * context's flags will be saved, but its abort_loc will
2787          * be overwritten by original jump buffer for the later
2788          * tests.
2789          */
2790         if (setjmp(thread_ctx->abort_loc)) {
2791                 thread_ctx->flags &= ~E2F_FLAG_SETJMP_OK;
2792                 goto out;
2793         }
2794         thread_ctx->flags |= E2F_FLAG_SETJMP_OK;
2795 #endif
2796
2797         e2fsck_pass1_run(thread_ctx);
2798
2799 out:
2800         if (thread_ctx->options & E2F_OPT_MULTITHREAD)
2801                 log_out(thread_ctx,
2802                         _("Scanned group range [%lu, %lu), inodes %lu\n"),
2803                         thread_ctx->thread_info.et_group_start,
2804                         thread_ctx->thread_info.et_group_end,
2805                         thread_ctx->thread_info.et_inode_number);
2806
2807 #ifdef DEBUG_THREADS
2808         pthread_mutex_lock(&thread_debug->etd_mutex);
2809         thread_debug->etd_finished_threads++;
2810         pthread_cond_broadcast(&thread_debug->etd_cond);
2811         pthread_mutex_unlock(&thread_debug->etd_mutex);
2812 #endif
2813
2814         return NULL;
2815 }
2816
2817 static int e2fsck_pass1_threads_start(struct e2fsck_thread_info **pinfo,
2818                                       int num_threads, e2fsck_t global_ctx)
2819 {
2820         struct e2fsck_thread_info       *infos;
2821         pthread_attr_t                   attr;
2822         errcode_t                        retval;
2823         errcode_t                        ret;
2824         struct e2fsck_thread_info       *tmp_pinfo;
2825         int                              i;
2826         e2fsck_t                         thread_ctx;
2827 #ifdef DEBUG_THREADS
2828         struct e2fsck_thread_debug       thread_debug =
2829                 {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER, 0};
2830
2831         thread_debug.etd_finished_threads = 0;
2832 #endif
2833
2834         retval = pthread_attr_init(&attr);
2835         if (retval) {
2836                 com_err(global_ctx->program_name, retval,
2837                         _("while setting pthread attribute\n"));
2838                 return retval;
2839         }
2840
2841         infos = calloc(num_threads, sizeof(struct e2fsck_thread_info));
2842         if (infos == NULL) {
2843                 retval = -ENOMEM;
2844                 com_err(global_ctx->program_name, retval,
2845                         _("while allocating memory for threads\n"));
2846                 pthread_attr_destroy(&attr);
2847                 return retval;
2848         }
2849
2850         for (i = 0; i < num_threads; i++) {
2851                 tmp_pinfo = &infos[i];
2852                 tmp_pinfo->eti_thread_index = i;
2853 #ifdef DEBUG_THREADS
2854                 tmp_pinfo->eti_debug = &thread_debug;
2855 #endif
2856                 retval = e2fsck_pass1_thread_prepare(global_ctx, &thread_ctx,
2857                                                      i, num_threads);
2858                 if (retval) {
2859                         com_err(global_ctx->program_name, retval,
2860                                 _("while preparing pass1 thread\n"));
2861                         break;
2862                 }
2863                 tmp_pinfo->eti_thread_ctx = thread_ctx;
2864
2865                 retval = pthread_create(&tmp_pinfo->eti_thread_id, &attr,
2866                                         &e2fsck_pass1_thread, tmp_pinfo);
2867                 if (retval) {
2868                         com_err(global_ctx->program_name, retval,
2869                                 _("while creating thread\n"));
2870                         e2fsck_pass1_thread_join(global_ctx, thread_ctx);
2871                         break;
2872                 }
2873
2874                 tmp_pinfo->eti_started = 1;
2875         }
2876
2877         /* destroy the thread attribute object, since it is no longer needed */
2878         ret = pthread_attr_destroy(&attr);
2879         if (ret) {
2880                 com_err(global_ctx->program_name, ret,
2881                         _("while destroying thread attribute\n"));
2882                 if (retval == 0)
2883                         retval = ret;
2884         }
2885
2886         if (retval) {
2887                 e2fsck_pass1_threads_join(infos, num_threads, global_ctx);
2888                 return retval;
2889         }
2890         *pinfo = infos;
2891         return 0;
2892 }
2893
2894 static void e2fsck_pass1_multithread(e2fsck_t global_ctx)
2895 {
2896         struct e2fsck_thread_info       *infos = NULL;
2897         int                              num_threads = 1;
2898         errcode_t                        retval;
2899
2900         retval = e2fsck_pass1_threads_start(&infos, num_threads, global_ctx);
2901         if (retval) {
2902                 com_err(global_ctx->program_name, retval,
2903                         _("while starting pass1 threads\n"));
2904                 goto out_abort;
2905         }
2906
2907         retval = e2fsck_pass1_threads_join(infos, num_threads, global_ctx);
2908         if (retval) {
2909                 com_err(global_ctx->program_name, retval,
2910                         _("while joining pass1 threads\n"));
2911                 goto out_abort;
2912         }
2913         return;
2914 out_abort:
2915         global_ctx->flags |= E2F_FLAG_ABORT;
2916         return;
2917 }
2918 #endif
2919
2920 /* TODO: tdb needs to be handled properly for multiple threads*/
2921 static int multiple_threads_supported(e2fsck_t ctx)
2922 {
2923 #ifdef  CONFIG_TDB
2924         unsigned int            threshold;
2925         ext2_ino_t              num_dirs;
2926         errcode_t               retval;
2927         char                    *tdb_dir;
2928         int                     enable;
2929
2930         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
2931                            &tdb_dir);
2932         profile_get_uint(ctx->profile, "scratch_files",
2933                          "numdirs_threshold", 0, 0, &threshold);
2934         profile_get_boolean(ctx->profile, "scratch_files",
2935                             "icount", 0, 1, &enable);
2936
2937         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
2938         if (retval)
2939                 num_dirs = 1024;        /* Guess */
2940
2941         /* tdb is unsupported now */
2942         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
2943             (!threshold || num_dirs > threshold))
2944                 return 0;
2945  #endif
2946         return 1;
2947 }
2948
2949 void e2fsck_pass1(e2fsck_t ctx)
2950 {
2951
2952         init_ext2_max_sizes();
2953 #ifdef HAVE_PTHREAD
2954         if (multiple_threads_supported(ctx)) {
2955                 e2fsck_pass1_multithread(ctx);
2956                 return;
2957         }
2958         fprintf(stderr, "Fall through single thread for pass1 "
2959                         "because tdb could not handle properly\n");
2960 #endif
2961         e2fsck_pass1_run(ctx);
2962 }
2963
2964 #undef FINISH_INODE_LOOP
2965
2966 /*
2967  * When the inode_scan routines call this callback at the end of the
2968  * glock group, call process_inodes.
2969  */
2970 static errcode_t scan_callback(ext2_filsys fs,
2971                                ext2_inode_scan scan EXT2FS_ATTR((unused)),
2972                                dgrp_t group, void * priv_data)
2973 {
2974         struct scan_callback_struct *scan_struct;
2975         e2fsck_t ctx;
2976         struct e2fsck_thread *tinfo;
2977
2978         scan_struct = (struct scan_callback_struct *) priv_data;
2979         ctx = scan_struct->ctx;
2980
2981         process_inodes((e2fsck_t) fs->priv_data, scan_struct->block_buf,
2982                        scan_struct->inodes_to_process,
2983                        scan_struct->process_inode_count);
2984
2985         if (ctx->progress)
2986                 if ((ctx->progress)(ctx, 1, group+1,
2987                                     ctx->fs->group_desc_count))
2988                         return EXT2_ET_CANCEL_REQUESTED;
2989
2990 #ifdef HAVE_PTHREAD
2991         if (ctx->global_ctx) {
2992                 tinfo = &ctx->thread_info;
2993                 tinfo->et_group_next++;
2994                 if (ctx->options & E2F_OPT_DEBUG &&
2995                     ctx->options & E2F_OPT_MULTITHREAD)
2996                         log_out(ctx, _("group %d finished\n"),
2997                                 tinfo->et_group_next);
2998                 if (tinfo->et_group_next >= tinfo->et_group_end)
2999                         return EXT2_ET_SCAN_FINISHED;
3000         }
3001 #endif
3002
3003         return 0;
3004 }
3005
3006 /*
3007  * Process the inodes in the "inodes to process" list.
3008  */
3009 static void process_inodes(e2fsck_t ctx, char *block_buf,
3010                            struct process_inode_block *inodes_to_process,
3011                            int *process_inode_count)
3012 {
3013         int                     i;
3014         struct ext2_inode       *old_stashed_inode;
3015         ext2_ino_t              old_stashed_ino;
3016         const char              *old_operation;
3017         char                    buf[80];
3018         struct problem_context  pctx;
3019
3020 #if 0
3021         printf("begin process_inodes: ");
3022 #endif
3023         if (*process_inode_count == 0)
3024                 return;
3025         old_operation = ehandler_operation(0);
3026         old_stashed_inode = ctx->stashed_inode;
3027         old_stashed_ino = ctx->stashed_ino;
3028         qsort(inodes_to_process, *process_inode_count,
3029                       sizeof(struct process_inode_block), process_inode_cmp);
3030         clear_problem_context(&pctx);
3031         for (i=0; i < *process_inode_count; i++) {
3032                 pctx.inode = ctx->stashed_inode =
3033                         (struct ext2_inode *) &inodes_to_process[i].inode;
3034                 pctx.ino = ctx->stashed_ino = inodes_to_process[i].ino;
3035
3036 #if 0
3037                 printf("%u ", pctx.ino);
3038 #endif
3039                 sprintf(buf, _("reading indirect blocks of inode %u"),
3040                         pctx.ino);
3041                 ehandler_operation(buf);
3042                 check_blocks(ctx, &pctx, block_buf,
3043                              &inodes_to_process[i].ea_ibody_quota);
3044                 if (e2fsck_should_abort(ctx))
3045                         break;
3046         }
3047         ctx->stashed_inode = old_stashed_inode;
3048         ctx->stashed_ino = old_stashed_ino;
3049         *process_inode_count = 0;
3050 #if 0
3051         printf("end process inodes\n");
3052 #endif
3053         ehandler_operation(old_operation);
3054 }
3055
3056 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b)
3057 {
3058         const struct process_inode_block *ib_a =
3059                 (const struct process_inode_block *) a;
3060         const struct process_inode_block *ib_b =
3061                 (const struct process_inode_block *) b;
3062         int     ret;
3063
3064         ret = (ib_a->inode.i_block[EXT2_IND_BLOCK] -
3065                ib_b->inode.i_block[EXT2_IND_BLOCK]);
3066         if (ret == 0)
3067                 /*
3068                  * We only call process_inodes() for non-extent
3069                  * inodes, so it's OK to pass NULL to
3070                  * ext2fs_file_acl_block() here.
3071                  */
3072                 ret = ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_a->inode)) -
3073                         ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_b->inode));
3074         if (ret == 0)
3075                 ret = ib_a->ino - ib_b->ino;
3076         return ret;
3077 }
3078
3079 /*
3080  * Mark an inode as being bad in some what
3081  */
3082 static void mark_inode_bad(e2fsck_t ctx, ino_t ino)
3083 {
3084         struct          problem_context pctx;
3085
3086         if (!ctx->inode_bad_map) {
3087                 clear_problem_context(&pctx);
3088
3089                 pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3090                                 _("bad inode map"), EXT2FS_BMAP64_RBTREE,
3091                                 "inode_bad_map", &ctx->inode_bad_map);
3092                 if (pctx.errcode) {
3093                         pctx.num = 3;
3094                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3095                         /* Should never get here */
3096                         ctx->flags |= E2F_FLAG_ABORT;
3097                         return;
3098                 }
3099         }
3100         ext2fs_mark_inode_bitmap2(ctx->inode_bad_map, ino);
3101 }
3102
3103 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino)
3104 {
3105         struct          problem_context pctx;
3106
3107         if (!ctx->casefolded_dirs) {
3108                 pctx.errcode = ext2fs_u32_list_create(&ctx->casefolded_dirs, 0);
3109                 if (pctx.errcode)
3110                         goto error;
3111         }
3112         pctx.errcode = ext2fs_u32_list_add(ctx->casefolded_dirs, ino);
3113         if (pctx.errcode == 0)
3114                 return;
3115 error:
3116         fix_problem(ctx, PR_1_ALLOCATE_CASEFOLDED_DIRLIST, &pctx);
3117         /* Should never get here */
3118         ctx->flags |= E2F_FLAG_ABORT;
3119 }
3120
3121 /*
3122  * This procedure will allocate the inode "bb" (badblock) map table
3123  */
3124 static void alloc_bb_map(e2fsck_t ctx)
3125 {
3126         struct          problem_context pctx;
3127
3128         clear_problem_context(&pctx);
3129         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3130                         _("inode in bad block map"), EXT2FS_BMAP64_RBTREE,
3131                         "inode_bb_map", &ctx->inode_bb_map);
3132         if (pctx.errcode) {
3133                 pctx.num = 4;
3134                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3135                 /* Should never get here */
3136                 ctx->flags |= E2F_FLAG_ABORT;
3137                 return;
3138         }
3139 }
3140
3141 /*
3142  * This procedure will allocate the inode imagic table
3143  */
3144 static void alloc_imagic_map(e2fsck_t ctx)
3145 {
3146         struct          problem_context pctx;
3147
3148         clear_problem_context(&pctx);
3149         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3150                         _("imagic inode map"), EXT2FS_BMAP64_RBTREE,
3151                         "inode_imagic_map", &ctx->inode_imagic_map);
3152         if (pctx.errcode) {
3153                 pctx.num = 5;
3154                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3155                 /* Should never get here */
3156                 ctx->flags |= E2F_FLAG_ABORT;
3157                 return;
3158         }
3159 }
3160
3161 /*
3162  * Marks a block as in use, setting the dup_map if it's been set
3163  * already.  Called by process_block and process_bad_block.
3164  *
3165  * WARNING: Assumes checks have already been done to make sure block
3166  * is valid.  This is true in both process_block and process_bad_block.
3167  */
3168 static _INLINE_ void mark_block_used(e2fsck_t ctx, blk64_t block)
3169 {
3170         struct          problem_context pctx;
3171
3172         clear_problem_context(&pctx);
3173
3174         if (ext2fs_fast_test_block_bitmap2(ctx->block_found_map, block)) {
3175                 if (ext2fs_has_feature_shared_blocks(ctx->fs->super) &&
3176                     !(ctx->options & E2F_OPT_UNSHARE_BLOCKS)) {
3177                         return;
3178                 }
3179                 if (!ctx->block_dup_map) {
3180                         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
3181                                         _("multiply claimed block map"),
3182                                         EXT2FS_BMAP64_RBTREE, "block_dup_map",
3183                                         &ctx->block_dup_map);
3184                         if (pctx.errcode) {
3185                                 pctx.num = 3;
3186                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR,
3187                                             &pctx);
3188                                 /* Should never get here */
3189                                 ctx->flags |= E2F_FLAG_ABORT;
3190                                 return;
3191                         }
3192                 }
3193                 ext2fs_fast_mark_block_bitmap2(ctx->block_dup_map, block);
3194         } else {
3195                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, block);
3196         }
3197 }
3198
3199 /*
3200  * When cluster size is greater than one block, it is caller's responsibility
3201  * to make sure block parameter starts at a cluster boundary.
3202  */
3203 static _INLINE_ void mark_blocks_used(e2fsck_t ctx, blk64_t block,
3204                                       unsigned int num)
3205 {
3206         if (ext2fs_test_block_bitmap_range2(ctx->block_found_map, block, num))
3207                 ext2fs_mark_block_bitmap_range2(ctx->block_found_map, block, num);
3208         else {
3209                 unsigned int i;
3210
3211                 for (i = 0; i < num; i += EXT2FS_CLUSTER_RATIO(ctx->fs))
3212                         mark_block_used(ctx, block + i);
3213         }
3214 }
3215
3216 /*
3217  * Adjust the extended attribute block's reference counts at the end
3218  * of pass 1, either by subtracting out references for EA blocks that
3219  * are still referenced in ctx->refcount, or by adding references for
3220  * EA blocks that had extra references as accounted for in
3221  * ctx->refcount_extra.
3222  */
3223 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
3224                                     char *block_buf, int adjust_sign)
3225 {
3226         struct ext2_ext_attr_header     *header;
3227         struct problem_context          pctx;
3228         ext2_filsys                     fs = ctx->fs;
3229         blk64_t                         blk;
3230         __u32                           should_be;
3231         ea_value_t                      count;
3232
3233         clear_problem_context(&pctx);
3234
3235         ea_refcount_intr_begin(refcount);
3236         while (1) {
3237                 if ((blk = ea_refcount_intr_next(refcount, &count)) == 0)
3238                         break;
3239                 pctx.blk = blk;
3240                 pctx.errcode = ext2fs_read_ext_attr3(fs, blk, block_buf,
3241                                                      pctx.ino);
3242                 if (pctx.errcode) {
3243                         fix_problem(ctx, PR_1_EXTATTR_READ_ABORT, &pctx);
3244                         return;
3245                 }
3246                 header = (struct ext2_ext_attr_header *) block_buf;
3247                 pctx.blkcount = header->h_refcount;
3248                 should_be = header->h_refcount + adjust_sign * (int)count;
3249                 pctx.num = should_be;
3250                 if (fix_problem(ctx, PR_1_EXTATTR_REFCOUNT, &pctx)) {
3251                         header->h_refcount = should_be;
3252                         pctx.errcode = ext2fs_write_ext_attr3(fs, blk,
3253                                                              block_buf,
3254                                                              pctx.ino);
3255                         if (pctx.errcode) {
3256                                 fix_problem(ctx, PR_1_EXTATTR_WRITE_ABORT,
3257                                             &pctx);
3258                                 continue;
3259                         }
3260                 }
3261         }
3262 }
3263
3264 /*
3265  * Handle processing the extended attribute blocks
3266  */
3267 static int check_ext_attr(e2fsck_t ctx, struct problem_context *pctx,
3268                            char *block_buf, struct ea_quota *ea_block_quota)
3269 {
3270         ext2_filsys fs = ctx->fs;
3271         ext2_ino_t      ino = pctx->ino;
3272         struct ext2_inode *inode = pctx->inode;
3273         blk64_t         blk;
3274         char *          end;
3275         struct ext2_ext_attr_header *header;
3276         struct ext2_ext_attr_entry *first, *entry;
3277         blk64_t         quota_blocks = EXT2FS_C2B(fs, 1);
3278         __u64           quota_inodes = 0;
3279         region_t        region = 0;
3280         int             failed_csum = 0;
3281
3282         ea_block_quota->blocks = 0;
3283         ea_block_quota->inodes = 0;
3284
3285         blk = ext2fs_file_acl_block(fs, inode);
3286         if (blk == 0)
3287                 return 0;
3288
3289         /*
3290          * If the Extended attribute flag isn't set, then a non-zero
3291          * file acl means that the inode is corrupted.
3292          *
3293          * Or if the extended attribute block is an invalid block,
3294          * then the inode is also corrupted.
3295          */
3296         if (!ext2fs_has_feature_xattr(fs->super) ||
3297             (blk < fs->super->s_first_data_block) ||
3298             (blk >= ext2fs_blocks_count(fs->super))) {
3299                 mark_inode_bad(ctx, ino);
3300                 return 0;
3301         }
3302
3303         /* If ea bitmap hasn't been allocated, create it */
3304         if (!ctx->block_ea_map) {
3305                 pctx->errcode = e2fsck_allocate_block_bitmap(fs,
3306                                         _("ext attr block map"),
3307                                         EXT2FS_BMAP64_RBTREE, "block_ea_map",
3308                                         &ctx->block_ea_map);
3309                 if (pctx->errcode) {
3310                         pctx->num = 2;
3311                         fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, pctx);
3312                         ctx->flags |= E2F_FLAG_ABORT;
3313                         return 0;
3314                 }
3315         }
3316
3317         /* Create the EA refcount structure if necessary */
3318         if (!ctx->refcount) {
3319                 pctx->errcode = ea_refcount_create(0, &ctx->refcount);
3320                 if (pctx->errcode) {
3321                         pctx->num = 1;
3322                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3323                         ctx->flags |= E2F_FLAG_ABORT;
3324                         return 0;
3325                 }
3326         }
3327
3328 #if 0
3329         /* Debugging text */
3330         printf("Inode %u has EA block %u\n", ino, blk);
3331 #endif
3332
3333         /* Have we seen this EA block before? */
3334         if (ext2fs_fast_test_block_bitmap2(ctx->block_ea_map, blk)) {
3335                 ea_block_quota->blocks = EXT2FS_C2B(fs, 1);
3336                 ea_block_quota->inodes = 0;
3337
3338                 if (ctx->ea_block_quota_blocks) {
3339                         ea_refcount_fetch(ctx->ea_block_quota_blocks, blk,
3340                                           &quota_blocks);
3341                         if (quota_blocks)
3342                                 ea_block_quota->blocks = quota_blocks;
3343                 }
3344
3345                 if (ctx->ea_block_quota_inodes)
3346                         ea_refcount_fetch(ctx->ea_block_quota_inodes, blk,
3347                                           &ea_block_quota->inodes);
3348
3349                 if (ea_refcount_decrement(ctx->refcount, blk, 0) == 0)
3350                         return 1;
3351                 /* Ooops, this EA was referenced more than it stated */
3352                 if (!ctx->refcount_extra) {
3353                         pctx->errcode = ea_refcount_create(0,
3354                                            &ctx->refcount_extra);
3355                         if (pctx->errcode) {
3356                                 pctx->num = 2;
3357                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3358                                 ctx->flags |= E2F_FLAG_ABORT;
3359                                 return 0;
3360                         }
3361                 }
3362                 ea_refcount_increment(ctx->refcount_extra, blk, 0);
3363                 return 1;
3364         }
3365
3366         /*
3367          * OK, we haven't seen this EA block yet.  So we need to
3368          * validate it
3369          */
3370         pctx->blk = blk;
3371         pctx->errcode = ext2fs_read_ext_attr3(fs, blk, block_buf, pctx->ino);
3372         if (pctx->errcode == EXT2_ET_EXT_ATTR_CSUM_INVALID) {
3373                 pctx->errcode = 0;
3374                 failed_csum = 1;
3375         } else if (pctx->errcode == EXT2_ET_BAD_EA_HEADER)
3376                 pctx->errcode = 0;
3377
3378         if (pctx->errcode &&
3379             fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx)) {
3380                 pctx->errcode = 0;
3381                 goto clear_extattr;
3382         }
3383         header = (struct ext2_ext_attr_header *) block_buf;
3384         pctx->blk = ext2fs_file_acl_block(fs, inode);
3385         if (((ctx->ext_attr_ver == 1) &&
3386              (header->h_magic != EXT2_EXT_ATTR_MAGIC_v1)) ||
3387             ((ctx->ext_attr_ver == 2) &&
3388              (header->h_magic != EXT2_EXT_ATTR_MAGIC))) {
3389                 if (fix_problem(ctx, PR_1_BAD_EA_BLOCK, pctx))
3390                         goto clear_extattr;
3391         }
3392
3393         if (header->h_blocks != 1) {
3394                 if (fix_problem(ctx, PR_1_EA_MULTI_BLOCK, pctx))
3395                         goto clear_extattr;
3396         }
3397
3398         if (pctx->errcode && fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx))
3399                 goto clear_extattr;
3400
3401         region = region_create(0, fs->blocksize);
3402         if (!region) {
3403                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
3404                 ctx->flags |= E2F_FLAG_ABORT;
3405                 return 0;
3406         }
3407         if (region_allocate(region, 0, sizeof(struct ext2_ext_attr_header))) {
3408                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3409                         goto clear_extattr;
3410         }
3411
3412         first = (struct ext2_ext_attr_entry *)(header+1);
3413         end = block_buf + fs->blocksize;
3414         entry = first;
3415         while ((char *)entry < end && *(__u32 *)entry) {
3416                 __u32 hash;
3417
3418                 if (region_allocate(region, (char *)entry - (char *)header,
3419                                    EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
3420                         if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3421                                 goto clear_extattr;
3422                         break;
3423                 }
3424                 if ((ctx->ext_attr_ver == 1 &&
3425                      (entry->e_name_len == 0 || entry->e_name_index != 0)) ||
3426                     (ctx->ext_attr_ver == 2 &&
3427                      entry->e_name_index == 0)) {
3428                         if (fix_problem(ctx, PR_1_EA_BAD_NAME, pctx))
3429                                 goto clear_extattr;
3430                         break;
3431                 }
3432                 if (entry->e_value_inum == 0) {
3433                         if (entry->e_value_offs + entry->e_value_size >
3434                             fs->blocksize) {
3435                                 if (fix_problem(ctx, PR_1_EA_BAD_VALUE, pctx))
3436                                         goto clear_extattr;
3437                                 break;
3438                         }
3439                         if (entry->e_value_size &&
3440                             region_allocate(region, entry->e_value_offs,
3441                                             EXT2_EXT_ATTR_SIZE(entry->e_value_size))) {
3442                                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION,
3443                                                 pctx))
3444                                         goto clear_extattr;
3445                         }
3446
3447                         hash = ext2fs_ext_attr_hash_entry(entry, block_buf +
3448                                                           entry->e_value_offs);
3449
3450                         if (entry->e_hash != hash) {
3451                                 pctx->num = entry->e_hash;
3452                                 if (fix_problem(ctx, PR_1_ATTR_HASH, pctx))
3453                                         goto clear_extattr;
3454                                 entry->e_hash = hash;
3455                         }
3456                 } else {
3457                         problem_t problem;
3458                         blk64_t entry_quota_blocks;
3459
3460                         problem = check_large_ea_inode(ctx, entry, pctx,
3461                                                        &entry_quota_blocks);
3462                         if (problem && fix_problem(ctx, problem, pctx))
3463                                 goto clear_extattr;
3464
3465                         quota_blocks += entry_quota_blocks;
3466                         quota_inodes++;
3467                 }
3468
3469                 entry = EXT2_EXT_ATTR_NEXT(entry);
3470         }
3471         if (region_allocate(region, (char *)entry - (char *)header, 4)) {
3472                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3473                         goto clear_extattr;
3474         }
3475         region_free(region);
3476
3477         /*
3478          * We only get here if there was no other errors that were fixed.
3479          * If there was a checksum fail, ask to correct it.
3480          */
3481         if (failed_csum &&
3482             fix_problem(ctx, PR_1_EA_BLOCK_ONLY_CSUM_INVALID, pctx)) {
3483                 pctx->errcode = ext2fs_write_ext_attr3(fs, blk, block_buf,
3484                                                        pctx->ino);
3485                 if (pctx->errcode)
3486                         return 0;
3487         }
3488
3489         if (quota_blocks != EXT2FS_C2B(fs, 1U)) {
3490                 if (!ctx->ea_block_quota_blocks) {
3491                         pctx->errcode = ea_refcount_create(0,
3492                                                 &ctx->ea_block_quota_blocks);
3493                         if (pctx->errcode) {
3494                                 pctx->num = 3;
3495                                 goto refcount_fail;
3496                         }
3497                 }
3498                 ea_refcount_store(ctx->ea_block_quota_blocks, blk,
3499                                   quota_blocks);
3500         }
3501
3502         if (quota_inodes) {
3503                 if (!ctx->ea_block_quota_inodes) {
3504                         pctx->errcode = ea_refcount_create(0,
3505                                                 &ctx->ea_block_quota_inodes);
3506                         if (pctx->errcode) {
3507                                 pctx->num = 4;
3508 refcount_fail:
3509                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3510                                 ctx->flags |= E2F_FLAG_ABORT;
3511                                 return 0;
3512                         }
3513                 }
3514
3515                 ea_refcount_store(ctx->ea_block_quota_inodes, blk,
3516                                   quota_inodes);
3517         }
3518         ea_block_quota->blocks = quota_blocks;
3519         ea_block_quota->inodes = quota_inodes;
3520
3521         inc_ea_inode_refs(ctx, pctx, first, end);
3522         ea_refcount_store(ctx->refcount, blk, header->h_refcount - 1);
3523         mark_block_used(ctx, blk);
3524         ext2fs_fast_mark_block_bitmap2(ctx->block_ea_map, blk);
3525         return 1;
3526
3527 clear_extattr:
3528         if (region)
3529                 region_free(region);
3530         ext2fs_file_acl_block_set(fs, inode, 0);
3531         e2fsck_write_inode(ctx, ino, inode, "check_ext_attr");
3532         return 0;
3533 }
3534
3535 /* Returns 1 if bad htree, 0 if OK */
3536 static int handle_htree(e2fsck_t ctx, struct problem_context *pctx,
3537                         ext2_ino_t ino, struct ext2_inode *inode,
3538                         char *block_buf)
3539 {
3540         struct ext2_dx_root_info        *root;
3541         ext2_filsys                     fs = ctx->fs;
3542         errcode_t                       retval;
3543         blk64_t                         blk;
3544
3545         if ((!LINUX_S_ISDIR(inode->i_mode) &&
3546              fix_problem(ctx, PR_1_HTREE_NODIR, pctx)) ||
3547             (!ext2fs_has_feature_dir_index(fs->super) &&
3548              fix_problem(ctx, PR_1_HTREE_SET, pctx)))
3549                 return 1;
3550
3551         pctx->errcode = ext2fs_bmap2(fs, ino, inode, 0, 0, 0, 0, &blk);
3552
3553         if ((pctx->errcode) ||
3554             (blk == 0) ||
3555             (blk < fs->super->s_first_data_block) ||
3556             (blk >= ext2fs_blocks_count(fs->super))) {
3557                 if (fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3558                         return 1;
3559                 else
3560                         return 0;
3561         }
3562
3563         retval = io_channel_read_blk64(fs->io, blk, 1, block_buf);
3564         if (retval && fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3565                 return 1;
3566
3567         /* XXX should check that beginning matches a directory */
3568         root = (struct ext2_dx_root_info *) (block_buf + 24);
3569
3570         if ((root->reserved_zero || root->info_length < 8) &&
3571             fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3572                 return 1;
3573
3574         pctx->num = root->hash_version;
3575         if ((root->hash_version != EXT2_HASH_LEGACY) &&
3576             (root->hash_version != EXT2_HASH_HALF_MD4) &&
3577             (root->hash_version != EXT2_HASH_TEA) &&
3578             (root->hash_version != EXT2_HASH_SIPHASH) &&
3579             fix_problem(ctx, PR_1_HTREE_HASHV, pctx))
3580                 return 1;
3581
3582         if (ext4_hash_in_dirent(inode)) {
3583                 if (root->hash_version != EXT2_HASH_SIPHASH &&
3584                     fix_problem(ctx, PR_1_HTREE_NEEDS_SIPHASH, pctx))
3585                         return 1;
3586         } else {
3587                 if (root->hash_version == EXT2_HASH_SIPHASH &&
3588                    fix_problem(ctx, PR_1_HTREE_CANNOT_SIPHASH, pctx))
3589                         return 1;
3590         }
3591
3592         if ((root->unused_flags & EXT2_HASH_FLAG_INCOMPAT) &&
3593             fix_problem(ctx, PR_1_HTREE_INCOMPAT, pctx))
3594                 return 1;
3595
3596         pctx->num = root->indirect_levels;
3597         /* if htree level is clearly too high, consider it to be broken */
3598         if (root->indirect_levels > EXT4_HTREE_LEVEL &&
3599             fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
3600                 return 1;
3601
3602         /* if level is only maybe too high, LARGE_DIR feature could be unset */
3603         if (root->indirect_levels > ext2_dir_htree_level(fs) &&
3604             !ext2fs_has_feature_largedir(fs->super)) {
3605                 int blockbits = EXT2_BLOCK_SIZE_BITS(fs->super) + 10;
3606                 int idx_pb = 1 << (blockbits - 3);
3607
3608                 /* compare inode size/blocks vs. max-sized 2-level htree */
3609                 if (EXT2_I_SIZE(pctx->inode) <
3610                     (idx_pb - 1) * (idx_pb - 2) << blockbits &&
3611                     pctx->inode->i_blocks <
3612                     (idx_pb - 1) * (idx_pb - 2) << (blockbits - 9) &&
3613                     fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
3614                         return 1;
3615         }
3616
3617         if (root->indirect_levels > EXT4_HTREE_LEVEL_COMPAT ||
3618             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
3619                 ctx->large_dirs++;
3620
3621         return 0;
3622 }
3623
3624 void e2fsck_clear_inode(e2fsck_t ctx, ext2_ino_t ino,
3625                         struct ext2_inode *inode, int restart_flag,
3626                         const char *source)
3627 {
3628         inode->i_flags = 0;
3629         inode->i_links_count = 0;
3630         ext2fs_icount_store(ctx->inode_link_info, ino, 0);
3631         inode->i_dtime = ctx->now;
3632
3633         /*
3634          * If a special inode has such rotten block mappings that we
3635          * want to clear the whole inode, be sure to actually zap
3636          * the block maps because i_links_count isn't checked for
3637          * special inodes, and we'll end up right back here the next
3638          * time we run fsck.
3639          */
3640         if (ino < EXT2_FIRST_INODE(ctx->fs->super))
3641                 memset(inode->i_block, 0, sizeof(inode->i_block));
3642
3643         ext2fs_unmark_inode_bitmap2(ctx->inode_dir_map, ino);
3644         ext2fs_unmark_inode_bitmap2(ctx->inode_used_map, ino);
3645         if (ctx->inode_reg_map)
3646                 ext2fs_unmark_inode_bitmap2(ctx->inode_reg_map, ino);
3647         if (ctx->inode_bad_map)
3648                 ext2fs_unmark_inode_bitmap2(ctx->inode_bad_map, ino);
3649
3650         /*
3651          * If the inode was partially accounted for before processing
3652          * was aborted, we need to restart the pass 1 scan.
3653          */
3654         ctx->flags |= restart_flag;
3655
3656         if (ino == EXT2_BAD_INO)
3657                 memset(inode, 0, sizeof(struct ext2_inode));
3658
3659         e2fsck_write_inode(ctx, ino, inode, source);
3660 }
3661
3662 /*
3663  * Use the multiple-blocks reclamation code to fix alignment problems in
3664  * a bigalloc filesystem.  We want a logical cluster to map to *only* one
3665  * physical cluster, and we want the block offsets within that cluster to
3666  * line up.
3667  */
3668 static int has_unaligned_cluster_map(e2fsck_t ctx,
3669                                      blk64_t last_pblk, blk64_t last_lblk,
3670                                      blk64_t pblk, blk64_t lblk)
3671 {
3672         blk64_t cluster_mask;
3673
3674         if (!ctx->fs->cluster_ratio_bits)
3675                 return 0;
3676         cluster_mask = EXT2FS_CLUSTER_MASK(ctx->fs);
3677
3678         /*
3679          * If the block in the logical cluster doesn't align with the block in
3680          * the physical cluster...
3681          */
3682         if ((lblk & cluster_mask) != (pblk & cluster_mask))
3683                 return 1;
3684
3685         /*
3686          * If we cross a physical cluster boundary within a logical cluster...
3687          */
3688         if (last_pblk && (lblk & cluster_mask) != 0 &&
3689             EXT2FS_B2C(ctx->fs, lblk) == EXT2FS_B2C(ctx->fs, last_lblk) &&
3690             EXT2FS_B2C(ctx->fs, pblk) != EXT2FS_B2C(ctx->fs, last_pblk))
3691                 return 1;
3692
3693         return 0;
3694 }
3695
3696 static void scan_extent_node(e2fsck_t ctx, struct problem_context *pctx,
3697                              struct process_block_struct *pb,
3698                              blk64_t start_block, blk64_t end_block,
3699                              blk64_t eof_block,
3700                              ext2_extent_handle_t ehandle,
3701                              int try_repairs)
3702 {
3703         struct ext2fs_extent    extent;
3704         blk64_t                 blk, last_lblk;
3705         unsigned int            i, n;
3706         int                     is_dir, is_leaf;
3707         problem_t               problem;
3708         struct ext2_extent_info info;
3709         int                     failed_csum = 0;
3710
3711         if (pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID)
3712                 failed_csum = 1;
3713
3714         pctx->errcode = ext2fs_extent_get_info(ehandle, &info);
3715         if (pctx->errcode)
3716                 return;
3717         if (!(ctx->options & E2F_OPT_FIXES_ONLY) &&
3718             !pb->eti.force_rebuild) {
3719                 struct extent_tree_level *etl;
3720
3721                 etl = pb->eti.ext_info + info.curr_level;
3722                 etl->num_extents += info.num_entries;
3723                 etl->max_extents += info.max_entries;
3724                 /*
3725                  * Implementation wart: Splitting extent blocks when appending
3726                  * will leave the old block with one free entry.  Therefore
3727                  * unless the node is totally full, pretend that a non-root
3728                  * extent block can hold one fewer entry than it actually does,
3729                  * so that we don't repeatedly rebuild the extent tree.
3730                  */
3731                 if (info.curr_level && info.num_entries < info.max_entries)
3732                         etl->max_extents--;
3733         }
3734
3735         pctx->errcode = ext2fs_extent_get(ehandle, EXT2_EXTENT_FIRST_SIB,
3736                                           &extent);
3737         while ((pctx->errcode == 0 ||
3738                 pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID) &&
3739                info.num_entries-- > 0) {
3740                 is_leaf = extent.e_flags & EXT2_EXTENT_FLAGS_LEAF;
3741                 is_dir = LINUX_S_ISDIR(pctx->inode->i_mode);
3742                 last_lblk = extent.e_lblk + extent.e_len - 1;
3743
3744                 problem = 0;
3745                 pctx->blk = extent.e_pblk;
3746                 pctx->blk2 = extent.e_lblk;
3747                 pctx->num = extent.e_len;
3748                 pctx->blkcount = extent.e_lblk + extent.e_len;
3749
3750                 if (extent.e_pblk == 0 ||
3751                     extent.e_pblk < ctx->fs->super->s_first_data_block ||
3752                     extent.e_pblk >= ext2fs_blocks_count(ctx->fs->super))
3753                         problem = PR_1_EXTENT_BAD_START_BLK;
3754                 else if (extent.e_lblk < start_block)
3755                         problem = PR_1_OUT_OF_ORDER_EXTENTS;
3756                 else if ((end_block && last_lblk > end_block) &&
3757                          !(last_lblk > eof_block &&
3758                            ((extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) ||
3759                             (pctx->inode->i_flags & EXT4_VERITY_FL))))
3760                         problem = PR_1_EXTENT_END_OUT_OF_BOUNDS;
3761                 else if (is_leaf && extent.e_len == 0)
3762                         problem = PR_1_EXTENT_LENGTH_ZERO;
3763                 else if (is_leaf &&
3764                          (extent.e_pblk + extent.e_len) >
3765                          ext2fs_blocks_count(ctx->fs->super))
3766                         problem = PR_1_EXTENT_ENDS_BEYOND;
3767                 else if (is_leaf && is_dir && !pctx->inode->i_size_high &&
3768                          !ext2fs_has_feature_largedir(ctx->fs->super) &&
3769                          ((extent.e_lblk + extent.e_len) >
3770                           (1U << (21 - ctx->fs->super->s_log_block_size))))
3771                         problem = PR_1_TOOBIG_DIR;
3772
3773                 if (is_leaf && problem == 0 && extent.e_len > 0) {
3774 #if 0
3775                         printf("extent_region(ino=%u, expect=%llu, "
3776                                "lblk=%llu, len=%u)\n", pb->ino,
3777                                (unsigned long long) pb->next_lblock,
3778                                (unsigned long long) extent.e_lblk,
3779                                extent.e_len);
3780 #endif
3781                         if (extent.e_lblk < pb->next_lblock)
3782                                 problem = PR_1_EXTENT_COLLISION;
3783                         else if (extent.e_lblk + extent.e_len > pb->next_lblock)
3784                                 pb->next_lblock = extent.e_lblk + extent.e_len;
3785                 }
3786
3787                 /*
3788                  * Uninitialized blocks in a directory?  Clear the flag and
3789                  * we'll interpret the blocks later.
3790                  */
3791                 if (try_repairs && is_dir && problem == 0 &&
3792                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3793                     fix_problem(ctx, PR_1_UNINIT_DBLOCK, pctx)) {
3794                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3795                         pb->inode_modified = 1;
3796                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3797                                                               &extent);
3798                         if (pctx->errcode)
3799                                 return;
3800                         failed_csum = 0;
3801                 }
3802 #ifdef CONFIG_DEVELOPER_FEATURES
3803                 if (try_repairs && !is_dir && problem == 0 &&
3804                     (ctx->options & E2F_OPT_CLEAR_UNINIT) &&
3805                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3806                     fix_problem(ctx, PR_1_CLEAR_UNINIT_EXTENT, pctx)) {
3807                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3808                         pb->inode_modified = 1;
3809                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3810                                                               &extent);
3811                         if (pctx->errcode)
3812                                 return;
3813                         failed_csum = 0;
3814                 }
3815 #endif
3816                 if (try_repairs && problem) {
3817 report_problem:
3818                         if (fix_problem(ctx, problem, pctx)) {
3819                                 if (ctx->invalid_bitmaps) {
3820                                         /*
3821                                          * If fsck knows the bitmaps are bad,
3822                                          * skip to the next extent and
3823                                          * try to clear this extent again
3824                                          * after fixing the bitmaps, by
3825                                          * restarting fsck.
3826                                          */
3827                                         pctx->errcode = ext2fs_extent_get(
3828                                                           ehandle,
3829                                                           EXT2_EXTENT_NEXT_SIB,
3830                                                           &extent);
3831                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3832                                         if (pctx->errcode ==
3833                                                     EXT2_ET_NO_CURRENT_NODE) {
3834                                                 pctx->errcode = 0;
3835                                                 break;
3836                                         }
3837                                         continue;
3838                                 }
3839                                 e2fsck_read_bitmaps(ctx);
3840                                 pb->inode_modified = 1;
3841                                 pctx->errcode =
3842                                         ext2fs_extent_delete(ehandle, 0);
3843                                 if (pctx->errcode) {
3844                                         pctx->str = "ext2fs_extent_delete";
3845                                         return;
3846                                 }
3847                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
3848                                 if (pctx->errcode &&
3849                                     pctx->errcode != EXT2_ET_NO_CURRENT_NODE) {
3850                                         pctx->str = "ext2fs_extent_fix_parents";
3851                                         return;
3852                                 }
3853                                 pctx->errcode = ext2fs_extent_get(ehandle,
3854                                                                   EXT2_EXTENT_CURRENT,
3855                                                                   &extent);
3856                                 if (pctx->errcode == EXT2_ET_NO_CURRENT_NODE) {
3857                                         pctx->errcode = 0;
3858                                         break;
3859                                 }
3860                                 failed_csum = 0;
3861                                 continue;
3862                         }
3863                         goto next;
3864                 }
3865
3866                 if (!is_leaf) {
3867                         blk64_t lblk = extent.e_lblk;
3868                         int next_try_repairs = 1;
3869
3870                         blk = extent.e_pblk;
3871
3872                         /*
3873                          * If this lower extent block collides with critical
3874                          * metadata, don't try to repair the damage.  Pass 1b
3875                          * will reallocate the block; then we can try again.
3876                          */
3877                         if (pb->ino != EXT2_RESIZE_INO &&
3878                             extent.e_pblk < ctx->fs->super->s_blocks_count &&
3879                             ext2fs_test_block_bitmap2(ctx->block_metadata_map,
3880                                                       extent.e_pblk)) {
3881                                 next_try_repairs = 0;
3882                                 pctx->blk = blk;
3883                                 fix_problem(ctx,
3884                                             PR_1_CRITICAL_METADATA_COLLISION,
3885                                             pctx);
3886                                 if ((ctx->options & E2F_OPT_NO) == 0)
3887                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3888                         }
3889                         pctx->errcode = ext2fs_extent_get(ehandle,
3890                                                   EXT2_EXTENT_DOWN, &extent);
3891                         if (pctx->errcode &&
3892                             pctx->errcode != EXT2_ET_EXTENT_CSUM_INVALID) {
3893                                 pctx->str = "EXT2_EXTENT_DOWN";
3894                                 problem = PR_1_EXTENT_HEADER_INVALID;
3895                                 if (!next_try_repairs)
3896                                         return;
3897                                 if (pctx->errcode == EXT2_ET_EXTENT_HEADER_BAD)
3898                                         goto report_problem;
3899                                 return;
3900                         }
3901                         /* The next extent should match this index's logical start */
3902                         if (extent.e_lblk != lblk) {
3903                                 struct ext2_extent_info e_info;
3904
3905                                 pctx->errcode = ext2fs_extent_get_info(ehandle,
3906                                                                        &e_info);
3907                                 if (pctx->errcode) {
3908                                         pctx->str = "ext2fs_extent_get_info";
3909                                         return;
3910                                 }
3911                                 pctx->blk = lblk;
3912                                 pctx->blk2 = extent.e_lblk;
3913                                 pctx->num = e_info.curr_level - 1;
3914                                 problem = PR_1_EXTENT_INDEX_START_INVALID;
3915                                 if (fix_problem(ctx, problem, pctx)) {
3916                                         pb->inode_modified = 1;
3917                                         pctx->errcode =
3918                                                 ext2fs_extent_fix_parents(ehandle);
3919                                         if (pctx->errcode) {
3920                                                 pctx->str = "ext2fs_extent_fix_parents";
3921                                                 return;
3922                                         }
3923                                 }
3924                         }
3925                         scan_extent_node(ctx, pctx, pb, extent.e_lblk,
3926                                          last_lblk, eof_block, ehandle,
3927                                          next_try_repairs);
3928                         if (pctx->errcode)
3929                                 return;
3930                         pctx->errcode = ext2fs_extent_get(ehandle,
3931                                                   EXT2_EXTENT_UP, &extent);
3932                         if (pctx->errcode) {
3933                                 pctx->str = "EXT2_EXTENT_UP";
3934                                 return;
3935                         }
3936                         mark_block_used(ctx, blk);
3937                         pb->num_blocks++;
3938                         goto next;
3939                 }
3940
3941                 if ((pb->previous_block != 0) &&
3942                     (pb->previous_block+1 != extent.e_pblk)) {
3943                         if (ctx->options & E2F_OPT_FRAGCHECK) {
3944                                 char type = '?';
3945
3946                                 if (pb->is_dir)
3947                                         type = 'd';
3948                                 else if (pb->is_reg)
3949                                         type = 'f';
3950
3951                                 printf(("%6lu(%c): expecting %6lu "
3952                                         "actual extent "
3953                                         "phys %6lu log %lu len %lu\n"),
3954                                        (unsigned long) pctx->ino, type,
3955                                        (unsigned long) pb->previous_block+1,
3956                                        (unsigned long) extent.e_pblk,
3957                                        (unsigned long) extent.e_lblk,
3958                                        (unsigned long) extent.e_len);
3959                         }
3960                         pb->fragmented = 1;
3961                 }
3962                 /*
3963                  * If we notice a gap in the logical block mappings of an
3964                  * extent-mapped directory, offer to close the hole by
3965                  * moving the logical block down, otherwise we'll go mad in
3966                  * pass 3 allocating empty directory blocks to fill the hole.
3967                  */
3968                 if (try_repairs && is_dir &&
3969                     pb->last_block + 1 < extent.e_lblk) {
3970                         blk64_t new_lblk;
3971
3972                         new_lblk = pb->last_block + 1;
3973                         if (EXT2FS_CLUSTER_RATIO(ctx->fs) > 1)
3974                                 new_lblk = ((new_lblk +
3975                                              EXT2FS_CLUSTER_RATIO(ctx->fs) - 1) &
3976                                             ~EXT2FS_CLUSTER_MASK(ctx->fs)) |
3977                                            (extent.e_pblk &
3978                                             EXT2FS_CLUSTER_MASK(ctx->fs));
3979                         pctx->blk = extent.e_lblk;
3980                         pctx->blk2 = new_lblk;
3981                         if (fix_problem(ctx, PR_1_COLLAPSE_DBLOCK, pctx)) {
3982                                 extent.e_lblk = new_lblk;
3983                                 pb->inode_modified = 1;
3984                                 pctx->errcode = ext2fs_extent_replace(ehandle,
3985                                                                 0, &extent);
3986                                 if (pctx->errcode) {
3987                                         pctx->errcode = 0;
3988                                         goto alloc_later;
3989                                 }
3990                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
3991                                 if (pctx->errcode)
3992                                         goto failed_add_dir_block;
3993                                 pctx->errcode = ext2fs_extent_goto(ehandle,
3994                                                                 extent.e_lblk);
3995                                 if (pctx->errcode)
3996                                         goto failed_add_dir_block;
3997                                 last_lblk = extent.e_lblk + extent.e_len - 1;
3998                                 failed_csum = 0;
3999                         }
4000                 }
4001 alloc_later:
4002                 if (is_dir) {
4003                         while (++pb->last_db_block <
4004                                (e2_blkcnt_t) extent.e_lblk) {
4005                                 pctx->errcode = ext2fs_add_dir_block2(
4006                                                         ctx->fs->dblist,
4007                                                         pb->ino, 0,
4008                                                         pb->last_db_block);
4009                                 if (pctx->errcode) {
4010                                         pctx->blk = 0;
4011                                         pctx->num = pb->last_db_block;
4012                                         goto failed_add_dir_block;
4013                                 }
4014                         }
4015
4016                         for (i = 0; i < extent.e_len; i++) {
4017                                 pctx->errcode = ext2fs_add_dir_block2(
4018                                                         ctx->fs->dblist,
4019                                                         pctx->ino,
4020                                                         extent.e_pblk + i,
4021                                                         extent.e_lblk + i);
4022                                 if (pctx->errcode) {
4023                                         pctx->blk = extent.e_pblk + i;
4024                                         pctx->num = extent.e_lblk + i;
4025                                 failed_add_dir_block:
4026                                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4027                                         /* Should never get here */
4028                                         ctx->flags |= E2F_FLAG_ABORT;
4029                                         return;
4030                                 }
4031                         }
4032                         if (extent.e_len > 0)
4033                                 pb->last_db_block = extent.e_lblk + extent.e_len - 1;
4034                 }
4035                 if (has_unaligned_cluster_map(ctx, pb->previous_block,
4036                                               pb->last_block,
4037                                               extent.e_pblk,
4038                                               extent.e_lblk)) {
4039                         for (i = 0; i < extent.e_len; i++) {
4040                                 pctx->blk = extent.e_lblk + i;
4041                                 pctx->blk2 = extent.e_pblk + i;
4042                                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4043                                 mark_block_used(ctx, extent.e_pblk + i);
4044                                 mark_block_used(ctx, extent.e_pblk + i);
4045                         }
4046                 }
4047
4048                 /*
4049                  * Check whether first cluster got marked in previous iteration.
4050                  */
4051                 if (ctx->fs->cluster_ratio_bits &&
4052                     pb->previous_block &&
4053                     (EXT2FS_B2C(ctx->fs, extent.e_pblk) ==
4054                      EXT2FS_B2C(ctx->fs, pb->previous_block)))
4055                         /* Set blk to the beginning of next cluster. */
4056                         blk = EXT2FS_C2B(
4057                                 ctx->fs,
4058                                 EXT2FS_B2C(ctx->fs, extent.e_pblk) + 1);
4059                 else
4060                         /* Set blk to the beginning of current cluster. */
4061                         blk = EXT2FS_C2B(ctx->fs,
4062                                          EXT2FS_B2C(ctx->fs, extent.e_pblk));
4063
4064                 if (blk < extent.e_pblk + extent.e_len) {
4065                         mark_blocks_used(ctx, blk,
4066                                          extent.e_pblk + extent.e_len - blk);
4067                         n = DIV_ROUND_UP(extent.e_pblk + extent.e_len - blk,
4068                                          EXT2FS_CLUSTER_RATIO(ctx->fs));
4069                         pb->num_blocks += n;
4070                 }
4071                 pb->last_block = extent.e_lblk + extent.e_len - 1;
4072                 pb->previous_block = extent.e_pblk + extent.e_len - 1;
4073                 start_block = pb->last_block = last_lblk;
4074                 if (is_leaf && !is_dir &&
4075                     !(extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT))
4076                         pb->last_init_lblock = last_lblk;
4077         next:
4078                 pctx->errcode = ext2fs_extent_get(ehandle,
4079                                                   EXT2_EXTENT_NEXT_SIB,
4080                                                   &extent);
4081         }
4082
4083         /* Failed csum but passes checks?  Ask to fix checksum. */
4084         if (failed_csum &&
4085             fix_problem(ctx, PR_1_EXTENT_ONLY_CSUM_INVALID, pctx)) {
4086                 pb->inode_modified = 1;
4087                 pctx->errcode = ext2fs_extent_replace(ehandle, 0, &extent);
4088                 if (pctx->errcode)
4089                         return;
4090         }
4091
4092         if (pctx->errcode == EXT2_ET_EXTENT_NO_NEXT)
4093                 pctx->errcode = 0;
4094 }
4095
4096 static void check_blocks_extents(e2fsck_t ctx, struct problem_context *pctx,
4097                                  struct process_block_struct *pb)
4098 {
4099         struct ext2_extent_info info;
4100         struct ext2_inode       *inode = pctx->inode;
4101         ext2_extent_handle_t    ehandle;
4102         ext2_filsys             fs = ctx->fs;
4103         ext2_ino_t              ino = pctx->ino;
4104         errcode_t               retval;
4105         blk64_t                 eof_lblk;
4106         struct ext3_extent_header       *eh;
4107
4108         /* Check for a proper extent header... */
4109         eh = (struct ext3_extent_header *) &inode->i_block[0];
4110         retval = ext2fs_extent_header_verify(eh, sizeof(inode->i_block));
4111         if (retval) {
4112                 if (fix_problem(ctx, PR_1_MISSING_EXTENT_HEADER, pctx))
4113                         e2fsck_clear_inode(ctx, ino, inode, 0,
4114                                            "check_blocks_extents");
4115                 pctx->errcode = 0;
4116                 return;
4117         }
4118
4119         /* ...since this function doesn't fail if i_block is zeroed. */
4120         pctx->errcode = ext2fs_extent_open2(fs, ino, inode, &ehandle);
4121         if (pctx->errcode) {
4122                 if (fix_problem(ctx, PR_1_READ_EXTENT, pctx))
4123                         e2fsck_clear_inode(ctx, ino, inode, 0,
4124                                            "check_blocks_extents");
4125                 pctx->errcode = 0;
4126                 return;
4127         }
4128
4129         retval = ext2fs_extent_get_info(ehandle, &info);
4130         if (retval == 0) {
4131                 int max_depth = info.max_depth;
4132
4133                 if (max_depth >= MAX_EXTENT_DEPTH_COUNT)
4134                         max_depth = MAX_EXTENT_DEPTH_COUNT-1;
4135                 ctx->extent_depth_count[max_depth]++;
4136         }
4137
4138         /* Check maximum extent depth */
4139         pctx->blk = info.max_depth;
4140         pctx->blk2 = ext2fs_max_extent_depth(ehandle);
4141         if (pctx->blk2 < pctx->blk &&
4142             fix_problem(ctx, PR_1_EXTENT_BAD_MAX_DEPTH, pctx))
4143                 pb->eti.force_rebuild = 1;
4144
4145         /* Can we collect extent tree level stats? */
4146         pctx->blk = MAX_EXTENT_DEPTH_COUNT;
4147         if (pctx->blk2 > pctx->blk)
4148                 fix_problem(ctx, PR_1E_MAX_EXTENT_TREE_DEPTH, pctx);
4149         memset(pb->eti.ext_info, 0, sizeof(pb->eti.ext_info));
4150         pb->eti.ino = pb->ino;
4151
4152         pb->next_lblock = 0;
4153
4154         eof_lblk = ((EXT2_I_SIZE(inode) + fs->blocksize - 1) >>
4155                 EXT2_BLOCK_SIZE_BITS(fs->super)) - 1;
4156         scan_extent_node(ctx, pctx, pb, 0, 0, eof_lblk, ehandle, 1);
4157         if (pctx->errcode &&
4158             fix_problem(ctx, PR_1_EXTENT_ITERATE_FAILURE, pctx)) {
4159                 pb->num_blocks = 0;
4160                 inode->i_blocks = 0;
4161                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4162                                    "check_blocks_extents");
4163                 pctx->errcode = 0;
4164         }
4165         ext2fs_extent_free(ehandle);
4166
4167         /* Rebuild unless it's a dir and we're rehashing it */
4168         if (LINUX_S_ISDIR(inode->i_mode) &&
4169             e2fsck_dir_will_be_rehashed(ctx, ino))
4170                 return;
4171
4172         if (ctx->options & E2F_OPT_CONVERT_BMAP)
4173                 e2fsck_rebuild_extents_later(ctx, ino);
4174         else
4175                 e2fsck_should_rebuild_extents(ctx, pctx, &pb->eti, &info);
4176 }
4177
4178 /*
4179  * In fact we don't need to check blocks for an inode with inline data
4180  * because this inode doesn't have any blocks.  In this function all
4181  * we need to do is add this inode into dblist when it is a directory.
4182  */
4183 static void check_blocks_inline_data(e2fsck_t ctx, struct problem_context *pctx,
4184                                      struct process_block_struct *pb)
4185 {
4186         int     flags;
4187         size_t  inline_data_size = 0;
4188
4189         if (!pb->is_dir) {
4190                 pctx->errcode = 0;
4191                 return;
4192         }
4193
4194         /* Process the dirents in i_block[] as the "first" block. */
4195         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 0);
4196         if (pctx->errcode)
4197                 goto err;
4198
4199         /* Process the dirents in the EA as a "second" block. */
4200         flags = ctx->fs->flags;
4201         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4202         pctx->errcode = ext2fs_inline_data_size(ctx->fs, pb->ino,
4203                                                 &inline_data_size);
4204         ctx->fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4205                          (ctx->fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4206         if (pctx->errcode) {
4207                 pctx->errcode = 0;
4208                 return;
4209         }
4210
4211         if (inline_data_size <= EXT4_MIN_INLINE_DATA_SIZE)
4212                 return;
4213
4214         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 1);
4215         if (pctx->errcode)
4216                 goto err;
4217
4218         return;
4219 err:
4220         pctx->blk = 0;
4221         pctx->num = 0;
4222         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4223         ctx->flags |= E2F_FLAG_ABORT;
4224 }
4225
4226 /*
4227  * This subroutine is called on each inode to account for all of the
4228  * blocks used by that inode.
4229  */
4230 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
4231                          char *block_buf, const struct ea_quota *ea_ibody_quota)
4232 {
4233         ext2_filsys fs = ctx->fs;
4234         struct process_block_struct pb;
4235         ext2_ino_t      ino = pctx->ino;
4236         struct ext2_inode *inode = pctx->inode;
4237         unsigned        bad_size = 0;
4238         int             dirty_inode = 0;
4239         int             extent_fs;
4240         int             inlinedata_fs;
4241         __u64           size;
4242         struct ea_quota ea_block_quota;
4243
4244         pb.ino = ino;
4245         pb.num_blocks = EXT2FS_B2C(ctx->fs,
4246                                    ea_ibody_quota ? ea_ibody_quota->blocks : 0);
4247         pb.last_block = ~0;
4248         pb.last_init_lblock = -1;
4249         pb.last_db_block = -1;
4250         pb.num_illegal_blocks = 0;
4251         pb.suppress = 0; pb.clear = 0;
4252         pb.fragmented = 0;
4253         pb.compressed = 0;
4254         pb.previous_block = 0;
4255         pb.is_dir = LINUX_S_ISDIR(inode->i_mode);
4256         pb.is_reg = LINUX_S_ISREG(inode->i_mode);
4257         pb.max_blocks = 1U << (31 - fs->super->s_log_block_size);
4258         pb.inode = inode;
4259         pb.pctx = pctx;
4260         pb.ctx = ctx;
4261         pb.inode_modified = 0;
4262         pb.eti.force_rebuild = 0;
4263         pctx->ino = ino;
4264         pctx->errcode = 0;
4265
4266         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
4267         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
4268
4269         if (check_ext_attr(ctx, pctx, block_buf, &ea_block_quota)) {
4270                 if (e2fsck_should_abort(ctx))
4271                         goto out;
4272                 pb.num_blocks += EXT2FS_B2C(ctx->fs, ea_block_quota.blocks);
4273         }
4274
4275         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL))
4276                 check_blocks_inline_data(ctx, pctx, &pb);
4277         else if (ext2fs_inode_has_valid_blocks2(fs, inode)) {
4278                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL))
4279                         check_blocks_extents(ctx, pctx, &pb);
4280                 else {
4281                         int flags;
4282                         /*
4283                          * If we've modified the inode, write it out before
4284                          * iterate() tries to use it.
4285                          */
4286                         if (dirty_inode) {
4287                                 e2fsck_write_inode(ctx, ino, inode,
4288                                                    "check_blocks");
4289                                 dirty_inode = 0;
4290                         }
4291                         flags = fs->flags;
4292                         fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4293                         pctx->errcode = ext2fs_block_iterate3(fs, ino,
4294                                                 pb.is_dir ? BLOCK_FLAG_HOLE : 0,
4295                                                 block_buf, process_block, &pb);
4296                         /*
4297                          * We do not have uninitialized extents in non extent
4298                          * files.
4299                          */
4300                         pb.last_init_lblock = pb.last_block;
4301                         /*
4302                          * If iterate() changed a block mapping, we have to
4303                          * re-read the inode.  If we decide to clear the
4304                          * inode after clearing some stuff, we'll re-write the
4305                          * bad mappings into the inode!
4306                          */
4307                         if (pb.inode_modified)
4308                                 e2fsck_read_inode(ctx, ino, inode,
4309                                                   "check_blocks");
4310                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4311                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4312
4313                         if (ctx->options & E2F_OPT_CONVERT_BMAP) {
4314 #ifdef DEBUG
4315                                 printf("bmap rebuild ino=%d\n", ino);
4316 #endif
4317                                 if (!LINUX_S_ISDIR(inode->i_mode) ||
4318                                     !e2fsck_dir_will_be_rehashed(ctx, ino))
4319                                         e2fsck_rebuild_extents_later(ctx, ino);
4320                         }
4321                 }
4322         }
4323         end_problem_latch(ctx, PR_LATCH_BLOCK);
4324         end_problem_latch(ctx, PR_LATCH_TOOBIG);
4325         if (e2fsck_should_abort(ctx))
4326                 goto out;
4327         if (pctx->errcode)
4328                 fix_problem(ctx, PR_1_BLOCK_ITERATE, pctx);
4329
4330         if (pb.fragmented && pb.num_blocks < fs->super->s_blocks_per_group) {
4331                 if (LINUX_S_ISDIR(inode->i_mode))
4332                         ctx->fs_fragmented_dir++;
4333                 else
4334                         ctx->fs_fragmented++;
4335         }
4336
4337         if (pb.clear) {
4338                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4339                                    "check_blocks");
4340                 return;
4341         }
4342
4343         if (inode->i_flags & EXT2_INDEX_FL) {
4344                 if (handle_htree(ctx, pctx, ino, inode, block_buf)) {
4345                         inode->i_flags &= ~EXT2_INDEX_FL;
4346                         dirty_inode++;
4347                 } else {
4348                         e2fsck_add_dx_dir(ctx, ino, inode, pb.last_block+1);
4349                 }
4350         }
4351
4352         if (!pb.num_blocks && pb.is_dir &&
4353             !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
4354                 if (fix_problem(ctx, PR_1_ZERO_LENGTH_DIR, pctx)) {
4355                         e2fsck_clear_inode(ctx, ino, inode, 0, "check_blocks");
4356                         ctx->fs_directory_count--;
4357                         return;
4358                 }
4359         }
4360
4361         if (ino != quota_type2inum(PRJQUOTA, fs->super) &&
4362             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INODE(ctx->fs->super)) &&
4363             !(inode->i_flags & EXT4_EA_INODE_FL)) {
4364                 quota_data_add(ctx->qctx, (struct ext2_inode_large *) inode,
4365                                ino,
4366                                pb.num_blocks * EXT2_CLUSTER_SIZE(fs->super));
4367                 quota_data_inodes(ctx->qctx, (struct ext2_inode_large *) inode,
4368                                   ino, (ea_ibody_quota ?
4369                                         ea_ibody_quota->inodes : 0) +
4370                                                 ea_block_quota.inodes + 1);
4371         }
4372
4373         if (!ext2fs_has_feature_huge_file(fs->super) ||
4374             !(inode->i_flags & EXT4_HUGE_FILE_FL))
4375                 pb.num_blocks *= (fs->blocksize / 512);
4376         pb.num_blocks *= EXT2FS_CLUSTER_RATIO(fs);
4377 #if 0
4378         printf("inode %u, i_size = %u, last_block = %llu, i_blocks=%llu, num_blocks = %llu\n",
4379                ino, inode->i_size, (unsigned long long) pb.last_block,
4380                (unsigned long long) ext2fs_inode_i_blocks(fs, inode),
4381                (unsigned long long) pb.num_blocks);
4382 #endif
4383         size = EXT2_I_SIZE(inode);
4384         if (pb.is_dir) {
4385                 unsigned nblock = size >> EXT2_BLOCK_SIZE_BITS(fs->super);
4386                 if (inode->i_flags & EXT4_INLINE_DATA_FL) {
4387                         int flags;
4388                         size_t sz = 0;
4389                         errcode_t err;
4390
4391                         flags = ctx->fs->flags;
4392                         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4393                         err = ext2fs_inline_data_size(ctx->fs, pctx->ino,
4394                                                       &sz);
4395                         ctx->fs->flags = (flags &
4396                                           EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4397                                          (ctx->fs->flags &
4398                                           ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4399                         if (err || sz != size) {
4400                                 bad_size = 7;
4401                                 pctx->num = sz;
4402                         }
4403                 } else if (size & (fs->blocksize - 1))
4404                         bad_size = 5;
4405                 else if (nblock > (pb.last_block + 1))
4406                         bad_size = 1;
4407                 else if (nblock < (pb.last_block + 1)) {
4408                         if (((pb.last_block + 1) - nblock) >
4409                             fs->super->s_prealloc_dir_blocks)
4410                                 bad_size = 2;
4411                 }
4412         } else {
4413                 if ((pb.last_init_lblock >= 0) &&
4414                     /* Do not allow initialized allocated blocks past i_size*/
4415                     (size < (__u64)pb.last_init_lblock * fs->blocksize) &&
4416                     !(inode->i_flags & EXT4_VERITY_FL))
4417                         bad_size = 3;
4418                 else if (!(extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4419                          size > ext2_max_sizes[fs->super->s_log_block_size])
4420                         /* too big for a direct/indirect-mapped file */
4421                         bad_size = 4;
4422                 else if ((extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4423                          size >
4424                          ((1ULL << (32 + EXT2_BLOCK_SIZE_BITS(fs->super))) - 1))
4425                         /* too big for an extent-based file - 32bit ee_block */
4426                         bad_size = 6;
4427         }
4428         /* i_size for symlinks is checked elsewhere */
4429         if (bad_size && !LINUX_S_ISLNK(inode->i_mode)) {
4430                 /* Did inline_data set pctx->num earlier? */
4431                 if (bad_size != 7)
4432                         pctx->num = (pb.last_block + 1) * fs->blocksize;
4433                 pctx->group = bad_size;
4434                 if (fix_problem(ctx, PR_1_BAD_I_SIZE, pctx)) {
4435                         ext2fs_inode_size_set(fs, inode, pctx->num);
4436                         if (EXT2_I_SIZE(inode) == 0 &&
4437                             (inode->i_flags & EXT4_INLINE_DATA_FL)) {
4438                                 memset(inode->i_block, 0,
4439                                        sizeof(inode->i_block));
4440                                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
4441                         }
4442                         dirty_inode++;
4443                 }
4444                 pctx->num = 0;
4445         }
4446         if (LINUX_S_ISREG(inode->i_mode) &&
4447             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
4448                 ctx->large_files++;
4449         if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
4450             ((pb.num_blocks != ext2fs_inode_i_blocks(fs, inode)) ||
4451              (ext2fs_has_feature_huge_file(fs->super) &&
4452               (inode->i_flags & EXT4_HUGE_FILE_FL) &&
4453               (inode->osd2.linux2.l_i_blocks_hi != 0)))) {
4454                 pctx->num = pb.num_blocks;
4455                 if (fix_problem(ctx, PR_1_BAD_I_BLOCKS, pctx)) {
4456                         inode->i_blocks = pb.num_blocks;
4457                         inode->osd2.linux2.l_i_blocks_hi = pb.num_blocks >> 32;
4458                         dirty_inode++;
4459                 }
4460                 pctx->num = 0;
4461         }
4462
4463         /*
4464          * The kernel gets mad if we ask it to allocate bigalloc clusters to
4465          * a block mapped file, so rebuild it as an extent file.  We can skip
4466          * symlinks because they're never rewritten.
4467          */
4468         if (ext2fs_has_feature_bigalloc(fs->super) &&
4469             (LINUX_S_ISREG(inode->i_mode) || LINUX_S_ISDIR(inode->i_mode)) &&
4470             ext2fs_inode_data_blocks2(fs, inode) > 0 &&
4471             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INO(fs->super)) &&
4472             !(inode->i_flags & (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)) &&
4473             fix_problem(ctx, PR_1_NO_BIGALLOC_BLOCKMAP_FILES, pctx)) {
4474                 pctx->errcode = e2fsck_rebuild_extents_later(ctx, ino);
4475                 if (pctx->errcode)
4476                         goto out;
4477         }
4478
4479         if (ctx->dirs_to_hash && pb.is_dir &&
4480             !(ctx->lost_and_found && ctx->lost_and_found == ino) &&
4481             !(inode->i_flags & EXT2_INDEX_FL) &&
4482             ((inode->i_size / fs->blocksize) >= 3))
4483                 e2fsck_rehash_dir_later(ctx, ino);
4484
4485 out:
4486         if (dirty_inode)
4487                 e2fsck_write_inode(ctx, ino, inode, "check_blocks");
4488 }
4489
4490 #if 0
4491 /*
4492  * Helper function called by process block when an illegal block is
4493  * found.  It returns a description about why the block is illegal
4494  */
4495 static char *describe_illegal_block(ext2_filsys fs, blk64_t block)
4496 {
4497         blk64_t super;
4498         int     i;
4499         static char     problem[80];
4500
4501         super = fs->super->s_first_data_block;
4502         strcpy(problem, "PROGRAMMING ERROR: Unknown reason for illegal block");
4503         if (block < super) {
4504                 sprintf(problem, "< FIRSTBLOCK (%u)", super);
4505                 return(problem);
4506         } else if (block >= ext2fs_blocks_count(fs->super)) {
4507                 sprintf(problem, "> BLOCKS (%u)", ext2fs_blocks_count(fs->super));
4508                 return(problem);
4509         }
4510         for (i = 0; i < fs->group_desc_count; i++) {
4511                 if (block == super) {
4512                         sprintf(problem, "is the superblock in group %d", i);
4513                         break;
4514                 }
4515                 if (block > super &&
4516                     block <= (super + fs->desc_blocks)) {
4517                         sprintf(problem, "is in the group descriptors "
4518                                 "of group %d", i);
4519                         break;
4520                 }
4521                 if (block == ext2fs_block_bitmap_loc(fs, i)) {
4522                         sprintf(problem, "is the block bitmap of group %d", i);
4523                         break;
4524                 }
4525                 if (block == ext2fs_inode_bitmap_loc(fs, i)) {
4526                         sprintf(problem, "is the inode bitmap of group %d", i);
4527                         break;
4528                 }
4529                 if (block >= ext2fs_inode_table_loc(fs, i) &&
4530                     (block < ext2fs_inode_table_loc(fs, i)
4531                      + fs->inode_blocks_per_group)) {
4532                         sprintf(problem, "is in the inode table of group %d",
4533                                 i);
4534                         break;
4535                 }
4536                 super += fs->super->s_blocks_per_group;
4537         }
4538         return(problem);
4539 }
4540 #endif
4541
4542 /*
4543  * This is a helper function for check_blocks().
4544  */
4545 static int process_block(ext2_filsys fs,
4546                   blk64_t       *block_nr,
4547                   e2_blkcnt_t blockcnt,
4548                   blk64_t ref_block EXT2FS_ATTR((unused)),
4549                   int ref_offset EXT2FS_ATTR((unused)),
4550                   void *priv_data)
4551 {
4552         struct process_block_struct *p;
4553         struct problem_context *pctx;
4554         blk64_t blk = *block_nr;
4555         int     ret_code = 0;
4556         problem_t       problem = 0;
4557         e2fsck_t        ctx;
4558
4559         p = (struct process_block_struct *) priv_data;
4560         pctx = p->pctx;
4561         ctx = p->ctx;
4562
4563         /*
4564          * For a directory, add logical block zero for processing even if it's
4565          * not mapped or we'll be perennially stuck with broken "." and ".."
4566          * entries.
4567          */
4568         if (p->is_dir && blockcnt == 0 && blk == 0) {
4569                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino, 0, 0);
4570                 if (pctx->errcode) {
4571                         pctx->blk = blk;
4572                         pctx->num = blockcnt;
4573                         goto failed_add_dir_block;
4574                 }
4575                 p->last_db_block++;
4576         }
4577
4578         if (blk == 0)
4579                 return 0;
4580
4581 #if 0
4582         printf("Process_block, inode %lu, block %u, #%d\n", p->ino, blk,
4583                blockcnt);
4584 #endif
4585
4586         /*
4587          * Simplistic fragmentation check.  We merely require that the
4588          * file be contiguous.  (Which can never be true for really
4589          * big files that are greater than a block group.)
4590          */
4591         if (p->previous_block && p->ino != EXT2_RESIZE_INO) {
4592                 if (p->previous_block+1 != blk) {
4593                         if (ctx->options & E2F_OPT_FRAGCHECK) {
4594                                 char type = '?';
4595
4596                                 if (p->is_dir)
4597                                         type = 'd';
4598                                 else if (p->is_reg)
4599                                         type = 'f';
4600
4601                                 printf(_("%6lu(%c): expecting %6lu "
4602                                          "got phys %6lu (blkcnt %lld)\n"),
4603                                        (unsigned long) pctx->ino, type,
4604                                        (unsigned long) p->previous_block+1,
4605                                        (unsigned long) blk,
4606                                        (long long) blockcnt);
4607                         }
4608                         p->fragmented = 1;
4609                 }
4610         }
4611
4612         if (p->is_dir && !ext2fs_has_feature_largedir(fs->super) &&
4613             !pctx->inode->i_size_high &&
4614             blockcnt > (1 << (21 - fs->super->s_log_block_size)))
4615                 problem = PR_1_TOOBIG_DIR;
4616         if (p->is_dir && p->num_blocks + 1 >= p->max_blocks)
4617                 problem = PR_1_TOOBIG_DIR;
4618         if (p->is_reg && p->num_blocks + 1 >= p->max_blocks)
4619                 problem = PR_1_TOOBIG_REG;
4620         if (!p->is_dir && !p->is_reg && blockcnt > 0)
4621                 problem = PR_1_TOOBIG_SYMLINK;
4622
4623         if (blk < fs->super->s_first_data_block ||
4624             blk >= ext2fs_blocks_count(fs->super))
4625                 problem = PR_1_ILLEGAL_BLOCK_NUM;
4626
4627         /*
4628          * If this IND/DIND/TIND block is squatting atop some critical metadata
4629          * (group descriptors, superblock, bitmap, inode table), any write to
4630          * "fix" mapping problems will destroy the metadata.  We'll let pass 1b
4631          * fix that and restart fsck.
4632          */
4633         if (blockcnt < 0 &&
4634             p->ino != EXT2_RESIZE_INO &&
4635             blk < ctx->fs->super->s_blocks_count &&
4636             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk)) {
4637                 pctx->blk = blk;
4638                 fix_problem(ctx, PR_1_CRITICAL_METADATA_COLLISION, pctx);
4639                 if ((ctx->options & E2F_OPT_NO) == 0)
4640                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4641         }
4642
4643         if (problem) {
4644                 p->num_illegal_blocks++;
4645                 /*
4646                  * A bit of subterfuge here -- we're trying to fix a block
4647                  * mapping, but the IND/DIND/TIND block could have collided
4648                  * with some critical metadata.  So, fix the in-core mapping so
4649                  * iterate won't go insane, but return 0 instead of
4650                  * BLOCK_CHANGED so that it won't write the remapping out to
4651                  * our multiply linked block.
4652                  *
4653                  * Even if we previously determined that an *IND block
4654                  * conflicts with critical metadata, we must still try to
4655                  * iterate the *IND block as if it is an *IND block to find and
4656                  * mark the blocks it points to.  Better to be overly cautious
4657                  * with the used_blocks map so that we don't move the *IND
4658                  * block to a block that's really in use!
4659                  */
4660                 if (p->ino != EXT2_RESIZE_INO &&
4661                     ref_block != 0 &&
4662                     ext2fs_test_block_bitmap2(ctx->block_metadata_map,
4663                                               ref_block)) {
4664                         *block_nr = 0;
4665                         return 0;
4666                 }
4667                 if (!p->suppress && (p->num_illegal_blocks % 12) == 0) {
4668                         if (fix_problem(ctx, PR_1_TOO_MANY_BAD_BLOCKS, pctx)) {
4669                                 p->clear = 1;
4670                                 return BLOCK_ABORT;
4671                         }
4672                         if (fix_problem(ctx, PR_1_SUPPRESS_MESSAGES, pctx)) {
4673                                 p->suppress = 1;
4674                                 set_latch_flags(PR_LATCH_BLOCK,
4675                                                 PRL_SUPPRESS, 0);
4676                         }
4677                 }
4678                 pctx->blk = blk;
4679                 pctx->blkcount = blockcnt;
4680                 if (fix_problem(ctx, problem, pctx)) {
4681                         blk = *block_nr = 0;
4682                         ret_code = BLOCK_CHANGED;
4683                         p->inode_modified = 1;
4684                         /*
4685                          * If the directory block is too big and is beyond the
4686                          * end of the FS, don't bother trying to add it for
4687                          * processing -- the kernel would never have created a
4688                          * directory this large, and we risk an ENOMEM abort.
4689                          * In any case, the toobig handler for extent-based
4690                          * directories also doesn't feed toobig blocks to
4691                          * pass 2.
4692                          */
4693                         if (problem == PR_1_TOOBIG_DIR)
4694                                 return ret_code;
4695                         goto mark_dir;
4696                 } else
4697                         return 0;
4698         }
4699
4700         if (p->ino == EXT2_RESIZE_INO) {
4701                 /*
4702                  * The resize inode has already be sanity checked
4703                  * during pass #0 (the superblock checks).  All we
4704                  * have to do is mark the double indirect block as
4705                  * being in use; all of the other blocks are handled
4706                  * by mark_table_blocks()).
4707                  */
4708                 if (blockcnt == BLOCK_COUNT_DIND)
4709                         mark_block_used(ctx, blk);
4710                 p->num_blocks++;
4711         } else if (!(ctx->fs->cluster_ratio_bits &&
4712                      p->previous_block &&
4713                      (EXT2FS_B2C(ctx->fs, blk) ==
4714                       EXT2FS_B2C(ctx->fs, p->previous_block)) &&
4715                      (blk & EXT2FS_CLUSTER_MASK(ctx->fs)) ==
4716                      ((unsigned) blockcnt & EXT2FS_CLUSTER_MASK(ctx->fs)))) {
4717                 mark_block_used(ctx, blk);
4718                 p->num_blocks++;
4719         } else if (has_unaligned_cluster_map(ctx, p->previous_block,
4720                                              p->last_block, blk, blockcnt)) {
4721                 pctx->blk = blockcnt;
4722                 pctx->blk2 = blk;
4723                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4724                 mark_block_used(ctx, blk);
4725                 mark_block_used(ctx, blk);
4726         }
4727         if (blockcnt >= 0)
4728                 p->last_block = blockcnt;
4729         p->previous_block = blk;
4730 mark_dir:
4731         if (p->is_dir && (blockcnt >= 0)) {
4732                 while (++p->last_db_block < blockcnt) {
4733                         pctx->errcode = ext2fs_add_dir_block2(fs->dblist,
4734                                                               p->ino, 0,
4735                                                               p->last_db_block);
4736                         if (pctx->errcode) {
4737                                 pctx->blk = 0;
4738                                 pctx->num = p->last_db_block;
4739                                 goto failed_add_dir_block;
4740                         }
4741                 }
4742                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino,
4743                                                       blk, blockcnt);
4744                 if (pctx->errcode) {
4745                         pctx->blk = blk;
4746                         pctx->num = blockcnt;
4747                 failed_add_dir_block:
4748                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4749                         /* Should never get here */
4750                         ctx->flags |= E2F_FLAG_ABORT;
4751                         return BLOCK_ABORT;
4752                 }
4753         }
4754         return ret_code;
4755 }
4756
4757 static int process_bad_block(ext2_filsys fs,
4758                       blk64_t *block_nr,
4759                       e2_blkcnt_t blockcnt,
4760                       blk64_t ref_block EXT2FS_ATTR((unused)),
4761                       int ref_offset EXT2FS_ATTR((unused)),
4762                       void *priv_data)
4763 {
4764         struct process_block_struct *p;
4765         blk64_t         blk = *block_nr;
4766         blk64_t         first_block;
4767         dgrp_t          i;
4768         struct problem_context *pctx;
4769         e2fsck_t        ctx;
4770
4771         if (!blk)
4772                 return 0;
4773
4774         p = (struct process_block_struct *) priv_data;
4775         ctx = p->ctx;
4776         pctx = p->pctx;
4777
4778         pctx->ino = EXT2_BAD_INO;
4779         pctx->blk = blk;
4780         pctx->blkcount = blockcnt;
4781
4782         if ((blk < fs->super->s_first_data_block) ||
4783             (blk >= ext2fs_blocks_count(fs->super))) {
4784                 if (fix_problem(ctx, PR_1_BB_ILLEGAL_BLOCK_NUM, pctx)) {
4785                         *block_nr = 0;
4786                         return BLOCK_CHANGED;
4787                 } else
4788                         return 0;
4789         }
4790
4791         if (blockcnt < 0) {
4792                 if (ext2fs_test_block_bitmap2(p->fs_meta_blocks, blk)) {
4793                         p->bbcheck = 1;
4794                         if (fix_problem(ctx, PR_1_BB_FS_BLOCK, pctx)) {
4795                                 *block_nr = 0;
4796                                 return BLOCK_CHANGED;
4797                         }
4798                 } else if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4799                                                     blk)) {
4800                         p->bbcheck = 1;
4801                         if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK,
4802                                         pctx)) {
4803                                 *block_nr = 0;
4804                                 return BLOCK_CHANGED;
4805                         }
4806                         if (e2fsck_should_abort(ctx))
4807                                 return BLOCK_ABORT;
4808                 } else
4809                         mark_block_used(ctx, blk);
4810                 return 0;
4811         }
4812 #if 0
4813         printf ("DEBUG: Marking %u as bad.\n", blk);
4814 #endif
4815         ctx->fs_badblocks_count++;
4816         /*
4817          * If the block is not used, then mark it as used and return.
4818          * If it is already marked as found, this must mean that
4819          * there's an overlap between the filesystem table blocks
4820          * (bitmaps and inode table) and the bad block list.
4821          */
4822         if (!ext2fs_test_block_bitmap2(ctx->block_found_map, blk)) {
4823                 ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
4824                 return 0;
4825         }
4826         /*
4827          * Try to find the where the filesystem block was used...
4828          */
4829         first_block = fs->super->s_first_data_block;
4830
4831         for (i = 0; i < fs->group_desc_count; i++ ) {
4832                 pctx->group = i;
4833                 pctx->blk = blk;
4834                 if (!ext2fs_bg_has_super(fs, i))
4835                         goto skip_super;
4836                 if (blk == first_block) {
4837                         if (i == 0) {
4838                                 if (fix_problem(ctx,
4839                                                 PR_1_BAD_PRIMARY_SUPERBLOCK,
4840                                                 pctx)) {
4841                                         *block_nr = 0;
4842                                         return BLOCK_CHANGED;
4843                                 }
4844                                 return 0;
4845                         }
4846                         fix_problem(ctx, PR_1_BAD_SUPERBLOCK, pctx);
4847                         return 0;
4848                 }
4849                 if ((blk > first_block) &&
4850                     (blk <= first_block + fs->desc_blocks)) {
4851                         if (i == 0) {
4852                                 pctx->blk = *block_nr;
4853                                 if (fix_problem(ctx,
4854                         PR_1_BAD_PRIMARY_GROUP_DESCRIPTOR, pctx)) {
4855                                         *block_nr = 0;
4856                                         return BLOCK_CHANGED;
4857                                 }
4858                                 return 0;
4859                         }
4860                         fix_problem(ctx, PR_1_BAD_GROUP_DESCRIPTORS, pctx);
4861                         return 0;
4862                 }
4863         skip_super:
4864                 if (blk == ext2fs_block_bitmap_loc(fs, i)) {
4865                         if (fix_problem(ctx, PR_1_BB_BAD_BLOCK, pctx)) {
4866                                 ctx->invalid_block_bitmap_flag[i]++;
4867                                 ctx->invalid_bitmaps++;
4868                         }
4869                         return 0;
4870                 }
4871                 if (blk == ext2fs_inode_bitmap_loc(fs, i)) {
4872                         if (fix_problem(ctx, PR_1_IB_BAD_BLOCK, pctx)) {
4873                                 ctx->invalid_inode_bitmap_flag[i]++;
4874                                 ctx->invalid_bitmaps++;
4875                         }
4876                         return 0;
4877                 }
4878                 if ((blk >= ext2fs_inode_table_loc(fs, i)) &&
4879                     (blk < (ext2fs_inode_table_loc(fs, i) +
4880                             fs->inode_blocks_per_group))) {
4881                         /*
4882                          * If there are bad blocks in the inode table,
4883                          * the inode scan code will try to do
4884                          * something reasonable automatically.
4885                          */
4886                         return 0;
4887                 }
4888                 first_block += fs->super->s_blocks_per_group;
4889         }
4890         /*
4891          * If we've gotten to this point, then the only
4892          * possibility is that the bad block inode meta data
4893          * is using a bad block.
4894          */
4895         if ((blk == p->inode->i_block[EXT2_IND_BLOCK]) ||
4896             (blk == p->inode->i_block[EXT2_DIND_BLOCK]) ||
4897             (blk == p->inode->i_block[EXT2_TIND_BLOCK])) {
4898                 p->bbcheck = 1;
4899                 if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK, pctx)) {
4900                         *block_nr = 0;
4901                         return BLOCK_CHANGED;
4902                 }
4903                 if (e2fsck_should_abort(ctx))
4904                         return BLOCK_ABORT;
4905                 return 0;
4906         }
4907
4908         pctx->group = -1;
4909
4910         /* Warn user that the block wasn't claimed */
4911         fix_problem(ctx, PR_1_PROGERR_CLAIMED_BLOCK, pctx);
4912
4913         return 0;
4914 }
4915
4916 static void new_table_block(e2fsck_t ctx, blk64_t first_block, dgrp_t group,
4917                             const char *name, int num, blk64_t *new_block)
4918 {
4919         ext2_filsys fs = ctx->fs;
4920         dgrp_t          last_grp;
4921         blk64_t         old_block = *new_block;
4922         blk64_t         last_block;
4923         dgrp_t          flexbg;
4924         unsigned        flexbg_size;
4925         int             i, is_flexbg;
4926         char            *buf;
4927         struct problem_context  pctx;
4928
4929         clear_problem_context(&pctx);
4930
4931         pctx.group = group;
4932         pctx.blk = old_block;
4933         pctx.str = name;
4934
4935         /*
4936          * For flex_bg filesystems, first try to allocate the metadata
4937          * within the flex_bg, and if that fails then try finding the
4938          * space anywhere in the filesystem.
4939          */
4940         is_flexbg = ext2fs_has_feature_flex_bg(fs->super);
4941         if (is_flexbg) {
4942                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
4943                 flexbg = group / flexbg_size;
4944                 first_block = ext2fs_group_first_block2(fs,
4945                                                         flexbg_size * flexbg);
4946                 last_grp = group | (flexbg_size - 1);
4947                 if (last_grp >= fs->group_desc_count)
4948                         last_grp = fs->group_desc_count - 1;
4949                 last_block = ext2fs_group_last_block2(fs, last_grp);
4950         } else
4951                 last_block = ext2fs_group_last_block2(fs, group);
4952         pctx.errcode = ext2fs_get_free_blocks2(fs, first_block, last_block,
4953                                                num, ctx->block_found_map,
4954                                                new_block);
4955         if (is_flexbg && (pctx.errcode == EXT2_ET_BLOCK_ALLOC_FAIL))
4956                 pctx.errcode = ext2fs_get_free_blocks2(fs,
4957                                 fs->super->s_first_data_block,
4958                                 ext2fs_blocks_count(fs->super),
4959                                 num, ctx->block_found_map, new_block);
4960         if (pctx.errcode) {
4961                 pctx.num = num;
4962                 fix_problem(ctx, PR_1_RELOC_BLOCK_ALLOCATE, &pctx);
4963                 ext2fs_unmark_valid(fs);
4964                 ctx->flags |= E2F_FLAG_ABORT;
4965                 return;
4966         }
4967         pctx.errcode = ext2fs_get_mem(fs->blocksize, &buf);
4968         if (pctx.errcode) {
4969                 fix_problem(ctx, PR_1_RELOC_MEMORY_ALLOCATE, &pctx);
4970                 ext2fs_unmark_valid(fs);
4971                 ctx->flags |= E2F_FLAG_ABORT;
4972                 return;
4973         }
4974         ext2fs_mark_super_dirty(fs);
4975         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
4976         pctx.blk2 = *new_block;
4977         fix_problem(ctx, (old_block ? PR_1_RELOC_FROM_TO :
4978                           PR_1_RELOC_TO), &pctx);
4979         pctx.blk2 = 0;
4980         for (i = 0; i < num; i++) {
4981                 pctx.blk = i;
4982                 ext2fs_mark_block_bitmap2(ctx->block_found_map, (*new_block)+i);
4983                 if (old_block) {
4984                         pctx.errcode = io_channel_read_blk64(fs->io,
4985                                    old_block + i, 1, buf);
4986                         if (pctx.errcode)
4987                                 fix_problem(ctx, PR_1_RELOC_READ_ERR, &pctx);
4988                         pctx.blk = (*new_block) + i;
4989                         pctx.errcode = io_channel_write_blk64(fs->io, pctx.blk,
4990                                                               1, buf);
4991                 } else {
4992                         pctx.blk = (*new_block) + i;
4993                         pctx.errcode = ext2fs_zero_blocks2(fs, pctx.blk, 1,
4994                                                            NULL, NULL);
4995                 }
4996
4997                 if (pctx.errcode)
4998                         fix_problem(ctx, PR_1_RELOC_WRITE_ERR, &pctx);
4999         }
5000         ext2fs_free_mem(&buf);
5001 }
5002
5003 /*
5004  * This routine gets called at the end of pass 1 if bad blocks are
5005  * detected in the superblock, group descriptors, inode_bitmaps, or
5006  * block bitmaps.  At this point, all of the blocks have been mapped
5007  * out, so we can try to allocate new block(s) to replace the bad
5008  * blocks.
5009  */
5010 static void handle_fs_bad_blocks(e2fsck_t ctx)
5011 {
5012         ext2_filsys fs = ctx->fs;
5013         dgrp_t          i;
5014         blk64_t         first_block;
5015         blk64_t         new_blk;
5016
5017         for (i = 0; i < fs->group_desc_count; i++) {
5018                 first_block = ext2fs_group_first_block2(fs, i);
5019
5020                 if (ctx->invalid_block_bitmap_flag[i]) {
5021                         new_blk = ext2fs_block_bitmap_loc(fs, i);
5022                         new_table_block(ctx, first_block, i, _("block bitmap"),
5023                                         1, &new_blk);
5024                         ext2fs_block_bitmap_loc_set(fs, i, new_blk);
5025                 }
5026                 if (ctx->invalid_inode_bitmap_flag[i]) {
5027                         new_blk = ext2fs_inode_bitmap_loc(fs, i);
5028                         new_table_block(ctx, first_block, i, _("inode bitmap"),
5029                                         1, &new_blk);
5030                         ext2fs_inode_bitmap_loc_set(fs, i, new_blk);
5031                 }
5032                 if (ctx->invalid_inode_table_flag[i]) {
5033                         new_blk = ext2fs_inode_table_loc(fs, i);
5034                         new_table_block(ctx, first_block, i, _("inode table"),
5035                                         fs->inode_blocks_per_group,
5036                                         &new_blk);
5037                         ext2fs_inode_table_loc_set(fs, i, new_blk);
5038                         ctx->flags |= E2F_FLAG_RESTART;
5039                 }
5040         }
5041         ctx->invalid_bitmaps = 0;
5042 }
5043
5044 /*
5045  * This routine marks all blocks which are used by the superblock,
5046  * group descriptors, inode bitmaps, and block bitmaps.
5047  */
5048 static void mark_table_blocks(e2fsck_t ctx)
5049 {
5050         ext2_filsys fs = ctx->fs;
5051         blk64_t b;
5052         dgrp_t  i;
5053         unsigned int    j;
5054         struct problem_context pctx;
5055
5056         clear_problem_context(&pctx);
5057
5058         for (i = 0; i < fs->group_desc_count; i++) {
5059                 pctx.group = i;
5060
5061                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_found_map);
5062                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_metadata_map);
5063
5064                 /*
5065                  * Mark the blocks used for the inode table
5066                  */
5067                 if (ext2fs_inode_table_loc(fs, i)) {
5068                         for (j = 0, b = ext2fs_inode_table_loc(fs, i);
5069                              j < fs->inode_blocks_per_group;
5070                              j++, b++) {
5071                                 if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5072                                                              b)) {
5073                                         pctx.blk = b;
5074                                         if (!ctx->invalid_inode_table_flag[i] &&
5075                                             fix_problem(ctx,
5076                                                 PR_1_ITABLE_CONFLICT, &pctx)) {
5077                                                 ctx->invalid_inode_table_flag[i]++;
5078                                                 ctx->invalid_bitmaps++;
5079                                         }
5080                                 } else {
5081                                     ext2fs_mark_block_bitmap2(
5082                                                 ctx->block_found_map, b);
5083                                     ext2fs_mark_block_bitmap2(
5084                                                 ctx->block_metadata_map, b);
5085                                 }
5086                         }
5087                 }
5088
5089                 /*
5090                  * Mark block used for the block bitmap
5091                  */
5092                 if (ext2fs_block_bitmap_loc(fs, i)) {
5093                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5094                                      ext2fs_block_bitmap_loc(fs, i))) {
5095                                 pctx.blk = ext2fs_block_bitmap_loc(fs, i);
5096                                 if (fix_problem(ctx, PR_1_BB_CONFLICT, &pctx)) {
5097                                         ctx->invalid_block_bitmap_flag[i]++;
5098                                         ctx->invalid_bitmaps++;
5099                                 }
5100                         } else {
5101                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5102                                      ext2fs_block_bitmap_loc(fs, i));
5103                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5104                                      ext2fs_block_bitmap_loc(fs, i));
5105                         }
5106                 }
5107                 /*
5108                  * Mark block used for the inode bitmap
5109                  */
5110                 if (ext2fs_inode_bitmap_loc(fs, i)) {
5111                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5112                                      ext2fs_inode_bitmap_loc(fs, i))) {
5113                                 pctx.blk = ext2fs_inode_bitmap_loc(fs, i);
5114                                 if (fix_problem(ctx, PR_1_IB_CONFLICT, &pctx)) {
5115                                         ctx->invalid_inode_bitmap_flag[i]++;
5116                                         ctx->invalid_bitmaps++;
5117                                 }
5118                         } else {
5119                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5120                                      ext2fs_inode_bitmap_loc(fs, i));
5121                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5122                                      ext2fs_inode_bitmap_loc(fs, i));
5123                         }
5124                 }
5125         }
5126 }
5127
5128 /*
5129  * These subroutines short circuits ext2fs_get_blocks and
5130  * ext2fs_check_directory; we use them since we already have the inode
5131  * structure, so there's no point in letting the ext2fs library read
5132  * the inode again.
5133  */
5134 static errcode_t pass1_get_blocks(ext2_filsys fs, ext2_ino_t ino,
5135                                   blk_t *blocks)
5136 {
5137         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5138         int     i;
5139
5140         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5141                 return EXT2_ET_CALLBACK_NOTHANDLED;
5142
5143         for (i=0; i < EXT2_N_BLOCKS; i++)
5144                 blocks[i] = ctx->stashed_inode->i_block[i];
5145         return 0;
5146 }
5147
5148 static errcode_t pass1_read_inode(ext2_filsys fs, ext2_ino_t ino,
5149                                   struct ext2_inode *inode)
5150 {
5151         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5152
5153         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5154                 return EXT2_ET_CALLBACK_NOTHANDLED;
5155         *inode = *ctx->stashed_inode;
5156         return 0;
5157 }
5158
5159 static errcode_t pass1_write_inode(ext2_filsys fs, ext2_ino_t ino,
5160                             struct ext2_inode *inode)
5161 {
5162         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5163
5164         if ((ino == ctx->stashed_ino) && ctx->stashed_inode &&
5165                 (inode != ctx->stashed_inode))
5166                 *ctx->stashed_inode = *inode;
5167         return EXT2_ET_CALLBACK_NOTHANDLED;
5168 }
5169
5170 static errcode_t pass1_check_directory(ext2_filsys fs, ext2_ino_t ino)
5171 {
5172         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5173
5174         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5175                 return EXT2_ET_CALLBACK_NOTHANDLED;
5176
5177         if (!LINUX_S_ISDIR(ctx->stashed_inode->i_mode))
5178                 return EXT2_ET_NO_DIRECTORY;
5179         return 0;
5180 }
5181
5182 static errcode_t e2fsck_get_alloc_block(ext2_filsys fs, blk64_t goal,
5183                                         blk64_t *ret)
5184 {
5185         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5186         errcode_t       retval;
5187         blk64_t         new_block;
5188
5189         if (ctx->block_found_map) {
5190                 retval = ext2fs_new_block2(fs, goal, ctx->block_found_map,
5191                                            &new_block);
5192                 if (retval)
5193                         return retval;
5194                 if (fs->block_map) {
5195                         ext2fs_mark_block_bitmap2(fs->block_map, new_block);
5196                         ext2fs_mark_bb_dirty(fs);
5197                 }
5198         } else {
5199                 if (!fs->block_map) {
5200                         retval = ext2fs_read_block_bitmap(fs);
5201                         if (retval)
5202                                 return retval;
5203                 }
5204
5205                 retval = ext2fs_new_block2(fs, goal, fs->block_map, &new_block);
5206                 if (retval)
5207                         return retval;
5208         }
5209
5210         *ret = new_block;
5211         return (0);
5212 }
5213
5214 static errcode_t e2fsck_new_range(ext2_filsys fs, int flags, blk64_t goal,
5215                                   blk64_t len, blk64_t *pblk, blk64_t *plen)
5216 {
5217         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5218         errcode_t       retval;
5219
5220         if (ctx->block_found_map)
5221                 return ext2fs_new_range(fs, flags, goal, len,
5222                                         ctx->block_found_map, pblk, plen);
5223
5224         if (!fs->block_map) {
5225                 retval = ext2fs_read_block_bitmap(fs);
5226                 if (retval)
5227                         return retval;
5228         }
5229
5230         return ext2fs_new_range(fs, flags, goal, len, fs->block_map,
5231                                 pblk, plen);
5232 }
5233
5234 static void e2fsck_block_alloc_stats(ext2_filsys fs, blk64_t blk, int inuse)
5235 {
5236         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5237
5238         /* Never free a critical metadata block */
5239         if (ctx->block_found_map &&
5240             ctx->block_metadata_map &&
5241             inuse < 0 &&
5242             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk))
5243                 return;
5244
5245         if (ctx->block_found_map) {
5246                 if (inuse > 0)
5247                         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5248                 else
5249                         ext2fs_unmark_block_bitmap2(ctx->block_found_map, blk);
5250         }
5251 }
5252
5253 static void e2fsck_block_alloc_stats_range(ext2_filsys fs, blk64_t blk,
5254                                            blk_t num, int inuse)
5255 {
5256         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5257
5258         /* Never free a critical metadata block */
5259         if (ctx->block_found_map &&
5260             ctx->block_metadata_map &&
5261             inuse < 0 &&
5262             ext2fs_test_block_bitmap_range2(ctx->block_metadata_map, blk, num))
5263                 return;
5264
5265         if (ctx->block_found_map) {
5266                 if (inuse > 0)
5267                         ext2fs_mark_block_bitmap_range2(ctx->block_found_map,
5268                                                         blk, num);
5269                 else
5270                         ext2fs_unmark_block_bitmap_range2(ctx->block_found_map,
5271                                                         blk, num);
5272         }
5273 }
5274
5275 void e2fsck_use_inode_shortcuts(e2fsck_t ctx, int use_shortcuts)
5276 {
5277         ext2_filsys fs = ctx->fs;
5278
5279         if (use_shortcuts) {
5280                 fs->get_blocks = pass1_get_blocks;
5281                 fs->check_directory = pass1_check_directory;
5282                 fs->read_inode = pass1_read_inode;
5283                 fs->write_inode = pass1_write_inode;
5284                 ctx->stashed_ino = 0;
5285         } else {
5286                 fs->get_blocks = 0;
5287                 fs->check_directory = 0;
5288                 fs->read_inode = 0;
5289                 fs->write_inode = 0;
5290         }
5291 }
5292
5293 void e2fsck_intercept_block_allocations(e2fsck_t ctx)
5294 {
5295         ext2fs_set_alloc_block_callback(ctx->fs, e2fsck_get_alloc_block, 0);
5296         ext2fs_set_block_alloc_stats_callback(ctx->fs,
5297                                                 e2fsck_block_alloc_stats, 0);
5298         ext2fs_set_new_range_callback(ctx->fs, e2fsck_new_range, NULL);
5299         ext2fs_set_block_alloc_stats_range_callback(ctx->fs,
5300                                         e2fsck_block_alloc_stats_range, NULL);
5301 }