Whamcloud - gitweb
LU-14953 e2fsck: pfsck progress report
[tools/e2fsprogs.git] / e2fsck / pass1.c
1 /*
2  * pass1.c -- pass #1 of e2fsck: sequential scan of the inode table
3  *
4  * Copyright (C) 1993, 1994, 1995, 1996, 1997 Theodore Ts'o.
5  *
6  * %Begin-Header%
7  * This file may be redistributed under the terms of the GNU Public
8  * License.
9  * %End-Header%
10  *
11  * Pass 1 of e2fsck iterates over all the inodes in the filesystems,
12  * and applies the following tests to each inode:
13  *
14  *      - The mode field of the inode must be legal.
15  *      - The size and block count fields of the inode are correct.
16  *      - A data block must not be used by another inode
17  *
18  * Pass 1 also gathers the collects the following information:
19  *
20  *      - A bitmap of which inodes are in use.          (inode_used_map)
21  *      - A bitmap of which inodes are directories.     (inode_dir_map)
22  *      - A bitmap of which inodes are regular files.   (inode_reg_map)
23  *      - A bitmap of which inodes have bad fields.     (inode_bad_map)
24  *      - A bitmap of which inodes are in bad blocks.   (inode_bb_map)
25  *      - A bitmap of which inodes are imagic inodes.   (inode_imagic_map)
26  *      - A bitmap of which inodes are casefolded.      (inode_casefold_map)
27  *      - A bitmap of which blocks are in use.          (block_found_map)
28  *      - A bitmap of which blocks are in use by two inodes     (block_dup_map)
29  *      - The data blocks of the directory inodes.      (dir_map)
30  *      - Ref counts for ea_inodes.                     (ea_inode_refs)
31  *      - The encryption policy ID of each encrypted inode. (encrypted_files)
32  *
33  * Pass 1 is designed to stash away enough information so that the
34  * other passes should not need to read in the inode information
35  * during the normal course of a filesystem check.  (Although if an
36  * inconsistency is detected, other passes may need to read in an
37  * inode to fix it.)
38  *
39  * Note that pass 1B will be invoked if there are any duplicate blocks
40  * found.
41  */
42
43 #define _GNU_SOURCE 1 /* get strnlen() */
44 #include "config.h"
45 #include <string.h>
46 #include <time.h>
47 #ifdef HAVE_ERRNO_H
48 #include <errno.h>
49 #endif
50 #include <assert.h>
51 #ifdef HAVE_PTHREAD
52 #include <pthread.h>
53 #endif
54
55 #include "e2fsck.h"
56 #include <ext2fs/ext2_ext_attr.h>
57 /* todo remove this finally */
58 #include <ext2fs/ext2fsP.h>
59 #include <e2p/e2p.h>
60
61 #include "problem.h"
62
63 #ifdef NO_INLINE_FUNCS
64 #define _INLINE_
65 #else
66 #define _INLINE_ inline
67 #endif
68
69 #undef DEBUG
70
71 struct ea_quota {
72         blk64_t blocks;
73         __u64 inodes;
74 };
75
76 static int process_block(ext2_filsys fs, blk64_t        *blocknr,
77                          e2_blkcnt_t blockcnt, blk64_t ref_blk,
78                          int ref_offset, void *priv_data);
79 static int process_bad_block(ext2_filsys fs, blk64_t *block_nr,
80                              e2_blkcnt_t blockcnt, blk64_t ref_blk,
81                              int ref_offset, void *priv_data);
82 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
83                          char *block_buf,
84                          const struct ea_quota *ea_ibody_quota);
85 static void mark_table_blocks(e2fsck_t ctx);
86 static void alloc_bb_map(e2fsck_t ctx);
87 static void alloc_imagic_map(e2fsck_t ctx);
88 static void mark_inode_bad(e2fsck_t ctx, ext2_ino_t ino);
89 static void add_casefolded_dir(e2fsck_t ctx, ext2_ino_t ino);
90 static void handle_fs_bad_blocks(e2fsck_t ctx);
91 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b);
92 static errcode_t scan_callback(ext2_filsys fs, ext2_inode_scan scan,
93                                   dgrp_t group, void * priv_data);
94 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
95                                     char *block_buf, int adjust_sign);
96 /* static char *describe_illegal_block(ext2_filsys fs, blk64_t block); */
97
98 struct process_block_struct {
99         ext2_ino_t      ino;
100         unsigned        is_dir:1, is_reg:1, clear:1, suppress:1,
101                                 fragmented:1, compressed:1, bbcheck:1,
102                                 inode_modified:1;
103         blk64_t         num_blocks;
104         blk64_t         max_blocks;
105         blk64_t         last_block;
106         e2_blkcnt_t     last_init_lblock;
107         e2_blkcnt_t     last_db_block;
108         int             num_illegal_blocks;
109         blk64_t         previous_block;
110         struct ext2_inode *inode;
111         struct problem_context *pctx;
112         ext2fs_block_bitmap fs_meta_blocks;
113         e2fsck_t        ctx;
114         blk64_t         next_lblock;
115         struct extent_tree_info eti;
116 };
117
118 struct process_inode_block {
119         ext2_ino_t ino;
120         struct ea_quota ea_ibody_quota;
121         struct ext2_inode_large inode;
122 };
123
124 struct scan_callback_struct {
125         e2fsck_t                         ctx;
126         char                            *block_buf;
127         struct process_inode_block      *inodes_to_process;
128         int                             *process_inode_count;
129 };
130
131 static void process_inodes(e2fsck_t ctx, char *block_buf,
132                            struct process_inode_block *inodes_to_process,
133                            int *process_inode_count);
134
135 static __u64 ext2_max_sizes[EXT2_MAX_BLOCK_LOG_SIZE -
136                             EXT2_MIN_BLOCK_LOG_SIZE + 1];
137
138 /*
139  * Check to make sure a device inode is real.  Returns 1 if the device
140  * checks out, 0 if not.
141  *
142  * Note: this routine is now also used to check FIFO's and Sockets,
143  * since they have the same requirement; the i_block fields should be
144  * zero.
145  */
146 int e2fsck_pass1_check_device_inode(ext2_filsys fs EXT2FS_ATTR((unused)),
147                                     struct ext2_inode *inode)
148 {
149         int     i;
150
151         /*
152          * If the index or extents flag is set, then this is a bogus
153          * device/fifo/socket
154          */
155         if (inode->i_flags & (EXT2_INDEX_FL | EXT4_EXTENTS_FL))
156                 return 0;
157
158         /*
159          * We should be able to do the test below all the time, but
160          * because the kernel doesn't forcibly clear the device
161          * inode's additional i_block fields, there are some rare
162          * occasions when a legitimate device inode will have non-zero
163          * additional i_block fields.  So for now, we only complain
164          * when the immutable flag is set, which should never happen
165          * for devices.  (And that's when the problem is caused, since
166          * you can't set or clear immutable flags for devices.)  Once
167          * the kernel has been fixed we can change this...
168          */
169         if (inode->i_flags & (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)) {
170                 for (i=4; i < EXT2_N_BLOCKS; i++)
171                         if (inode->i_block[i])
172                                 return 0;
173         }
174         return 1;
175 }
176
177 /*
178  * Check to make sure a symlink inode is real.  Returns 1 if the symlink
179  * checks out, 0 if not.
180  */
181 int e2fsck_pass1_check_symlink(ext2_filsys fs, ext2_ino_t ino,
182                                struct ext2_inode *inode, char *buf)
183 {
184         unsigned int buflen;
185         unsigned int len;
186
187         if ((inode->i_size_high || inode->i_size == 0) ||
188             (inode->i_flags & EXT2_INDEX_FL))
189                 return 0;
190
191         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
192                 size_t inline_size;
193
194                 if (inode->i_flags & EXT4_EXTENTS_FL)
195                         return 0;
196                 if (ext2fs_inline_data_size(fs, ino, &inline_size))
197                         return 0;
198                 if (inode->i_size != inline_size)
199                         return 0;
200
201                 return 1;
202         }
203
204         if (ext2fs_is_fast_symlink(inode)) {
205                 if (inode->i_flags & EXT4_EXTENTS_FL)
206                         return 0;
207                 buf = (char *)inode->i_block;
208                 buflen = sizeof(inode->i_block);
209         } else {
210                 ext2_extent_handle_t    handle;
211                 struct ext2_extent_info info;
212                 struct ext2fs_extent    extent;
213                 blk64_t blk;
214                 int i;
215
216                 if (inode->i_flags & EXT4_EXTENTS_FL) {
217                         if (ext2fs_extent_open2(fs, ino, inode, &handle))
218                                 return 0;
219                         if (ext2fs_extent_get_info(handle, &info) ||
220                             (info.num_entries != 1) ||
221                             (info.max_depth != 0)) {
222                                 ext2fs_extent_free(handle);
223                                 return 0;
224                         }
225                         if (ext2fs_extent_get(handle, EXT2_EXTENT_ROOT,
226                                               &extent) ||
227                             (extent.e_lblk != 0) ||
228                             (extent.e_len != 1)) {
229                                 ext2fs_extent_free(handle);
230                                 return 0;
231                         }
232                         blk = extent.e_pblk;
233                         ext2fs_extent_free(handle);
234                 } else {
235                         blk = inode->i_block[0];
236
237                         for (i = 1; i < EXT2_N_BLOCKS; i++)
238                                 if (inode->i_block[i])
239                                         return 0;
240                 }
241
242                 if (blk < fs->super->s_first_data_block ||
243                     blk >= ext2fs_blocks_count(fs->super))
244                         return 0;
245
246                 if (io_channel_read_blk64(fs->io, blk, 1, buf))
247                         return 0;
248
249                 buflen = fs->blocksize;
250         }
251
252         if (inode->i_flags & EXT4_ENCRYPT_FL)
253                 len = ext2fs_le16_to_cpu(*(__u16 *)buf) + 2;
254         else
255                 len = strnlen(buf, buflen);
256
257         if (len >= buflen)
258                 return 0;
259
260         if (len != inode->i_size)
261                 return 0;
262         return 1;
263 }
264
265 /*
266  * If the extents or inlinedata flags are set on the inode, offer to clear 'em.
267  */
268 #define BAD_SPECIAL_FLAGS (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)
269 static void check_extents_inlinedata(e2fsck_t ctx,
270                                      struct problem_context *pctx)
271 {
272         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
273                 return;
274
275         if (!fix_problem(ctx, PR_1_SPECIAL_EXTENTS_IDATA, pctx))
276                 return;
277
278         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
279         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
280 }
281 #undef BAD_SPECIAL_FLAGS
282
283 /*
284  * If the immutable (or append-only) flag is set on the inode, offer
285  * to clear it.
286  */
287 #define BAD_SPECIAL_FLAGS (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)
288 static void check_immutable(e2fsck_t ctx, struct problem_context *pctx)
289 {
290         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
291                 return;
292
293         if (!fix_problem(ctx, PR_1_SET_IMMUTABLE, pctx))
294                 return;
295
296         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
297         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
298 }
299
300 /*
301  * If device, fifo or socket, check size is zero -- if not offer to
302  * clear it
303  */
304 static void check_size(e2fsck_t ctx, struct problem_context *pctx)
305 {
306         struct ext2_inode *inode = pctx->inode;
307
308         if (EXT2_I_SIZE(inode) == 0)
309                 return;
310
311         if (!fix_problem(ctx, PR_1_SET_NONZSIZE, pctx))
312                 return;
313
314         ext2fs_inode_size_set(ctx->fs, inode, 0);
315         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
316 }
317
318 /*
319  * For a given size, calculate how many blocks would be charged towards quota.
320  */
321 static blk64_t size_to_quota_blocks(ext2_filsys fs, size_t size)
322 {
323         blk64_t clusters;
324
325         clusters = DIV_ROUND_UP(size, fs->blocksize << fs->cluster_ratio_bits);
326         return EXT2FS_C2B(fs, clusters);
327 }
328
329 /*
330  * Check validity of EA inode. Return 0 if EA inode is valid, otherwise return
331  * the problem code.
332  */
333 static problem_t check_large_ea_inode(e2fsck_t ctx,
334                                       struct ext2_ext_attr_entry *entry,
335                                       struct problem_context *pctx,
336                                       blk64_t *quota_blocks)
337 {
338         struct ext2_inode inode;
339         __u32 hash, signed_hash;
340         errcode_t retval;
341
342         /* Check if inode is within valid range */
343         if ((entry->e_value_inum < EXT2_FIRST_INODE(ctx->fs->super)) ||
344             (entry->e_value_inum > ctx->fs->super->s_inodes_count)) {
345                 pctx->num = entry->e_value_inum;
346                 return PR_1_ATTR_VALUE_EA_INODE;
347         }
348
349         e2fsck_read_inode(ctx, entry->e_value_inum, &inode, "pass1");
350
351         retval = ext2fs_ext_attr_hash_entry3(ctx->fs, entry, NULL, &hash,
352                                              &signed_hash);
353         if (retval) {
354                 com_err("check_large_ea_inode", retval,
355                         _("while hashing entry with e_value_inum = %u"),
356                         entry->e_value_inum);
357                 fatal_error(ctx, 0);
358         }
359
360         if ((hash == entry->e_hash) || (signed_hash == entry->e_hash)) {
361                 *quota_blocks = size_to_quota_blocks(ctx->fs,
362                                                      entry->e_value_size);
363         } else {
364                 /* This might be an old Lustre-style ea_inode reference. */
365                 if (inode.i_mtime == pctx->ino &&
366                     inode.i_generation == pctx->inode->i_generation) {
367                         *quota_blocks = 0;
368                 } else {
369                         /* If target inode is also missing EA_INODE flag,
370                          * this is likely to be a bad reference.
371                          */
372                         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
373                                 pctx->num = entry->e_value_inum;
374                                 return PR_1_ATTR_VALUE_EA_INODE;
375                         } else {
376                                 pctx->num = entry->e_hash;
377                                 return PR_1_ATTR_HASH;
378                         }
379                 }
380         }
381
382         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
383                 pctx->num = entry->e_value_inum;
384                 if (fix_problem(ctx, PR_1_ATTR_SET_EA_INODE_FL, pctx)) {
385                         inode.i_flags |= EXT4_EA_INODE_FL;
386                         e2fsck_pass1_fix_lock(ctx);
387                         ext2fs_write_inode(ctx->fs, entry->e_value_inum,
388                                            &inode);
389                         e2fsck_pass1_fix_unlock(ctx);
390                 } else {
391                         return PR_1_ATTR_NO_EA_INODE_FL;
392                 }
393         }
394         return 0;
395 }
396
397 static void inc_ea_inode_refs(e2fsck_t ctx, struct problem_context *pctx,
398                               struct ext2_ext_attr_entry *first, void *end)
399 {
400         struct ext2_ext_attr_entry *entry = first;
401         struct ext2_ext_attr_entry *np = EXT2_EXT_ATTR_NEXT(entry);
402
403         while ((void *) entry < end && (void *) np < end &&
404                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
405                 if (!entry->e_value_inum)
406                         goto next;
407                 if (!ctx->ea_inode_refs) {
408                         pctx->errcode = ea_refcount_create(0,
409                                                            &ctx->ea_inode_refs);
410                         if (pctx->errcode) {
411                                 pctx->num = 4;
412                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
413                                 ctx->flags |= E2F_FLAG_ABORT;
414                                 return;
415                         }
416                 }
417                 ea_refcount_increment(ctx->ea_inode_refs, entry->e_value_inum,
418                                       0);
419         next:
420                 entry = np;
421                 np = EXT2_EXT_ATTR_NEXT(entry);
422         }
423 }
424
425 static void check_ea_in_inode(e2fsck_t ctx, struct problem_context *pctx,
426                               struct ea_quota *ea_ibody_quota)
427 {
428         struct ext2_super_block *sb = ctx->fs->super;
429         struct ext2_inode_large *inode;
430         struct ext2_ext_attr_entry *entry;
431         char *start, *header, *end;
432         unsigned int storage_size, remain;
433         problem_t problem = 0;
434         region_t region = 0;
435
436         ea_ibody_quota->blocks = 0;
437         ea_ibody_quota->inodes = 0;
438
439         inode = (struct ext2_inode_large *) pctx->inode;
440         storage_size = EXT2_INODE_SIZE(ctx->fs->super) - EXT2_GOOD_OLD_INODE_SIZE -
441                 inode->i_extra_isize;
442         header = ((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
443                  inode->i_extra_isize;
444         end = header + storage_size;
445         start = header + sizeof(__u32);
446         entry = (struct ext2_ext_attr_entry *) start;
447
448         /* scan all entry's headers first */
449
450         /* take finish entry 0UL into account */
451         remain = storage_size - sizeof(__u32);
452
453         region = region_create(0, storage_size);
454         if (!region) {
455                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
456                 problem = 0;
457                 ctx->flags |= E2F_FLAG_ABORT;
458                 return;
459         }
460         if (region_allocate(region, 0, sizeof(__u32))) {
461                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
462                 goto fix;
463         }
464
465         while (remain >= sizeof(struct ext2_ext_attr_entry) &&
466                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
467                 __u32 hash;
468
469                 if (region_allocate(region, (char *)entry - (char *)header,
470                                     EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
471                         problem = PR_1_INODE_EA_ALLOC_COLLISION;
472                         goto fix;
473                 }
474
475                 /* header eats this space */
476                 remain -= sizeof(struct ext2_ext_attr_entry);
477
478                 /* is attribute name valid? */
479                 if (EXT2_EXT_ATTR_SIZE(entry->e_name_len) > remain) {
480                         pctx->num = entry->e_name_len;
481                         problem = PR_1_ATTR_NAME_LEN;
482                         goto fix;
483                 }
484
485                 /* attribute len eats this space */
486                 remain -= EXT2_EXT_ATTR_SIZE(entry->e_name_len);
487
488                 if (entry->e_value_inum == 0) {
489                         /* check value size */
490                         if (entry->e_value_size > remain) {
491                                 pctx->num = entry->e_value_size;
492                                 problem = PR_1_ATTR_VALUE_SIZE;
493                                 goto fix;
494                         }
495
496                         if (entry->e_value_size &&
497                             region_allocate(region,
498                                             sizeof(__u32) + entry->e_value_offs,
499                                             EXT2_EXT_ATTR_SIZE(
500                                                 entry->e_value_size))) {
501                                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
502                                 goto fix;
503                         }
504
505                         hash = ext2fs_ext_attr_hash_entry(entry,
506                                                 start + entry->e_value_offs);
507                         if (entry->e_hash != 0 && entry->e_hash != hash)
508                                 hash = ext2fs_ext_attr_hash_entry_signed(entry,
509                                                 start + entry->e_value_offs);
510
511                         /* e_hash may be 0 in older inode's ea */
512                         if (entry->e_hash != 0 && entry->e_hash != hash) {
513                                 pctx->num = entry->e_hash;
514                                 problem = PR_1_ATTR_HASH;
515                                 goto fix;
516                         }
517                 } else {
518                         blk64_t quota_blocks;
519
520                         problem = check_large_ea_inode(ctx, entry, pctx,
521                                                        &quota_blocks);
522                         if (problem != 0)
523                                 goto fix;
524
525                         ea_ibody_quota->blocks += quota_blocks;
526                         ea_ibody_quota->inodes++;
527                 }
528
529                 /* If EA value is stored in external inode then it does not
530                  * consume space here */
531                 if (entry->e_value_inum == 0)
532                         remain -= entry->e_value_size;
533
534                 entry = EXT2_EXT_ATTR_NEXT(entry);
535         }
536
537         if (region_allocate(region, (char *)entry - (char *)header,
538                             sizeof(__u32))) {
539                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
540                 goto fix;
541         }
542 fix:
543         if (region)
544                 region_free(region);
545         /*
546          * it seems like a corruption. it's very unlikely we could repair
547          * EA(s) in automatic fashion -bzzz
548          */
549         if (problem == 0 || !fix_problem(ctx, problem, pctx)) {
550                 inc_ea_inode_refs(ctx, pctx,
551                                   (struct ext2_ext_attr_entry *)start, end);
552                 return;
553         }
554
555         /* simply remove all possible EA(s) */
556         *((__u32 *)header) = 0UL;
557         e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
558                                 EXT2_INODE_SIZE(sb), "pass1");
559         ea_ibody_quota->blocks = 0;
560         ea_ibody_quota->inodes = 0;
561 }
562
563 static int check_inode_extra_negative_epoch(__u32 xtime, __u32 extra) {
564         return (xtime & (1U << 31)) != 0 &&
565                 (extra & EXT4_EPOCH_MASK) == EXT4_EPOCH_MASK;
566 }
567
568 #define CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, xtime) \
569         check_inode_extra_negative_epoch(inode->i_##xtime, \
570                                          inode->i_##xtime##_extra)
571
572 /* When today's date is earlier than 2242, we assume that atimes,
573  * ctimes, crtimes, and mtimes with years in the range 2310..2378 are
574  * actually pre-1970 dates mis-encoded.
575  */
576 #define EXT4_EXTRA_NEGATIVE_DATE_CUTOFF 2 * (1LL << 32)
577
578 static void check_inode_extra_space(e2fsck_t ctx, struct problem_context *pctx,
579                                     struct ea_quota *ea_ibody_quota)
580 {
581         struct ext2_super_block *sb = ctx->fs->super;
582         struct ext2_inode_large *inode;
583         __u32 *eamagic;
584         int min, max;
585
586         ea_ibody_quota->blocks = 0;
587         ea_ibody_quota->inodes = 0;
588
589         inode = (struct ext2_inode_large *) pctx->inode;
590         if (EXT2_INODE_SIZE(sb) == EXT2_GOOD_OLD_INODE_SIZE) {
591                 /* this isn't large inode. so, nothing to check */
592                 return;
593         }
594
595 #if 0
596         printf("inode #%u, i_extra_size %d\n", pctx->ino,
597                         inode->i_extra_isize);
598 #endif
599         /* i_extra_isize must cover i_extra_isize + i_checksum_hi at least */
600         min = sizeof(inode->i_extra_isize) + sizeof(inode->i_checksum_hi);
601         max = EXT2_INODE_SIZE(sb) - EXT2_GOOD_OLD_INODE_SIZE;
602         /*
603          * For now we will allow i_extra_isize to be 0, but really
604          * implementations should never allow i_extra_isize to be 0
605          */
606         if (inode->i_extra_isize &&
607             (inode->i_extra_isize < min || inode->i_extra_isize > max ||
608              inode->i_extra_isize & 3)) {
609                 if (!fix_problem(ctx, PR_1_EXTRA_ISIZE, pctx))
610                         return;
611                 if (inode->i_extra_isize < min || inode->i_extra_isize > max)
612                         inode->i_extra_isize = sb->s_want_extra_isize;
613                 else
614                         inode->i_extra_isize = (inode->i_extra_isize + 3) & ~3;
615                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
616                                         EXT2_INODE_SIZE(sb), "pass1");
617         }
618
619         /* check if there is no place for an EA header */
620         if (inode->i_extra_isize >= max - sizeof(__u32))
621                 return;
622
623         eamagic = (__u32 *) (((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
624                         inode->i_extra_isize);
625         if (*eamagic == EXT2_EXT_ATTR_MAGIC) {
626                 /* it seems inode has an extended attribute(s) in body */
627                 check_ea_in_inode(ctx, pctx, ea_ibody_quota);
628         }
629
630         /*
631          * If the inode's extended atime (ctime, crtime, mtime) is stored in
632          * the old, invalid format, repair it.
633          */
634         if (((sizeof(time_t) <= 4) ||
635              (((sizeof(time_t) > 4) &&
636                ctx->now < EXT4_EXTRA_NEGATIVE_DATE_CUTOFF))) &&
637             (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime) ||
638              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime) ||
639              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime) ||
640              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))) {
641
642                 if (!fix_problem(ctx, PR_1_EA_TIME_OUT_OF_RANGE, pctx))
643                         return;
644
645                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime))
646                         inode->i_atime_extra &= ~EXT4_EPOCH_MASK;
647                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime))
648                         inode->i_ctime_extra &= ~EXT4_EPOCH_MASK;
649                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime))
650                         inode->i_crtime_extra &= ~EXT4_EPOCH_MASK;
651                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))
652                         inode->i_mtime_extra &= ~EXT4_EPOCH_MASK;
653                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
654                                         EXT2_INODE_SIZE(sb), "pass1");
655         }
656
657 }
658
659 static _INLINE_ int is_blocks_used(e2fsck_t ctx, blk64_t block,
660                                    unsigned int num)
661 {
662         int retval;
663
664         /* used to avoid duplicate output from below */
665         retval = ext2fs_test_block_bitmap_range2_valid(ctx->block_found_map,
666                                                        block, num);
667         if (!retval)
668                 return 0;
669
670         retval = ext2fs_test_block_bitmap_range2(ctx->block_found_map, block, num);
671         if (retval) {
672                 e2fsck_pass1_block_map_r_lock(ctx);
673                 if (ctx->global_ctx)
674                         retval = ext2fs_test_block_bitmap_range2(
675                                         ctx->global_ctx->block_found_map, block, num);
676                 e2fsck_pass1_block_map_r_unlock(ctx);
677                 if (retval)
678                         return 0;
679         }
680
681         return 1;
682 }
683
684 /*
685  * Check to see if the inode might really be a directory, despite i_mode
686  *
687  * This is a lot of complexity for something for which I'm not really
688  * convinced happens frequently in the wild.  If for any reason this
689  * causes any problems, take this code out.
690  * [tytso:20070331.0827EDT]
691  */
692 static void check_is_really_dir(e2fsck_t ctx, struct problem_context *pctx,
693                                 char *buf)
694 {
695         struct ext2_inode *inode = pctx->inode;
696         struct ext2_dir_entry   *dirent;
697         errcode_t               retval;
698         blk64_t                 blk;
699         unsigned int            i, rec_len, not_device = 0;
700         int                     extent_fs;
701         int                     inlinedata_fs;
702
703         /*
704          * If the mode looks OK, we believe it.  If the first block in
705          * the i_block array is 0, this cannot be a directory. If the
706          * inode is extent-mapped, it is still the case that the latter
707          * cannot be 0 - the magic number in the extent header would make
708          * it nonzero.
709          */
710         if (LINUX_S_ISDIR(inode->i_mode) || LINUX_S_ISREG(inode->i_mode) ||
711             LINUX_S_ISLNK(inode->i_mode) || inode->i_block[0] == 0)
712                 return;
713
714         /*
715          * Check the block numbers in the i_block array for validity:
716          * zero blocks are skipped (but the first one cannot be zero -
717          * see above), other blocks are checked against the first and
718          * max data blocks (from the the superblock) and against the
719          * block bitmap. Any invalid block found means this cannot be
720          * a directory.
721          *
722          * If there are non-zero blocks past the fourth entry, then
723          * this cannot be a device file: we remember that for the next
724          * check.
725          *
726          * For extent mapped files, we don't do any sanity checking:
727          * just try to get the phys block of logical block 0 and run
728          * with it.
729          *
730          * For inline data files, we just try to get the size of inline
731          * data.  If it's true, we will treat it as a directory.
732          */
733
734         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
735         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
736         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL)) {
737                 size_t size;
738                 __u32 dotdot;
739                 unsigned int rec_len2;
740                 struct ext2_dir_entry de;
741
742                 if (ext2fs_inline_data_size(ctx->fs, pctx->ino, &size))
743                         return;
744                 /*
745                  * If the size isn't a multiple of 4, it's probably not a
746                  * directory??
747                  */
748                 if (size & 3)
749                         return;
750                 /*
751                  * If the first 10 bytes don't look like a directory entry,
752                  * it's probably not a directory.
753                  */
754                 memcpy(&dotdot, inode->i_block, sizeof(dotdot));
755                 memcpy(&de, ((char *)inode->i_block) + EXT4_INLINE_DATA_DOTDOT_SIZE,
756                        EXT2_DIR_REC_LEN(0));
757                 dotdot = ext2fs_le32_to_cpu(dotdot);
758                 de.inode = ext2fs_le32_to_cpu(de.inode);
759                 de.rec_len = ext2fs_le16_to_cpu(de.rec_len);
760                 ext2fs_get_rec_len(ctx->fs, &de, &rec_len2);
761                 if (dotdot >= ctx->fs->super->s_inodes_count ||
762                     (dotdot < EXT2_FIRST_INO(ctx->fs->super) &&
763                      dotdot != EXT2_ROOT_INO) ||
764                     de.inode >= ctx->fs->super->s_inodes_count ||
765                     (de.inode < EXT2_FIRST_INO(ctx->fs->super) &&
766                      de.inode != 0) ||
767                     rec_len2 > EXT4_MIN_INLINE_DATA_SIZE -
768                               EXT4_INLINE_DATA_DOTDOT_SIZE)
769                         return;
770                 /* device files never have a "system.data" entry */
771                 goto isdir;
772         } else if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) {
773                 /* extent mapped */
774                 if  (ext2fs_bmap2(ctx->fs, pctx->ino, inode, 0, 0, 0, 0,
775                                  &blk))
776                         return;
777                 /* device files are never extent mapped */
778                 not_device++;
779         } else {
780                 for (i=0; i < EXT2_N_BLOCKS; i++) {
781                         blk = inode->i_block[i];
782                         if (!blk)
783                                 continue;
784                         if (i >= 4)
785                                 not_device++;
786
787                         if (blk < ctx->fs->super->s_first_data_block ||
788                             blk >= ext2fs_blocks_count(ctx->fs->super) ||
789                             is_blocks_used(ctx, blk, 1))
790                                 return; /* Invalid block, can't be dir */
791                 }
792                 blk = inode->i_block[0];
793         }
794
795         /*
796          * If the mode says this is a device file and the i_links_count field
797          * is sane and we have not ruled it out as a device file previously,
798          * we declare it a device file, not a directory.
799          */
800         if ((LINUX_S_ISCHR(inode->i_mode) || LINUX_S_ISBLK(inode->i_mode)) &&
801             (inode->i_links_count == 1) && !not_device)
802                 return;
803
804         /* read the first block */
805         ehandler_operation(_("reading directory block"));
806         retval = ext2fs_read_dir_block4(ctx->fs, blk, buf, 0, pctx->ino);
807         ehandler_operation(0);
808         if (retval)
809                 return;
810
811         dirent = (struct ext2_dir_entry *) buf;
812         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
813         if (retval)
814                 return;
815         if ((ext2fs_dirent_name_len(dirent) != 1) ||
816             (dirent->name[0] != '.') ||
817             (dirent->inode != pctx->ino) ||
818             (rec_len < 12) ||
819             (rec_len % 4) ||
820             (rec_len >= ctx->fs->blocksize - 12))
821                 return;
822
823         dirent = (struct ext2_dir_entry *) (buf + rec_len);
824         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
825         if (retval)
826                 return;
827         if ((ext2fs_dirent_name_len(dirent) != 2) ||
828             (dirent->name[0] != '.') ||
829             (dirent->name[1] != '.') ||
830             (rec_len < 12) ||
831             (rec_len % 4))
832                 return;
833
834 isdir:
835         if (fix_problem(ctx, PR_1_TREAT_AS_DIRECTORY, pctx)) {
836                 inode->i_mode = (inode->i_mode & 07777) | LINUX_S_IFDIR;
837                 e2fsck_write_inode_full(ctx, pctx->ino, inode,
838                                         EXT2_INODE_SIZE(ctx->fs->super),
839                                         "check_is_really_dir");
840         }
841 }
842
843 extern errcode_t e2fsck_setup_icount(e2fsck_t ctx, const char *icount_name,
844                                      int flags, ext2_icount_t hint,
845                                      ext2_icount_t *ret)
846 {
847         unsigned int            threshold;
848         unsigned int            save_type;
849         ext2_ino_t              num_dirs;
850         errcode_t               retval;
851         char                    *tdb_dir;
852         int                     enable;
853
854         *ret = 0;
855
856         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
857                            &tdb_dir);
858         profile_get_uint(ctx->profile, "scratch_files",
859                          "numdirs_threshold", 0, 0, &threshold);
860         profile_get_boolean(ctx->profile, "scratch_files",
861                             "icount", 0, 1, &enable);
862
863         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
864         if (retval)
865                 num_dirs = 1024;        /* Guess */
866
867         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
868             (!threshold || num_dirs > threshold)) {
869                 retval = ext2fs_create_icount_tdb(ctx->fs, tdb_dir,
870                                                   flags, ret);
871                 if (retval == 0)
872                         return 0;
873         }
874         e2fsck_set_bitmap_type(ctx->fs, EXT2FS_BMAP64_RBTREE, icount_name,
875                                &save_type);
876         if (ctx->options & E2F_OPT_ICOUNT_FULLMAP)
877                 flags |= EXT2_ICOUNT_OPT_FULLMAP;
878         retval = ext2fs_create_icount2(ctx->fs, flags, 0, hint, ret);
879         ctx->fs->default_bitmap_type = save_type;
880         return retval;
881 }
882
883 static errcode_t recheck_bad_inode_checksum(ext2_filsys fs, ext2_ino_t ino,
884                                             e2fsck_t ctx,
885                                             struct problem_context *pctx)
886 {
887         errcode_t retval;
888         struct ext2_inode_large inode;
889
890         /*
891          * Reread inode.  If we don't see checksum error, then this inode
892          * has been fixed elsewhere.
893          */
894         ctx->stashed_ino = 0;
895         retval = ext2fs_read_inode_full(fs, ino, (struct ext2_inode *)&inode,
896                                         sizeof(inode));
897         if (retval && retval != EXT2_ET_INODE_CSUM_INVALID)
898                 return retval;
899         if (!retval)
900                 return 0;
901
902         /*
903          * Checksum still doesn't match.  That implies that the inode passes
904          * all the sanity checks, so maybe the checksum is simply corrupt.
905          * See if the user will go for fixing that.
906          */
907         if (!fix_problem(ctx, PR_1_INODE_ONLY_CSUM_INVALID, pctx))
908                 return 0;
909
910
911         e2fsck_pass1_fix_lock(ctx);
912         retval = ext2fs_write_inode_full(fs, ino, (struct ext2_inode *)&inode,
913                                          sizeof(inode));
914         e2fsck_pass1_fix_unlock(ctx);
915         return retval;
916 }
917
918 static void reserve_block_for_root_repair(e2fsck_t ctx)
919 {
920         blk64_t         blk = 0;
921         errcode_t       err;
922         ext2_filsys     fs = ctx->fs;
923
924         ctx->root_repair_block = 0;
925         if (ext2fs_test_inode_bitmap2(ctx->inode_used_map, EXT2_ROOT_INO))
926                 return;
927
928         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
929         if (err)
930                 return;
931         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
932         ctx->root_repair_block = blk;
933 }
934
935 static void reserve_block_for_lnf_repair(e2fsck_t ctx)
936 {
937         blk64_t         blk = 0;
938         errcode_t       err;
939         ext2_filsys     fs = ctx->fs;
940         static const char name[] = "lost+found";
941         ext2_ino_t      ino;
942
943         ctx->lnf_repair_block = 0;
944         if (!ext2fs_lookup(fs, EXT2_ROOT_INO, name, sizeof(name)-1, 0, &ino))
945                 return;
946
947         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
948         if (err)
949                 return;
950         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
951         ctx->lnf_repair_block = blk;
952         return;
953 }
954
955 static errcode_t get_inline_data_ea_size(ext2_filsys fs, ext2_ino_t ino,
956                                          struct ext2_inode *inode,
957                                          size_t *sz)
958 {
959         void *p;
960         struct ext2_xattr_handle *handle;
961         errcode_t retval;
962
963         retval = ext2fs_xattrs_open(fs, ino, &handle);
964         if (retval)
965                 return retval;
966
967         retval = ext2fs_xattrs_read_inode(handle,
968                                           (struct ext2_inode_large *)inode);
969         if (retval)
970                 goto err;
971
972         retval = ext2fs_xattr_get(handle, "system.data", &p, sz);
973         if (retval)
974                 goto err;
975         ext2fs_free_mem(&p);
976 err:
977         (void) ext2fs_xattrs_close(&handle);
978         return retval;
979 }
980
981 static void finish_processing_inode(e2fsck_t ctx, ext2_ino_t ino,
982                                     struct problem_context *pctx,
983                                     int failed_csum)
984 {
985         if (!failed_csum)
986                 return;
987
988         /*
989          * If the inode failed the checksum and the user didn't
990          * clear the inode, test the checksum again -- if it still
991          * fails, ask the user if the checksum should be corrected.
992          */
993         pctx->errcode = recheck_bad_inode_checksum(ctx->fs, ino, ctx, pctx);
994         if (pctx->errcode)
995                 ctx->flags |= E2F_FLAG_ABORT;
996 }
997 #define FINISH_INODE_LOOP(ctx, ino, pctx, failed_csum) \
998         do { \
999                 finish_processing_inode((ctx), (ino), (pctx), (failed_csum)); \
1000                 if ((ctx)->flags & E2F_FLAG_ABORT) { \
1001                         e2fsck_pass1_check_unlock(ctx); \
1002                         return; \
1003                 } \
1004         } while (0)
1005
1006 static int could_be_block_map(ext2_filsys fs, struct ext2_inode *inode)
1007 {
1008         __u32 x;
1009         int i;
1010
1011         for (i = 0; i < EXT2_N_BLOCKS; i++) {
1012                 x = inode->i_block[i];
1013 #ifdef WORDS_BIGENDIAN
1014                 x = ext2fs_swab32(x);
1015 #endif
1016                 if (x >= ext2fs_blocks_count(fs->super))
1017                         return 0;
1018         }
1019
1020         return 1;
1021 }
1022
1023 /*
1024  * Figure out what to do with an inode that has both extents and inline data
1025  * inode flags set.  Returns -1 if we decide to erase the inode, 0 otherwise.
1026  */
1027 static int fix_inline_data_extents_file(e2fsck_t ctx,
1028                                         ext2_ino_t ino,
1029                                         struct ext2_inode *inode,
1030                                         int inode_size,
1031                                         struct problem_context *pctx)
1032 {
1033         size_t max_inline_ea_size;
1034         ext2_filsys fs = ctx->fs;
1035         int dirty = 0;
1036
1037         /* Both feature flags not set?  Just run the regular checks */
1038         if (!ext2fs_has_feature_extents(fs->super) &&
1039             !ext2fs_has_feature_inline_data(fs->super))
1040                 return 0;
1041
1042         /* Clear both flags if it's a special file */
1043         if (LINUX_S_ISCHR(inode->i_mode) ||
1044             LINUX_S_ISBLK(inode->i_mode) ||
1045             LINUX_S_ISFIFO(inode->i_mode) ||
1046             LINUX_S_ISSOCK(inode->i_mode)) {
1047                 check_extents_inlinedata(ctx, pctx);
1048                 return 0;
1049         }
1050
1051         /* If it looks like an extent tree, try to clear inlinedata */
1052         if (ext2fs_extent_header_verify(inode->i_block,
1053                                  sizeof(inode->i_block)) == 0 &&
1054             fix_problem(ctx, PR_1_CLEAR_INLINE_DATA_FOR_EXTENT, pctx)) {
1055                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1056                 dirty = 1;
1057                 goto out;
1058         }
1059
1060         /* If it looks short enough to be inline data, try to clear extents */
1061         if (inode_size > EXT2_GOOD_OLD_INODE_SIZE)
1062                 max_inline_ea_size = inode_size -
1063                                      (EXT2_GOOD_OLD_INODE_SIZE +
1064                                       ((struct ext2_inode_large *)inode)->i_extra_isize);
1065         else
1066                 max_inline_ea_size = 0;
1067         if (EXT2_I_SIZE(inode) <
1068             EXT4_MIN_INLINE_DATA_SIZE + max_inline_ea_size &&
1069             fix_problem(ctx, PR_1_CLEAR_EXTENT_FOR_INLINE_DATA, pctx)) {
1070                 inode->i_flags &= ~EXT4_EXTENTS_FL;
1071                 dirty = 1;
1072                 goto out;
1073         }
1074
1075         /*
1076          * Too big for inline data, but no evidence of extent tree -
1077          * maybe it's a block map file?  If the mappings all look valid?
1078          */
1079         if (could_be_block_map(fs, inode) &&
1080             fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_FLAGS, pctx)) {
1081 #ifdef WORDS_BIGENDIAN
1082                 int i;
1083
1084                 for (i = 0; i < EXT2_N_BLOCKS; i++)
1085                         inode->i_block[i] = ext2fs_swab32(inode->i_block[i]);
1086 #endif
1087
1088                 inode->i_flags &= ~(EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL);
1089                 dirty = 1;
1090                 goto out;
1091         }
1092
1093         /* Oh well, just clear the busted inode. */
1094         if (fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_INODE, pctx)) {
1095                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1096                 return -1;
1097         }
1098
1099 out:
1100         if (dirty)
1101                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1102
1103         return 0;
1104 }
1105
1106 static void pass1_readahead(e2fsck_t ctx, dgrp_t *group, ext2_ino_t *next_ino)
1107 {
1108         ext2_ino_t inodes_in_group = 0, inodes_per_block, inodes_per_buffer;
1109         dgrp_t start = *group, grp, grp_end = ctx->fs->group_desc_count;
1110         blk64_t blocks_to_read = 0;
1111         errcode_t err = EXT2_ET_INVALID_ARGUMENT;
1112
1113 #ifdef HAVE_PTHREAD
1114         if (ctx->fs->fs_num_threads > 1)
1115                 grp_end = ctx->thread_info.et_group_end;
1116 #endif
1117         if (ctx->readahead_kb == 0)
1118                 goto out;
1119
1120         /* Keep iterating groups until we have enough to readahead */
1121         inodes_per_block = EXT2_INODES_PER_BLOCK(ctx->fs->super);
1122         for (grp = start; grp < grp_end; grp++) {
1123                 if (ext2fs_bg_flags_test(ctx->fs, grp, EXT2_BG_INODE_UNINIT))
1124                         continue;
1125                 inodes_in_group = ctx->fs->super->s_inodes_per_group -
1126                                         ext2fs_bg_itable_unused(ctx->fs, grp);
1127                 blocks_to_read += (inodes_in_group + inodes_per_block - 1) /
1128                                         inodes_per_block;
1129                 if (blocks_to_read * ctx->fs->blocksize >
1130                     ctx->readahead_kb * 1024)
1131                         break;
1132         }
1133
1134         err = e2fsck_readahead(ctx->fs, E2FSCK_READA_ITABLE, start,
1135                                grp - start + 1);
1136         if (err == EAGAIN) {
1137                 ctx->readahead_kb /= 2;
1138                 err = 0;
1139         }
1140
1141 out:
1142         if (err) {
1143                 /* Error; disable itable readahead */
1144                 *group = ctx->fs->group_desc_count;
1145                 *next_ino = ctx->fs->super->s_inodes_count;
1146         } else {
1147                 /*
1148                  * Don't do more readahead until we've reached the first inode
1149                  * of the last inode scan buffer block for the last group.
1150                  */
1151                 *group = grp + 1;
1152                 inodes_per_buffer = (ctx->inode_buffer_blocks ?
1153                                      ctx->inode_buffer_blocks :
1154                                      EXT2_INODE_SCAN_DEFAULT_BUFFER_BLOCKS) *
1155                                     ctx->fs->blocksize /
1156                                     EXT2_INODE_SIZE(ctx->fs->super);
1157                 inodes_in_group--;
1158                 *next_ino = inodes_in_group -
1159                             (inodes_in_group % inodes_per_buffer) + 1 +
1160                             (grp * ctx->fs->super->s_inodes_per_group);
1161         }
1162 }
1163
1164 /*
1165  * Check if the passed ino is one of the used superblock quota inodes.
1166  *
1167  * Before the quota inodes were journaled, older superblock quota inodes
1168  * were just regular files in the filesystem and not reserved inodes.  This
1169  * checks if the passed ino is one of the s_*_quota_inum superblock fields,
1170  * which may not always be the same as the EXT4_*_QUOTA_INO fields.
1171  */
1172 static int quota_inum_is_super(struct ext2_super_block *sb, ext2_ino_t ino)
1173 {
1174         enum quota_type qtype;
1175
1176         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1177                 if (*quota_sb_inump(sb, qtype) == ino)
1178                         return 1;
1179
1180         return 0;
1181 }
1182
1183 /*
1184  * Check if the passed ino is one of the reserved quota inodes.
1185  * This checks if the inode number is one of the reserved EXT4_*_QUOTA_INO
1186  * inodes.  These inodes may or may not be in use by the quota feature.
1187  */
1188 static int quota_inum_is_reserved(ext2_filsys fs, ext2_ino_t ino)
1189 {
1190         enum quota_type qtype;
1191
1192         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1193                 if (quota_type2inum(qtype, fs->super) == ino)
1194                         return 1;
1195
1196         return 0;
1197 }
1198
1199 static int e2fsck_should_abort(e2fsck_t ctx)
1200 {
1201         e2fsck_t global_ctx;
1202
1203         if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1204                 return 1;
1205
1206         if (ctx->global_ctx) {
1207                 global_ctx = ctx->global_ctx;
1208                 if (global_ctx->flags & E2F_FLAG_SIGNAL_MASK)
1209                         return 1;
1210         }
1211         return 0;
1212 }
1213
1214 static void init_ext2_max_sizes()
1215 {
1216         int     i;
1217         __u64   max_sizes;
1218
1219         /*
1220          * Init ext2_max_sizes which will be immutable and shared between
1221          * threads
1222          */
1223 #define EXT2_BPP(bits) (1ULL << ((bits) - 2))
1224
1225         for (i = EXT2_MIN_BLOCK_LOG_SIZE; i <= EXT2_MAX_BLOCK_LOG_SIZE; i++) {
1226                 max_sizes = EXT2_NDIR_BLOCKS + EXT2_BPP(i);
1227                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i);
1228                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i) * EXT2_BPP(i);
1229                 max_sizes = (max_sizes * (1UL << i));
1230                 ext2_max_sizes[i - EXT2_MIN_BLOCK_LOG_SIZE] = max_sizes;
1231         }
1232 #undef EXT2_BPP
1233 }
1234
1235 #ifdef HAVE_PTHREAD
1236 /* TODO: tdb needs to be handled properly for multiple threads*/
1237 static int multiple_threads_supported(e2fsck_t ctx)
1238 {
1239 #ifdef  CONFIG_TDB
1240         unsigned int            threshold;
1241         ext2_ino_t              num_dirs;
1242         errcode_t               retval;
1243         char                    *tdb_dir;
1244         int                     enable;
1245
1246         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
1247                            &tdb_dir);
1248         profile_get_uint(ctx->profile, "scratch_files",
1249                          "numdirs_threshold", 0, 0, &threshold);
1250         profile_get_boolean(ctx->profile, "scratch_files",
1251                             "icount", 0, 1, &enable);
1252
1253         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
1254         if (retval)
1255                 num_dirs = 1024;        /* Guess */
1256
1257         /* tdb is unsupported now */
1258         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
1259             (!threshold || num_dirs > threshold))
1260                 return 0;
1261 #endif
1262         return 1;
1263 }
1264
1265 /**
1266  * Even though we could specify number of threads,
1267  * but it might be more than the whole filesystem
1268  * block groups, correct it here.
1269  */
1270 static void e2fsck_pass1_set_thread_num(e2fsck_t ctx)
1271 {
1272         unsigned flexbg_size = 1;
1273         ext2_filsys fs = ctx->fs;
1274         int num_threads = ctx->pfs_num_threads;
1275         int max_threads;
1276
1277         if (num_threads < 1) {
1278                 num_threads = 1;
1279                 goto out;
1280         }
1281
1282         if (!multiple_threads_supported(ctx)) {
1283                 num_threads = 1;
1284                 fprintf(stderr, "Fall through single thread for pass1 "
1285                         "because tdb could not handle properly\n");
1286                 goto out;
1287         }
1288
1289         if (ext2fs_has_feature_flex_bg(fs->super))
1290                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
1291         max_threads = fs->group_desc_count / flexbg_size;
1292         if (max_threads == 0)
1293                 max_threads = 1;
1294         if (max_threads > E2FSCK_MAX_THREADS)
1295                 max_threads = E2FSCK_MAX_THREADS;
1296
1297         if (num_threads > max_threads) {
1298                 fprintf(stderr, "Use max possible thread num: %d instead\n",
1299                                 max_threads);
1300                 num_threads = max_threads;
1301         }
1302 out:
1303         ctx->pfs_num_threads = num_threads;
1304         ctx->fs->fs_num_threads = num_threads;
1305 }
1306 #endif
1307
1308 /*
1309  * We need call mark_table_blocks() before multiple
1310  * thread start, since all known system blocks should be
1311  * marked and checked later.
1312  */
1313 static errcode_t e2fsck_pass1_prepare(e2fsck_t ctx)
1314 {
1315         struct problem_context pctx;
1316         ext2_filsys fs = ctx->fs;
1317         unsigned long long readahead_kb;
1318
1319         init_ext2_max_sizes();
1320 #ifdef HAVE_PTHREAD
1321         e2fsck_pass1_set_thread_num(ctx);
1322 #endif
1323         /* If we can do readahead, figure out how many groups to pull in. */
1324         if (!e2fsck_can_readahead(ctx->fs))
1325                 ctx->readahead_kb = 0;
1326         else if (ctx->readahead_kb == ~0ULL)
1327                 ctx->readahead_kb = e2fsck_guess_readahead(ctx->fs);
1328
1329 #ifdef HAVE_PTHREAD
1330         /* don't use more than 1/10 of memory for threads checking */
1331         readahead_kb = get_memory_size() / (10 * ctx->pfs_num_threads);
1332         /* maybe better disable RA if this is too small? */
1333         if (ctx->readahead_kb > readahead_kb)
1334                 ctx->readahead_kb = readahead_kb;
1335 #endif
1336         clear_problem_context(&pctx);
1337         if (!(ctx->options & E2F_OPT_PREEN))
1338                 fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1339
1340         pctx.errcode = e2fsck_allocate_subcluster_bitmap(ctx->fs,
1341                         _("in-use block map"), EXT2FS_BMAP64_RBTREE,
1342                         "block_found_map", &ctx->block_found_map);
1343         if (pctx.errcode) {
1344                 pctx.num = 1;
1345                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1346                 ctx->flags |= E2F_FLAG_ABORT;
1347                 return pctx.errcode;
1348         }
1349         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
1350                         _("metadata block map"), EXT2FS_BMAP64_RBTREE,
1351                         "block_metadata_map", &ctx->block_metadata_map);
1352         if (pctx.errcode) {
1353                 pctx.num = 1;
1354                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1355                 ctx->flags |= E2F_FLAG_ABORT;
1356                 return pctx.errcode;
1357         }
1358
1359         mark_table_blocks(ctx);
1360         pctx.errcode = ext2fs_convert_subcluster_bitmap(ctx->fs,
1361                                                 &ctx->block_found_map);
1362         if (pctx.errcode) {
1363                 fix_problem(ctx, PR_1_CONVERT_SUBCLUSTER, &pctx);
1364                 ctx->flags |= E2F_FLAG_ABORT;
1365                 return pctx.errcode;
1366         }
1367
1368         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
1369                         _("multiply claimed block map"),
1370                         EXT2FS_BMAP64_RBTREE, "block_dup_map",
1371                         &ctx->block_dup_map);
1372         if (pctx.errcode) {
1373                 pctx.num = 3;
1374                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR,
1375                             &pctx);
1376                 /* Should never get here */
1377                 ctx->flags |= E2F_FLAG_ABORT;
1378                 return pctx.errcode;
1379         }
1380
1381         if (ext2fs_has_feature_mmp(fs->super) &&
1382             fs->super->s_mmp_block > fs->super->s_first_data_block &&
1383             fs->super->s_mmp_block < ext2fs_blocks_count(fs->super))
1384                 ext2fs_mark_block_bitmap2(ctx->block_found_map,
1385                                           fs->super->s_mmp_block);
1386 #ifdef  HAVE_PTHREAD
1387         pthread_rwlock_init(&ctx->fs_fix_rwlock, NULL);
1388         pthread_rwlock_init(&ctx->fs_block_map_rwlock, NULL);
1389         if (ctx->pfs_num_threads > 1)
1390                 ctx->fs_need_locking = 1;
1391 #endif
1392
1393         return 0;
1394 }
1395
1396 static void e2fsck_pass1_post(e2fsck_t ctx)
1397 {
1398         struct problem_context pctx;
1399         ext2_filsys fs = ctx->fs;
1400         char *block_buf;
1401
1402         if (e2fsck_should_abort(ctx))
1403                 return;
1404
1405         block_buf = (char *)e2fsck_allocate_memory(ctx, ctx->fs->blocksize * 3,
1406                                               "block interate buffer");
1407         reserve_block_for_root_repair(ctx);
1408         reserve_block_for_lnf_repair(ctx);
1409
1410         /*
1411          * If any extended attribute blocks' reference counts need to
1412          * be adjusted, either up (ctx->refcount_extra), or down
1413          * (ctx->refcount), then fix them.
1414          */
1415         if (ctx->refcount) {
1416                 adjust_extattr_refcount(ctx, ctx->refcount, block_buf, -1);
1417                 ea_refcount_free(ctx->refcount);
1418                 ctx->refcount = 0;
1419         }
1420         if (ctx->refcount_extra) {
1421                 adjust_extattr_refcount(ctx, ctx->refcount_extra,
1422                                         block_buf, +1);
1423                 ea_refcount_free(ctx->refcount_extra);
1424                 ctx->refcount_extra = 0;
1425         }
1426
1427         if (ctx->invalid_bitmaps)
1428                 handle_fs_bad_blocks(ctx);
1429
1430         /* We don't need the block_ea_map any more */
1431         if (ctx->block_ea_map) {
1432                 ext2fs_free_block_bitmap(ctx->block_ea_map);
1433                 ctx->block_ea_map = 0;
1434         }
1435
1436         if (ctx->flags & E2F_FLAG_RESIZE_INODE) {
1437                 struct ext2_inode *inode;
1438                 int inode_size = EXT2_INODE_SIZE(fs->super);
1439                 inode = e2fsck_allocate_memory(ctx, inode_size,
1440                                                "scratch inode");
1441
1442                 clear_problem_context(&pctx);
1443                 pctx.errcode = ext2fs_create_resize_inode(fs);
1444                 if (pctx.errcode) {
1445                         if (!fix_problem(ctx, PR_1_RESIZE_INODE_CREATE,
1446                                          &pctx)) {
1447                                 ctx->flags |= E2F_FLAG_ABORT;
1448                                 ext2fs_free_mem(&inode);
1449                                 ext2fs_free_mem(&block_buf);
1450                                 return;
1451                         }
1452                         pctx.errcode = 0;
1453                 }
1454                 if (!pctx.errcode) {
1455                         e2fsck_read_inode(ctx, EXT2_RESIZE_INO, inode,
1456                                           "recreate inode");
1457                         inode->i_mtime = ctx->now;
1458                         e2fsck_write_inode(ctx, EXT2_RESIZE_INO, inode,
1459                                            "recreate inode");
1460                 }
1461                 ctx->flags &= ~E2F_FLAG_RESIZE_INODE;
1462                 ext2fs_free_mem(&inode);
1463         }
1464
1465         if (ctx->flags & E2F_FLAG_RESTART) {
1466                 ext2fs_free_mem(&block_buf);
1467                 return;
1468         }
1469
1470         if (ctx->block_dup_map) {
1471                 if (!(ctx->flags & E2F_FLAG_DUP_BLOCK)) {
1472                         ext2fs_free_mem(&block_buf);
1473                         return;
1474                 }
1475                 if (ctx->options & E2F_OPT_PREEN) {
1476                         clear_problem_context(&pctx);
1477                         fix_problem(ctx, PR_1_DUP_BLOCKS_PREENSTOP, &pctx);
1478                 }
1479                 e2fsck_pass1_dupblocks(ctx, block_buf);
1480                 ext2fs_free_mem(&block_buf);
1481                 ctx->flags &= ~E2F_FLAG_DUP_BLOCK;
1482         }
1483
1484         ctx->flags |= E2F_FLAG_ALLOC_OK;
1485 }
1486
1487
1488 void e2fsck_pass1_run(e2fsck_t ctx)
1489 {
1490         int     i;
1491         ext2_filsys fs = ctx->fs;
1492         ext2_ino_t      ino = 0;
1493         struct ext2_inode *inode = NULL;
1494         ext2_inode_scan scan = NULL;
1495         char            *block_buf = NULL;
1496 #ifdef RESOURCE_TRACK
1497         struct resource_track   rtrack;
1498 #endif
1499         unsigned char   frag, fsize;
1500         struct          problem_context pctx;
1501         struct          scan_callback_struct scan_struct;
1502         struct ext2_super_block *sb = ctx->fs->super;
1503         const char      *old_op;
1504         const char      *eop_next_inode = _("getting next inode from scan");
1505         int             imagic_fs, extent_fs, inlinedata_fs, casefold_fs;
1506         int             low_dtime_check = 1;
1507         unsigned int    inode_size = EXT2_INODE_SIZE(fs->super);
1508         unsigned int    bufsize;
1509         int             failed_csum = 0;
1510         ext2_ino_t      ino_threshold = 0;
1511         dgrp_t          ra_group = 0;
1512         struct ea_quota ea_ibody_quota;
1513         struct process_inode_block *inodes_to_process;
1514         int             process_inode_count, check_mmp;
1515         e2fsck_t        global_ctx = ctx->global_ctx ? ctx->global_ctx : ctx;
1516
1517         init_resource_track(&rtrack, ctx->fs->io);
1518         clear_problem_context(&pctx);
1519
1520         pass1_readahead(ctx, &ra_group, &ino_threshold);
1521         if (ext2fs_has_feature_dir_index(fs->super) &&
1522             !(ctx->options & E2F_OPT_NO)) {
1523                 if (ext2fs_u32_list_create(&ctx->dirs_to_hash, 50))
1524                         ctx->dirs_to_hash = 0;
1525         }
1526
1527 #ifdef MTRACE
1528         mtrace_print("Pass 1");
1529 #endif
1530
1531         imagic_fs = ext2fs_has_feature_imagic_inodes(sb);
1532         extent_fs = ext2fs_has_feature_extents(sb);
1533         inlinedata_fs = ext2fs_has_feature_inline_data(sb);
1534         casefold_fs = ext2fs_has_feature_casefold(sb);
1535
1536         /*
1537          * Allocate bitmaps structures
1538          */
1539         pctx.errcode = e2fsck_allocate_inode_bitmap(fs, _("in-use inode map"),
1540                                                     EXT2FS_BMAP64_RBTREE,
1541                                                     "inode_used_map",
1542                                                     &ctx->inode_used_map);
1543         if (pctx.errcode) {
1544                 pctx.num = 1;
1545                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1546                 ctx->flags |= E2F_FLAG_ABORT;
1547                 return;
1548         }
1549         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1550                         _("directory inode map"),
1551                         ctx->global_ctx ? EXT2FS_BMAP64_RBTREE :
1552                         EXT2FS_BMAP64_AUTODIR,
1553                         "inode_dir_map", &ctx->inode_dir_map);
1554         if (pctx.errcode) {
1555                 pctx.num = 2;
1556                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1557                 ctx->flags |= E2F_FLAG_ABORT;
1558                 return;
1559         }
1560         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1561                         _("regular file inode map"), EXT2FS_BMAP64_RBTREE,
1562                         "inode_reg_map", &ctx->inode_reg_map);
1563         if (pctx.errcode) {
1564                 pctx.num = 6;
1565                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1566                 ctx->flags |= E2F_FLAG_ABORT;
1567                 return;
1568         }
1569         if (casefold_fs) {
1570                 pctx.errcode =
1571                         e2fsck_allocate_inode_bitmap(fs,
1572                                                      _("inode casefold map"),
1573                                                      EXT2FS_BMAP64_RBTREE,
1574                                                      "inode_casefold_map",
1575                                                      &ctx->inode_casefold_map);
1576                 if (pctx.errcode) {
1577                         pctx.num = 1;
1578                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1579                         ctx->flags |= E2F_FLAG_ABORT;
1580                         return;
1581                 }
1582         }
1583         pctx.errcode = e2fsck_setup_icount(ctx, "inode_link_info", 0, NULL,
1584                                            &ctx->inode_link_info);
1585         if (pctx.errcode) {
1586                 fix_problem(ctx, PR_1_ALLOCATE_ICOUNT, &pctx);
1587                 ctx->flags |= E2F_FLAG_ABORT;
1588                 return;
1589         }
1590         bufsize = inode_size;
1591         if (bufsize < sizeof(struct ext2_inode_large))
1592                 bufsize = sizeof(struct ext2_inode_large);
1593         inode = (struct ext2_inode *)
1594                 e2fsck_allocate_memory(ctx, bufsize, "scratch inode");
1595
1596         inodes_to_process = (struct process_inode_block *)
1597                 e2fsck_allocate_memory(ctx,
1598                                        (ctx->process_inode_size *
1599                                         sizeof(struct process_inode_block)),
1600                                        "array of inodes to process");
1601         process_inode_count = 0;
1602
1603         pctx.errcode = ext2fs_init_dblist(fs, 0);
1604         if (pctx.errcode) {
1605                 fix_problem(ctx, PR_1_ALLOCATE_DBCOUNT, &pctx);
1606                 ctx->flags |= E2F_FLAG_ABORT;
1607                 goto endit;
1608         }
1609
1610         /*
1611          * If the last orphan field is set, clear it, since the pass1
1612          * processing will automatically find and clear the orphans.
1613          * In the future, we may want to try using the last_orphan
1614          * linked list ourselves, but for now, we clear it so that the
1615          * ext3 mount code won't get confused.
1616          */
1617         if (!(ctx->options & E2F_OPT_READONLY)) {
1618                 if (fs->super->s_last_orphan) {
1619                         fs->super->s_last_orphan = 0;
1620                         ext2fs_mark_super_dirty(fs);
1621                 }
1622         }
1623
1624         block_buf = (char *) e2fsck_allocate_memory(ctx, fs->blocksize * 3,
1625                                                     "block iterate buffer");
1626         if (EXT2_INODE_SIZE(fs->super) == EXT2_GOOD_OLD_INODE_SIZE)
1627                 e2fsck_use_inode_shortcuts(ctx, 1);
1628         e2fsck_intercept_block_allocations(ctx);
1629         old_op = ehandler_operation(_("opening inode scan"));
1630         pctx.errcode = ext2fs_open_inode_scan(fs, ctx->inode_buffer_blocks,
1631                                               &scan);
1632         ehandler_operation(old_op);
1633         if (pctx.errcode) {
1634                 fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1635                 ctx->flags |= E2F_FLAG_ABORT;
1636                 goto endit;
1637         }
1638         ext2fs_inode_scan_flags(scan, EXT2_SF_SKIP_MISSING_ITABLE |
1639                                       EXT2_SF_WARN_GARBAGE_INODES, 0);
1640         ctx->stashed_inode = inode;
1641         scan_struct.ctx = ctx;
1642         scan_struct.block_buf = block_buf;
1643         scan_struct.inodes_to_process = inodes_to_process;
1644         scan_struct.process_inode_count = &process_inode_count;
1645         ext2fs_set_inode_callback(scan, scan_callback, &scan_struct);
1646         if (ctx->progress && ((ctx->progress)(ctx, 1, 0,
1647                                               ctx->fs->group_desc_count)))
1648                 goto endit;
1649         if ((fs->super->s_wtime &&
1650              fs->super->s_wtime < fs->super->s_inodes_count) ||
1651             (fs->super->s_mtime &&
1652              fs->super->s_mtime < fs->super->s_inodes_count) ||
1653             (fs->super->s_mkfs_time &&
1654              fs->super->s_mkfs_time < fs->super->s_inodes_count))
1655                 low_dtime_check = 0;
1656
1657         /* Set up ctx->lost_and_found if possible */
1658         (void) e2fsck_get_lost_and_found(ctx, 0);
1659
1660 #ifdef HAVE_PTHREAD
1661         if (ctx->global_ctx) {
1662                 if (ctx->options & E2F_OPT_DEBUG &&
1663                     ctx->options & E2F_OPT_MULTITHREAD)
1664                         fprintf(stderr, "thread %d jumping to group %u\n",
1665                                         ctx->thread_info.et_thread_index,
1666                                         ctx->thread_info.et_group_start);
1667                 pctx.errcode = ext2fs_inode_scan_goto_blockgroup(scan,
1668                                         ctx->thread_info.et_group_start);
1669                 if (pctx.errcode) {
1670                         fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1671                         ctx->flags |= E2F_FLAG_ABORT;
1672                         goto endit;
1673                 }
1674         }
1675 #endif
1676
1677         while (1) {
1678                 check_mmp = 0;
1679                 e2fsck_pass1_check_lock(ctx);
1680 #ifdef  HAVE_PTHREAD
1681                 if (!global_ctx->mmp_update_thread) {
1682                         e2fsck_pass1_block_map_w_lock(ctx);
1683                         if (!global_ctx->mmp_update_thread) {
1684                                 global_ctx->mmp_update_thread =
1685                                         ctx->thread_info.et_thread_index + 1;
1686                                 check_mmp = 1;
1687                         }
1688                         e2fsck_pass1_block_map_w_unlock(ctx);
1689                 }
1690
1691                 /* only one active thread could update mmp block. */
1692                 e2fsck_pass1_block_map_r_lock(ctx);
1693                 if (global_ctx->mmp_update_thread ==
1694                     ctx->thread_info.et_thread_index + 1)
1695                         check_mmp = 1;
1696                 e2fsck_pass1_block_map_r_unlock(ctx);
1697 #else
1698                 check_mmp = 1;
1699 #endif
1700
1701                 if (check_mmp && (ino % (fs->super->s_inodes_per_group * 4) == 1)) {
1702                         if (e2fsck_mmp_update(fs))
1703                                 fatal_error(ctx, 0);
1704                 }
1705                 old_op = ehandler_operation(eop_next_inode);
1706                 pctx.errcode = ext2fs_get_next_inode_full(scan, &ino,
1707                                                           inode, inode_size);
1708                 if (ino > ino_threshold)
1709                         pass1_readahead(ctx, &ra_group, &ino_threshold);
1710                 ehandler_operation(old_op);
1711                 if (e2fsck_should_abort(ctx)) {
1712                         e2fsck_pass1_check_unlock(ctx);
1713                         goto endit;
1714                 }
1715                 if (pctx.errcode == EXT2_ET_BAD_BLOCK_IN_INODE_TABLE) {
1716                         /*
1717                          * If badblocks says badblocks is bad, offer to clear
1718                          * the list, update the in-core bb list, and restart
1719                          * the inode scan.
1720                          */
1721                         if (ino == EXT2_BAD_INO &&
1722                             fix_problem(ctx, PR_1_BADBLOCKS_IN_BADBLOCKS,
1723                                         &pctx)) {
1724                                 errcode_t err;
1725
1726                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1727                                 ext2fs_badblocks_list_free(ctx->fs->badblocks);
1728                                 ctx->fs->badblocks = NULL;
1729                                 err = ext2fs_read_bb_inode(ctx->fs,
1730                                                         &ctx->fs->badblocks);
1731                                 if (err) {
1732                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1733                                                     &pctx);
1734                                         ctx->flags |= E2F_FLAG_ABORT;
1735                                         e2fsck_pass1_check_unlock(ctx);
1736                                         goto endit;
1737                                 } else
1738                                         ctx->flags |= E2F_FLAG_RESTART;
1739                                 err = ext2fs_inode_scan_goto_blockgroup(scan,
1740                                                                         0);
1741                                 if (err) {
1742                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1743                                                     &pctx);
1744                                         ctx->flags |= E2F_FLAG_ABORT;
1745                                         e2fsck_pass1_check_unlock(ctx);
1746                                         goto endit;
1747                                 }
1748                                 e2fsck_pass1_check_unlock(ctx);
1749                                 continue;
1750                         }
1751                         if (!ctx->inode_bb_map)
1752                                 alloc_bb_map(ctx);
1753                         ext2fs_mark_inode_bitmap2(ctx->inode_bb_map, ino);
1754                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1755                         e2fsck_pass1_check_unlock(ctx);
1756                         continue;
1757                 }
1758                 if (pctx.errcode == EXT2_ET_SCAN_FINISHED) {
1759                         e2fsck_pass1_check_unlock(ctx);
1760                         break;
1761                 }
1762                 if (pctx.errcode &&
1763                     pctx.errcode != EXT2_ET_INODE_CSUM_INVALID &&
1764                     pctx.errcode != EXT2_ET_INODE_IS_GARBAGE) {
1765                         fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1766                         ctx->flags |= E2F_FLAG_ABORT;
1767                         e2fsck_pass1_check_unlock(ctx);
1768                         goto endit;
1769                 }
1770                 if (!ino) {
1771                         e2fsck_pass1_check_unlock(ctx);
1772                         break;
1773                 }
1774 #ifdef HAVE_PTHREAD
1775                 if (ctx->global_ctx)
1776                         ctx->thread_info.et_inode_number++;
1777 #endif
1778                 pctx.ino = ino;
1779                 pctx.inode = inode;
1780                 ctx->stashed_ino = ino;
1781
1782                 /* Clear trashed inode? */
1783                 if (pctx.errcode == EXT2_ET_INODE_IS_GARBAGE &&
1784                     inode->i_links_count > 0 &&
1785                     fix_problem(ctx, PR_1_INODE_IS_GARBAGE, &pctx)) {
1786                         pctx.errcode = 0;
1787                         e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1788                 }
1789                 failed_csum = pctx.errcode != 0;
1790
1791                 /*
1792                  * Check for inodes who might have been part of the
1793                  * orphaned list linked list.  They should have gotten
1794                  * dealt with by now, unless the list had somehow been
1795                  * corrupted.
1796                  *
1797                  * FIXME: In the future, inodes which are still in use
1798                  * (and which are therefore) pending truncation should
1799                  * be handled specially.  Right now we just clear the
1800                  * dtime field, and the normal e2fsck handling of
1801                  * inodes where i_size and the inode blocks are
1802                  * inconsistent is to fix i_size, instead of releasing
1803                  * the extra blocks.  This won't catch the inodes that
1804                  * was at the end of the orphan list, but it's better
1805                  * than nothing.  The right answer is that there
1806                  * shouldn't be any bugs in the orphan list handling.  :-)
1807                  */
1808                 if (inode->i_dtime && low_dtime_check &&
1809                     inode->i_dtime < ctx->fs->super->s_inodes_count) {
1810                         if (fix_problem(ctx, PR_1_LOW_DTIME, &pctx)) {
1811                                 inode->i_dtime = inode->i_links_count ?
1812                                         0 : ctx->now;
1813                                 e2fsck_write_inode(ctx, ino, inode,
1814                                                    "pass1");
1815                                 failed_csum = 0;
1816                         }
1817                 }
1818
1819                 if (inode->i_links_count) {
1820                         pctx.errcode = ext2fs_icount_store(ctx->inode_link_info,
1821                                            ino, inode->i_links_count);
1822                         if (pctx.errcode) {
1823                                 pctx.num = inode->i_links_count;
1824                                 fix_problem(ctx, PR_1_ICOUNT_STORE, &pctx);
1825                                 ctx->flags |= E2F_FLAG_ABORT;
1826                                 e2fsck_pass1_check_unlock(ctx);
1827                                 goto endit;
1828                         }
1829                 } else if ((ino >= EXT2_FIRST_INODE(fs->super)) &&
1830                            !quota_inum_is_reserved(fs, ino)) {
1831                         if (!inode->i_dtime && inode->i_mode) {
1832                                 if (fix_problem(ctx,
1833                                             PR_1_ZERO_DTIME, &pctx)) {
1834                                         inode->i_dtime = ctx->now;
1835                                         e2fsck_write_inode(ctx, ino, inode,
1836                                                            "pass1");
1837                                         failed_csum = 0;
1838                                 }
1839                         }
1840                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1841                         e2fsck_pass1_check_unlock(ctx);
1842                         continue;
1843                 }
1844
1845                 if ((inode->i_flags & EXT4_CASEFOLD_FL) &&
1846                     ((!LINUX_S_ISDIR(inode->i_mode) &&
1847                       fix_problem(ctx, PR_1_CASEFOLD_NONDIR, &pctx)) ||
1848                      (!casefold_fs &&
1849                       fix_problem(ctx, PR_1_CASEFOLD_FEATURE, &pctx)))) {
1850                         inode->i_flags &= ~EXT4_CASEFOLD_FL;
1851                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1852                 }
1853
1854                 /* Conflicting inlinedata/extents inode flags? */
1855                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) &&
1856                     (inode->i_flags & EXT4_EXTENTS_FL)) {
1857                         int res = fix_inline_data_extents_file(ctx, ino, inode,
1858                                                                inode_size,
1859                                                                &pctx);
1860                         if (res < 0) {
1861                                 /* skip FINISH_INODE_LOOP */
1862                                 e2fsck_pass1_check_unlock(ctx);
1863                                 continue;
1864                         }
1865                 }
1866
1867                 /* Test for incorrect inline_data flags settings. */
1868                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && !inlinedata_fs &&
1869                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1870                         size_t size = 0;
1871
1872                         pctx.errcode = get_inline_data_ea_size(fs, ino, inode,
1873                                                                &size);
1874                         if (!pctx.errcode &&
1875                             fix_problem(ctx, PR_1_INLINE_DATA_FEATURE, &pctx)) {
1876                                 e2fsck_pass1_fix_lock(ctx);
1877                                 ext2fs_set_feature_inline_data(sb);
1878                                 ext2fs_mark_super_dirty(fs);
1879                                 e2fsck_pass1_fix_unlock(ctx);
1880                                 inlinedata_fs = 1;
1881                         } else if (fix_problem(ctx, PR_1_INLINE_DATA_SET, &pctx)) {
1882                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1883                                 /* skip FINISH_INODE_LOOP */
1884                                 e2fsck_pass1_check_unlock(ctx);
1885                                 continue;
1886                         }
1887                 }
1888
1889                 /* Test for inline data flag but no attr */
1890                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && inlinedata_fs &&
1891                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1892                         size_t size = 0;
1893                         errcode_t err;
1894                         int flags;
1895
1896                         flags = fs->flags;
1897                         if (failed_csum)
1898                                 fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
1899                         err = get_inline_data_ea_size(fs, ino, inode, &size);
1900                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
1901                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
1902
1903                         switch (err) {
1904                         case 0:
1905                                 /* Everything is awesome... */
1906                                 break;
1907                         case EXT2_ET_BAD_EA_BLOCK_NUM:
1908                         case EXT2_ET_BAD_EA_HASH:
1909                         case EXT2_ET_BAD_EA_HEADER:
1910                         case EXT2_ET_EA_BAD_NAME_LEN:
1911                         case EXT2_ET_EA_BAD_VALUE_SIZE:
1912                         case EXT2_ET_EA_KEY_NOT_FOUND:
1913                         case EXT2_ET_EA_NO_SPACE:
1914                         case EXT2_ET_MISSING_EA_FEATURE:
1915                         case EXT2_ET_INLINE_DATA_CANT_ITERATE:
1916                         case EXT2_ET_INLINE_DATA_NO_BLOCK:
1917                         case EXT2_ET_INLINE_DATA_NO_SPACE:
1918                         case EXT2_ET_NO_INLINE_DATA:
1919                         case EXT2_ET_EXT_ATTR_CSUM_INVALID:
1920                         case EXT2_ET_EA_BAD_VALUE_OFFSET:
1921                         case EXT2_ET_EA_INODE_CORRUPTED:
1922                                 /* broken EA or no system.data EA; truncate */
1923                                 if (fix_problem(ctx, PR_1_INLINE_DATA_NO_ATTR,
1924                                                 &pctx)) {
1925                                         err = ext2fs_inode_size_set(fs, inode, 0);
1926                                         if (err) {
1927                                                 pctx.errcode = err;
1928                                                 ctx->flags |= E2F_FLAG_ABORT;
1929                                                 e2fsck_pass1_check_unlock(ctx);
1930                                                 goto endit;
1931                                         }
1932                                         inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1933                                         memset(&inode->i_block, 0,
1934                                                sizeof(inode->i_block));
1935                                         e2fsck_write_inode(ctx, ino, inode,
1936                                                            "pass1");
1937                                         failed_csum = 0;
1938                                 }
1939                                 break;
1940                         default:
1941                                 /* Some other kind of non-xattr error? */
1942                                 pctx.errcode = err;
1943                                 ctx->flags |= E2F_FLAG_ABORT;
1944                                 e2fsck_pass1_check_unlock(ctx);
1945                                 goto endit;
1946                         }
1947                 }
1948
1949                 /*
1950                  * Test for incorrect extent flag settings.
1951                  *
1952                  * On big-endian machines we must be careful:
1953                  * When the inode is read, the i_block array is not swapped
1954                  * if the extent flag is set.  Therefore if we are testing
1955                  * for or fixing a wrongly-set flag, we must potentially
1956                  * (un)swap before testing, or after fixing.
1957                  */
1958
1959                 /*
1960                  * In this case the extents flag was set when read, so
1961                  * extent_header_verify is ok.  If the inode is cleared,
1962                  * no need to swap... so no extra swapping here.
1963                  */
1964                 if ((inode->i_flags & EXT4_EXTENTS_FL) && !extent_fs &&
1965                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1966                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO))) {
1967                         if ((ext2fs_extent_header_verify(inode->i_block,
1968                                                  sizeof(inode->i_block)) == 0) &&
1969                             fix_problem(ctx, PR_1_EXTENT_FEATURE, &pctx)) {
1970                                 e2fsck_pass1_fix_lock(ctx);
1971                                 ext2fs_set_feature_extents(sb);
1972                                 ext2fs_mark_super_dirty(fs);
1973                                 extent_fs = 1;
1974                                 e2fsck_pass1_fix_unlock(ctx);
1975                         } else if (fix_problem(ctx, PR_1_EXTENTS_SET, &pctx)) {
1976                         clear_inode:
1977                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1978                                 if (ino == EXT2_BAD_INO)
1979                                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map,
1980                                                                  ino);
1981                                 /* skip FINISH_INODE_LOOP */
1982                                 e2fsck_pass1_check_unlock(ctx);
1983                                 continue;
1984                         }
1985                 }
1986
1987                 /*
1988                  * For big-endian machines:
1989                  * If the inode didn't have the extents flag set when it
1990                  * was read, then the i_blocks array was swapped.  To test
1991                  * as an extents header, we must swap it back first.
1992                  * IF we then set the extents flag, the entire i_block
1993                  * array must be un/re-swapped to make it proper extents data.
1994                  */
1995                 if (extent_fs && !(inode->i_flags & EXT4_EXTENTS_FL) &&
1996                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1997                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO)) &&
1998                     (LINUX_S_ISREG(inode->i_mode) ||
1999                      LINUX_S_ISDIR(inode->i_mode))) {
2000                         void *ehp;
2001 #ifdef WORDS_BIGENDIAN
2002                         __u32 tmp_block[EXT2_N_BLOCKS];
2003
2004                         for (i = 0; i < EXT2_N_BLOCKS; i++)
2005                                 tmp_block[i] = ext2fs_swab32(inode->i_block[i]);
2006                         ehp = tmp_block;
2007 #else
2008                         ehp = inode->i_block;
2009 #endif
2010                         if ((ext2fs_extent_header_verify(ehp,
2011                                          sizeof(inode->i_block)) == 0) &&
2012                             (fix_problem(ctx, PR_1_UNSET_EXTENT_FL, &pctx))) {
2013                                 inode->i_flags |= EXT4_EXTENTS_FL;
2014 #ifdef WORDS_BIGENDIAN
2015                                 memcpy(inode->i_block, tmp_block,
2016                                        sizeof(inode->i_block));
2017 #endif
2018                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
2019                                 failed_csum = 0;
2020                         }
2021                 }
2022
2023                 if (ino == EXT2_BAD_INO) {
2024                         struct process_block_struct pb;
2025
2026                         if ((failed_csum || inode->i_mode || inode->i_uid ||
2027                              inode->i_gid || inode->i_links_count ||
2028                              (inode->i_flags & EXT4_INLINE_DATA_FL) ||
2029                              inode->i_file_acl) &&
2030                             fix_problem(ctx, PR_1_INVALID_BAD_INODE, &pctx)) {
2031                                 memset(inode, 0, sizeof(struct ext2_inode));
2032                                 e2fsck_write_inode(ctx, ino, inode,
2033                                                    "clear bad inode");
2034                                 failed_csum = 0;
2035                         }
2036
2037                         e2fsck_pass1_block_map_r_lock(ctx);
2038                         pctx.errcode = ext2fs_copy_bitmap(ctx->global_ctx ?
2039                                         ctx->global_ctx->block_found_map :
2040                                         ctx->block_found_map, &pb.fs_meta_blocks);
2041                         e2fsck_pass1_block_map_r_unlock(ctx);
2042                         if (pctx.errcode) {
2043                                 pctx.num = 4;
2044                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
2045                                 ctx->flags |= E2F_FLAG_ABORT;
2046                                 e2fsck_pass1_check_unlock(ctx);
2047                                 goto endit;
2048                         }
2049                         pb.ino = EXT2_BAD_INO;
2050                         pb.num_blocks = pb.last_block = 0;
2051                         pb.last_db_block = -1;
2052                         pb.num_illegal_blocks = 0;
2053                         pb.suppress = 0; pb.clear = 0; pb.is_dir = 0;
2054                         pb.is_reg = 0; pb.fragmented = 0; pb.bbcheck = 0;
2055                         pb.inode = inode;
2056                         pb.pctx = &pctx;
2057                         pb.ctx = ctx;
2058                         pctx.errcode = ext2fs_block_iterate3(fs, ino, 0,
2059                                      block_buf, process_bad_block, &pb);
2060                         ext2fs_free_block_bitmap(pb.fs_meta_blocks);
2061                         if (pctx.errcode) {
2062                                 fix_problem(ctx, PR_1_BLOCK_ITERATE, &pctx);
2063                                 ctx->flags |= E2F_FLAG_ABORT;
2064                                 e2fsck_pass1_check_unlock(ctx);
2065                                 goto endit;
2066                         }
2067                         if (pb.bbcheck)
2068                                 if (!fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK_PROMPT, &pctx)) {
2069                                 ctx->flags |= E2F_FLAG_ABORT;
2070                                 e2fsck_pass1_check_unlock(ctx);
2071                                 goto endit;
2072                         }
2073                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2074                         clear_problem_context(&pctx);
2075                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2076                         e2fsck_pass1_check_unlock(ctx);
2077                         continue;
2078                 } else if (ino == EXT2_ROOT_INO) {
2079                         /*
2080                          * Make sure the root inode is a directory; if
2081                          * not, offer to clear it.  It will be
2082                          * regenerated in pass #3.
2083                          */
2084                         if (!LINUX_S_ISDIR(inode->i_mode)) {
2085                                 if (fix_problem(ctx, PR_1_ROOT_NO_DIR, &pctx))
2086                                         goto clear_inode;
2087                         }
2088                         /*
2089                          * If dtime is set, offer to clear it.  mke2fs
2090                          * version 0.2b created filesystems with the
2091                          * dtime field set for the root and lost+found
2092                          * directories.  We won't worry about
2093                          * /lost+found, since that can be regenerated
2094                          * easily.  But we will fix the root directory
2095                          * as a special case.
2096                          */
2097                         if (inode->i_dtime && inode->i_links_count) {
2098                                 if (fix_problem(ctx, PR_1_ROOT_DTIME, &pctx)) {
2099                                         inode->i_dtime = 0;
2100                                         e2fsck_write_inode(ctx, ino, inode,
2101                                                            "pass1");
2102                                         failed_csum = 0;
2103                                 }
2104                         }
2105                 } else if (ino == EXT2_JOURNAL_INO) {
2106                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2107                         if (fs->super->s_journal_inum == EXT2_JOURNAL_INO) {
2108                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2109                                     fix_problem(ctx, PR_1_JOURNAL_BAD_MODE,
2110                                                 &pctx)) {
2111                                         inode->i_mode = LINUX_S_IFREG;
2112                                         e2fsck_write_inode(ctx, ino, inode,
2113                                                            "pass1");
2114                                         failed_csum = 0;
2115                                 }
2116                                 check_blocks(ctx, &pctx, block_buf, NULL);
2117                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2118                                 e2fsck_pass1_check_unlock(ctx);
2119                                 continue;
2120                         }
2121                         if ((inode->i_links_count ||
2122                              inode->i_blocks || inode->i_block[0]) &&
2123                             fix_problem(ctx, PR_1_JOURNAL_INODE_NOT_CLEAR,
2124                                         &pctx)) {
2125                                 memset(inode, 0, inode_size);
2126                                 ext2fs_icount_store(ctx->inode_link_info,
2127                                                     ino, 0);
2128                                 e2fsck_write_inode_full(ctx, ino, inode,
2129                                                         inode_size, "pass1");
2130                                 failed_csum = 0;
2131                         }
2132                 } else if (quota_inum_is_reserved(fs, ino)) {
2133                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2134                         if (ext2fs_has_feature_quota(fs->super) &&
2135                             quota_inum_is_super(fs->super, ino)) {
2136                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2137                                     fix_problem(ctx, PR_1_QUOTA_BAD_MODE,
2138                                                         &pctx)) {
2139                                         inode->i_mode = LINUX_S_IFREG;
2140                                         e2fsck_write_inode(ctx, ino, inode,
2141                                                         "pass1");
2142                                         failed_csum = 0;
2143                                 }
2144                                 check_blocks(ctx, &pctx, block_buf, NULL);
2145                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2146                                 e2fsck_pass1_check_unlock(ctx);
2147                                 continue;
2148                         }
2149                         if ((inode->i_links_count ||
2150                              inode->i_blocks || inode->i_block[0]) &&
2151                             fix_problem(ctx, PR_1_QUOTA_INODE_NOT_CLEAR,
2152                                         &pctx)) {
2153                                 memset(inode, 0, inode_size);
2154                                 ext2fs_icount_store(ctx->inode_link_info,
2155                                                     ino, 0);
2156                                 e2fsck_write_inode_full(ctx, ino, inode,
2157                                                         inode_size, "pass1");
2158                                 failed_csum = 0;
2159                         }
2160                 } else if (ino == fs->super->s_orphan_file_inum) {
2161                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2162                         if (ext2fs_has_feature_orphan_file(fs->super)) {
2163                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2164                                     fix_problem(ctx, PR_1_ORPHAN_FILE_BAD_MODE,
2165                                                 &pctx)) {
2166                                         inode->i_mode = LINUX_S_IFREG;
2167                                         e2fsck_write_inode(ctx, ino, inode,
2168                                                            "pass1");
2169                                         failed_csum = 0;
2170                                 }
2171                                 check_blocks(ctx, &pctx, block_buf, NULL);
2172                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2173                                 continue;
2174                         }
2175                         if ((inode->i_links_count ||
2176                              inode->i_blocks || inode->i_block[0]) &&
2177                             fix_problem(ctx, PR_1_ORPHAN_FILE_NOT_CLEAR,
2178                                         &pctx)) {
2179                                 memset(inode, 0, inode_size);
2180                                 ext2fs_icount_store(ctx->inode_link_info, ino,
2181                                                     0);
2182                                 e2fsck_write_inode_full(ctx, ino, inode,
2183                                                         inode_size, "pass1");
2184                                 failed_csum = 0;
2185                         }
2186                 } else if (ino < EXT2_FIRST_INODE(fs->super)) {
2187                         problem_t problem = 0;
2188
2189                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2190                         if (ino == EXT2_BOOT_LOADER_INO) {
2191                                 if (LINUX_S_ISDIR(inode->i_mode))
2192                                         problem = PR_1_RESERVED_BAD_MODE;
2193                         } else if (ino == EXT2_RESIZE_INO) {
2194                                 if (inode->i_mode &&
2195                                     !LINUX_S_ISREG(inode->i_mode))
2196                                         problem = PR_1_RESERVED_BAD_MODE;
2197                         } else {
2198                                 if (inode->i_mode != 0)
2199                                         problem = PR_1_RESERVED_BAD_MODE;
2200                         }
2201                         if (problem) {
2202                                 if (fix_problem(ctx, problem, &pctx)) {
2203                                         inode->i_mode = 0;
2204                                         e2fsck_write_inode(ctx, ino, inode,
2205                                                            "pass1");
2206                                         failed_csum = 0;
2207                                 }
2208                         }
2209                         check_blocks(ctx, &pctx, block_buf, NULL);
2210                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2211                         e2fsck_pass1_check_unlock(ctx);
2212                         continue;
2213                 }
2214
2215                 if (!inode->i_links_count) {
2216                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2217                         e2fsck_pass1_check_unlock(ctx);
2218                         continue;
2219                 }
2220                 /*
2221                  * n.b.  0.3c ext2fs code didn't clear i_links_count for
2222                  * deleted files.  Oops.
2223                  *
2224                  * Since all new ext2 implementations get this right,
2225                  * we now assume that the case of non-zero
2226                  * i_links_count and non-zero dtime means that we
2227                  * should keep the file, not delete it.
2228                  *
2229                  */
2230                 if (inode->i_dtime) {
2231                         if (fix_problem(ctx, PR_1_SET_DTIME, &pctx)) {
2232                                 inode->i_dtime = 0;
2233                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
2234                                 failed_csum = 0;
2235                         }
2236                 }
2237
2238                 ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2239                 switch (fs->super->s_creator_os) {
2240                     case EXT2_OS_HURD:
2241                         frag = inode->osd2.hurd2.h_i_frag;
2242                         fsize = inode->osd2.hurd2.h_i_fsize;
2243                         break;
2244                     default:
2245                         frag = fsize = 0;
2246                 }
2247
2248                 if (inode->i_faddr || frag || fsize ||
2249                     (!ext2fs_has_feature_largedir(fs->super) &&
2250                     (LINUX_S_ISDIR(inode->i_mode) && inode->i_size_high)))
2251                         mark_inode_bad(ctx, ino);
2252                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
2253                     !ext2fs_has_feature_64bit(fs->super) &&
2254                     inode->osd2.linux2.l_i_file_acl_high != 0)
2255                         mark_inode_bad(ctx, ino);
2256                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
2257                     !ext2fs_has_feature_huge_file(fs->super) &&
2258                     (inode->osd2.linux2.l_i_blocks_hi != 0))
2259                         mark_inode_bad(ctx, ino);
2260                 if (inode->i_flags & EXT2_IMAGIC_FL) {
2261                         if (imagic_fs) {
2262                                 if (!ctx->inode_imagic_map)
2263                                         alloc_imagic_map(ctx);
2264                                 ext2fs_mark_inode_bitmap2(ctx->inode_imagic_map,
2265                                                          ino);
2266                         } else {
2267                                 if (fix_problem(ctx, PR_1_SET_IMAGIC, &pctx)) {
2268                                         inode->i_flags &= ~EXT2_IMAGIC_FL;
2269                                         e2fsck_write_inode(ctx, ino,
2270                                                            inode, "pass1");
2271                                         failed_csum = 0;
2272                                 }
2273                         }
2274                 }
2275
2276                 check_inode_extra_space(ctx, &pctx, &ea_ibody_quota);
2277                 check_is_really_dir(ctx, &pctx, block_buf);
2278
2279                 /*
2280                  * ext2fs_inode_has_valid_blocks2 does not actually look
2281                  * at i_block[] values, so not endian-sensitive here.
2282                  */
2283                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL) &&
2284                     LINUX_S_ISLNK(inode->i_mode) &&
2285                     !ext2fs_inode_has_valid_blocks2(fs, inode) &&
2286                     fix_problem(ctx, PR_1_FAST_SYMLINK_EXTENT_FL, &pctx)) {
2287                         inode->i_flags &= ~EXT4_EXTENTS_FL;
2288                         e2fsck_write_inode(ctx, ino, inode, "pass1");
2289                         failed_csum = 0;
2290                 }
2291
2292                 if ((inode->i_flags & EXT4_ENCRYPT_FL) &&
2293                     add_encrypted_file(ctx, &pctx) < 0)
2294                         goto clear_inode;
2295
2296                 if (casefold_fs && inode->i_flags & EXT4_CASEFOLD_FL)
2297                         ext2fs_mark_inode_bitmap2(ctx->inode_casefold_map, ino);
2298
2299                 if (LINUX_S_ISDIR(inode->i_mode)) {
2300                         ext2fs_mark_inode_bitmap2(ctx->inode_dir_map, ino);
2301                         e2fsck_add_dir_info(ctx, ino, 0);
2302                         ctx->fs_directory_count++;
2303                         if (inode->i_flags & EXT4_CASEFOLD_FL)
2304                                 add_casefolded_dir(ctx, ino);
2305                 } else if (LINUX_S_ISREG (inode->i_mode)) {
2306                         ext2fs_mark_inode_bitmap2(ctx->inode_reg_map, ino);
2307                         ctx->fs_regular_count++;
2308                 } else if (LINUX_S_ISCHR (inode->i_mode) &&
2309                            e2fsck_pass1_check_device_inode(fs, inode)) {
2310                         check_extents_inlinedata(ctx, &pctx);
2311                         check_immutable(ctx, &pctx);
2312                         check_size(ctx, &pctx);
2313                         ctx->fs_chardev_count++;
2314                 } else if (LINUX_S_ISBLK (inode->i_mode) &&
2315                            e2fsck_pass1_check_device_inode(fs, inode)) {
2316                         check_extents_inlinedata(ctx, &pctx);
2317                         check_immutable(ctx, &pctx);
2318                         check_size(ctx, &pctx);
2319                         ctx->fs_blockdev_count++;
2320                 } else if (LINUX_S_ISLNK (inode->i_mode) &&
2321                            e2fsck_pass1_check_symlink(fs, ino, inode,
2322                                                       block_buf)) {
2323                         check_immutable(ctx, &pctx);
2324                         ctx->fs_symlinks_count++;
2325                         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
2326                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2327                                 e2fsck_pass1_check_unlock(ctx);
2328                                 continue;
2329                         } else if (ext2fs_is_fast_symlink(inode)) {
2330                                 ctx->fs_fast_symlinks_count++;
2331                                 check_blocks(ctx, &pctx, block_buf,
2332                                              &ea_ibody_quota);
2333                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2334                                 e2fsck_pass1_check_unlock(ctx);
2335                                 continue;
2336                         }
2337                 }
2338                 else if (LINUX_S_ISFIFO (inode->i_mode) &&
2339                          e2fsck_pass1_check_device_inode(fs, inode)) {
2340                         check_extents_inlinedata(ctx, &pctx);
2341                         check_immutable(ctx, &pctx);
2342                         check_size(ctx, &pctx);
2343                         ctx->fs_fifo_count++;
2344                 } else if ((LINUX_S_ISSOCK (inode->i_mode)) &&
2345                            e2fsck_pass1_check_device_inode(fs, inode)) {
2346                         check_extents_inlinedata(ctx, &pctx);
2347                         check_immutable(ctx, &pctx);
2348                         check_size(ctx, &pctx);
2349                         ctx->fs_sockets_count++;
2350                 } else
2351                         mark_inode_bad(ctx, ino);
2352                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
2353                     !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
2354                         if (inode->i_block[EXT2_IND_BLOCK])
2355                                 ctx->fs_ind_count++;
2356                         if (inode->i_block[EXT2_DIND_BLOCK])
2357                                 ctx->fs_dind_count++;
2358                         if (inode->i_block[EXT2_TIND_BLOCK])
2359                                 ctx->fs_tind_count++;
2360                 }
2361                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
2362                     !(inode->i_flags & EXT4_INLINE_DATA_FL) &&
2363                     (inode->i_block[EXT2_IND_BLOCK] ||
2364                      inode->i_block[EXT2_DIND_BLOCK] ||
2365                      inode->i_block[EXT2_TIND_BLOCK] ||
2366                      ext2fs_file_acl_block(fs, inode))) {
2367                         struct process_inode_block *itp;
2368
2369                         itp = &inodes_to_process[process_inode_count];
2370                         itp->ino = ino;
2371                         itp->ea_ibody_quota = ea_ibody_quota;
2372                         if (inode_size < sizeof(struct ext2_inode_large))
2373                                 memcpy(&itp->inode, inode, inode_size);
2374                         else
2375                                 memcpy(&itp->inode, inode, sizeof(itp->inode));
2376                         process_inode_count++;
2377                 } else
2378                         check_blocks(ctx, &pctx, block_buf, &ea_ibody_quota);
2379
2380                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2381
2382                 if (e2fsck_should_abort(ctx)) {
2383                         e2fsck_pass1_check_unlock(ctx);
2384                         goto endit;
2385                 }
2386
2387                 if (process_inode_count >= ctx->process_inode_size) {
2388                         process_inodes(ctx, block_buf, inodes_to_process,
2389                                        &process_inode_count);
2390
2391                         if (e2fsck_should_abort(ctx)) {
2392                                 e2fsck_pass1_check_unlock(ctx);
2393                                 goto endit;
2394                         }
2395                 }
2396                 e2fsck_pass1_check_unlock(ctx);
2397         }
2398         process_inodes(ctx, block_buf, inodes_to_process,
2399                        &process_inode_count);
2400         ext2fs_close_inode_scan(scan);
2401         scan = NULL;
2402
2403         if (ctx->ea_block_quota_blocks) {
2404                 ea_refcount_free(ctx->ea_block_quota_blocks);
2405                 ctx->ea_block_quota_blocks = 0;
2406         }
2407
2408         if (ctx->ea_block_quota_inodes) {
2409                 ea_refcount_free(ctx->ea_block_quota_inodes);
2410                 ctx->ea_block_quota_inodes = 0;
2411         }
2412
2413         /* We don't need the encryption policy => ID map any more */
2414         destroy_encryption_policy_map(ctx);
2415
2416         if (ctx->flags & E2F_FLAG_RESTART) {
2417                 /*
2418                  * Only the master copy of the superblock and block
2419                  * group descriptors are going to be written during a
2420                  * restart, so set the superblock to be used to be the
2421                  * master superblock.
2422                  */
2423                 ctx->use_superblock = 0;
2424                 goto endit;
2425         }
2426
2427         if (ctx->large_dirs && !ext2fs_has_feature_largedir(fs->super)) {
2428                 if (fix_problem(ctx, PR_2_FEATURE_LARGE_DIRS, &pctx)) {
2429                         ext2fs_set_feature_largedir(fs->super);
2430                         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
2431                         ext2fs_mark_super_dirty(fs);
2432                 }
2433                 if (fs->super->s_rev_level == EXT2_GOOD_OLD_REV &&
2434                     fix_problem(ctx, PR_1_FS_REV_LEVEL, &pctx)) {
2435                         ext2fs_update_dynamic_rev(fs);
2436                         ext2fs_mark_super_dirty(fs);
2437                 }
2438         }
2439
2440         ctx->flags |= E2F_FLAG_ALLOC_OK;
2441         ext2fs_free_mem(&inodes_to_process);
2442 endit:
2443         e2fsck_use_inode_shortcuts(ctx, 0);
2444         ext2fs_free_mem(&inodes_to_process);
2445         inodes_to_process = 0;
2446
2447         if (scan)
2448                 ext2fs_close_inode_scan(scan);
2449         if (block_buf)
2450                 ext2fs_free_mem(&block_buf);
2451         if (inode)
2452                 ext2fs_free_mem(&inode);
2453
2454         /*
2455          * The l+f inode may have been cleared, so zap it now and
2456          * later passes will recalculate it if necessary
2457          */
2458         ctx->lost_and_found = 0;
2459
2460         if ((ctx->flags & E2F_FLAG_SIGNAL_MASK) == 0)
2461                 print_resource_track(ctx, _("Pass 1"), &rtrack, ctx->fs->io);
2462         else
2463                 ctx->invalid_bitmaps++;
2464 #ifdef  HAVE_PTHREAD
2465         /* reset update_thread after this thread exit */
2466         e2fsck_pass1_block_map_w_lock(ctx);
2467         if (check_mmp)
2468                 global_ctx->mmp_update_thread = 0;
2469         e2fsck_pass1_block_map_w_unlock(ctx);
2470 #endif
2471 }
2472
2473 #ifdef HAVE_PTHREAD
2474 static errcode_t e2fsck_pass1_copy_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2475                                           ext2fs_generic_bitmap *dest)
2476 {
2477         errcode_t ret;
2478
2479         ret = ext2fs_copy_bitmap(*src, dest);
2480         if (ret)
2481                 return ret;
2482
2483         (*dest)->fs = fs;
2484
2485         return 0;
2486 }
2487
2488 static void e2fsck_pass1_free_bitmap(ext2fs_generic_bitmap *bitmap)
2489 {
2490         if (*bitmap) {
2491                 ext2fs_free_generic_bmap(*bitmap);
2492                 *bitmap = NULL;
2493         }
2494
2495 }
2496
2497 static errcode_t e2fsck_pass1_merge_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2498                                           ext2fs_generic_bitmap *dest)
2499 {
2500         errcode_t ret = 0;
2501
2502         if (*src) {
2503                 if (*dest == NULL) {
2504                         *dest = *src;
2505                         *src = NULL;
2506                 } else {
2507                         ret = ext2fs_merge_bitmap(*src, *dest, NULL, NULL);
2508                         if (ret)
2509                                 return ret;
2510                 }
2511                 (*dest)->fs = fs;
2512         }
2513
2514         return 0;
2515 }
2516
2517 static errcode_t e2fsck_pass1_copy_fs(ext2_filsys dest, e2fsck_t src_context,
2518                                       ext2_filsys src)
2519 {
2520         errcode_t       retval;
2521
2522         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2523         dest->inode_map = NULL;
2524         dest->block_map = NULL;
2525         dest->badblocks = NULL;
2526         if (dest->dblist)
2527                 dest->dblist->fs = dest;
2528         if (src->block_map) {
2529                 retval = e2fsck_pass1_copy_bitmap(dest, &src->block_map,
2530                                                   &dest->block_map);
2531                 if (retval)
2532                         return retval;
2533         }
2534         if (src->inode_map) {
2535                 retval = e2fsck_pass1_copy_bitmap(dest, &src->inode_map,
2536                                                   &dest->inode_map);
2537                 if (retval)
2538                         return retval;
2539         }
2540
2541         if (src->badblocks) {
2542                 retval = ext2fs_badblocks_copy(src->badblocks,
2543                                                &dest->badblocks);
2544                 if (retval)
2545                         return retval;
2546         }
2547
2548         /* disable it for now */
2549         src_context->openfs_flags &= ~EXT2_FLAG_EXCLUSIVE;
2550         retval = ext2fs_open_channel(dest, src_context->io_options,
2551                                      src_context->io_manager,
2552                                      src_context->openfs_flags,
2553                                      src->io->block_size);
2554         if (retval)
2555                 return retval;
2556
2557         /* Block size might not be default */
2558         io_channel_set_blksize(dest->io, src->io->block_size);
2559         ehandler_init(dest->io);
2560
2561         assert(dest->io->magic == src->io->magic);
2562         assert(dest->io->manager == src->io->manager);
2563         assert(strcmp(dest->io->name, src->io->name) == 0);
2564         assert(dest->io->block_size == src->io->block_size);
2565         assert(dest->io->read_error == src->io->read_error);
2566         assert(dest->io->write_error == src->io->write_error);
2567         assert(dest->io->refcount == src->io->refcount);
2568         assert(dest->io->flags == src->io->flags);
2569         assert(dest->io->app_data == dest);
2570         assert(src->io->app_data == src);
2571         assert(dest->io->align == src->io->align);
2572
2573         /* The data should be written to disk immediately */
2574         dest->io->flags |= CHANNEL_FLAGS_WRITETHROUGH;
2575         /* icache will be rebuilt if needed, so do not copy from @src */
2576         src->icache = NULL;
2577         return 0;
2578 }
2579
2580 static int e2fsck_pass1_merge_fs(ext2_filsys dest, ext2_filsys src)
2581 {
2582         struct ext2_inode_cache *icache = dest->icache;
2583         errcode_t retval = 0;
2584         io_channel dest_io;
2585         io_channel dest_image_io;
2586         ext2fs_inode_bitmap inode_map;
2587         ext2fs_block_bitmap block_map;
2588         ext2_badblocks_list badblocks;
2589         ext2_dblist dblist;
2590         int flags;
2591         e2fsck_t dest_ctx = dest->priv_data;
2592
2593         dest_io = dest->io;
2594         dest_image_io = dest->image_io;
2595         inode_map = dest->inode_map;
2596         block_map = dest->block_map;
2597         badblocks = dest->badblocks;
2598         dblist = dest->dblist;
2599         flags = dest->flags;
2600
2601         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2602         dest->io = dest_io;
2603         dest->image_io = dest_image_io;
2604         dest->icache = icache;
2605         dest->inode_map = inode_map;
2606         dest->block_map = block_map;
2607         dest->badblocks = badblocks;
2608         dest->dblist = dblist;
2609         dest->priv_data = dest_ctx;
2610         if (dest->dblist)
2611                 dest->dblist->fs = dest;
2612         dest->flags = src->flags | flags;
2613         if (!(src->flags & EXT2_FLAG_VALID) || !(flags & EXT2_FLAG_VALID))
2614                 ext2fs_unmark_valid(dest);
2615
2616         if (src->icache) {
2617                 ext2fs_free_inode_cache(src->icache);
2618                 src->icache = NULL;
2619         }
2620
2621         retval = e2fsck_pass1_merge_bitmap(dest, &src->inode_map,
2622                                            &dest->inode_map);
2623         if (retval)
2624                 goto out;
2625
2626         retval = e2fsck_pass1_merge_bitmap(dest, &src->block_map,
2627                                           &dest->block_map);
2628         if (retval)
2629                 goto out;
2630
2631         if (src->dblist) {
2632                 if (dest->dblist) {
2633                         retval = ext2fs_merge_dblist(src->dblist,
2634                                                      dest->dblist);
2635                         if (retval)
2636                                 goto out;
2637                 } else {
2638                         dest->dblist = src->dblist;
2639                         dest->dblist->fs = dest;
2640                         src->dblist = NULL;
2641                 }
2642         }
2643
2644         if (src->badblocks) {
2645                 if (dest->badblocks == NULL)
2646                         retval = ext2fs_badblocks_copy(src->badblocks,
2647                                                        &dest->badblocks);
2648                 else
2649                         retval = ext2fs_badblocks_merge(src->badblocks,
2650                                                         dest->badblocks);
2651         }
2652 out:
2653         io_channel_close(src->io);
2654         if (src->inode_map)
2655                 ext2fs_free_generic_bmap(src->inode_map);
2656         if (src->block_map)
2657                 ext2fs_free_generic_bmap(src->block_map);
2658         if (src->badblocks)
2659                 ext2fs_badblocks_list_free(src->badblocks);
2660         if (src->dblist)
2661                 ext2fs_free_dblist(src->dblist);
2662
2663         return retval;
2664 }
2665
2666 static void e2fsck_pass1_copy_invalid_bitmaps(e2fsck_t global_ctx,
2667                                               e2fsck_t thread_ctx)
2668 {
2669         dgrp_t i, j;
2670         dgrp_t grp_start = thread_ctx->thread_info.et_group_start;
2671         dgrp_t grp_end = thread_ctx->thread_info.et_group_end;
2672         dgrp_t total = grp_end - grp_start;
2673
2674         thread_ctx->invalid_inode_bitmap_flag =
2675                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2676                                                 "invalid_inode_bitmap");
2677         thread_ctx->invalid_block_bitmap_flag =
2678                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2679                                                "invalid_block_bitmap");
2680         thread_ctx->invalid_inode_table_flag =
2681                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2682                                                "invalid_inode_table");
2683
2684         memcpy(thread_ctx->invalid_block_bitmap_flag,
2685                &global_ctx->invalid_block_bitmap_flag[grp_start],
2686                total * sizeof(int));
2687         memcpy(thread_ctx->invalid_inode_bitmap_flag,
2688                &global_ctx->invalid_inode_bitmap_flag[grp_start],
2689                total * sizeof(int));
2690         memcpy(thread_ctx->invalid_inode_table_flag,
2691                &global_ctx->invalid_inode_table_flag[grp_start],
2692                total * sizeof(int));
2693
2694         thread_ctx->invalid_bitmaps = 0;
2695         for (i = grp_start, j = 0; i < grp_end; i++, j++) {
2696                 if (thread_ctx->invalid_block_bitmap_flag[j])
2697                         thread_ctx->invalid_bitmaps++;
2698                 if (thread_ctx->invalid_inode_bitmap_flag[j])
2699                         thread_ctx->invalid_bitmaps++;
2700                 if (thread_ctx->invalid_inode_table_flag[j])
2701                         thread_ctx->invalid_bitmaps++;
2702         }
2703 }
2704
2705 static void e2fsck_pass1_merge_invalid_bitmaps(e2fsck_t global_ctx,
2706                                                e2fsck_t thread_ctx)
2707 {
2708         dgrp_t grp_start = thread_ctx->thread_info.et_group_start;
2709         dgrp_t grp_end = thread_ctx->thread_info.et_group_end;
2710         dgrp_t total = grp_end - grp_start;
2711
2712         memcpy(&global_ctx->invalid_block_bitmap_flag[grp_start],
2713                thread_ctx->invalid_block_bitmap_flag, total * sizeof(int));
2714         memcpy(&global_ctx->invalid_inode_bitmap_flag[grp_start],
2715                thread_ctx->invalid_inode_bitmap_flag, total * sizeof(int));
2716         memcpy(&global_ctx->invalid_inode_table_flag[grp_start],
2717                thread_ctx->invalid_inode_table_flag, total * sizeof(int));
2718         global_ctx->invalid_bitmaps += thread_ctx->invalid_bitmaps;
2719 }
2720
2721 static errcode_t e2fsck_pass1_thread_prepare(e2fsck_t global_ctx, e2fsck_t *thread_ctx,
2722                                              int thread_index, int num_threads,
2723                                              dgrp_t average_group)
2724 {
2725         errcode_t               retval;
2726         e2fsck_t                thread_context;
2727         ext2_filsys             thread_fs;
2728         ext2_filsys             global_fs = global_ctx->fs;
2729         struct e2fsck_thread    *tinfo;
2730
2731         assert(global_ctx->inode_used_map == NULL);
2732         assert(global_ctx->inode_dir_map == NULL);
2733         assert(global_ctx->inode_bb_map == NULL);
2734         assert(global_ctx->inode_imagic_map == NULL);
2735         assert(global_ctx->inode_reg_map == NULL);
2736         assert(global_ctx->inodes_to_rebuild == NULL);
2737
2738         assert(global_ctx->block_found_map != NULL);
2739         assert(global_ctx->block_metadata_map != NULL);
2740         assert(global_ctx->block_dup_map != NULL);
2741         assert(global_ctx->block_ea_map == NULL);
2742         assert(global_ctx->fs->dblist == NULL);
2743
2744         retval = ext2fs_get_mem(sizeof(struct e2fsck_struct), &thread_context);
2745         if (retval) {
2746                 com_err(global_ctx->program_name, retval, "while allocating memory");
2747                 return retval;
2748         }
2749         memcpy(thread_context, global_ctx, sizeof(struct e2fsck_struct));
2750         thread_context->block_dup_map = NULL;
2751         thread_context->casefolded_dirs = NULL;
2752
2753         retval = e2fsck_allocate_block_bitmap(global_ctx->fs,
2754                                 _("in-use block map"), EXT2FS_BMAP64_RBTREE,
2755                                 "block_found_map", &thread_context->block_found_map);
2756         if (retval)
2757                 goto out_context;
2758
2759         thread_context->global_ctx = global_ctx;
2760         retval = ext2fs_get_mem(sizeof(struct struct_ext2_filsys), &thread_fs);
2761         if (retval) {
2762                 com_err(global_ctx->program_name, retval, "while allocating memory");
2763                 goto out_context;
2764         }
2765
2766         io_channel_flush_cleanup(global_fs->io);
2767         retval = e2fsck_pass1_copy_fs(thread_fs, global_ctx, global_fs);
2768         if (retval) {
2769                 com_err(global_ctx->program_name, retval, "while copying fs");
2770                 goto out_fs;
2771         }
2772         thread_fs->priv_data = thread_context;
2773
2774         thread_context->thread_info.et_thread_index = thread_index;
2775         set_up_logging(thread_context);
2776
2777         tinfo = &thread_context->thread_info;
2778         tinfo->et_group_start = average_group * thread_index;
2779         if (thread_index == global_fs->fs_num_threads - 1)
2780                 tinfo->et_group_end = thread_fs->group_desc_count;
2781         else
2782                 tinfo->et_group_end = average_group * (thread_index + 1);
2783         tinfo->et_group_next = tinfo->et_group_start;
2784         tinfo->et_inode_number = 0;
2785         tinfo->et_log_buf[0] = '\0';
2786         tinfo->et_log_length = 0;
2787         if (thread_context->options & E2F_OPT_MULTITHREAD)
2788                 log_out(thread_context, _("Scan group range [%d, %d)\n"),
2789                         tinfo->et_group_start, tinfo->et_group_end);
2790         thread_context->fs = thread_fs;
2791         retval = quota_init_context(&thread_context->qctx, thread_fs, 0);
2792         if (retval) {
2793                 com_err(global_ctx->program_name, retval,
2794                         "while init quota context");
2795                 goto out_fs;
2796         }
2797         *thread_ctx = thread_context;
2798         e2fsck_pass1_copy_invalid_bitmaps(global_ctx, thread_context);
2799         return 0;
2800 out_fs:
2801         ext2fs_free_mem(&thread_fs);
2802 out_context:
2803         if (thread_context->block_found_map)
2804                 ext2fs_free_mem(&thread_context->block_found_map);
2805         ext2fs_free_mem(&thread_context);
2806         return retval;
2807 }
2808
2809 static void e2fsck_pass1_merge_dir_info(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2810 {
2811         if (thread_ctx->dir_info == NULL)
2812                 return;
2813
2814         if (global_ctx->dir_info == NULL) {
2815                 global_ctx->dir_info = thread_ctx->dir_info;
2816                 thread_ctx->dir_info = NULL;
2817                 return;
2818         }
2819
2820         e2fsck_merge_dir_info(global_ctx, thread_ctx->dir_info,
2821                               global_ctx->dir_info);
2822 }
2823
2824 static void e2fsck_pass1_merge_dx_dir(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2825 {
2826         if (thread_ctx->dx_dir_info == NULL)
2827                 return;
2828
2829         if (global_ctx->dx_dir_info == NULL) {
2830                 global_ctx->dx_dir_info = thread_ctx->dx_dir_info;
2831                 global_ctx->dx_dir_info_size = thread_ctx->dx_dir_info_size;
2832                 global_ctx->dx_dir_info_count = thread_ctx->dx_dir_info_count;
2833                 thread_ctx->dx_dir_info = NULL;
2834                 return;
2835         }
2836
2837         e2fsck_merge_dx_dir(global_ctx, thread_ctx);
2838 }
2839
2840 static inline errcode_t
2841 e2fsck_pass1_merge_icount(ext2_icount_t *dest_icount,
2842                           ext2_icount_t *src_icount)
2843 {
2844         if (*src_icount) {
2845                 if (*dest_icount == NULL) {
2846                         *dest_icount = *src_icount;
2847                         *src_icount = NULL;
2848                 } else {
2849                         errcode_t ret;
2850
2851                         ret = ext2fs_icount_merge(*src_icount,
2852                                                   *dest_icount);
2853                         if (ret)
2854                                 return ret;
2855                 }
2856         }
2857
2858         return 0;
2859 }
2860
2861 static errcode_t e2fsck_pass1_merge_icounts(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2862 {
2863         errcode_t ret;
2864
2865         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_count,
2866                                         &thread_ctx->inode_count);
2867         if (ret)
2868                 return ret;
2869         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_link_info,
2870                                         &thread_ctx->inode_link_info);
2871
2872         return ret;
2873 }
2874
2875 static errcode_t e2fsck_pass1_merge_dirs_to_hash(e2fsck_t global_ctx,
2876                                                  e2fsck_t thread_ctx)
2877 {
2878         errcode_t retval = 0;
2879
2880         if (!thread_ctx->dirs_to_hash)
2881                 return 0;
2882
2883         if (!global_ctx->dirs_to_hash)
2884                 retval = ext2fs_badblocks_copy(thread_ctx->dirs_to_hash,
2885                                                &global_ctx->dirs_to_hash);
2886         else
2887                 retval = ext2fs_badblocks_merge(thread_ctx->dirs_to_hash,
2888                                                 global_ctx->dirs_to_hash);
2889
2890         return retval;
2891 }
2892
2893 static errcode_t e2fsck_pass1_merge_ea_inode_refs(e2fsck_t global_ctx,
2894                                                   e2fsck_t thread_ctx)
2895 {
2896         ea_value_t count;
2897         blk64_t blk;
2898         errcode_t retval;
2899
2900         if (!thread_ctx->ea_inode_refs)
2901                 return 0;
2902
2903         if (!global_ctx->ea_inode_refs) {
2904                 global_ctx->ea_inode_refs = thread_ctx->ea_inode_refs;
2905                 thread_ctx->ea_inode_refs = NULL;
2906                 return 0;
2907         }
2908
2909         ea_refcount_intr_begin(thread_ctx->ea_inode_refs);
2910         while (1) {
2911                 if ((blk = ea_refcount_intr_next(thread_ctx->ea_inode_refs,
2912                                                  &count)) == 0)
2913                         break;
2914                 if (!global_ctx->block_ea_map ||
2915                     !ext2fs_fast_test_block_bitmap2(global_ctx->block_ea_map,
2916                                                     blk)) {
2917                         retval = ea_refcount_store(global_ctx->ea_inode_refs,
2918                                                    blk, count);
2919                         if (retval)
2920                                 return retval;
2921                 }
2922         }
2923
2924         return retval;
2925 }
2926
2927 static ea_value_t ea_refcount_usage(e2fsck_t ctx, blk64_t blk,
2928                                     ea_value_t *orig)
2929 {
2930         ea_value_t count_cur;
2931         ea_value_t count_extra = 0;
2932         ea_value_t count_orig;
2933
2934         ea_refcount_fetch(ctx->refcount_orig, blk, &count_orig);
2935         ea_refcount_fetch(ctx->refcount, blk, &count_cur);
2936         /* most of time this is not needed */
2937         if (ctx->refcount_extra && count_cur == 0)
2938                 ea_refcount_fetch(ctx->refcount_extra, blk, &count_extra);
2939
2940         if (!count_orig)
2941                 count_orig = *orig;
2942         else if (orig)
2943                 *orig = count_orig;
2944
2945         return count_orig + count_extra - count_cur;
2946 }
2947
2948 static errcode_t e2fsck_pass1_merge_ea_refcount(e2fsck_t global_ctx,
2949                                                 e2fsck_t thread_ctx)
2950 {
2951         ea_value_t count;
2952         blk64_t blk;
2953         errcode_t retval = 0;
2954
2955         if (!thread_ctx->refcount)
2956                 return 0;
2957
2958         if (!global_ctx->refcount) {
2959                 global_ctx->refcount = thread_ctx->refcount;
2960                 thread_ctx->refcount = NULL;
2961                 global_ctx->refcount_extra = thread_ctx->refcount;
2962                 thread_ctx->refcount_extra = NULL;
2963                 return 0;
2964         }
2965
2966         ea_refcount_intr_begin(thread_ctx->refcount);
2967         while (1) {
2968                 if ((blk = ea_refcount_intr_next(thread_ctx->refcount,
2969                                                  &count)) == 0)
2970                         break;
2971                 /**
2972                  * this EA has never seen before, so just store its
2973                  * refcount and refcount_extra into global_ctx if needed.
2974                  */
2975                 if (!global_ctx->block_ea_map ||
2976                     !ext2fs_fast_test_block_bitmap2(global_ctx->block_ea_map,
2977                                                     blk)) {
2978                         ea_value_t extra;
2979
2980                         retval = ea_refcount_store(global_ctx->refcount,
2981                                                    blk, count);
2982                         if (retval)
2983                                 return retval;
2984
2985                         if (count > 0 || !thread_ctx->refcount_extra)
2986                                 continue;
2987                         ea_refcount_fetch(thread_ctx->refcount_extra, blk,
2988                                           &extra);
2989                         if (extra == 0)
2990                                 continue;
2991
2992                         if (!global_ctx->refcount_extra) {
2993                                 retval = ea_refcount_create(0,
2994                                                 &global_ctx->refcount_extra);
2995                                 if (retval)
2996                                         return retval;
2997                         }
2998                         retval = ea_refcount_store(global_ctx->refcount_extra,
2999                                                    blk, extra);
3000                         if (retval)
3001                                 return retval;
3002                 } else {
3003                         ea_value_t orig;
3004                         ea_value_t thread_usage;
3005                         ea_value_t global_usage;
3006                         ea_value_t new;
3007
3008                         thread_usage = ea_refcount_usage(thread_ctx,
3009                                                          blk, &orig);
3010                         global_usage = ea_refcount_usage(global_ctx,
3011                                                          blk, &orig);
3012                         if (thread_usage + global_usage <= orig) {
3013                                 new = orig - thread_usage - global_usage;
3014                                 retval = ea_refcount_store(global_ctx->refcount,
3015                                                            blk, new);
3016                                 if (retval)
3017                                         return retval;
3018                                 continue;
3019                         }
3020                         /* update it is as zero */
3021                         retval = ea_refcount_store(global_ctx->refcount,
3022                                                    blk, 0);
3023                         if (retval)
3024                                 return retval;
3025                         /* Ooops, this EA was referenced more than it stated */
3026                         if (!global_ctx->refcount_extra) {
3027                                 retval = ea_refcount_create(0,
3028                                                 &global_ctx->refcount_extra);
3029                                 if (retval)
3030                                         return retval;
3031                         }
3032                         new = global_usage + thread_usage - orig;
3033                         retval = ea_refcount_store(global_ctx->refcount_extra,
3034                                                    blk, new);
3035                         if (retval)
3036                                 return retval;
3037                 }
3038         }
3039
3040         return retval;
3041 }
3042
3043 static errcode_t e2fsck_pass1_merge_casefolded_dirs(e2fsck_t global_ctx,
3044                                                    e2fsck_t thread_ctx)
3045 {
3046         errcode_t retval = 0;
3047
3048         if (!thread_ctx->casefolded_dirs)
3049                 return 0;
3050
3051         if (!global_ctx->casefolded_dirs)
3052                 retval = ext2fs_badblocks_copy(thread_ctx->casefolded_dirs,
3053                                                &global_ctx->casefolded_dirs);
3054         else
3055                 retval = ext2fs_badblocks_merge(thread_ctx->casefolded_dirs,
3056                                                 global_ctx->casefolded_dirs);
3057
3058         return retval;
3059 }
3060
3061 static errcode_t e2fsck_pass1_merge_context(e2fsck_t global_ctx,
3062                                             e2fsck_t thread_ctx)
3063 {
3064         ext2_filsys global_fs = global_ctx->fs;
3065         errcode_t retval;
3066         int i;
3067
3068         global_ctx->fs_directory_count += thread_ctx->fs_directory_count;
3069         global_ctx->fs_regular_count += thread_ctx->fs_regular_count;
3070         global_ctx->fs_blockdev_count += thread_ctx->fs_blockdev_count;
3071         global_ctx->fs_chardev_count += thread_ctx->fs_chardev_count;
3072         global_ctx->fs_links_count += thread_ctx->fs_links_count;
3073         global_ctx->fs_symlinks_count += thread_ctx->fs_symlinks_count;
3074         global_ctx->fs_fast_symlinks_count += thread_ctx->fs_fast_symlinks_count;
3075         global_ctx->fs_fifo_count += thread_ctx->fs_fifo_count;
3076         global_ctx->fs_total_count += thread_ctx->fs_total_count;
3077         global_ctx->fs_badblocks_count += thread_ctx->fs_badblocks_count;
3078         global_ctx->fs_sockets_count += thread_ctx->fs_sockets_count;
3079         global_ctx->fs_ind_count += thread_ctx->fs_ind_count;
3080         global_ctx->fs_dind_count += thread_ctx->fs_dind_count;
3081         global_ctx->fs_tind_count += thread_ctx->fs_tind_count;
3082         global_ctx->fs_fragmented += thread_ctx->fs_fragmented;
3083         global_ctx->fs_fragmented_dir += thread_ctx->fs_fragmented_dir;
3084         global_ctx->large_files += thread_ctx->large_files;
3085         /* threads might enable E2F_OPT_YES */
3086         global_ctx->options |= thread_ctx->options;
3087         global_ctx->flags |= thread_ctx->flags;
3088         /*
3089          * The l+f inode may have been cleared, so zap it now and
3090          * later passes will recalculate it if necessary
3091          */
3092         global_ctx->lost_and_found = 0;
3093         /* merge extent depth count */
3094         for (i = 0; i < MAX_EXTENT_DEPTH_COUNT; i++)
3095                 global_ctx->extent_depth_count[i] +=
3096                         thread_ctx->extent_depth_count[i];
3097
3098         e2fsck_pass1_merge_dir_info(global_ctx, thread_ctx);
3099         e2fsck_pass1_merge_dx_dir(global_ctx, thread_ctx);
3100
3101         retval = e2fsck_pass1_merge_fs(global_ctx->fs, thread_ctx->fs);
3102         if (retval) {
3103                 com_err(global_ctx->program_name, 0, _("while merging fs\n"));
3104                 return retval;
3105         }
3106         retval = e2fsck_pass1_merge_icounts(global_ctx, thread_ctx);
3107         if (retval) {
3108                 com_err(global_ctx->program_name, 0,
3109                         _("while merging icounts\n"));
3110                 return retval;
3111         }
3112
3113         retval = e2fsck_pass1_merge_dirs_to_hash(global_ctx, thread_ctx);
3114         if (retval) {
3115                 com_err(global_ctx->program_name, 0,
3116                         _("while merging dirs to hash\n"));
3117                 return retval;
3118         }
3119
3120         e2fsck_pass1_merge_ea_inode_refs(global_ctx, thread_ctx);
3121         e2fsck_pass1_merge_ea_refcount(global_ctx, thread_ctx);
3122         retval = quota_merge_and_update_usage(global_ctx->qctx,
3123                                               thread_ctx->qctx);
3124         if (retval)
3125                 return retval;
3126
3127         retval = e2fsck_pass1_merge_casefolded_dirs(global_ctx, thread_ctx);
3128         if (retval) {
3129                 com_err(global_ctx->program_name, 0,
3130                         _("while merging casefolded dirs\n"));
3131                 return retval;
3132         }
3133
3134         e2fsck_pass1_merge_invalid_bitmaps(global_ctx, thread_ctx);
3135
3136         retval = e2fsck_pass1_merge_bitmap(global_fs,
3137                                 &thread_ctx->inode_used_map,
3138                                 &global_ctx->inode_used_map);
3139         if (retval)
3140                 return retval;
3141
3142         retval = e2fsck_pass1_merge_bitmap(global_fs,
3143                                 &thread_ctx->inode_bad_map,
3144                                 &global_ctx->inode_bad_map);
3145         if (retval)
3146                 return retval;
3147         retval = e2fsck_pass1_merge_bitmap(global_fs,
3148                                         &thread_ctx->inode_dir_map,
3149                                         &global_ctx->inode_dir_map);
3150         if (retval)
3151                 return retval;
3152         retval = e2fsck_pass1_merge_bitmap(global_fs,
3153                                 &thread_ctx->inode_bb_map,
3154                                 &global_ctx->inode_bb_map);
3155         if (retval)
3156                 return retval;
3157         retval = e2fsck_pass1_merge_bitmap(global_fs,
3158                                 &thread_ctx->inode_imagic_map,
3159                                 &global_ctx->inode_imagic_map);
3160         if (retval)
3161                 return retval;
3162         retval = e2fsck_pass1_merge_bitmap(global_fs,
3163                                 &thread_ctx->inode_reg_map,
3164                                 &global_ctx->inode_reg_map);
3165         if (retval)
3166                 return retval;
3167         retval = e2fsck_pass1_merge_bitmap(global_fs,
3168                                 &thread_ctx->inodes_to_rebuild,
3169                                 &global_ctx->inodes_to_rebuild);
3170         if (retval)
3171                 return retval;
3172         retval = e2fsck_pass1_merge_bitmap(global_fs,
3173                                 &thread_ctx->block_ea_map,
3174                                 &global_ctx->block_ea_map);
3175         if (retval)
3176                 return retval;
3177
3178         if (ext2fs_has_feature_shared_blocks(global_fs->super) &&
3179             !(global_ctx->options & E2F_OPT_UNSHARE_BLOCKS))
3180                 return 0;
3181         /*
3182          * This need be done after merging block_ea_map
3183          * because ea block might be shared, we need exclude
3184          * them from dup blocks.
3185          */
3186         e2fsck_pass1_block_map_w_lock(thread_ctx);
3187         retval = ext2fs_merge_bitmap(thread_ctx->block_found_map,
3188                                      global_ctx->block_found_map,
3189                                      global_ctx->block_dup_map,
3190                                      global_ctx->block_ea_map);
3191         e2fsck_pass1_block_map_w_unlock(thread_ctx);
3192         if (retval == EEXIST)
3193                 global_ctx->flags |= E2F_FLAG_DUP_BLOCK;
3194
3195         return 0;
3196 }
3197
3198 static int e2fsck_pass1_thread_join(e2fsck_t global_ctx, e2fsck_t thread_ctx)
3199 {
3200         errcode_t       retval;
3201
3202         retval = e2fsck_pass1_merge_context(global_ctx, thread_ctx);
3203         ext2fs_free_mem(&thread_ctx->fs);
3204         if (thread_ctx->logf)
3205                 fclose(thread_ctx->logf);
3206         if (thread_ctx->problem_logf) {
3207                 fputs("</problem_log>\n", thread_ctx->problem_logf);
3208                 fclose(thread_ctx->problem_logf);
3209         }
3210
3211         quota_release_context(&thread_ctx->qctx);
3212         /*
3213          * @block_metadata_map and @block_dup_map are
3214          * shared, so we don't free them.
3215          */
3216         thread_ctx->block_metadata_map = NULL;
3217         thread_ctx->block_dup_map = NULL;
3218         e2fsck_reset_context(thread_ctx);
3219         ext2fs_free_mem(&thread_ctx);
3220
3221         return retval;
3222 }
3223
3224 static int e2fsck_pass1_threads_join(e2fsck_t global_ctx)
3225 {
3226         errcode_t rc;
3227         errcode_t ret = 0;
3228         struct e2fsck_thread_info *infos = global_ctx->infos;
3229         struct e2fsck_thread_info *pinfo;
3230         int num_threads = global_ctx->pfs_num_threads;
3231         int i;
3232
3233         /* merge invalid bitmaps will recalculate it */
3234         global_ctx->invalid_bitmaps = 0;
3235         for (i = 0; i < num_threads; i++) {
3236                 pinfo = &infos[i];
3237
3238                 if (!pinfo->eti_started)
3239                         continue;
3240
3241                 rc = pthread_join(pinfo->eti_thread_id, NULL);
3242                 if (rc) {
3243                         com_err(global_ctx->program_name, rc,
3244                                 _("while joining thread\n"));
3245                         if (ret == 0)
3246                                 ret = rc;
3247                 }
3248                 rc = e2fsck_pass1_thread_join(global_ctx, infos[i].eti_thread_ctx);
3249                 if (rc) {
3250                         com_err(global_ctx->program_name, rc,
3251                                 _("while joining pass1 thread\n"));
3252                         if (ret == 0)
3253                                 ret = rc;
3254                 }
3255         }
3256         free(infos);
3257         global_ctx->infos = NULL;
3258
3259         return ret;
3260 }
3261
3262 static void *e2fsck_pass1_thread(void *arg)
3263 {
3264         struct e2fsck_thread_info       *info = arg;
3265         e2fsck_t                         thread_ctx = info->eti_thread_ctx;
3266 #ifdef DEBUG_THREADS
3267         struct e2fsck_thread_debug      *thread_debug = info->eti_debug;
3268 #endif
3269
3270 #ifdef DEBUG_THREADS
3271         pthread_mutex_lock(&thread_debug->etd_mutex);
3272         while (info->eti_thread_index > thread_debug->etd_finished_threads) {
3273                 pthread_cond_wait(&thread_debug->etd_cond,
3274                                   &thread_debug->etd_mutex);
3275         }
3276         pthread_mutex_unlock(&thread_debug->etd_mutex);
3277 #endif
3278
3279 #ifdef HAVE_SETJMP_H
3280         /*
3281          * When fatal_error() happens, jump to here. The thread
3282          * context's flags will be saved, but its abort_loc will
3283          * be overwritten by original jump buffer for the later
3284          * tests.
3285          */
3286         if (setjmp(thread_ctx->abort_loc)) {
3287                 thread_ctx->flags &= ~E2F_FLAG_SETJMP_OK;
3288                 goto out;
3289         }
3290         thread_ctx->flags |= E2F_FLAG_SETJMP_OK;
3291 #endif
3292
3293         e2fsck_pass1_run(thread_ctx);
3294
3295 out:
3296         if (thread_ctx->options & E2F_OPT_MULTITHREAD)
3297                 log_out(thread_ctx,
3298                         _("Scanned group range [%u, %u), inodes %u\n"),
3299                         thread_ctx->thread_info.et_group_start,
3300                         thread_ctx->thread_info.et_group_end,
3301                         thread_ctx->thread_info.et_inode_number);
3302
3303 #ifdef DEBUG_THREADS
3304         pthread_mutex_lock(&thread_debug->etd_mutex);
3305         thread_debug->etd_finished_threads++;
3306         pthread_cond_broadcast(&thread_debug->etd_cond);
3307         pthread_mutex_unlock(&thread_debug->etd_mutex);
3308 #endif
3309
3310         return NULL;
3311 }
3312
3313 static dgrp_t ext2fs_get_avg_group(ext2_filsys fs)
3314 {
3315 #ifdef HAVE_PTHREAD
3316         dgrp_t average_group;
3317         unsigned flexbg_size;
3318
3319         if (fs->fs_num_threads <= 1)
3320                 return fs->group_desc_count;
3321
3322         average_group = fs->group_desc_count / fs->fs_num_threads;
3323         if (average_group <= 1)
3324                 return 1;
3325
3326         if (ext2fs_has_feature_flex_bg(fs->super)) {
3327                 int times = 1;
3328
3329                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
3330                 if (average_group % flexbg_size) {
3331                         times = average_group / flexbg_size;
3332                         average_group = times * flexbg_size;
3333                 }
3334         }
3335
3336         return average_group;
3337 #else
3338         return fs->group_desc_count;
3339 #endif
3340 }
3341
3342 static int e2fsck_pass1_threads_start(e2fsck_t global_ctx)
3343 {
3344         struct e2fsck_thread_info       *infos;
3345         pthread_attr_t                   attr;
3346         errcode_t                        retval;
3347         errcode_t                        ret;
3348         struct e2fsck_thread_info       *tmp_pinfo;
3349         int                              i;
3350         e2fsck_t                         thread_ctx;
3351         dgrp_t                           average_group;
3352         int num_threads = global_ctx->pfs_num_threads;
3353 #ifdef DEBUG_THREADS
3354         struct e2fsck_thread_debug       thread_debug =
3355                 {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER, 0};
3356
3357         thread_debug.etd_finished_threads = 0;
3358 #endif
3359
3360         retval = pthread_attr_init(&attr);
3361         if (retval) {
3362                 com_err(global_ctx->program_name, retval,
3363                         _("while setting pthread attribute\n"));
3364                 return retval;
3365         }
3366
3367         infos = calloc(num_threads, sizeof(struct e2fsck_thread_info));
3368         if (infos == NULL) {
3369                 retval = -ENOMEM;
3370                 com_err(global_ctx->program_name, retval,
3371                         _("while allocating memory for threads\n"));
3372                 pthread_attr_destroy(&attr);
3373                 return retval;
3374         }
3375         global_ctx->infos = infos;
3376
3377         average_group = ext2fs_get_avg_group(global_ctx->fs);
3378         for (i = 0; i < num_threads; i++) {
3379                 tmp_pinfo = &infos[i];
3380                 tmp_pinfo->eti_thread_index = i;
3381 #ifdef DEBUG_THREADS
3382                 tmp_pinfo->eti_debug = &thread_debug;
3383 #endif
3384                 retval = e2fsck_pass1_thread_prepare(global_ctx, &thread_ctx,
3385                                                      i, num_threads,
3386                                                      average_group);
3387                 if (retval) {
3388                         com_err(global_ctx->program_name, retval,
3389                                 _("while preparing pass1 thread\n"));
3390                         break;
3391                 }
3392                 tmp_pinfo->eti_thread_ctx = thread_ctx;
3393
3394                 retval = pthread_create(&tmp_pinfo->eti_thread_id, &attr,
3395                                         &e2fsck_pass1_thread, tmp_pinfo);
3396                 if (retval) {
3397                         com_err(global_ctx->program_name, retval,
3398                                 _("while creating thread\n"));
3399                         e2fsck_pass1_thread_join(global_ctx, thread_ctx);
3400                         break;
3401                 }
3402
3403                 tmp_pinfo->eti_started = 1;
3404         }
3405
3406         /* destroy the thread attribute object, since it is no longer needed */
3407         ret = pthread_attr_destroy(&attr);
3408         if (ret) {
3409                 com_err(global_ctx->program_name, ret,
3410                         _("while destroying thread attribute\n"));
3411                 if (retval == 0)
3412                         retval = ret;
3413         }
3414
3415         if (retval) {
3416                 e2fsck_pass1_threads_join(global_ctx);
3417                 return retval;
3418         }
3419         return 0;
3420 }
3421
3422 static void e2fsck_pass1_multithread(e2fsck_t global_ctx)
3423 {
3424         errcode_t retval;
3425
3426         retval = e2fsck_pass1_threads_start(global_ctx);
3427         if (retval) {
3428                 com_err(global_ctx->program_name, retval,
3429                         _("while starting pass1 threads\n"));
3430                 goto out_abort;
3431         }
3432
3433         retval = e2fsck_pass1_threads_join(global_ctx);
3434         if (retval) {
3435                 com_err(global_ctx->program_name, retval,
3436                         _("while joining pass1 threads\n"));
3437                 goto out_abort;
3438         }
3439         return;
3440 out_abort:
3441         global_ctx->flags |= E2F_FLAG_ABORT;
3442         return;
3443 }
3444 #endif
3445
3446 void e2fsck_pass1(e2fsck_t ctx)
3447 {
3448         errcode_t retval;
3449         int need_single = 1;
3450
3451         retval = e2fsck_pass1_prepare(ctx);
3452         if (retval)
3453                 return;
3454 #ifdef HAVE_PTHREAD
3455         if (ctx->pfs_num_threads > 1 || ctx->options & E2F_OPT_MULTITHREAD) {
3456                 need_single = 0;
3457                 e2fsck_pass1_multithread(ctx);
3458         }
3459         /* No lock is needed at this time */
3460         ctx->fs_need_locking = 0;
3461 #endif
3462         if (need_single)
3463                 e2fsck_pass1_run(ctx);
3464         e2fsck_pass1_post(ctx);
3465 }
3466
3467 #undef FINISH_INODE_LOOP
3468
3469 /*
3470  * When the inode_scan routines call this callback at the end of the
3471  * glock group, call process_inodes.
3472  */
3473 static errcode_t scan_callback(ext2_filsys fs,
3474                                ext2_inode_scan scan EXT2FS_ATTR((unused)),
3475                                dgrp_t group, void * priv_data)
3476 {
3477         struct scan_callback_struct *scan_struct;
3478         e2fsck_t ctx;
3479         dgrp_t cur = group + 1;
3480         struct e2fsck_thread *tinfo;
3481         struct e2fsck_thread_info *pinfo, *infos;
3482         int i;
3483
3484         scan_struct = (struct scan_callback_struct *) priv_data;
3485         ctx = scan_struct->ctx;
3486
3487         process_inodes((e2fsck_t) fs->priv_data, scan_struct->block_buf,
3488                        scan_struct->inodes_to_process,
3489                        scan_struct->process_inode_count);
3490
3491 #ifdef HAVE_PTHREAD
3492         if (ctx->global_ctx) {
3493                 cur = 0;
3494                 infos = ctx->global_ctx->infos;
3495                 for (i = 0; i < ctx->global_ctx->pfs_num_threads; i++) {
3496                         pinfo = &infos[i];
3497
3498                         if (!pinfo->eti_started)
3499                                 continue;
3500
3501                         tinfo = &pinfo->eti_thread_ctx->thread_info;
3502                         if (ctx == pinfo->eti_thread_ctx)
3503                                 cur += group + 1 - tinfo->et_group_start;
3504                         else
3505                                 cur += tinfo->et_group_next -
3506                                         tinfo->et_group_start;
3507                 }
3508         }
3509 #endif
3510
3511         if (ctx->progress)
3512                 if ((ctx->progress)(ctx, 1, cur,
3513                                     ctx->fs->group_desc_count))
3514                         return EXT2_ET_CANCEL_REQUESTED;
3515
3516 #ifdef HAVE_PTHREAD
3517         if (ctx->global_ctx) {
3518                 tinfo = &ctx->thread_info;
3519                 tinfo->et_group_next++;
3520                 if (ctx->options & E2F_OPT_DEBUG &&
3521                     ctx->options & E2F_OPT_MULTITHREAD)
3522                         log_out(ctx, _("group %d finished\n"),
3523                                 tinfo->et_group_next);
3524                 if (tinfo->et_group_next >= tinfo->et_group_end)
3525                         return EXT2_ET_SCAN_FINISHED;
3526         }
3527 #endif
3528
3529         return 0;
3530 }
3531
3532 /*
3533  * Process the inodes in the "inodes to process" list.
3534  */
3535 static void process_inodes(e2fsck_t ctx, char *block_buf,
3536                            struct process_inode_block *inodes_to_process,
3537                            int *process_inode_count)
3538 {
3539         int                     i;
3540         struct ext2_inode       *old_stashed_inode;
3541         ext2_ino_t              old_stashed_ino;
3542         const char              *old_operation;
3543         char                    buf[80];
3544         struct problem_context  pctx;
3545
3546 #if 0
3547         printf("begin process_inodes: ");
3548 #endif
3549         if (*process_inode_count == 0)
3550                 return;
3551         old_operation = ehandler_operation(0);
3552         old_stashed_inode = ctx->stashed_inode;
3553         old_stashed_ino = ctx->stashed_ino;
3554         qsort(inodes_to_process, *process_inode_count,
3555                       sizeof(struct process_inode_block), process_inode_cmp);
3556         clear_problem_context(&pctx);
3557         for (i=0; i < *process_inode_count; i++) {
3558                 pctx.inode = ctx->stashed_inode =
3559                         (struct ext2_inode *) &inodes_to_process[i].inode;
3560                 pctx.ino = ctx->stashed_ino = inodes_to_process[i].ino;
3561
3562 #if 0
3563                 printf("%u ", pctx.ino);
3564 #endif
3565                 sprintf(buf, _("reading indirect blocks of inode %u"),
3566                         pctx.ino);
3567                 ehandler_operation(buf);
3568                 check_blocks(ctx, &pctx, block_buf,
3569                              &inodes_to_process[i].ea_ibody_quota);
3570                 if (e2fsck_should_abort(ctx))
3571                         break;
3572         }
3573         ctx->stashed_inode = old_stashed_inode;
3574         ctx->stashed_ino = old_stashed_ino;
3575         *process_inode_count = 0;
3576 #if 0
3577         printf("end process inodes\n");
3578 #endif
3579         ehandler_operation(old_operation);
3580 }
3581
3582 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b)
3583 {
3584         const struct process_inode_block *ib_a =
3585                 (const struct process_inode_block *) a;
3586         const struct process_inode_block *ib_b =
3587                 (const struct process_inode_block *) b;
3588         int     ret;
3589
3590         ret = (ib_a->inode.i_block[EXT2_IND_BLOCK] -
3591                ib_b->inode.i_block[EXT2_IND_BLOCK]);
3592         if (ret == 0)
3593                 /*
3594                  * We only call process_inodes() for non-extent
3595                  * inodes, so it's OK to pass NULL to
3596                  * ext2fs_file_acl_block() here.
3597                  */
3598                 ret = ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_a->inode)) -
3599                         ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_b->inode));
3600         if (ret == 0)
3601                 ret = ib_a->ino - ib_b->ino;
3602         return ret;
3603 }
3604
3605 /*
3606  * Mark an inode as being bad in some what
3607  */
3608 static void mark_inode_bad(e2fsck_t ctx, ext2_ino_t ino)
3609 {
3610         struct          problem_context pctx;
3611
3612         if (!ctx->inode_bad_map) {
3613                 clear_problem_context(&pctx);
3614
3615                 pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3616                                 _("bad inode map"), EXT2FS_BMAP64_RBTREE,
3617                                 "inode_bad_map", &ctx->inode_bad_map);
3618                 if (pctx.errcode) {
3619                         pctx.num = 3;
3620                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3621                         /* Should never get here */
3622                         ctx->flags |= E2F_FLAG_ABORT;
3623                         return;
3624                 }
3625         }
3626         ext2fs_mark_inode_bitmap2(ctx->inode_bad_map, ino);
3627 }
3628
3629 static void add_casefolded_dir(e2fsck_t ctx, ext2_ino_t ino)
3630 {
3631         struct          problem_context pctx;
3632
3633         if (!ctx->casefolded_dirs) {
3634                 pctx.errcode = ext2fs_u32_list_create(&ctx->casefolded_dirs, 0);
3635                 if (pctx.errcode)
3636                         goto error;
3637         }
3638         pctx.errcode = ext2fs_u32_list_add(ctx->casefolded_dirs, ino);
3639         if (pctx.errcode == 0)
3640                 return;
3641 error:
3642         fix_problem(ctx, PR_1_ALLOCATE_CASEFOLDED_DIRLIST, &pctx);
3643         /* Should never get here */
3644         ctx->flags |= E2F_FLAG_ABORT;
3645 }
3646
3647 /*
3648  * This procedure will allocate the inode "bb" (badblock) map table
3649  */
3650 static void alloc_bb_map(e2fsck_t ctx)
3651 {
3652         struct          problem_context pctx;
3653
3654         clear_problem_context(&pctx);
3655         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3656                         _("inode in bad block map"), EXT2FS_BMAP64_RBTREE,
3657                         "inode_bb_map", &ctx->inode_bb_map);
3658         if (pctx.errcode) {
3659                 pctx.num = 4;
3660                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3661                 /* Should never get here */
3662                 ctx->flags |= E2F_FLAG_ABORT;
3663                 return;
3664         }
3665 }
3666
3667 /*
3668  * This procedure will allocate the inode imagic table
3669  */
3670 static void alloc_imagic_map(e2fsck_t ctx)
3671 {
3672         struct          problem_context pctx;
3673
3674         clear_problem_context(&pctx);
3675         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3676                         _("imagic inode map"), EXT2FS_BMAP64_RBTREE,
3677                         "inode_imagic_map", &ctx->inode_imagic_map);
3678         if (pctx.errcode) {
3679                 pctx.num = 5;
3680                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3681                 /* Should never get here */
3682                 ctx->flags |= E2F_FLAG_ABORT;
3683                 return;
3684         }
3685 }
3686
3687 /*
3688  * Marks a block as in use, setting the dup_map if it's been set
3689  * already.  Called by process_block and process_bad_block.
3690  *
3691  * WARNING: Assumes checks have already been done to make sure block
3692  * is valid.  This is true in both process_block and process_bad_block.
3693  */
3694 static _INLINE_ void mark_block_used(e2fsck_t ctx, blk64_t block)
3695 {
3696         struct problem_context pctx;
3697         e2fsck_t global_ctx = ctx->global_ctx ? ctx->global_ctx : ctx;
3698
3699         clear_problem_context(&pctx);
3700
3701         if (is_blocks_used(ctx, block, 1)) {
3702                 if (ext2fs_has_feature_shared_blocks(ctx->fs->super) &&
3703                     !(ctx->options & E2F_OPT_UNSHARE_BLOCKS)) {
3704                         return;
3705                 }
3706                 ctx->flags |= E2F_FLAG_DUP_BLOCK;
3707                 e2fsck_pass1_block_map_w_lock(ctx);
3708                 ext2fs_fast_mark_block_bitmap2(global_ctx->block_dup_map, block);
3709                 e2fsck_pass1_block_map_w_unlock(ctx);
3710         } else {
3711                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, block);
3712         }
3713 }
3714
3715 /*
3716  * When cluster size is greater than one block, it is caller's responsibility
3717  * to make sure block parameter starts at a cluster boundary.
3718  */
3719 static _INLINE_ void mark_blocks_used(e2fsck_t ctx, blk64_t block,
3720                                       unsigned int num)
3721 {
3722         if (!is_blocks_used(ctx, block, num)) {
3723                 ext2fs_mark_block_bitmap_range2(ctx->block_found_map, block, num);
3724         } else {
3725                 unsigned int i;
3726
3727                 for (i = 0; i < num; i += EXT2FS_CLUSTER_RATIO(ctx->fs))
3728                         mark_block_used(ctx, block + i);
3729         }
3730 }
3731
3732 static errcode_t _INLINE_ e2fsck_write_ext_attr3(e2fsck_t ctx, blk64_t block,
3733                                                  void *inbuf, ext2_ino_t inum)
3734 {
3735         errcode_t retval;
3736         ext2_filsys fs = ctx->fs;
3737
3738         e2fsck_pass1_fix_lock(ctx);
3739         retval = ext2fs_write_ext_attr3(fs, block, inbuf, inum);
3740         e2fsck_pass1_fix_unlock(ctx);
3741
3742         return retval;
3743 }
3744 /*
3745  * Adjust the extended attribute block's reference counts at the end
3746  * of pass 1, either by subtracting out references for EA blocks that
3747  * are still referenced in ctx->refcount, or by adding references for
3748  * EA blocks that had extra references as accounted for in
3749  * ctx->refcount_extra.
3750  */
3751 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
3752                                     char *block_buf, int adjust_sign)
3753 {
3754         struct ext2_ext_attr_header     *header;
3755         struct problem_context          pctx;
3756         ext2_filsys                     fs = ctx->fs;
3757         blk64_t                         blk;
3758         __u32                           should_be;
3759         ea_value_t                      count;
3760
3761         clear_problem_context(&pctx);
3762
3763         ea_refcount_intr_begin(refcount);
3764         while (1) {
3765                 if ((blk = ea_refcount_intr_next(refcount, &count)) == 0)
3766                         break;
3767                 pctx.blk = blk;
3768                 pctx.errcode = ext2fs_read_ext_attr3(fs, blk, block_buf,
3769                                                      pctx.ino);
3770                 if (pctx.errcode) {
3771                         fix_problem(ctx, PR_1_EXTATTR_READ_ABORT, &pctx);
3772                         return;
3773                 }
3774                 header = (struct ext2_ext_attr_header *) block_buf;
3775                 pctx.blkcount = header->h_refcount;
3776                 should_be = header->h_refcount + adjust_sign * (int)count;
3777                 pctx.num = should_be;
3778                 if (fix_problem(ctx, PR_1_EXTATTR_REFCOUNT, &pctx)) {
3779                         header->h_refcount = should_be;
3780                         pctx.errcode = e2fsck_write_ext_attr3(ctx, blk,
3781                                                              block_buf,
3782                                                              pctx.ino);
3783                         if (pctx.errcode) {
3784                                 fix_problem(ctx, PR_1_EXTATTR_WRITE_ABORT,
3785                                             &pctx);
3786                                 continue;
3787                         }
3788                 }
3789         }
3790 }
3791
3792 /*
3793  * Handle processing the extended attribute blocks
3794  */
3795 static int check_ext_attr(e2fsck_t ctx, struct problem_context *pctx,
3796                            char *block_buf, struct ea_quota *ea_block_quota)
3797 {
3798         ext2_filsys fs = ctx->fs;
3799         ext2_ino_t      ino = pctx->ino;
3800         struct ext2_inode *inode = pctx->inode;
3801         blk64_t         blk;
3802         char *          end;
3803         struct ext2_ext_attr_header *header;
3804         struct ext2_ext_attr_entry *first, *entry;
3805         blk64_t         quota_blocks = EXT2FS_C2B(fs, 1);
3806         __u64           quota_inodes = 0;
3807         region_t        region = 0;
3808         int             failed_csum = 0;
3809
3810         ea_block_quota->blocks = 0;
3811         ea_block_quota->inodes = 0;
3812
3813         blk = ext2fs_file_acl_block(fs, inode);
3814         if (blk == 0)
3815                 return 0;
3816
3817         /*
3818          * If the Extended attribute flag isn't set, then a non-zero
3819          * file acl means that the inode is corrupted.
3820          *
3821          * Or if the extended attribute block is an invalid block,
3822          * then the inode is also corrupted.
3823          */
3824         if (!ext2fs_has_feature_xattr(fs->super) ||
3825             (blk < fs->super->s_first_data_block) ||
3826             (blk >= ext2fs_blocks_count(fs->super))) {
3827                 mark_inode_bad(ctx, ino);
3828                 return 0;
3829         }
3830
3831         /* If ea bitmap hasn't been allocated, create it */
3832         if (!ctx->block_ea_map) {
3833                 pctx->errcode = e2fsck_allocate_block_bitmap(fs,
3834                                         _("ext attr block map"),
3835                                         EXT2FS_BMAP64_RBTREE, "block_ea_map",
3836                                         &ctx->block_ea_map);
3837                 if (pctx->errcode) {
3838                         pctx->num = 2;
3839                         fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, pctx);
3840                         ctx->flags |= E2F_FLAG_ABORT;
3841                         return 0;
3842                 }
3843         }
3844
3845         /* Create the EA refcount structure if necessary */
3846         if (!ctx->refcount) {
3847                 pctx->errcode = ea_refcount_create(0,
3848                                         &ctx->refcount_orig);
3849                 if (pctx->errcode) {
3850                         pctx->num = 1;
3851                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3852                         ctx->flags |= E2F_FLAG_ABORT;
3853                         return 0;
3854                 }
3855
3856                 pctx->errcode = ea_refcount_create(0, &ctx->refcount);
3857                 if (pctx->errcode) {
3858                         pctx->num = 1;
3859                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3860                         ctx->flags |= E2F_FLAG_ABORT;
3861                         return 0;
3862                 }
3863         }
3864
3865 #if 0
3866         /* Debugging text */
3867         printf("Inode %u has EA block %u\n", ino, blk);
3868 #endif
3869
3870         /* Have we seen this EA block before? */
3871         if (ext2fs_fast_test_block_bitmap2(ctx->block_ea_map, blk)) {
3872                 ea_block_quota->blocks = EXT2FS_C2B(fs, 1);
3873                 ea_block_quota->inodes = 0;
3874
3875                 if (ctx->ea_block_quota_blocks) {
3876                         ea_refcount_fetch(ctx->ea_block_quota_blocks, blk,
3877                                           &quota_blocks);
3878                         if (quota_blocks)
3879                                 ea_block_quota->blocks = quota_blocks;
3880                 }
3881
3882                 if (ctx->ea_block_quota_inodes)
3883                         ea_refcount_fetch(ctx->ea_block_quota_inodes, blk,
3884                                           &ea_block_quota->inodes);
3885
3886                 if (ea_refcount_decrement(ctx->refcount, blk, 0) == 0)
3887                         return 1;
3888                 /* Ooops, this EA was referenced more than it stated */
3889                 if (!ctx->refcount_extra) {
3890                         pctx->errcode = ea_refcount_create(0,
3891                                            &ctx->refcount_extra);
3892                         if (pctx->errcode) {
3893                                 pctx->num = 2;
3894                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3895                                 ctx->flags |= E2F_FLAG_ABORT;
3896                                 return 0;
3897                         }
3898                 }
3899                 ea_refcount_increment(ctx->refcount_extra, blk, 0);
3900                 return 1;
3901         }
3902
3903         /*
3904          * OK, we haven't seen this EA block yet.  So we need to
3905          * validate it
3906          */
3907         pctx->blk = blk;
3908         pctx->errcode = ext2fs_read_ext_attr3(fs, blk, block_buf, pctx->ino);
3909         if (pctx->errcode == EXT2_ET_EXT_ATTR_CSUM_INVALID) {
3910                 pctx->errcode = 0;
3911                 failed_csum = 1;
3912         } else if (pctx->errcode == EXT2_ET_BAD_EA_HEADER)
3913                 pctx->errcode = 0;
3914
3915         if (pctx->errcode &&
3916             fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx)) {
3917                 pctx->errcode = 0;
3918                 goto clear_extattr;
3919         }
3920         header = (struct ext2_ext_attr_header *) block_buf;
3921         pctx->blk = ext2fs_file_acl_block(fs, inode);
3922         if (((ctx->ext_attr_ver == 1) &&
3923              (header->h_magic != EXT2_EXT_ATTR_MAGIC_v1)) ||
3924             ((ctx->ext_attr_ver == 2) &&
3925              (header->h_magic != EXT2_EXT_ATTR_MAGIC))) {
3926                 if (fix_problem(ctx, PR_1_BAD_EA_BLOCK, pctx))
3927                         goto clear_extattr;
3928         }
3929
3930         if (header->h_blocks != 1) {
3931                 if (fix_problem(ctx, PR_1_EA_MULTI_BLOCK, pctx))
3932                         goto clear_extattr;
3933         }
3934
3935         if (pctx->errcode && fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx))
3936                 goto clear_extattr;
3937
3938         region = region_create(0, fs->blocksize);
3939         if (!region) {
3940                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
3941                 ctx->flags |= E2F_FLAG_ABORT;
3942                 return 0;
3943         }
3944         if (region_allocate(region, 0, sizeof(struct ext2_ext_attr_header))) {
3945                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3946                         goto clear_extattr;
3947         }
3948
3949         first = (struct ext2_ext_attr_entry *)(header+1);
3950         end = block_buf + fs->blocksize;
3951         entry = first;
3952         while ((char *)entry < end && *(__u32 *)entry) {
3953                 __u32 hash;
3954
3955                 if (region_allocate(region, (char *)entry - (char *)header,
3956                                    EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
3957                         if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3958                                 goto clear_extattr;
3959                         break;
3960                 }
3961                 if ((ctx->ext_attr_ver == 1 &&
3962                      (entry->e_name_len == 0 || entry->e_name_index != 0)) ||
3963                     (ctx->ext_attr_ver == 2 &&
3964                      entry->e_name_index == 0)) {
3965                         if (fix_problem(ctx, PR_1_EA_BAD_NAME, pctx))
3966                                 goto clear_extattr;
3967                         break;
3968                 }
3969                 if (entry->e_value_inum == 0) {
3970                         if (entry->e_value_size > EXT2_XATTR_SIZE_MAX ||
3971                             (entry->e_value_offs + entry->e_value_size >
3972                              fs->blocksize)) {
3973                                 if (fix_problem(ctx, PR_1_EA_BAD_VALUE, pctx))
3974                                         goto clear_extattr;
3975                                 break;
3976                         }
3977                         if (entry->e_value_size &&
3978                             region_allocate(region, entry->e_value_offs,
3979                                             EXT2_EXT_ATTR_SIZE(entry->e_value_size))) {
3980                                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION,
3981                                                 pctx))
3982                                         goto clear_extattr;
3983                         }
3984
3985                         hash = ext2fs_ext_attr_hash_entry(entry, block_buf +
3986                                                           entry->e_value_offs);
3987                         if (entry->e_hash != hash)
3988                                 hash = ext2fs_ext_attr_hash_entry_signed(entry,
3989                                         block_buf + entry->e_value_offs);
3990
3991                         if (entry->e_hash != hash) {
3992                                 pctx->num = entry->e_hash;
3993                                 if (fix_problem(ctx, PR_1_ATTR_HASH, pctx))
3994                                         goto clear_extattr;
3995                                 entry->e_hash = hash;
3996                         }
3997                 } else {
3998                         problem_t problem;
3999                         blk64_t entry_quota_blocks;
4000
4001                         problem = check_large_ea_inode(ctx, entry, pctx,
4002                                                        &entry_quota_blocks);
4003                         if (problem && fix_problem(ctx, problem, pctx))
4004                                 goto clear_extattr;
4005
4006                         quota_blocks += entry_quota_blocks;
4007                         quota_inodes++;
4008                 }
4009
4010                 entry = EXT2_EXT_ATTR_NEXT(entry);
4011         }
4012         if (region_allocate(region, (char *)entry - (char *)header, 4)) {
4013                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
4014                         goto clear_extattr;
4015         }
4016         region_free(region);
4017
4018         /*
4019          * We only get here if there was no other errors that were fixed.
4020          * If there was a checksum fail, ask to correct it.
4021          */
4022         if (failed_csum &&
4023             fix_problem(ctx, PR_1_EA_BLOCK_ONLY_CSUM_INVALID, pctx)) {
4024                 pctx->errcode = e2fsck_write_ext_attr3(ctx, blk, block_buf,
4025                                                        pctx->ino);
4026                 if (pctx->errcode)
4027                         return 0;
4028         }
4029
4030         if (quota_blocks != EXT2FS_C2B(fs, 1U)) {
4031                 if (!ctx->ea_block_quota_blocks) {
4032                         pctx->errcode = ea_refcount_create(0,
4033                                                 &ctx->ea_block_quota_blocks);
4034                         if (pctx->errcode) {
4035                                 pctx->num = 3;
4036                                 goto refcount_fail;
4037                         }
4038                 }
4039                 ea_refcount_store(ctx->ea_block_quota_blocks, blk,
4040                                   quota_blocks);
4041         }
4042
4043         if (quota_inodes) {
4044                 if (!ctx->ea_block_quota_inodes) {
4045                         pctx->errcode = ea_refcount_create(0,
4046                                                 &ctx->ea_block_quota_inodes);
4047                         if (pctx->errcode) {
4048                                 pctx->num = 4;
4049 refcount_fail:
4050                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
4051                                 ctx->flags |= E2F_FLAG_ABORT;
4052                                 return 0;
4053                         }
4054                 }
4055
4056                 ea_refcount_store(ctx->ea_block_quota_inodes, blk,
4057                                   quota_inodes);
4058         }
4059         ea_block_quota->blocks = quota_blocks;
4060         ea_block_quota->inodes = quota_inodes;
4061
4062         inc_ea_inode_refs(ctx, pctx, first, end);
4063         ea_refcount_store(ctx->refcount, blk, header->h_refcount - 1);
4064         ea_refcount_store(ctx->refcount_orig, blk, header->h_refcount);
4065         /**
4066          * It might be racy that this block has been merged in the
4067          * global found map.
4068          */
4069         if (!is_blocks_used(ctx, blk, 1))
4070                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, blk);
4071         ext2fs_fast_mark_block_bitmap2(ctx->block_ea_map, blk);
4072         return 1;
4073
4074 clear_extattr:
4075         if (region)
4076                 region_free(region);
4077         ext2fs_file_acl_block_set(fs, inode, 0);
4078         e2fsck_write_inode(ctx, ino, inode, "check_ext_attr");
4079         return 0;
4080 }
4081
4082 /* Returns 1 if bad htree, 0 if OK */
4083 static int handle_htree(e2fsck_t ctx, struct problem_context *pctx,
4084                         ext2_ino_t ino, struct ext2_inode *inode,
4085                         char *block_buf)
4086 {
4087         struct ext2_dx_root_info        *root;
4088         ext2_filsys                     fs = ctx->fs;
4089         errcode_t                       retval;
4090         blk64_t                         blk;
4091
4092         if ((!LINUX_S_ISDIR(inode->i_mode) &&
4093              fix_problem(ctx, PR_1_HTREE_NODIR, pctx)) ||
4094             (!ext2fs_has_feature_dir_index(fs->super) &&
4095              fix_problem(ctx, PR_1_HTREE_SET, pctx)))
4096                 return 1;
4097
4098         pctx->errcode = ext2fs_bmap2(fs, ino, inode, 0, 0, 0, 0, &blk);
4099
4100         if ((pctx->errcode) ||
4101             (blk == 0) ||
4102             (blk < fs->super->s_first_data_block) ||
4103             (blk >= ext2fs_blocks_count(fs->super))) {
4104                 if (fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4105                         return 1;
4106                 else
4107                         return 0;
4108         }
4109
4110         retval = io_channel_read_blk64(fs->io, blk, 1, block_buf);
4111         if (retval && fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4112                 return 1;
4113
4114         /* XXX should check that beginning matches a directory */
4115         root = (struct ext2_dx_root_info *) (block_buf + 24);
4116
4117         if ((root->reserved_zero || root->info_length < 8) &&
4118             fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4119                 return 1;
4120
4121         pctx->num = root->hash_version;
4122         if ((root->hash_version != EXT2_HASH_LEGACY) &&
4123             (root->hash_version != EXT2_HASH_HALF_MD4) &&
4124             (root->hash_version != EXT2_HASH_TEA) &&
4125             (root->hash_version != EXT2_HASH_SIPHASH) &&
4126             fix_problem(ctx, PR_1_HTREE_HASHV, pctx))
4127                 return 1;
4128
4129         if (ext4_hash_in_dirent(inode)) {
4130                 if (root->hash_version != EXT2_HASH_SIPHASH &&
4131                     fix_problem(ctx, PR_1_HTREE_NEEDS_SIPHASH, pctx))
4132                         return 1;
4133         } else {
4134                 if (root->hash_version == EXT2_HASH_SIPHASH &&
4135                    fix_problem(ctx, PR_1_HTREE_CANNOT_SIPHASH, pctx))
4136                         return 1;
4137         }
4138
4139         if ((root->unused_flags & EXT2_HASH_FLAG_INCOMPAT) &&
4140             fix_problem(ctx, PR_1_HTREE_INCOMPAT, pctx))
4141                 return 1;
4142
4143         pctx->num = root->indirect_levels;
4144         /* if htree level is clearly too high, consider it to be broken */
4145         if (root->indirect_levels > EXT4_HTREE_LEVEL &&
4146             fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
4147                 return 1;
4148
4149         /* if level is only maybe too high, LARGE_DIR feature could be unset */
4150         if (root->indirect_levels > ext2_dir_htree_level(fs) &&
4151             !ext2fs_has_feature_largedir(fs->super)) {
4152                 int blockbits = EXT2_BLOCK_SIZE_BITS(fs->super) + 10;
4153                 unsigned idx_pb = 1 << (blockbits - 3);
4154
4155                 /* compare inode size/blocks vs. max-sized 2-level htree */
4156                 if (EXT2_I_SIZE(pctx->inode) <
4157                     (idx_pb - 1) * (idx_pb - 2) << blockbits &&
4158                     pctx->inode->i_blocks <
4159                     (idx_pb - 1) * (idx_pb - 2) << (blockbits - 9) &&
4160                     fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
4161                         return 1;
4162         }
4163
4164         if (root->indirect_levels > EXT4_HTREE_LEVEL_COMPAT ||
4165             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
4166                 ctx->large_dirs++;
4167
4168         return 0;
4169 }
4170
4171 void e2fsck_clear_inode(e2fsck_t ctx, ext2_ino_t ino,
4172                         struct ext2_inode *inode, int restart_flag,
4173                         const char *source)
4174 {
4175         inode->i_flags = 0;
4176         inode->i_links_count = 0;
4177         ext2fs_icount_store(ctx->inode_link_info, ino, 0);
4178         inode->i_dtime = ctx->now;
4179
4180         /*
4181          * If a special inode has such rotten block mappings that we
4182          * want to clear the whole inode, be sure to actually zap
4183          * the block maps because i_links_count isn't checked for
4184          * special inodes, and we'll end up right back here the next
4185          * time we run fsck.
4186          */
4187         if (ino < EXT2_FIRST_INODE(ctx->fs->super))
4188                 memset(inode->i_block, 0, sizeof(inode->i_block));
4189
4190         ext2fs_unmark_inode_bitmap2(ctx->inode_dir_map, ino);
4191         ext2fs_unmark_inode_bitmap2(ctx->inode_used_map, ino);
4192         if (ctx->inode_reg_map)
4193                 ext2fs_unmark_inode_bitmap2(ctx->inode_reg_map, ino);
4194         if (ctx->inode_bad_map)
4195                 ext2fs_unmark_inode_bitmap2(ctx->inode_bad_map, ino);
4196
4197         /*
4198          * If the inode was partially accounted for before processing
4199          * was aborted, we need to restart the pass 1 scan.
4200          */
4201         ctx->flags |= restart_flag;
4202
4203         if (ino == EXT2_BAD_INO)
4204                 memset(inode, 0, sizeof(struct ext2_inode));
4205
4206         e2fsck_write_inode(ctx, ino, inode, source);
4207 }
4208
4209 /*
4210  * Use the multiple-blocks reclamation code to fix alignment problems in
4211  * a bigalloc filesystem.  We want a logical cluster to map to *only* one
4212  * physical cluster, and we want the block offsets within that cluster to
4213  * line up.
4214  */
4215 static int has_unaligned_cluster_map(e2fsck_t ctx,
4216                                      blk64_t last_pblk, blk64_t last_lblk,
4217                                      blk64_t pblk, blk64_t lblk)
4218 {
4219         blk64_t cluster_mask;
4220
4221         if (!ctx->fs->cluster_ratio_bits)
4222                 return 0;
4223         cluster_mask = EXT2FS_CLUSTER_MASK(ctx->fs);
4224
4225         /*
4226          * If the block in the logical cluster doesn't align with the block in
4227          * the physical cluster...
4228          */
4229         if ((lblk & cluster_mask) != (pblk & cluster_mask))
4230                 return 1;
4231
4232         /*
4233          * If we cross a physical cluster boundary within a logical cluster...
4234          */
4235         if (last_pblk && (lblk & cluster_mask) != 0 &&
4236             EXT2FS_B2C(ctx->fs, lblk) == EXT2FS_B2C(ctx->fs, last_lblk) &&
4237             EXT2FS_B2C(ctx->fs, pblk) != EXT2FS_B2C(ctx->fs, last_pblk))
4238                 return 1;
4239
4240         return 0;
4241 }
4242
4243 static void scan_extent_node(e2fsck_t ctx, struct problem_context *pctx,
4244                              struct process_block_struct *pb,
4245                              blk64_t start_block, blk64_t end_block,
4246                              blk64_t eof_block,
4247                              ext2_extent_handle_t ehandle,
4248                              int try_repairs)
4249 {
4250         struct ext2fs_extent    extent;
4251         blk64_t                 blk, last_lblk;
4252         unsigned int            i, n;
4253         int                     is_dir, is_leaf;
4254         problem_t               problem;
4255         struct ext2_extent_info info;
4256         int                     failed_csum = 0;
4257
4258         if (pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID)
4259                 failed_csum = 1;
4260
4261         pctx->errcode = ext2fs_extent_get_info(ehandle, &info);
4262         if (pctx->errcode)
4263                 return;
4264         if (!(ctx->options & E2F_OPT_FIXES_ONLY) &&
4265             !pb->eti.force_rebuild &&
4266             info.curr_level < MAX_EXTENT_DEPTH_COUNT) {
4267                 struct extent_tree_level *etl;
4268
4269                 etl = pb->eti.ext_info + info.curr_level;
4270                 etl->num_extents += info.num_entries;
4271                 etl->max_extents += info.max_entries;
4272                 /*
4273                  * Implementation wart: Splitting extent blocks when appending
4274                  * will leave the old block with one free entry.  Therefore
4275                  * unless the node is totally full, pretend that a non-root
4276                  * extent block can hold one fewer entry than it actually does,
4277                  * so that we don't repeatedly rebuild the extent tree.
4278                  */
4279                 if (info.curr_level && info.num_entries < info.max_entries)
4280                         etl->max_extents--;
4281         }
4282
4283         pctx->errcode = ext2fs_extent_get(ehandle, EXT2_EXTENT_FIRST_SIB,
4284                                           &extent);
4285         while ((pctx->errcode == 0 ||
4286                 pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID) &&
4287                info.num_entries-- > 0) {
4288                 is_leaf = extent.e_flags & EXT2_EXTENT_FLAGS_LEAF;
4289                 is_dir = LINUX_S_ISDIR(pctx->inode->i_mode);
4290                 last_lblk = extent.e_lblk + extent.e_len - 1;
4291
4292                 problem = 0;
4293                 pctx->blk = extent.e_pblk;
4294                 pctx->blk2 = extent.e_lblk;
4295                 pctx->num = extent.e_len;
4296                 pctx->blkcount = extent.e_lblk + extent.e_len;
4297
4298                 if (extent.e_pblk == 0 ||
4299                     extent.e_pblk < ctx->fs->super->s_first_data_block ||
4300                     extent.e_pblk >= ext2fs_blocks_count(ctx->fs->super))
4301                         problem = PR_1_EXTENT_BAD_START_BLK;
4302                 else if (extent.e_lblk < start_block)
4303                         problem = PR_1_OUT_OF_ORDER_EXTENTS;
4304                 else if ((end_block && last_lblk > end_block) &&
4305                          !(last_lblk > eof_block &&
4306                            ((extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) ||
4307                             (pctx->inode->i_flags & EXT4_VERITY_FL))))
4308                         problem = PR_1_EXTENT_END_OUT_OF_BOUNDS;
4309                 else if (is_leaf && extent.e_len == 0)
4310                         problem = PR_1_EXTENT_LENGTH_ZERO;
4311                 else if (is_leaf &&
4312                          (extent.e_pblk + extent.e_len) >
4313                          ext2fs_blocks_count(ctx->fs->super))
4314                         problem = PR_1_EXTENT_ENDS_BEYOND;
4315                 else if (is_leaf && is_dir && !pctx->inode->i_size_high &&
4316                          !ext2fs_has_feature_largedir(ctx->fs->super) &&
4317                          ((extent.e_lblk + extent.e_len) >
4318                           (1U << (21 - ctx->fs->super->s_log_block_size))))
4319                         problem = PR_1_TOOBIG_DIR;
4320
4321                 if (is_leaf && problem == 0 && extent.e_len > 0) {
4322 #if 0
4323                         printf("extent_region(ino=%u, expect=%llu, "
4324                                "lblk=%llu, len=%u)\n", pb->ino,
4325                                (unsigned long long) pb->next_lblock,
4326                                (unsigned long long) extent.e_lblk,
4327                                extent.e_len);
4328 #endif
4329                         if (extent.e_lblk < pb->next_lblock)
4330                                 problem = PR_1_EXTENT_COLLISION;
4331                         else if (extent.e_lblk + extent.e_len > pb->next_lblock)
4332                                 pb->next_lblock = extent.e_lblk + extent.e_len;
4333                 }
4334
4335                 /*
4336                  * Uninitialized blocks in a directory?  Clear the flag and
4337                  * we'll interpret the blocks later.
4338                  */
4339                 if (try_repairs && is_dir && problem == 0 &&
4340                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
4341                     fix_problem(ctx, PR_1_UNINIT_DBLOCK, pctx)) {
4342                         e2fsck_pass1_fix_lock(ctx);
4343                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
4344                         pb->inode_modified = 1;
4345                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
4346                                                               &extent);
4347                         e2fsck_pass1_fix_unlock(ctx);
4348                         if (pctx->errcode)
4349                                 return;
4350                         failed_csum = 0;
4351                 }
4352 #ifdef CONFIG_DEVELOPER_FEATURES
4353                 if (try_repairs && !is_dir && problem == 0 &&
4354                     (ctx->options & E2F_OPT_CLEAR_UNINIT) &&
4355                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
4356                     fix_problem(ctx, PR_1_CLEAR_UNINIT_EXTENT, pctx)) {
4357                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
4358                         pb->inode_modified = 1;
4359                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
4360                                                               &extent);
4361                         if (pctx->errcode)
4362                                 return;
4363                         failed_csum = 0;
4364                 }
4365 #endif
4366                 if (try_repairs && problem) {
4367 report_problem:
4368                         if (fix_problem(ctx, problem, pctx)) {
4369                                 if (ctx->invalid_bitmaps) {
4370                                         /*
4371                                          * If fsck knows the bitmaps are bad,
4372                                          * skip to the next extent and
4373                                          * try to clear this extent again
4374                                          * after fixing the bitmaps, by
4375                                          * restarting fsck.
4376                                          */
4377                                         pctx->errcode = ext2fs_extent_get(
4378                                                           ehandle,
4379                                                           EXT2_EXTENT_NEXT_SIB,
4380                                                           &extent);
4381                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4382                                         if (pctx->errcode ==
4383                                                     EXT2_ET_NO_CURRENT_NODE) {
4384                                                 pctx->errcode = 0;
4385                                                 break;
4386                                         }
4387                                         continue;
4388                                 }
4389                                 e2fsck_pass1_fix_lock(ctx);
4390                                 e2fsck_read_bitmaps(ctx);
4391                                 pb->inode_modified = 1;
4392                                 pctx->errcode =
4393                                         ext2fs_extent_delete(ehandle, 0);
4394                                 e2fsck_pass1_fix_unlock(ctx);
4395                                 if (pctx->errcode) {
4396                                         pctx->str = "ext2fs_extent_delete";
4397                                         return;
4398                                 }
4399                                 e2fsck_pass1_fix_lock(ctx);
4400                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
4401                                 e2fsck_pass1_fix_unlock(ctx);
4402                                 if (pctx->errcode &&
4403                                     pctx->errcode != EXT2_ET_NO_CURRENT_NODE) {
4404                                         pctx->str = "ext2fs_extent_fix_parents";
4405                                         return;
4406                                 }
4407                                 pctx->errcode = ext2fs_extent_get(ehandle,
4408                                                                   EXT2_EXTENT_CURRENT,
4409                                                                   &extent);
4410                                 if (pctx->errcode == EXT2_ET_NO_CURRENT_NODE) {
4411                                         pctx->errcode = 0;
4412                                         break;
4413                                 }
4414                                 failed_csum = 0;
4415                                 continue;
4416                         }
4417                         goto next;
4418                 }
4419
4420                 if (!is_leaf) {
4421                         blk64_t lblk = extent.e_lblk;
4422                         int next_try_repairs = 1;
4423
4424                         blk = extent.e_pblk;
4425
4426                         /*
4427                          * If this lower extent block collides with critical
4428                          * metadata, don't try to repair the damage.  Pass 1b
4429                          * will reallocate the block; then we can try again.
4430                          */
4431                         if (pb->ino != EXT2_RESIZE_INO &&
4432                             extent.e_pblk < ctx->fs->super->s_blocks_count &&
4433                             ext2fs_test_block_bitmap2(ctx->block_metadata_map,
4434                                                       extent.e_pblk)) {
4435                                 next_try_repairs = 0;
4436                                 pctx->blk = blk;
4437                                 fix_problem(ctx,
4438                                             PR_1_CRITICAL_METADATA_COLLISION,
4439                                             pctx);
4440                                 if ((ctx->options & E2F_OPT_NO) == 0)
4441                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4442                         }
4443                         pctx->errcode = ext2fs_extent_get(ehandle,
4444                                                   EXT2_EXTENT_DOWN, &extent);
4445                         if (pctx->errcode &&
4446                             pctx->errcode != EXT2_ET_EXTENT_CSUM_INVALID) {
4447                                 pctx->str = "EXT2_EXTENT_DOWN";
4448                                 problem = PR_1_EXTENT_HEADER_INVALID;
4449                                 if (!next_try_repairs)
4450                                         return;
4451                                 if (pctx->errcode == EXT2_ET_EXTENT_HEADER_BAD)
4452                                         goto report_problem;
4453                                 return;
4454                         }
4455                         /* The next extent should match this index's logical start */
4456                         if (extent.e_lblk != lblk) {
4457                                 struct ext2_extent_info e_info;
4458
4459                                 pctx->errcode = ext2fs_extent_get_info(ehandle,
4460                                                                        &e_info);
4461                                 if (pctx->errcode) {
4462                                         pctx->str = "ext2fs_extent_get_info";
4463                                         return;
4464                                 }
4465                                 pctx->blk = lblk;
4466                                 pctx->blk2 = extent.e_lblk;
4467                                 pctx->num = e_info.curr_level - 1;
4468                                 problem = PR_1_EXTENT_INDEX_START_INVALID;
4469                                 if (fix_problem(ctx, problem, pctx)) {
4470                                         e2fsck_pass1_fix_lock(ctx);
4471                                         pb->inode_modified = 1;
4472                                         pctx->errcode =
4473                                                 ext2fs_extent_fix_parents(ehandle);
4474                                         e2fsck_pass1_fix_unlock(ctx);
4475                                         if (pctx->errcode) {
4476                                                 pctx->str = "ext2fs_extent_fix_parents";
4477                                                 return;
4478                                         }
4479                                 }
4480                         }
4481                         scan_extent_node(ctx, pctx, pb, extent.e_lblk,
4482                                          last_lblk, eof_block, ehandle,
4483                                          next_try_repairs);
4484                         if (pctx->errcode)
4485                                 return;
4486                         pctx->errcode = ext2fs_extent_get(ehandle,
4487                                                   EXT2_EXTENT_UP, &extent);
4488                         if (pctx->errcode) {
4489                                 pctx->str = "EXT2_EXTENT_UP";
4490                                 return;
4491                         }
4492                         mark_block_used(ctx, blk);
4493                         pb->num_blocks++;
4494                         goto next;
4495                 }
4496
4497                 if ((pb->previous_block != 0) &&
4498                     (pb->previous_block+1 != extent.e_pblk)) {
4499                         if (ctx->options & E2F_OPT_FRAGCHECK) {
4500                                 char type = '?';
4501
4502                                 if (pb->is_dir)
4503                                         type = 'd';
4504                                 else if (pb->is_reg)
4505                                         type = 'f';
4506
4507                                 printf(("%6lu(%c): expecting %6lu "
4508                                         "actual extent "
4509                                         "phys %6lu log %lu len %lu\n"),
4510                                        (unsigned long) pctx->ino, type,
4511                                        (unsigned long) pb->previous_block+1,
4512                                        (unsigned long) extent.e_pblk,
4513                                        (unsigned long) extent.e_lblk,
4514                                        (unsigned long) extent.e_len);
4515                         }
4516                         pb->fragmented = 1;
4517                 }
4518                 /*
4519                  * If we notice a gap in the logical block mappings of an
4520                  * extent-mapped directory, offer to close the hole by
4521                  * moving the logical block down, otherwise we'll go mad in
4522                  * pass 3 allocating empty directory blocks to fill the hole.
4523                  */
4524                 if (try_repairs && is_dir &&
4525                     pb->last_block + 1 < extent.e_lblk) {
4526                         blk64_t new_lblk;
4527
4528                         new_lblk = pb->last_block + 1;
4529                         if (EXT2FS_CLUSTER_RATIO(ctx->fs) > 1)
4530                                 new_lblk = ((new_lblk +
4531                                              EXT2FS_CLUSTER_RATIO(ctx->fs) - 1) &
4532                                             ~EXT2FS_CLUSTER_MASK(ctx->fs)) |
4533                                            (extent.e_pblk &
4534                                             EXT2FS_CLUSTER_MASK(ctx->fs));
4535                         pctx->blk = extent.e_lblk;
4536                         pctx->blk2 = new_lblk;
4537                         if (fix_problem(ctx, PR_1_COLLAPSE_DBLOCK, pctx)) {
4538                                 e2fsck_pass1_fix_lock(ctx);
4539                                 extent.e_lblk = new_lblk;
4540                                 pb->inode_modified = 1;
4541                                 pctx->errcode = ext2fs_extent_replace(ehandle,
4542                                                                 0, &extent);
4543                                 e2fsck_pass1_fix_unlock(ctx);
4544                                 if (pctx->errcode) {
4545                                         pctx->errcode = 0;
4546                                         goto alloc_later;
4547                                 }
4548                                 e2fsck_pass1_fix_lock(ctx);
4549                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
4550                                 e2fsck_pass1_fix_unlock(ctx);
4551                                 if (pctx->errcode)
4552                                         goto failed_add_dir_block;
4553                                 pctx->errcode = ext2fs_extent_goto(ehandle,
4554                                                                 extent.e_lblk);
4555                                 if (pctx->errcode)
4556                                         goto failed_add_dir_block;
4557                                 last_lblk = extent.e_lblk + extent.e_len - 1;
4558                                 failed_csum = 0;
4559                         }
4560                 }
4561 alloc_later:
4562                 if (is_dir) {
4563                         while (++pb->last_db_block <
4564                                (e2_blkcnt_t) extent.e_lblk) {
4565                                 pctx->errcode = ext2fs_add_dir_block2(
4566                                                         ctx->fs->dblist,
4567                                                         pb->ino, 0,
4568                                                         pb->last_db_block);
4569                                 if (pctx->errcode) {
4570                                         pctx->blk = 0;
4571                                         pctx->num = pb->last_db_block;
4572                                         goto failed_add_dir_block;
4573                                 }
4574                         }
4575
4576                         for (i = 0; i < extent.e_len; i++) {
4577                                 pctx->errcode = ext2fs_add_dir_block2(
4578                                                         ctx->fs->dblist,
4579                                                         pctx->ino,
4580                                                         extent.e_pblk + i,
4581                                                         extent.e_lblk + i);
4582                                 if (pctx->errcode) {
4583                                         pctx->blk = extent.e_pblk + i;
4584                                         pctx->num = extent.e_lblk + i;
4585                                 failed_add_dir_block:
4586                                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4587                                         /* Should never get here */
4588                                         ctx->flags |= E2F_FLAG_ABORT;
4589                                         return;
4590                                 }
4591                         }
4592                         if (extent.e_len > 0)
4593                                 pb->last_db_block = extent.e_lblk + extent.e_len - 1;
4594                 }
4595                 if (has_unaligned_cluster_map(ctx, pb->previous_block,
4596                                               pb->last_block,
4597                                               extent.e_pblk,
4598                                               extent.e_lblk)) {
4599                         for (i = 0; i < extent.e_len; i++) {
4600                                 pctx->blk = extent.e_lblk + i;
4601                                 pctx->blk2 = extent.e_pblk + i;
4602                                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4603                                 mark_block_used(ctx, extent.e_pblk + i);
4604                                 mark_block_used(ctx, extent.e_pblk + i);
4605                         }
4606                 }
4607
4608                 /*
4609                  * Check whether first cluster got marked in previous iteration.
4610                  */
4611                 if (ctx->fs->cluster_ratio_bits &&
4612                     pb->previous_block &&
4613                     (EXT2FS_B2C(ctx->fs, extent.e_pblk) ==
4614                      EXT2FS_B2C(ctx->fs, pb->previous_block)))
4615                         /* Set blk to the beginning of next cluster. */
4616                         blk = EXT2FS_C2B(
4617                                 ctx->fs,
4618                                 EXT2FS_B2C(ctx->fs, extent.e_pblk) + 1);
4619                 else
4620                         /* Set blk to the beginning of current cluster. */
4621                         blk = EXT2FS_C2B(ctx->fs,
4622                                          EXT2FS_B2C(ctx->fs, extent.e_pblk));
4623
4624                 if (blk < extent.e_pblk + extent.e_len) {
4625                         mark_blocks_used(ctx, blk,
4626                                          extent.e_pblk + extent.e_len - blk);
4627                         n = DIV_ROUND_UP(extent.e_pblk + extent.e_len - blk,
4628                                          EXT2FS_CLUSTER_RATIO(ctx->fs));
4629                         pb->num_blocks += n;
4630                 }
4631                 pb->last_block = extent.e_lblk + extent.e_len - 1;
4632                 pb->previous_block = extent.e_pblk + extent.e_len - 1;
4633                 start_block = pb->last_block = last_lblk;
4634                 if (is_leaf && !is_dir &&
4635                     !(extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT))
4636                         pb->last_init_lblock = last_lblk;
4637         next:
4638                 pctx->errcode = ext2fs_extent_get(ehandle,
4639                                                   EXT2_EXTENT_NEXT_SIB,
4640                                                   &extent);
4641         }
4642
4643         /* Failed csum but passes checks?  Ask to fix checksum. */
4644         if (failed_csum &&
4645             fix_problem(ctx, PR_1_EXTENT_ONLY_CSUM_INVALID, pctx)) {
4646                 e2fsck_pass1_fix_lock(ctx);
4647                 pb->inode_modified = 1;
4648                 pctx->errcode = ext2fs_extent_replace(ehandle, 0, &extent);
4649                 e2fsck_pass1_fix_unlock(ctx);
4650                 if (pctx->errcode)
4651                         return;
4652         }
4653
4654         if (pctx->errcode == EXT2_ET_EXTENT_NO_NEXT)
4655                 pctx->errcode = 0;
4656 }
4657
4658 static void check_blocks_extents(e2fsck_t ctx, struct problem_context *pctx,
4659                                  struct process_block_struct *pb)
4660 {
4661         struct ext2_extent_info info;
4662         struct ext2_inode       *inode = pctx->inode;
4663         ext2_extent_handle_t    ehandle;
4664         ext2_filsys             fs = ctx->fs;
4665         ext2_ino_t              ino = pctx->ino;
4666         errcode_t               retval;
4667         blk64_t                 eof_lblk;
4668         struct ext3_extent_header       *eh;
4669
4670         /* Check for a proper extent header... */
4671         eh = (struct ext3_extent_header *) &inode->i_block[0];
4672         retval = ext2fs_extent_header_verify(eh, sizeof(inode->i_block));
4673         if (retval) {
4674                 if (fix_problem(ctx, PR_1_MISSING_EXTENT_HEADER, pctx))
4675                         e2fsck_clear_inode(ctx, ino, inode, 0,
4676                                            "check_blocks_extents");
4677                 pctx->errcode = 0;
4678                 return;
4679         }
4680
4681         /* ...since this function doesn't fail if i_block is zeroed. */
4682         pctx->errcode = ext2fs_extent_open2(fs, ino, inode, &ehandle);
4683         if (pctx->errcode) {
4684                 if (fix_problem(ctx, PR_1_READ_EXTENT, pctx))
4685                         e2fsck_clear_inode(ctx, ino, inode, 0,
4686                                            "check_blocks_extents");
4687                 pctx->errcode = 0;
4688                 return;
4689         }
4690
4691         retval = ext2fs_extent_get_info(ehandle, &info);
4692         if (retval == 0) {
4693                 int max_depth = info.max_depth;
4694
4695                 if (max_depth >= MAX_EXTENT_DEPTH_COUNT)
4696                         max_depth = MAX_EXTENT_DEPTH_COUNT-1;
4697                 ctx->extent_depth_count[max_depth]++;
4698         }
4699
4700         /* Check maximum extent depth */
4701         pctx->blk = info.max_depth;
4702         pctx->blk2 = ext2fs_max_extent_depth(ehandle);
4703         if (pctx->blk2 < pctx->blk &&
4704             fix_problem(ctx, PR_1_EXTENT_BAD_MAX_DEPTH, pctx))
4705                 pb->eti.force_rebuild = 1;
4706
4707         /* Can we collect extent tree level stats? */
4708         pctx->blk = MAX_EXTENT_DEPTH_COUNT;
4709         if (pctx->blk2 > pctx->blk)
4710                 fix_problem(ctx, PR_1E_MAX_EXTENT_TREE_DEPTH, pctx);
4711         memset(pb->eti.ext_info, 0, sizeof(pb->eti.ext_info));
4712         pb->eti.ino = pb->ino;
4713
4714         pb->next_lblock = 0;
4715
4716         eof_lblk = ((EXT2_I_SIZE(inode) + fs->blocksize - 1) >>
4717                 EXT2_BLOCK_SIZE_BITS(fs->super)) - 1;
4718         scan_extent_node(ctx, pctx, pb, 0, 0, eof_lblk, ehandle, 1);
4719         if (pctx->errcode &&
4720             fix_problem(ctx, PR_1_EXTENT_ITERATE_FAILURE, pctx)) {
4721                 pb->num_blocks = 0;
4722                 inode->i_blocks = 0;
4723                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4724                                    "check_blocks_extents");
4725                 pctx->errcode = 0;
4726         }
4727         ext2fs_extent_free(ehandle);
4728
4729         /* Rebuild unless it's a dir and we're rehashing it */
4730         if (LINUX_S_ISDIR(inode->i_mode) &&
4731             e2fsck_dir_will_be_rehashed(ctx, ino))
4732                 return;
4733
4734         if (ctx->options & E2F_OPT_CONVERT_BMAP)
4735                 e2fsck_rebuild_extents_later(ctx, ino);
4736         else
4737                 e2fsck_should_rebuild_extents(ctx, pctx, &pb->eti, &info);
4738 }
4739
4740 /*
4741  * In fact we don't need to check blocks for an inode with inline data
4742  * because this inode doesn't have any blocks.  In this function all
4743  * we need to do is add this inode into dblist when it is a directory.
4744  */
4745 static void check_blocks_inline_data(e2fsck_t ctx, struct problem_context *pctx,
4746                                      struct process_block_struct *pb)
4747 {
4748         int     flags;
4749         size_t  inline_data_size = 0;
4750
4751         if (!pb->is_dir) {
4752                 pctx->errcode = 0;
4753                 return;
4754         }
4755
4756         /* Process the dirents in i_block[] as the "first" block. */
4757         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 0);
4758         if (pctx->errcode)
4759                 goto err;
4760
4761         /* Process the dirents in the EA as a "second" block. */
4762         flags = ctx->fs->flags;
4763         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4764         pctx->errcode = ext2fs_inline_data_size(ctx->fs, pb->ino,
4765                                                 &inline_data_size);
4766         ctx->fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4767                          (ctx->fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4768         if (pctx->errcode) {
4769                 pctx->errcode = 0;
4770                 return;
4771         }
4772
4773         if (inline_data_size <= EXT4_MIN_INLINE_DATA_SIZE)
4774                 return;
4775
4776         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 1);
4777         if (pctx->errcode)
4778                 goto err;
4779
4780         return;
4781 err:
4782         pctx->blk = 0;
4783         pctx->num = 0;
4784         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4785         ctx->flags |= E2F_FLAG_ABORT;
4786 }
4787
4788 /*
4789  * This subroutine is called on each inode to account for all of the
4790  * blocks used by that inode.
4791  */
4792 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
4793                          char *block_buf, const struct ea_quota *ea_ibody_quota)
4794 {
4795         ext2_filsys fs = ctx->fs;
4796         struct process_block_struct pb;
4797         ext2_ino_t      ino = pctx->ino;
4798         struct ext2_inode *inode = pctx->inode;
4799         unsigned        bad_size = 0;
4800         int             dirty_inode = 0;
4801         int             extent_fs;
4802         int             inlinedata_fs;
4803         __u64           size;
4804         struct ea_quota ea_block_quota;
4805
4806         pb.ino = ino;
4807         pb.num_blocks = EXT2FS_B2C(ctx->fs,
4808                                    ea_ibody_quota ? ea_ibody_quota->blocks : 0);
4809         pb.last_block = ~0;
4810         pb.last_init_lblock = -1;
4811         pb.last_db_block = -1;
4812         pb.num_illegal_blocks = 0;
4813         pb.suppress = 0; pb.clear = 0;
4814         pb.fragmented = 0;
4815         pb.compressed = 0;
4816         pb.previous_block = 0;
4817         pb.is_dir = LINUX_S_ISDIR(inode->i_mode);
4818         pb.is_reg = LINUX_S_ISREG(inode->i_mode);
4819         pb.max_blocks = 1U << (31 - fs->super->s_log_block_size);
4820         pb.inode = inode;
4821         pb.pctx = pctx;
4822         pb.ctx = ctx;
4823         pb.inode_modified = 0;
4824         pb.eti.force_rebuild = 0;
4825         pctx->ino = ino;
4826         pctx->errcode = 0;
4827
4828         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
4829         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
4830
4831         if (check_ext_attr(ctx, pctx, block_buf, &ea_block_quota)) {
4832                 if (e2fsck_should_abort(ctx))
4833                         goto out;
4834                 pb.num_blocks += EXT2FS_B2C(ctx->fs, ea_block_quota.blocks);
4835         }
4836
4837         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL))
4838                 check_blocks_inline_data(ctx, pctx, &pb);
4839         else if (ext2fs_inode_has_valid_blocks2(fs, inode)) {
4840                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL))
4841                         check_blocks_extents(ctx, pctx, &pb);
4842                 else {
4843                         int flags;
4844                         /*
4845                          * If we've modified the inode, write it out before
4846                          * iterate() tries to use it.
4847                          */
4848                         if (dirty_inode) {
4849                                 e2fsck_write_inode(ctx, ino, inode,
4850                                                    "check_blocks");
4851                                 dirty_inode = 0;
4852                         }
4853                         flags = fs->flags;
4854                         fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4855                         pctx->errcode = ext2fs_block_iterate3(fs, ino,
4856                                                 pb.is_dir ? BLOCK_FLAG_HOLE : 0,
4857                                                 block_buf, process_block, &pb);
4858                         /*
4859                          * We do not have uninitialized extents in non extent
4860                          * files.
4861                          */
4862                         pb.last_init_lblock = pb.last_block;
4863                         /*
4864                          * If iterate() changed a block mapping, we have to
4865                          * re-read the inode.  If we decide to clear the
4866                          * inode after clearing some stuff, we'll re-write the
4867                          * bad mappings into the inode!
4868                          */
4869                         if (pb.inode_modified)
4870                                 e2fsck_read_inode(ctx, ino, inode,
4871                                                   "check_blocks");
4872                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4873                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4874
4875                         if (ctx->options & E2F_OPT_CONVERT_BMAP) {
4876 #ifdef DEBUG
4877                                 printf("bmap rebuild ino=%d\n", ino);
4878 #endif
4879                                 if (!LINUX_S_ISDIR(inode->i_mode) ||
4880                                     !e2fsck_dir_will_be_rehashed(ctx, ino))
4881                                         e2fsck_rebuild_extents_later(ctx, ino);
4882                         }
4883                 }
4884         }
4885         end_problem_latch(ctx, PR_LATCH_BLOCK);
4886         end_problem_latch(ctx, PR_LATCH_TOOBIG);
4887         if (e2fsck_should_abort(ctx))
4888                 goto out;
4889         if (pctx->errcode)
4890                 fix_problem(ctx, PR_1_BLOCK_ITERATE, pctx);
4891
4892         if (pb.fragmented && pb.num_blocks < fs->super->s_blocks_per_group) {
4893                 if (LINUX_S_ISDIR(inode->i_mode))
4894                         ctx->fs_fragmented_dir++;
4895                 else
4896                         ctx->fs_fragmented++;
4897         }
4898
4899         if (pb.clear) {
4900                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4901                                    "check_blocks");
4902                 return;
4903         }
4904
4905         if (inode->i_flags & EXT2_INDEX_FL) {
4906                 if (handle_htree(ctx, pctx, ino, inode, block_buf)) {
4907                         inode->i_flags &= ~EXT2_INDEX_FL;
4908                         dirty_inode++;
4909                 } else {
4910                         e2fsck_add_dx_dir(ctx, ino, inode, pb.last_block+1);
4911                 }
4912         }
4913
4914         if (!pb.num_blocks && pb.is_dir &&
4915             !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
4916                 if (fix_problem(ctx, PR_1_ZERO_LENGTH_DIR, pctx)) {
4917                         e2fsck_clear_inode(ctx, ino, inode, 0, "check_blocks");
4918                         ctx->fs_directory_count--;
4919                         return;
4920                 }
4921         }
4922
4923         if (ino != quota_type2inum(PRJQUOTA, fs->super) &&
4924             ino != fs->super->s_orphan_file_inum &&
4925             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INODE(ctx->fs->super)) &&
4926             !(inode->i_flags & EXT4_EA_INODE_FL)) {
4927                 quota_data_add(ctx->qctx, (struct ext2_inode_large *) inode,
4928                                ino,
4929                                pb.num_blocks * EXT2_CLUSTER_SIZE(fs->super));
4930                 quota_data_inodes(ctx->qctx, (struct ext2_inode_large *) inode,
4931                                   ino, (ea_ibody_quota ?
4932                                         ea_ibody_quota->inodes : 0) +
4933                                                 ea_block_quota.inodes + 1);
4934         }
4935
4936         if (!ext2fs_has_feature_huge_file(fs->super) ||
4937             !(inode->i_flags & EXT4_HUGE_FILE_FL))
4938                 pb.num_blocks *= (fs->blocksize / 512);
4939         pb.num_blocks *= EXT2FS_CLUSTER_RATIO(fs);
4940 #if 0
4941         printf("inode %u, i_size = %u, last_block = %llu, i_blocks=%llu, num_blocks = %llu\n",
4942                ino, inode->i_size, (unsigned long long) pb.last_block,
4943                (unsigned long long) ext2fs_inode_i_blocks(fs, inode),
4944                (unsigned long long) pb.num_blocks);
4945 #endif
4946         size = EXT2_I_SIZE(inode);
4947         if (pb.is_dir) {
4948                 unsigned nblock = size >> EXT2_BLOCK_SIZE_BITS(fs->super);
4949                 if (inode->i_flags & EXT4_INLINE_DATA_FL) {
4950                         int flags;
4951                         size_t sz = 0;
4952                         errcode_t err;
4953
4954                         flags = ctx->fs->flags;
4955                         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4956                         err = ext2fs_inline_data_size(ctx->fs, pctx->ino,
4957                                                       &sz);
4958                         ctx->fs->flags = (flags &
4959                                           EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4960                                          (ctx->fs->flags &
4961                                           ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4962                         if (err || sz != size) {
4963                                 bad_size = 7;
4964                                 pctx->num = sz;
4965                         }
4966                 } else if (size & (fs->blocksize - 1))
4967                         bad_size = 5;
4968                 else if (nblock > (pb.last_block + 1))
4969                         bad_size = 1;
4970                 else if (nblock < (pb.last_block + 1)) {
4971                         if (((pb.last_block + 1) - nblock) >
4972                             fs->super->s_prealloc_dir_blocks)
4973                                 bad_size = 2;
4974                 }
4975         } else {
4976                 if ((pb.last_init_lblock >= 0) &&
4977                     /* Do not allow initialized allocated blocks past i_size*/
4978                     (size < (__u64)pb.last_init_lblock * fs->blocksize) &&
4979                     !(inode->i_flags & EXT4_VERITY_FL))
4980                         bad_size = 3;
4981                 else if (!(extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4982                          size > ext2_max_sizes[fs->super->s_log_block_size])
4983                         /* too big for a direct/indirect-mapped file */
4984                         bad_size = 4;
4985                 else if ((extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4986                          size >
4987                          ((1ULL << (32 + EXT2_BLOCK_SIZE_BITS(fs->super))) - 1))
4988                         /* too big for an extent-based file - 32bit ee_block */
4989                         bad_size = 6;
4990         }
4991         /* i_size for symlinks is checked elsewhere */
4992         if (bad_size && !LINUX_S_ISLNK(inode->i_mode)) {
4993                 /* Did inline_data set pctx->num earlier? */
4994                 if (bad_size != 7)
4995                         pctx->num = (pb.last_block + 1) * fs->blocksize;
4996                 pctx->group = bad_size;
4997                 if (fix_problem(ctx, PR_1_BAD_I_SIZE, pctx)) {
4998                         ext2fs_inode_size_set(fs, inode, pctx->num);
4999                         if (EXT2_I_SIZE(inode) == 0 &&
5000                             (inode->i_flags & EXT4_INLINE_DATA_FL)) {
5001                                 memset(inode->i_block, 0,
5002                                        sizeof(inode->i_block));
5003                                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
5004                         }
5005                         dirty_inode++;
5006                 }
5007                 pctx->num = 0;
5008         }
5009         if (LINUX_S_ISREG(inode->i_mode) &&
5010             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
5011                 ctx->large_files++;
5012         if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
5013             ((pb.num_blocks != ext2fs_inode_i_blocks(fs, inode)) ||
5014              (ext2fs_has_feature_huge_file(fs->super) &&
5015               (inode->i_flags & EXT4_HUGE_FILE_FL) &&
5016               (inode->osd2.linux2.l_i_blocks_hi != 0)))) {
5017                 pctx->num = pb.num_blocks;
5018                 if (fix_problem(ctx, PR_1_BAD_I_BLOCKS, pctx)) {
5019                         inode->i_blocks = pb.num_blocks;
5020                         inode->osd2.linux2.l_i_blocks_hi = pb.num_blocks >> 32;
5021                         dirty_inode++;
5022                 }
5023                 pctx->num = 0;
5024         }
5025
5026         /*
5027          * The kernel gets mad if we ask it to allocate bigalloc clusters to
5028          * a block mapped file, so rebuild it as an extent file.  We can skip
5029          * symlinks because they're never rewritten.
5030          */
5031         if (ext2fs_has_feature_bigalloc(fs->super) &&
5032             (LINUX_S_ISREG(inode->i_mode) || LINUX_S_ISDIR(inode->i_mode)) &&
5033             ext2fs_inode_data_blocks2(fs, inode) > 0 &&
5034             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INO(fs->super)) &&
5035             !(inode->i_flags & (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)) &&
5036             fix_problem(ctx, PR_1_NO_BIGALLOC_BLOCKMAP_FILES, pctx)) {
5037                 pctx->errcode = e2fsck_rebuild_extents_later(ctx, ino);
5038                 if (pctx->errcode)
5039                         goto out;
5040         }
5041
5042         if (ctx->dirs_to_hash && pb.is_dir &&
5043             !(ctx->lost_and_found && ctx->lost_and_found == ino) &&
5044             !(inode->i_flags & EXT2_INDEX_FL) &&
5045             ((inode->i_size / fs->blocksize) >= 3))
5046                 e2fsck_rehash_dir_later(ctx, ino);
5047
5048 out:
5049         if (dirty_inode)
5050                 e2fsck_write_inode(ctx, ino, inode, "check_blocks");
5051 }
5052
5053 #if 0
5054 /*
5055  * Helper function called by process block when an illegal block is
5056  * found.  It returns a description about why the block is illegal
5057  */
5058 static char *describe_illegal_block(ext2_filsys fs, blk64_t block)
5059 {
5060         blk64_t super;
5061         int     i;
5062         static char     problem[80];
5063
5064         super = fs->super->s_first_data_block;
5065         strcpy(problem, "PROGRAMMING ERROR: Unknown reason for illegal block");
5066         if (block < super) {
5067                 sprintf(problem, "< FIRSTBLOCK (%u)", super);
5068                 return(problem);
5069         } else if (block >= ext2fs_blocks_count(fs->super)) {
5070                 sprintf(problem, "> BLOCKS (%u)", ext2fs_blocks_count(fs->super));
5071                 return(problem);
5072         }
5073         for (i = 0; i < fs->group_desc_count; i++) {
5074                 if (block == super) {
5075                         sprintf(problem, "is the superblock in group %d", i);
5076                         break;
5077                 }
5078                 if (block > super &&
5079                     block <= (super + fs->desc_blocks)) {
5080                         sprintf(problem, "is in the group descriptors "
5081                                 "of group %d", i);
5082                         break;
5083                 }
5084                 if (block == ext2fs_block_bitmap_loc(fs, i)) {
5085                         sprintf(problem, "is the block bitmap of group %d", i);
5086                         break;
5087                 }
5088                 if (block == ext2fs_inode_bitmap_loc(fs, i)) {
5089                         sprintf(problem, "is the inode bitmap of group %d", i);
5090                         break;
5091                 }
5092                 if (block >= ext2fs_inode_table_loc(fs, i) &&
5093                     (block < ext2fs_inode_table_loc(fs, i)
5094                      + fs->inode_blocks_per_group)) {
5095                         sprintf(problem, "is in the inode table of group %d",
5096                                 i);
5097                         break;
5098                 }
5099                 super += fs->super->s_blocks_per_group;
5100         }
5101         return(problem);
5102 }
5103 #endif
5104
5105 /*
5106  * This is a helper function for check_blocks().
5107  */
5108 static int process_block(ext2_filsys fs,
5109                   blk64_t       *block_nr,
5110                   e2_blkcnt_t blockcnt,
5111                   blk64_t ref_block EXT2FS_ATTR((unused)),
5112                   int ref_offset EXT2FS_ATTR((unused)),
5113                   void *priv_data)
5114 {
5115         struct process_block_struct *p;
5116         struct problem_context *pctx;
5117         blk64_t blk = *block_nr;
5118         int     ret_code = 0;
5119         problem_t       problem = 0;
5120         e2fsck_t        ctx;
5121
5122         p = (struct process_block_struct *) priv_data;
5123         pctx = p->pctx;
5124         ctx = p->ctx;
5125
5126         /*
5127          * For a directory, add logical block zero for processing even if it's
5128          * not mapped or we'll be perennially stuck with broken "." and ".."
5129          * entries.
5130          */
5131         if (p->is_dir && blockcnt == 0 && blk == 0) {
5132                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino, 0, 0);
5133                 if (pctx->errcode) {
5134                         pctx->blk = blk;
5135                         pctx->num = blockcnt;
5136                         goto failed_add_dir_block;
5137                 }
5138                 p->last_db_block++;
5139         }
5140
5141         if (blk == 0)
5142                 return 0;
5143
5144 #if 0
5145         printf("Process_block, inode %lu, block %u, #%d\n", p->ino, blk,
5146                blockcnt);
5147 #endif
5148
5149         /*
5150          * Simplistic fragmentation check.  We merely require that the
5151          * file be contiguous.  (Which can never be true for really
5152          * big files that are greater than a block group.)
5153          */
5154         if (p->previous_block && p->ino != EXT2_RESIZE_INO) {
5155                 if (p->previous_block+1 != blk) {
5156                         if (ctx->options & E2F_OPT_FRAGCHECK) {
5157                                 char type = '?';
5158
5159                                 if (p->is_dir)
5160                                         type = 'd';
5161                                 else if (p->is_reg)
5162                                         type = 'f';
5163
5164                                 printf(_("%6lu(%c): expecting %6lu "
5165                                          "got phys %6lu (blkcnt %lld)\n"),
5166                                        (unsigned long) pctx->ino, type,
5167                                        (unsigned long) p->previous_block+1,
5168                                        (unsigned long) blk,
5169                                        (long long) blockcnt);
5170                         }
5171                         p->fragmented = 1;
5172                 }
5173         }
5174
5175         if (p->is_dir && !ext2fs_has_feature_largedir(fs->super) &&
5176             !pctx->inode->i_size_high &&
5177             blockcnt > (1 << (21 - fs->super->s_log_block_size)))
5178                 problem = PR_1_TOOBIG_DIR;
5179         if (p->is_dir && p->num_blocks + 1 >= p->max_blocks)
5180                 problem = PR_1_TOOBIG_DIR;
5181         if (p->is_reg && p->num_blocks + 1 >= p->max_blocks)
5182                 problem = PR_1_TOOBIG_REG;
5183         if (!p->is_dir && !p->is_reg && blockcnt > 0)
5184                 problem = PR_1_TOOBIG_SYMLINK;
5185
5186         if (blk < fs->super->s_first_data_block ||
5187             blk >= ext2fs_blocks_count(fs->super))
5188                 problem = PR_1_ILLEGAL_BLOCK_NUM;
5189
5190         /*
5191          * If this IND/DIND/TIND block is squatting atop some critical metadata
5192          * (group descriptors, superblock, bitmap, inode table), any write to
5193          * "fix" mapping problems will destroy the metadata.  We'll let pass 1b
5194          * fix that and restart fsck.
5195          */
5196         if (blockcnt < 0 &&
5197             p->ino != EXT2_RESIZE_INO &&
5198             blk < ctx->fs->super->s_blocks_count &&
5199             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk)) {
5200                 pctx->blk = blk;
5201                 fix_problem(ctx, PR_1_CRITICAL_METADATA_COLLISION, pctx);
5202                 if ((ctx->options & E2F_OPT_NO) == 0)
5203                         ctx->flags |= E2F_FLAG_RESTART_LATER;
5204         }
5205
5206         if (problem) {
5207                 p->num_illegal_blocks++;
5208                 /*
5209                  * A bit of subterfuge here -- we're trying to fix a block
5210                  * mapping, but the IND/DIND/TIND block could have collided
5211                  * with some critical metadata.  So, fix the in-core mapping so
5212                  * iterate won't go insane, but return 0 instead of
5213                  * BLOCK_CHANGED so that it won't write the remapping out to
5214                  * our multiply linked block.
5215                  *
5216                  * Even if we previously determined that an *IND block
5217                  * conflicts with critical metadata, we must still try to
5218                  * iterate the *IND block as if it is an *IND block to find and
5219                  * mark the blocks it points to.  Better to be overly cautious
5220                  * with the used_blocks map so that we don't move the *IND
5221                  * block to a block that's really in use!
5222                  */
5223                 if (p->ino != EXT2_RESIZE_INO &&
5224                     ref_block != 0 &&
5225                     ext2fs_test_block_bitmap2(ctx->block_metadata_map,
5226                                               ref_block)) {
5227                         *block_nr = 0;
5228                         return 0;
5229                 }
5230                 if (!p->suppress && (p->num_illegal_blocks % 12) == 0) {
5231                         if (fix_problem(ctx, PR_1_TOO_MANY_BAD_BLOCKS, pctx)) {
5232                                 p->clear = 1;
5233                                 return BLOCK_ABORT;
5234                         }
5235                         if (fix_problem(ctx, PR_1_SUPPRESS_MESSAGES, pctx)) {
5236                                 p->suppress = 1;
5237                                 set_latch_flags(PR_LATCH_BLOCK,
5238                                                 PRL_SUPPRESS, 0);
5239                         }
5240                 }
5241                 pctx->blk = blk;
5242                 pctx->blkcount = blockcnt;
5243                 if (fix_problem(ctx, problem, pctx)) {
5244                         blk = *block_nr = 0;
5245                         ret_code = BLOCK_CHANGED;
5246                         p->inode_modified = 1;
5247                         /*
5248                          * If the directory block is too big and is beyond the
5249                          * end of the FS, don't bother trying to add it for
5250                          * processing -- the kernel would never have created a
5251                          * directory this large, and we risk an ENOMEM abort.
5252                          * In any case, the toobig handler for extent-based
5253                          * directories also doesn't feed toobig blocks to
5254                          * pass 2.
5255                          */
5256                         if (problem == PR_1_TOOBIG_DIR)
5257                                 return ret_code;
5258                         goto mark_dir;
5259                 } else
5260                         return 0;
5261         }
5262
5263         if (p->ino == EXT2_RESIZE_INO) {
5264                 /*
5265                  * The resize inode has already be sanity checked
5266                  * during pass #0 (the superblock checks).  All we
5267                  * have to do is mark the double indirect block as
5268                  * being in use; all of the other blocks are handled
5269                  * by mark_table_blocks()).
5270                  */
5271                 if (blockcnt == BLOCK_COUNT_DIND)
5272                         mark_block_used(ctx, blk);
5273                 p->num_blocks++;
5274         } else if (!(ctx->fs->cluster_ratio_bits &&
5275                      p->previous_block &&
5276                      (EXT2FS_B2C(ctx->fs, blk) ==
5277                       EXT2FS_B2C(ctx->fs, p->previous_block)) &&
5278                      (blk & EXT2FS_CLUSTER_MASK(ctx->fs)) ==
5279                      ((unsigned) blockcnt & EXT2FS_CLUSTER_MASK(ctx->fs)))) {
5280                 mark_block_used(ctx, blk);
5281                 p->num_blocks++;
5282         } else if (has_unaligned_cluster_map(ctx, p->previous_block,
5283                                              p->last_block, blk, blockcnt)) {
5284                 pctx->blk = blockcnt;
5285                 pctx->blk2 = blk;
5286                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
5287                 mark_block_used(ctx, blk);
5288                 mark_block_used(ctx, blk);
5289         }
5290         if (blockcnt >= 0)
5291                 p->last_block = blockcnt;
5292         p->previous_block = blk;
5293 mark_dir:
5294         if (p->is_dir && (blockcnt >= 0)) {
5295                 while (++p->last_db_block < blockcnt) {
5296                         pctx->errcode = ext2fs_add_dir_block2(fs->dblist,
5297                                                               p->ino, 0,
5298                                                               p->last_db_block);
5299                         if (pctx->errcode) {
5300                                 pctx->blk = 0;
5301                                 pctx->num = p->last_db_block;
5302                                 goto failed_add_dir_block;
5303                         }
5304                 }
5305                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino,
5306                                                       blk, blockcnt);
5307                 if (pctx->errcode) {
5308                         pctx->blk = blk;
5309                         pctx->num = blockcnt;
5310                 failed_add_dir_block:
5311                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
5312                         /* Should never get here */
5313                         ctx->flags |= E2F_FLAG_ABORT;
5314                         return BLOCK_ABORT;
5315                 }
5316         }
5317         return ret_code;
5318 }
5319
5320 static int process_bad_block(ext2_filsys fs,
5321                       blk64_t *block_nr,
5322                       e2_blkcnt_t blockcnt,
5323                       blk64_t ref_block EXT2FS_ATTR((unused)),
5324                       int ref_offset EXT2FS_ATTR((unused)),
5325                       void *priv_data)
5326 {
5327         struct process_block_struct *p;
5328         blk64_t         blk = *block_nr;
5329         blk64_t         first_block;
5330         dgrp_t          i;
5331         struct problem_context *pctx;
5332         e2fsck_t        ctx;
5333
5334         if (!blk)
5335                 return 0;
5336
5337         p = (struct process_block_struct *) priv_data;
5338         ctx = p->ctx;
5339         pctx = p->pctx;
5340
5341         pctx->ino = EXT2_BAD_INO;
5342         pctx->blk = blk;
5343         pctx->blkcount = blockcnt;
5344
5345         if ((blk < fs->super->s_first_data_block) ||
5346             (blk >= ext2fs_blocks_count(fs->super))) {
5347                 if (fix_problem(ctx, PR_1_BB_ILLEGAL_BLOCK_NUM, pctx)) {
5348                         *block_nr = 0;
5349                         return BLOCK_CHANGED;
5350                 } else
5351                         return 0;
5352         }
5353
5354         if (blockcnt < 0) {
5355                 if (ext2fs_test_block_bitmap2(p->fs_meta_blocks, blk)) {
5356                         p->bbcheck = 1;
5357                         if (fix_problem(ctx, PR_1_BB_FS_BLOCK, pctx)) {
5358                                 *block_nr = 0;
5359                                 return BLOCK_CHANGED;
5360                         }
5361                 } else if (is_blocks_used(ctx, blk, 1)) {
5362                         p->bbcheck = 1;
5363                         if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK,
5364                                         pctx)) {
5365                                 *block_nr = 0;
5366                                 return BLOCK_CHANGED;
5367                         }
5368                         if (e2fsck_should_abort(ctx))
5369                                 return BLOCK_ABORT;
5370                 } else {
5371                         mark_block_used(ctx, blk);
5372                 }
5373                 return 0;
5374         }
5375 #if 0
5376         printf ("DEBUG: Marking %u as bad.\n", blk);
5377 #endif
5378         ctx->fs_badblocks_count++;
5379         /*
5380          * If the block is not used, then mark it as used and return.
5381          * If it is already marked as found, this must mean that
5382          * there's an overlap between the filesystem table blocks
5383          * (bitmaps and inode table) and the bad block list.
5384          */
5385         if (!is_blocks_used(ctx, blk, 1)) {
5386                 ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5387                 return 0;
5388         }
5389         /*
5390          * Try to find the where the filesystem block was used...
5391          */
5392         first_block = fs->super->s_first_data_block;
5393
5394         for (i = 0; i < fs->group_desc_count; i++ ) {
5395                 pctx->group = i;
5396                 pctx->blk = blk;
5397                 if (!ext2fs_bg_has_super(fs, i))
5398                         goto skip_super;
5399                 if (blk == first_block) {
5400                         if (i == 0) {
5401                                 if (fix_problem(ctx,
5402                                                 PR_1_BAD_PRIMARY_SUPERBLOCK,
5403                                                 pctx)) {
5404                                         *block_nr = 0;
5405                                         return BLOCK_CHANGED;
5406                                 }
5407                                 return 0;
5408                         }
5409                         fix_problem(ctx, PR_1_BAD_SUPERBLOCK, pctx);
5410                         return 0;
5411                 }
5412                 if ((blk > first_block) &&
5413                     (blk <= first_block + fs->desc_blocks)) {
5414                         if (i == 0) {
5415                                 pctx->blk = *block_nr;
5416                                 if (fix_problem(ctx,
5417                         PR_1_BAD_PRIMARY_GROUP_DESCRIPTOR, pctx)) {
5418                                         *block_nr = 0;
5419                                         return BLOCK_CHANGED;
5420                                 }
5421                                 return 0;
5422                         }
5423                         fix_problem(ctx, PR_1_BAD_GROUP_DESCRIPTORS, pctx);
5424                         return 0;
5425                 }
5426         skip_super:
5427                 if (blk == ext2fs_block_bitmap_loc(fs, i)) {
5428                         if (fix_problem(ctx, PR_1_BB_BAD_BLOCK, pctx)) {
5429                                 ctx->invalid_block_bitmap_flag[i]++;
5430                                 ctx->invalid_bitmaps++;
5431                         }
5432                         return 0;
5433                 }
5434                 if (blk == ext2fs_inode_bitmap_loc(fs, i)) {
5435                         if (fix_problem(ctx, PR_1_IB_BAD_BLOCK, pctx)) {
5436                                 ctx->invalid_inode_bitmap_flag[i]++;
5437                                 ctx->invalid_bitmaps++;
5438                         }
5439                         return 0;
5440                 }
5441                 if ((blk >= ext2fs_inode_table_loc(fs, i)) &&
5442                     (blk < (ext2fs_inode_table_loc(fs, i) +
5443                             fs->inode_blocks_per_group))) {
5444                         /*
5445                          * If there are bad blocks in the inode table,
5446                          * the inode scan code will try to do
5447                          * something reasonable automatically.
5448                          */
5449                         return 0;
5450                 }
5451                 first_block += fs->super->s_blocks_per_group;
5452         }
5453         /*
5454          * If we've gotten to this point, then the only
5455          * possibility is that the bad block inode meta data
5456          * is using a bad block.
5457          */
5458         if ((blk == p->inode->i_block[EXT2_IND_BLOCK]) ||
5459             (blk == p->inode->i_block[EXT2_DIND_BLOCK]) ||
5460             (blk == p->inode->i_block[EXT2_TIND_BLOCK])) {
5461                 p->bbcheck = 1;
5462                 if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK, pctx)) {
5463                         *block_nr = 0;
5464                         return BLOCK_CHANGED;
5465                 }
5466                 if (e2fsck_should_abort(ctx))
5467                         return BLOCK_ABORT;
5468                 return 0;
5469         }
5470
5471         pctx->group = -1;
5472
5473         /* Warn user that the block wasn't claimed */
5474         fix_problem(ctx, PR_1_PROGERR_CLAIMED_BLOCK, pctx);
5475
5476         return 0;
5477 }
5478
5479 static void new_table_block(e2fsck_t ctx, blk64_t first_block, dgrp_t group,
5480                             const char *name, int num, blk64_t *new_block)
5481 {
5482         ext2_filsys fs = ctx->fs;
5483         dgrp_t          last_grp;
5484         blk64_t         old_block = *new_block;
5485         blk64_t         last_block;
5486         dgrp_t          flexbg;
5487         unsigned        flexbg_size;
5488         int             i, is_flexbg;
5489         char            *buf;
5490         struct problem_context  pctx;
5491
5492         clear_problem_context(&pctx);
5493
5494         pctx.group = group;
5495         pctx.blk = old_block;
5496         pctx.str = name;
5497
5498         /*
5499          * For flex_bg filesystems, first try to allocate the metadata
5500          * within the flex_bg, and if that fails then try finding the
5501          * space anywhere in the filesystem.
5502          */
5503         is_flexbg = ext2fs_has_feature_flex_bg(fs->super);
5504         if (is_flexbg) {
5505                 flexbg_size = 1U << fs->super->s_log_groups_per_flex;
5506                 flexbg = group / flexbg_size;
5507                 first_block = ext2fs_group_first_block2(fs,
5508                                                         flexbg_size * flexbg);
5509                 last_grp = group | (flexbg_size - 1);
5510                 if (last_grp >= fs->group_desc_count)
5511                         last_grp = fs->group_desc_count - 1;
5512                 last_block = ext2fs_group_last_block2(fs, last_grp);
5513         } else
5514                 last_block = ext2fs_group_last_block2(fs, group);
5515         pctx.errcode = ext2fs_get_free_blocks2(fs, first_block, last_block,
5516                                                num, ctx->block_found_map,
5517                                                new_block);
5518         if (is_flexbg && (pctx.errcode == EXT2_ET_BLOCK_ALLOC_FAIL))
5519                 pctx.errcode = ext2fs_get_free_blocks2(fs,
5520                                 fs->super->s_first_data_block,
5521                                 ext2fs_blocks_count(fs->super),
5522                                 num, ctx->block_found_map, new_block);
5523         if (pctx.errcode) {
5524                 pctx.num = num;
5525                 fix_problem(ctx, PR_1_RELOC_BLOCK_ALLOCATE, &pctx);
5526                 ext2fs_unmark_valid(fs);
5527                 ctx->flags |= E2F_FLAG_ABORT;
5528                 return;
5529         }
5530         pctx.errcode = ext2fs_get_mem(fs->blocksize, &buf);
5531         if (pctx.errcode) {
5532                 fix_problem(ctx, PR_1_RELOC_MEMORY_ALLOCATE, &pctx);
5533                 ext2fs_unmark_valid(fs);
5534                 ctx->flags |= E2F_FLAG_ABORT;
5535                 return;
5536         }
5537         ext2fs_mark_super_dirty(fs);
5538         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
5539         pctx.blk2 = *new_block;
5540         fix_problem(ctx, (old_block ? PR_1_RELOC_FROM_TO :
5541                           PR_1_RELOC_TO), &pctx);
5542         pctx.blk2 = 0;
5543         for (i = 0; i < num; i++) {
5544                 pctx.blk = i;
5545                 ext2fs_mark_block_bitmap2(ctx->block_found_map, (*new_block)+i);
5546                 if (old_block) {
5547                         pctx.errcode = io_channel_read_blk64(fs->io,
5548                                    old_block + i, 1, buf);
5549                         if (pctx.errcode)
5550                                 fix_problem(ctx, PR_1_RELOC_READ_ERR, &pctx);
5551                         pctx.blk = (*new_block) + i;
5552                         pctx.errcode = io_channel_write_blk64(fs->io, pctx.blk,
5553                                                               1, buf);
5554                 } else {
5555                         pctx.blk = (*new_block) + i;
5556                         pctx.errcode = ext2fs_zero_blocks2(fs, pctx.blk, 1,
5557                                                            NULL, NULL);
5558                 }
5559
5560                 if (pctx.errcode)
5561                         fix_problem(ctx, PR_1_RELOC_WRITE_ERR, &pctx);
5562         }
5563         ext2fs_free_mem(&buf);
5564 }
5565
5566 /*
5567  * This routine gets called at the end of pass 1 if bad blocks are
5568  * detected in the superblock, group descriptors, inode_bitmaps, or
5569  * block bitmaps.  At this point, all of the blocks have been mapped
5570  * out, so we can try to allocate new block(s) to replace the bad
5571  * blocks.
5572  */
5573 static void handle_fs_bad_blocks(e2fsck_t ctx)
5574 {
5575         ext2_filsys fs = ctx->fs;
5576         dgrp_t          i;
5577         blk64_t         first_block;
5578         blk64_t         new_blk;
5579
5580         for (i = 0; i < fs->group_desc_count; i++) {
5581                 first_block = ext2fs_group_first_block2(fs, i);
5582
5583                 if (ctx->invalid_block_bitmap_flag[i]) {
5584                         new_blk = ext2fs_block_bitmap_loc(fs, i);
5585                         new_table_block(ctx, first_block, i, _("block bitmap"),
5586                                         1, &new_blk);
5587                         ext2fs_block_bitmap_loc_set(fs, i, new_blk);
5588                 }
5589                 if (ctx->invalid_inode_bitmap_flag[i]) {
5590                         new_blk = ext2fs_inode_bitmap_loc(fs, i);
5591                         new_table_block(ctx, first_block, i, _("inode bitmap"),
5592                                         1, &new_blk);
5593                         ext2fs_inode_bitmap_loc_set(fs, i, new_blk);
5594                 }
5595                 if (ctx->invalid_inode_table_flag[i]) {
5596                         new_blk = ext2fs_inode_table_loc(fs, i);
5597                         new_table_block(ctx, first_block, i, _("inode table"),
5598                                         fs->inode_blocks_per_group,
5599                                         &new_blk);
5600                         ext2fs_inode_table_loc_set(fs, i, new_blk);
5601                         ctx->flags |= E2F_FLAG_RESTART;
5602                 }
5603         }
5604         ctx->invalid_bitmaps = 0;
5605 }
5606
5607 /*
5608  * This routine marks all blocks which are used by the superblock,
5609  * group descriptors, inode bitmaps, and block bitmaps.
5610  */
5611 static void mark_table_blocks(e2fsck_t ctx)
5612 {
5613         ext2_filsys fs = ctx->fs;
5614         blk64_t b;
5615         dgrp_t  i;
5616         unsigned int    j;
5617         struct problem_context pctx;
5618
5619         clear_problem_context(&pctx);
5620
5621         for (i = 0; i < fs->group_desc_count; i++) {
5622                 pctx.group = i;
5623
5624                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_found_map);
5625                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_metadata_map);
5626
5627                 /*
5628                  * Mark the blocks used for the inode table
5629                  */
5630                 if (ext2fs_inode_table_loc(fs, i)) {
5631                         for (j = 0, b = ext2fs_inode_table_loc(fs, i);
5632                              j < fs->inode_blocks_per_group;
5633                              j++, b++) {
5634                                 if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5635                                                              b)) {
5636                                         pctx.blk = b;
5637                                         if (!ctx->invalid_inode_table_flag[i] &&
5638                                             fix_problem(ctx,
5639                                                 PR_1_ITABLE_CONFLICT, &pctx)) {
5640                                                 ctx->invalid_inode_table_flag[i]++;
5641                                                 ctx->invalid_bitmaps++;
5642                                         }
5643                                 } else {
5644                                     ext2fs_mark_block_bitmap2(
5645                                                 ctx->block_found_map, b);
5646                                     ext2fs_mark_block_bitmap2(
5647                                                 ctx->block_metadata_map, b);
5648                                 }
5649                         }
5650                 }
5651
5652                 /*
5653                  * Mark block used for the block bitmap
5654                  */
5655                 if (ext2fs_block_bitmap_loc(fs, i)) {
5656                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5657                                      ext2fs_block_bitmap_loc(fs, i))) {
5658                                 pctx.blk = ext2fs_block_bitmap_loc(fs, i);
5659                                 if (fix_problem(ctx, PR_1_BB_CONFLICT, &pctx)) {
5660                                         ctx->invalid_block_bitmap_flag[i]++;
5661                                         ctx->invalid_bitmaps++;
5662                                 }
5663                         } else {
5664                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5665                                      ext2fs_block_bitmap_loc(fs, i));
5666                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5667                                      ext2fs_block_bitmap_loc(fs, i));
5668                         }
5669                 }
5670                 /*
5671                  * Mark block used for the inode bitmap
5672                  */
5673                 if (ext2fs_inode_bitmap_loc(fs, i)) {
5674                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5675                                      ext2fs_inode_bitmap_loc(fs, i))) {
5676                                 pctx.blk = ext2fs_inode_bitmap_loc(fs, i);
5677                                 if (fix_problem(ctx, PR_1_IB_CONFLICT, &pctx)) {
5678                                         ctx->invalid_inode_bitmap_flag[i]++;
5679                                         ctx->invalid_bitmaps++;
5680                                 }
5681                         } else {
5682                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5683                                      ext2fs_inode_bitmap_loc(fs, i));
5684                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5685                                      ext2fs_inode_bitmap_loc(fs, i));
5686                         }
5687                 }
5688         }
5689 }
5690
5691 /*
5692  * These subroutines short circuits ext2fs_get_blocks and
5693  * ext2fs_check_directory; we use them since we already have the inode
5694  * structure, so there's no point in letting the ext2fs library read
5695  * the inode again.
5696  */
5697 static errcode_t pass1_get_blocks(ext2_filsys fs, ext2_ino_t ino,
5698                                   blk_t *blocks)
5699 {
5700         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5701         int     i;
5702
5703         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5704                 return EXT2_ET_CALLBACK_NOTHANDLED;
5705
5706         for (i=0; i < EXT2_N_BLOCKS; i++)
5707                 blocks[i] = ctx->stashed_inode->i_block[i];
5708         return 0;
5709 }
5710
5711 static errcode_t pass1_read_inode(ext2_filsys fs, ext2_ino_t ino,
5712                                   struct ext2_inode *inode)
5713 {
5714         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5715
5716         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5717                 return EXT2_ET_CALLBACK_NOTHANDLED;
5718         *inode = *ctx->stashed_inode;
5719         return 0;
5720 }
5721
5722 static errcode_t pass1_write_inode(ext2_filsys fs, ext2_ino_t ino,
5723                             struct ext2_inode *inode)
5724 {
5725         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5726
5727         if ((ino == ctx->stashed_ino) && ctx->stashed_inode &&
5728                 (inode != ctx->stashed_inode))
5729                 *ctx->stashed_inode = *inode;
5730         return EXT2_ET_CALLBACK_NOTHANDLED;
5731 }
5732
5733 static errcode_t pass1_check_directory(ext2_filsys fs, ext2_ino_t ino)
5734 {
5735         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5736
5737         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5738                 return EXT2_ET_CALLBACK_NOTHANDLED;
5739
5740         if (!LINUX_S_ISDIR(ctx->stashed_inode->i_mode))
5741                 return EXT2_ET_NO_DIRECTORY;
5742         return 0;
5743 }
5744
5745 static errcode_t e2fsck_get_alloc_block(ext2_filsys fs, blk64_t goal,
5746                                         blk64_t *ret)
5747 {
5748         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5749         errcode_t       retval;
5750         blk64_t         new_block;
5751
5752         if (ctx->block_found_map) {
5753                 retval = ext2fs_new_block2(fs, goal, ctx->block_found_map,
5754                                            &new_block);
5755                 if (retval)
5756                         return retval;
5757                 if (fs->block_map) {
5758                         ext2fs_mark_block_bitmap2(fs->block_map, new_block);
5759                         ext2fs_mark_bb_dirty(fs);
5760                 }
5761         } else {
5762                 if (!fs->block_map) {
5763                         retval = ext2fs_read_block_bitmap(fs);
5764                         if (retval)
5765                                 return retval;
5766                 }
5767
5768                 retval = ext2fs_new_block2(fs, goal, fs->block_map, &new_block);
5769                 if (retval)
5770                         return retval;
5771         }
5772
5773         *ret = new_block;
5774         return (0);
5775 }
5776
5777 static errcode_t e2fsck_new_range(ext2_filsys fs, int flags, blk64_t goal,
5778                                   blk64_t len, blk64_t *pblk, blk64_t *plen)
5779 {
5780         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5781         errcode_t       retval;
5782
5783         if (ctx->block_found_map)
5784                 return ext2fs_new_range(fs, flags, goal, len,
5785                                         ctx->block_found_map, pblk, plen);
5786
5787         if (!fs->block_map) {
5788                 retval = ext2fs_read_block_bitmap(fs);
5789                 if (retval)
5790                         return retval;
5791         }
5792
5793         return ext2fs_new_range(fs, flags, goal, len, fs->block_map,
5794                                 pblk, plen);
5795 }
5796
5797 static void e2fsck_block_alloc_stats(ext2_filsys fs, blk64_t blk, int inuse)
5798 {
5799         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5800
5801         /* Never free a critical metadata block */
5802         if (ctx->block_found_map &&
5803             ctx->block_metadata_map &&
5804             inuse < 0 &&
5805             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk))
5806                 return;
5807
5808         if (ctx->block_found_map) {
5809                 if (inuse > 0)
5810                         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5811                 else
5812                         ext2fs_unmark_block_bitmap2(ctx->block_found_map, blk);
5813         }
5814 }
5815
5816 static void e2fsck_block_alloc_stats_range(ext2_filsys fs, blk64_t blk,
5817                                            blk_t num, int inuse)
5818 {
5819         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5820
5821         /* Never free a critical metadata block */
5822         if (ctx->block_found_map &&
5823             ctx->block_metadata_map &&
5824             inuse < 0 &&
5825             ext2fs_test_block_bitmap_range2(ctx->block_metadata_map, blk, num))
5826                 return;
5827
5828         if (ctx->block_found_map) {
5829                 if (inuse > 0)
5830                         ext2fs_mark_block_bitmap_range2(ctx->block_found_map,
5831                                                         blk, num);
5832                 else
5833                         ext2fs_unmark_block_bitmap_range2(ctx->block_found_map,
5834                                                         blk, num);
5835         }
5836 }
5837
5838 void e2fsck_use_inode_shortcuts(e2fsck_t ctx, int use_shortcuts)
5839 {
5840         ext2_filsys fs = ctx->fs;
5841
5842         if (use_shortcuts) {
5843                 fs->get_blocks = pass1_get_blocks;
5844                 fs->check_directory = pass1_check_directory;
5845                 fs->read_inode = pass1_read_inode;
5846                 fs->write_inode = pass1_write_inode;
5847                 ctx->stashed_ino = 0;
5848         } else {
5849                 fs->get_blocks = 0;
5850                 fs->check_directory = 0;
5851                 fs->read_inode = 0;
5852                 fs->write_inode = 0;
5853         }
5854 }
5855
5856 void e2fsck_intercept_block_allocations(e2fsck_t ctx)
5857 {
5858         ext2fs_set_alloc_block_callback(ctx->fs, e2fsck_get_alloc_block, 0);
5859         ext2fs_set_block_alloc_stats_callback(ctx->fs,
5860                                                 e2fsck_block_alloc_stats, 0);
5861         ext2fs_set_new_range_callback(ctx->fs, e2fsck_new_range, NULL);
5862         ext2fs_set_block_alloc_stats_range_callback(ctx->fs,
5863                                         e2fsck_block_alloc_stats_range, NULL);
5864 }