Whamcloud - gitweb
e2fsck: merge quota context after threads finish
[tools/e2fsprogs.git] / e2fsck / pass1.c
1 /*
2  * pass1.c -- pass #1 of e2fsck: sequential scan of the inode table
3  *
4  * Copyright (C) 1993, 1994, 1995, 1996, 1997 Theodore Ts'o.
5  *
6  * %Begin-Header%
7  * This file may be redistributed under the terms of the GNU Public
8  * License.
9  * %End-Header%
10  *
11  * Pass 1 of e2fsck iterates over all the inodes in the filesystems,
12  * and applies the following tests to each inode:
13  *
14  *      - The mode field of the inode must be legal.
15  *      - The size and block count fields of the inode are correct.
16  *      - A data block must not be used by another inode
17  *
18  * Pass 1 also gathers the collects the following information:
19  *
20  *      - A bitmap of which inodes are in use.          (inode_used_map)
21  *      - A bitmap of which inodes are directories.     (inode_dir_map)
22  *      - A bitmap of which inodes are regular files.   (inode_reg_map)
23  *      - A bitmap of which inodes have bad fields.     (inode_bad_map)
24  *      - A bitmap of which inodes are in bad blocks.   (inode_bb_map)
25  *      - A bitmap of which inodes are imagic inodes.   (inode_imagic_map)
26  *      - A bitmap of which inodes are casefolded.      (inode_casefold_map)
27  *      - A bitmap of which blocks are in use.          (block_found_map)
28  *      - A bitmap of which blocks are in use by two inodes     (block_dup_map)
29  *      - The data blocks of the directory inodes.      (dir_map)
30  *      - Ref counts for ea_inodes.                     (ea_inode_refs)
31  *      - The encryption policy ID of each encrypted inode. (encrypted_files)
32  *
33  * Pass 1 is designed to stash away enough information so that the
34  * other passes should not need to read in the inode information
35  * during the normal course of a filesystem check.  (Although if an
36  * inconsistency is detected, other passes may need to read in an
37  * inode to fix it.)
38  *
39  * Note that pass 1B will be invoked if there are any duplicate blocks
40  * found.
41  */
42
43 #define _GNU_SOURCE 1 /* get strnlen() */
44 #include "config.h"
45 #include <string.h>
46 #include <time.h>
47 #ifdef HAVE_ERRNO_H
48 #include <errno.h>
49 #endif
50 #include <assert.h>
51 #ifdef HAVE_PTHREAD
52 #include <pthread.h>
53 #endif
54
55 #include "e2fsck.h"
56 #include <ext2fs/ext2_ext_attr.h>
57 /* todo remove this finally */
58 #include <ext2fs/ext2fsP.h>
59 #include <e2p/e2p.h>
60
61 #include "problem.h"
62
63 #ifdef NO_INLINE_FUNCS
64 #define _INLINE_
65 #else
66 #define _INLINE_ inline
67 #endif
68
69 #undef DEBUG
70
71 struct ea_quota {
72         blk64_t blocks;
73         __u64 inodes;
74 };
75
76 static int process_block(ext2_filsys fs, blk64_t        *blocknr,
77                          e2_blkcnt_t blockcnt, blk64_t ref_blk,
78                          int ref_offset, void *priv_data);
79 static int process_bad_block(ext2_filsys fs, blk64_t *block_nr,
80                              e2_blkcnt_t blockcnt, blk64_t ref_blk,
81                              int ref_offset, void *priv_data);
82 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
83                          char *block_buf,
84                          const struct ea_quota *ea_ibody_quota);
85 static void mark_table_blocks(e2fsck_t ctx);
86 static void alloc_bb_map(e2fsck_t ctx);
87 static void alloc_imagic_map(e2fsck_t ctx);
88 static void mark_inode_bad(e2fsck_t ctx, ino_t ino);
89 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino);
90 static void handle_fs_bad_blocks(e2fsck_t ctx);
91 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b);
92 static errcode_t scan_callback(ext2_filsys fs, ext2_inode_scan scan,
93                                   dgrp_t group, void * priv_data);
94 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
95                                     char *block_buf, int adjust_sign);
96 /* static char *describe_illegal_block(ext2_filsys fs, blk64_t block); */
97
98 struct process_block_struct {
99         ext2_ino_t      ino;
100         unsigned        is_dir:1, is_reg:1, clear:1, suppress:1,
101                                 fragmented:1, compressed:1, bbcheck:1,
102                                 inode_modified:1;
103         blk64_t         num_blocks;
104         blk64_t         max_blocks;
105         blk64_t         last_block;
106         e2_blkcnt_t     last_init_lblock;
107         e2_blkcnt_t     last_db_block;
108         int             num_illegal_blocks;
109         blk64_t         previous_block;
110         struct ext2_inode *inode;
111         struct problem_context *pctx;
112         ext2fs_block_bitmap fs_meta_blocks;
113         e2fsck_t        ctx;
114         blk64_t         next_lblock;
115         struct extent_tree_info eti;
116 };
117
118 struct process_inode_block {
119         ext2_ino_t ino;
120         struct ea_quota ea_ibody_quota;
121         struct ext2_inode_large inode;
122 };
123
124 struct scan_callback_struct {
125         e2fsck_t                         ctx;
126         char                            *block_buf;
127         struct process_inode_block      *inodes_to_process;
128         int                             *process_inode_count;
129 };
130
131 static void process_inodes(e2fsck_t ctx, char *block_buf,
132                            struct process_inode_block *inodes_to_process,
133                            int *process_inode_count);
134
135 static __u64 ext2_max_sizes[EXT2_MAX_BLOCK_LOG_SIZE -
136                             EXT2_MIN_BLOCK_LOG_SIZE + 1];
137
138 /*
139  * Check to make sure a device inode is real.  Returns 1 if the device
140  * checks out, 0 if not.
141  *
142  * Note: this routine is now also used to check FIFO's and Sockets,
143  * since they have the same requirement; the i_block fields should be
144  * zero.
145  */
146 int e2fsck_pass1_check_device_inode(ext2_filsys fs EXT2FS_ATTR((unused)),
147                                     struct ext2_inode *inode)
148 {
149         int     i;
150
151         /*
152          * If the index or extents flag is set, then this is a bogus
153          * device/fifo/socket
154          */
155         if (inode->i_flags & (EXT2_INDEX_FL | EXT4_EXTENTS_FL))
156                 return 0;
157
158         /*
159          * We should be able to do the test below all the time, but
160          * because the kernel doesn't forcibly clear the device
161          * inode's additional i_block fields, there are some rare
162          * occasions when a legitimate device inode will have non-zero
163          * additional i_block fields.  So for now, we only complain
164          * when the immutable flag is set, which should never happen
165          * for devices.  (And that's when the problem is caused, since
166          * you can't set or clear immutable flags for devices.)  Once
167          * the kernel has been fixed we can change this...
168          */
169         if (inode->i_flags & (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)) {
170                 for (i=4; i < EXT2_N_BLOCKS; i++)
171                         if (inode->i_block[i])
172                                 return 0;
173         }
174         return 1;
175 }
176
177 /*
178  * Check to make sure a symlink inode is real.  Returns 1 if the symlink
179  * checks out, 0 if not.
180  */
181 int e2fsck_pass1_check_symlink(ext2_filsys fs, ext2_ino_t ino,
182                                struct ext2_inode *inode, char *buf)
183 {
184         unsigned int buflen;
185         unsigned int len;
186
187         if ((inode->i_size_high || inode->i_size == 0) ||
188             (inode->i_flags & EXT2_INDEX_FL))
189                 return 0;
190
191         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
192                 size_t inline_size;
193
194                 if (inode->i_flags & EXT4_EXTENTS_FL)
195                         return 0;
196                 if (ext2fs_inline_data_size(fs, ino, &inline_size))
197                         return 0;
198                 if (inode->i_size != inline_size)
199                         return 0;
200
201                 return 1;
202         }
203
204         if (ext2fs_is_fast_symlink(inode)) {
205                 if (inode->i_flags & EXT4_EXTENTS_FL)
206                         return 0;
207                 buf = (char *)inode->i_block;
208                 buflen = sizeof(inode->i_block);
209         } else {
210                 ext2_extent_handle_t    handle;
211                 struct ext2_extent_info info;
212                 struct ext2fs_extent    extent;
213                 blk64_t blk;
214                 int i;
215
216                 if (inode->i_flags & EXT4_EXTENTS_FL) {
217                         if (ext2fs_extent_open2(fs, ino, inode, &handle))
218                                 return 0;
219                         if (ext2fs_extent_get_info(handle, &info) ||
220                             (info.num_entries != 1) ||
221                             (info.max_depth != 0)) {
222                                 ext2fs_extent_free(handle);
223                                 return 0;
224                         }
225                         if (ext2fs_extent_get(handle, EXT2_EXTENT_ROOT,
226                                               &extent) ||
227                             (extent.e_lblk != 0) ||
228                             (extent.e_len != 1)) {
229                                 ext2fs_extent_free(handle);
230                                 return 0;
231                         }
232                         blk = extent.e_pblk;
233                         ext2fs_extent_free(handle);
234                 } else {
235                         blk = inode->i_block[0];
236
237                         for (i = 1; i < EXT2_N_BLOCKS; i++)
238                                 if (inode->i_block[i])
239                                         return 0;
240                 }
241
242                 if (blk < fs->super->s_first_data_block ||
243                     blk >= ext2fs_blocks_count(fs->super))
244                         return 0;
245
246                 if (io_channel_read_blk64(fs->io, blk, 1, buf))
247                         return 0;
248
249                 buflen = fs->blocksize;
250         }
251
252         if (inode->i_flags & EXT4_ENCRYPT_FL)
253                 len = ext2fs_le16_to_cpu(*(__u16 *)buf) + 2;
254         else
255                 len = strnlen(buf, buflen);
256
257         if (len >= buflen)
258                 return 0;
259
260         if (len != inode->i_size)
261                 return 0;
262         return 1;
263 }
264
265 /*
266  * If the extents or inlinedata flags are set on the inode, offer to clear 'em.
267  */
268 #define BAD_SPECIAL_FLAGS (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)
269 static void check_extents_inlinedata(e2fsck_t ctx,
270                                      struct problem_context *pctx)
271 {
272         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
273                 return;
274
275         if (!fix_problem(ctx, PR_1_SPECIAL_EXTENTS_IDATA, pctx))
276                 return;
277
278         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
279         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
280 }
281 #undef BAD_SPECIAL_FLAGS
282
283 /*
284  * If the immutable (or append-only) flag is set on the inode, offer
285  * to clear it.
286  */
287 #define BAD_SPECIAL_FLAGS (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)
288 static void check_immutable(e2fsck_t ctx, struct problem_context *pctx)
289 {
290         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
291                 return;
292
293         if (!fix_problem(ctx, PR_1_SET_IMMUTABLE, pctx))
294                 return;
295
296         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
297         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
298 }
299
300 /*
301  * If device, fifo or socket, check size is zero -- if not offer to
302  * clear it
303  */
304 static void check_size(e2fsck_t ctx, struct problem_context *pctx)
305 {
306         struct ext2_inode *inode = pctx->inode;
307
308         if (EXT2_I_SIZE(inode) == 0)
309                 return;
310
311         if (!fix_problem(ctx, PR_1_SET_NONZSIZE, pctx))
312                 return;
313
314         ext2fs_inode_size_set(ctx->fs, inode, 0);
315         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
316 }
317
318 /*
319  * For a given size, calculate how many blocks would be charged towards quota.
320  */
321 static blk64_t size_to_quota_blocks(ext2_filsys fs, size_t size)
322 {
323         blk64_t clusters;
324
325         clusters = DIV_ROUND_UP(size, fs->blocksize << fs->cluster_ratio_bits);
326         return EXT2FS_C2B(fs, clusters);
327 }
328
329 /*
330  * Check validity of EA inode. Return 0 if EA inode is valid, otherwise return
331  * the problem code.
332  */
333 static problem_t check_large_ea_inode(e2fsck_t ctx,
334                                       struct ext2_ext_attr_entry *entry,
335                                       struct problem_context *pctx,
336                                       blk64_t *quota_blocks)
337 {
338         struct ext2_inode inode;
339         __u32 hash;
340         errcode_t retval;
341
342         /* Check if inode is within valid range */
343         if ((entry->e_value_inum < EXT2_FIRST_INODE(ctx->fs->super)) ||
344             (entry->e_value_inum > ctx->fs->super->s_inodes_count)) {
345                 pctx->num = entry->e_value_inum;
346                 return PR_1_ATTR_VALUE_EA_INODE;
347         }
348
349         e2fsck_read_inode(ctx, entry->e_value_inum, &inode, "pass1");
350
351         retval = ext2fs_ext_attr_hash_entry2(ctx->fs, entry, NULL, &hash);
352         if (retval) {
353                 com_err("check_large_ea_inode", retval,
354                         _("while hashing entry with e_value_inum = %u"),
355                         entry->e_value_inum);
356                 fatal_error(ctx, 0);
357         }
358
359         if (hash == entry->e_hash) {
360                 *quota_blocks = size_to_quota_blocks(ctx->fs,
361                                                      entry->e_value_size);
362         } else {
363                 /* This might be an old Lustre-style ea_inode reference. */
364                 if (inode.i_mtime == pctx->ino &&
365                     inode.i_generation == pctx->inode->i_generation) {
366                         *quota_blocks = 0;
367                 } else {
368                         /* If target inode is also missing EA_INODE flag,
369                          * this is likely to be a bad reference.
370                          */
371                         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
372                                 pctx->num = entry->e_value_inum;
373                                 return PR_1_ATTR_VALUE_EA_INODE;
374                         } else {
375                                 pctx->num = entry->e_hash;
376                                 return PR_1_ATTR_HASH;
377                         }
378                 }
379         }
380
381         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
382                 pctx->num = entry->e_value_inum;
383                 if (fix_problem(ctx, PR_1_ATTR_SET_EA_INODE_FL, pctx)) {
384                         inode.i_flags |= EXT4_EA_INODE_FL;
385                         ext2fs_write_inode(ctx->fs, entry->e_value_inum,
386                                            &inode);
387                 } else {
388                         return PR_1_ATTR_NO_EA_INODE_FL;
389                 }
390         }
391         return 0;
392 }
393
394 static void inc_ea_inode_refs(e2fsck_t ctx, struct problem_context *pctx,
395                               struct ext2_ext_attr_entry *first, void *end)
396 {
397         struct ext2_ext_attr_entry *entry = first;
398         struct ext2_ext_attr_entry *np = EXT2_EXT_ATTR_NEXT(entry);
399
400         while ((void *) entry < end && (void *) np < end &&
401                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
402                 if (!entry->e_value_inum)
403                         goto next;
404                 if (!ctx->ea_inode_refs) {
405                         pctx->errcode = ea_refcount_create(0,
406                                                            &ctx->ea_inode_refs);
407                         if (pctx->errcode) {
408                                 pctx->num = 4;
409                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
410                                 ctx->flags |= E2F_FLAG_ABORT;
411                                 return;
412                         }
413                 }
414                 ea_refcount_increment(ctx->ea_inode_refs, entry->e_value_inum,
415                                       0);
416         next:
417                 entry = np;
418                 np = EXT2_EXT_ATTR_NEXT(entry);
419         }
420 }
421
422 static void check_ea_in_inode(e2fsck_t ctx, struct problem_context *pctx,
423                               struct ea_quota *ea_ibody_quota)
424 {
425         struct ext2_super_block *sb = ctx->fs->super;
426         struct ext2_inode_large *inode;
427         struct ext2_ext_attr_entry *entry;
428         char *start, *header, *end;
429         unsigned int storage_size, remain;
430         problem_t problem = 0;
431         region_t region = 0;
432
433         ea_ibody_quota->blocks = 0;
434         ea_ibody_quota->inodes = 0;
435
436         inode = (struct ext2_inode_large *) pctx->inode;
437         storage_size = EXT2_INODE_SIZE(ctx->fs->super) - EXT2_GOOD_OLD_INODE_SIZE -
438                 inode->i_extra_isize;
439         header = ((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
440                  inode->i_extra_isize;
441         end = header + storage_size;
442         start = header + sizeof(__u32);
443         entry = (struct ext2_ext_attr_entry *) start;
444
445         /* scan all entry's headers first */
446
447         /* take finish entry 0UL into account */
448         remain = storage_size - sizeof(__u32);
449
450         region = region_create(0, storage_size);
451         if (!region) {
452                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
453                 problem = 0;
454                 ctx->flags |= E2F_FLAG_ABORT;
455                 return;
456         }
457         if (region_allocate(region, 0, sizeof(__u32))) {
458                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
459                 goto fix;
460         }
461
462         while (remain >= sizeof(struct ext2_ext_attr_entry) &&
463                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
464                 __u32 hash;
465
466                 if (region_allocate(region, (char *)entry - (char *)header,
467                                     EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
468                         problem = PR_1_INODE_EA_ALLOC_COLLISION;
469                         goto fix;
470                 }
471
472                 /* header eats this space */
473                 remain -= sizeof(struct ext2_ext_attr_entry);
474
475                 /* is attribute name valid? */
476                 if (EXT2_EXT_ATTR_SIZE(entry->e_name_len) > remain) {
477                         pctx->num = entry->e_name_len;
478                         problem = PR_1_ATTR_NAME_LEN;
479                         goto fix;
480                 }
481
482                 /* attribute len eats this space */
483                 remain -= EXT2_EXT_ATTR_SIZE(entry->e_name_len);
484
485                 if (entry->e_value_inum == 0) {
486                         /* check value size */
487                         if (entry->e_value_size > remain) {
488                                 pctx->num = entry->e_value_size;
489                                 problem = PR_1_ATTR_VALUE_SIZE;
490                                 goto fix;
491                         }
492
493                         if (entry->e_value_size &&
494                             region_allocate(region,
495                                             sizeof(__u32) + entry->e_value_offs,
496                                             EXT2_EXT_ATTR_SIZE(
497                                                 entry->e_value_size))) {
498                                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
499                                 goto fix;
500                         }
501
502                         hash = ext2fs_ext_attr_hash_entry(entry,
503                                                           start + entry->e_value_offs);
504
505                         /* e_hash may be 0 in older inode's ea */
506                         if (entry->e_hash != 0 && entry->e_hash != hash) {
507                                 pctx->num = entry->e_hash;
508                                 problem = PR_1_ATTR_HASH;
509                                 goto fix;
510                         }
511                 } else {
512                         blk64_t quota_blocks;
513
514                         problem = check_large_ea_inode(ctx, entry, pctx,
515                                                        &quota_blocks);
516                         if (problem != 0)
517                                 goto fix;
518
519                         ea_ibody_quota->blocks += quota_blocks;
520                         ea_ibody_quota->inodes++;
521                 }
522
523                 /* If EA value is stored in external inode then it does not
524                  * consume space here */
525                 if (entry->e_value_inum == 0)
526                         remain -= entry->e_value_size;
527
528                 entry = EXT2_EXT_ATTR_NEXT(entry);
529         }
530
531         if (region_allocate(region, (char *)entry - (char *)header,
532                             sizeof(__u32))) {
533                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
534                 goto fix;
535         }
536 fix:
537         if (region)
538                 region_free(region);
539         /*
540          * it seems like a corruption. it's very unlikely we could repair
541          * EA(s) in automatic fashion -bzzz
542          */
543         if (problem == 0 || !fix_problem(ctx, problem, pctx)) {
544                 inc_ea_inode_refs(ctx, pctx,
545                                   (struct ext2_ext_attr_entry *)start, end);
546                 return;
547         }
548
549         /* simply remove all possible EA(s) */
550         *((__u32 *)header) = 0UL;
551         e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
552                                 EXT2_INODE_SIZE(sb), "pass1");
553         ea_ibody_quota->blocks = 0;
554         ea_ibody_quota->inodes = 0;
555 }
556
557 static int check_inode_extra_negative_epoch(__u32 xtime, __u32 extra) {
558         return (xtime & (1U << 31)) != 0 &&
559                 (extra & EXT4_EPOCH_MASK) == EXT4_EPOCH_MASK;
560 }
561
562 #define CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, xtime) \
563         check_inode_extra_negative_epoch(inode->i_##xtime, \
564                                          inode->i_##xtime##_extra)
565
566 /* When today's date is earlier than 2242, we assume that atimes,
567  * ctimes, crtimes, and mtimes with years in the range 2310..2378 are
568  * actually pre-1970 dates mis-encoded.
569  */
570 #define EXT4_EXTRA_NEGATIVE_DATE_CUTOFF 2 * (1LL << 32)
571
572 static void check_inode_extra_space(e2fsck_t ctx, struct problem_context *pctx,
573                                     struct ea_quota *ea_ibody_quota)
574 {
575         struct ext2_super_block *sb = ctx->fs->super;
576         struct ext2_inode_large *inode;
577         __u32 *eamagic;
578         int min, max;
579
580         ea_ibody_quota->blocks = 0;
581         ea_ibody_quota->inodes = 0;
582
583         inode = (struct ext2_inode_large *) pctx->inode;
584         if (EXT2_INODE_SIZE(sb) == EXT2_GOOD_OLD_INODE_SIZE) {
585                 /* this isn't large inode. so, nothing to check */
586                 return;
587         }
588
589 #if 0
590         printf("inode #%u, i_extra_size %d\n", pctx->ino,
591                         inode->i_extra_isize);
592 #endif
593         /* i_extra_isize must cover i_extra_isize + i_checksum_hi at least */
594         min = sizeof(inode->i_extra_isize) + sizeof(inode->i_checksum_hi);
595         max = EXT2_INODE_SIZE(sb) - EXT2_GOOD_OLD_INODE_SIZE;
596         /*
597          * For now we will allow i_extra_isize to be 0, but really
598          * implementations should never allow i_extra_isize to be 0
599          */
600         if (inode->i_extra_isize &&
601             (inode->i_extra_isize < min || inode->i_extra_isize > max ||
602              inode->i_extra_isize & 3)) {
603                 if (!fix_problem(ctx, PR_1_EXTRA_ISIZE, pctx))
604                         return;
605                 if (inode->i_extra_isize < min || inode->i_extra_isize > max)
606                         inode->i_extra_isize = sb->s_want_extra_isize;
607                 else
608                         inode->i_extra_isize = (inode->i_extra_isize + 3) & ~3;
609                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
610                                         EXT2_INODE_SIZE(sb), "pass1");
611         }
612
613         /* check if there is no place for an EA header */
614         if (inode->i_extra_isize >= max - sizeof(__u32))
615                 return;
616
617         eamagic = (__u32 *) (((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
618                         inode->i_extra_isize);
619         if (*eamagic == EXT2_EXT_ATTR_MAGIC) {
620                 /* it seems inode has an extended attribute(s) in body */
621                 check_ea_in_inode(ctx, pctx, ea_ibody_quota);
622         }
623
624         /*
625          * If the inode's extended atime (ctime, crtime, mtime) is stored in
626          * the old, invalid format, repair it.
627          */
628         if (((sizeof(time_t) <= 4) ||
629              (((sizeof(time_t) > 4) &&
630                ctx->now < EXT4_EXTRA_NEGATIVE_DATE_CUTOFF))) &&
631             (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime) ||
632              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime) ||
633              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime) ||
634              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))) {
635
636                 if (!fix_problem(ctx, PR_1_EA_TIME_OUT_OF_RANGE, pctx))
637                         return;
638
639                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime))
640                         inode->i_atime_extra &= ~EXT4_EPOCH_MASK;
641                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime))
642                         inode->i_ctime_extra &= ~EXT4_EPOCH_MASK;
643                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime))
644                         inode->i_crtime_extra &= ~EXT4_EPOCH_MASK;
645                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))
646                         inode->i_mtime_extra &= ~EXT4_EPOCH_MASK;
647                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
648                                         EXT2_INODE_SIZE(sb), "pass1");
649         }
650
651 }
652
653 /*
654  * Check to see if the inode might really be a directory, despite i_mode
655  *
656  * This is a lot of complexity for something for which I'm not really
657  * convinced happens frequently in the wild.  If for any reason this
658  * causes any problems, take this code out.
659  * [tytso:20070331.0827EDT]
660  */
661 static void check_is_really_dir(e2fsck_t ctx, struct problem_context *pctx,
662                                 char *buf)
663 {
664         struct ext2_inode *inode = pctx->inode;
665         struct ext2_dir_entry   *dirent;
666         errcode_t               retval;
667         blk64_t                 blk;
668         unsigned int            i, rec_len, not_device = 0;
669         int                     extent_fs;
670         int                     inlinedata_fs;
671
672         /*
673          * If the mode looks OK, we believe it.  If the first block in
674          * the i_block array is 0, this cannot be a directory. If the
675          * inode is extent-mapped, it is still the case that the latter
676          * cannot be 0 - the magic number in the extent header would make
677          * it nonzero.
678          */
679         if (LINUX_S_ISDIR(inode->i_mode) || LINUX_S_ISREG(inode->i_mode) ||
680             LINUX_S_ISLNK(inode->i_mode) || inode->i_block[0] == 0)
681                 return;
682
683         /* 
684          * Check the block numbers in the i_block array for validity:
685          * zero blocks are skipped (but the first one cannot be zero -
686          * see above), other blocks are checked against the first and
687          * max data blocks (from the the superblock) and against the
688          * block bitmap. Any invalid block found means this cannot be
689          * a directory.
690          * 
691          * If there are non-zero blocks past the fourth entry, then
692          * this cannot be a device file: we remember that for the next
693          * check.
694          *
695          * For extent mapped files, we don't do any sanity checking:
696          * just try to get the phys block of logical block 0 and run
697          * with it.
698          *
699          * For inline data files, we just try to get the size of inline
700          * data.  If it's true, we will treat it as a directory.
701          */
702
703         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
704         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
705         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL)) {
706                 size_t size;
707                 __u32 dotdot;
708                 unsigned int rec_len2;
709                 struct ext2_dir_entry de;
710
711                 if (ext2fs_inline_data_size(ctx->fs, pctx->ino, &size))
712                         return;
713                 /*
714                  * If the size isn't a multiple of 4, it's probably not a
715                  * directory??
716                  */
717                 if (size & 3)
718                         return;
719                 /*
720                  * If the first 10 bytes don't look like a directory entry,
721                  * it's probably not a directory.
722                  */
723                 memcpy(&dotdot, inode->i_block, sizeof(dotdot));
724                 memcpy(&de, ((char *)inode->i_block) + EXT4_INLINE_DATA_DOTDOT_SIZE,
725                        EXT2_DIR_REC_LEN(0));
726                 dotdot = ext2fs_le32_to_cpu(dotdot);
727                 de.inode = ext2fs_le32_to_cpu(de.inode);
728                 de.rec_len = ext2fs_le16_to_cpu(de.rec_len);
729                 ext2fs_get_rec_len(ctx->fs, &de, &rec_len2);
730                 if (dotdot >= ctx->fs->super->s_inodes_count ||
731                     (dotdot < EXT2_FIRST_INO(ctx->fs->super) &&
732                      dotdot != EXT2_ROOT_INO) ||
733                     de.inode >= ctx->fs->super->s_inodes_count ||
734                     (de.inode < EXT2_FIRST_INO(ctx->fs->super) &&
735                      de.inode != 0) ||
736                     rec_len2 > EXT4_MIN_INLINE_DATA_SIZE -
737                               EXT4_INLINE_DATA_DOTDOT_SIZE)
738                         return;
739                 /* device files never have a "system.data" entry */
740                 goto isdir;
741         } else if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) {
742                 /* extent mapped */
743                 if  (ext2fs_bmap2(ctx->fs, pctx->ino, inode, 0, 0, 0, 0,
744                                  &blk))
745                         return;
746                 /* device files are never extent mapped */
747                 not_device++;
748         } else {
749                 for (i=0; i < EXT2_N_BLOCKS; i++) {
750                         blk = inode->i_block[i];
751                         if (!blk)
752                                 continue;
753                         if (i >= 4)
754                                 not_device++;
755
756                         if (blk < ctx->fs->super->s_first_data_block ||
757                             blk >= ext2fs_blocks_count(ctx->fs->super) ||
758                             ext2fs_fast_test_block_bitmap2(ctx->block_found_map,
759                                                            blk))
760                                 return; /* Invalid block, can't be dir */
761                 }
762                 blk = inode->i_block[0];
763         }
764
765         /*
766          * If the mode says this is a device file and the i_links_count field
767          * is sane and we have not ruled it out as a device file previously,
768          * we declare it a device file, not a directory.
769          */
770         if ((LINUX_S_ISCHR(inode->i_mode) || LINUX_S_ISBLK(inode->i_mode)) &&
771             (inode->i_links_count == 1) && !not_device)
772                 return;
773
774         /* read the first block */
775         ehandler_operation(_("reading directory block"));
776         retval = ext2fs_read_dir_block4(ctx->fs, blk, buf, 0, pctx->ino);
777         ehandler_operation(0);
778         if (retval)
779                 return;
780
781         dirent = (struct ext2_dir_entry *) buf;
782         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
783         if (retval)
784                 return;
785         if ((ext2fs_dirent_name_len(dirent) != 1) ||
786             (dirent->name[0] != '.') ||
787             (dirent->inode != pctx->ino) ||
788             (rec_len < 12) ||
789             (rec_len % 4) ||
790             (rec_len >= ctx->fs->blocksize - 12))
791                 return;
792
793         dirent = (struct ext2_dir_entry *) (buf + rec_len);
794         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
795         if (retval)
796                 return;
797         if ((ext2fs_dirent_name_len(dirent) != 2) ||
798             (dirent->name[0] != '.') ||
799             (dirent->name[1] != '.') ||
800             (rec_len < 12) ||
801             (rec_len % 4))
802                 return;
803
804 isdir:
805         if (fix_problem(ctx, PR_1_TREAT_AS_DIRECTORY, pctx)) {
806                 inode->i_mode = (inode->i_mode & 07777) | LINUX_S_IFDIR;
807                 e2fsck_write_inode_full(ctx, pctx->ino, inode,
808                                         EXT2_INODE_SIZE(ctx->fs->super),
809                                         "check_is_really_dir");
810         }
811 }
812
813 extern errcode_t e2fsck_setup_icount(e2fsck_t ctx, const char *icount_name,
814                                      int flags, ext2_icount_t hint,
815                                      ext2_icount_t *ret)
816 {
817         unsigned int            threshold;
818         unsigned int            save_type;
819         ext2_ino_t              num_dirs;
820         errcode_t               retval;
821         char                    *tdb_dir;
822         int                     enable;
823
824         *ret = 0;
825
826         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
827                            &tdb_dir);
828         profile_get_uint(ctx->profile, "scratch_files",
829                          "numdirs_threshold", 0, 0, &threshold);
830         profile_get_boolean(ctx->profile, "scratch_files",
831                             "icount", 0, 1, &enable);
832
833         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
834         if (retval)
835                 num_dirs = 1024;        /* Guess */
836
837         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
838             (!threshold || num_dirs > threshold)) {
839                 retval = ext2fs_create_icount_tdb(ctx->fs, tdb_dir,
840                                                   flags, ret);
841                 if (retval == 0)
842                         return 0;
843         }
844         e2fsck_set_bitmap_type(ctx->fs, EXT2FS_BMAP64_RBTREE, icount_name,
845                                &save_type);
846         if (ctx->options & E2F_OPT_ICOUNT_FULLMAP)
847                 flags |= EXT2_ICOUNT_OPT_FULLMAP;
848         retval = ext2fs_create_icount2(ctx->fs, flags, 0, hint, ret);
849         ctx->fs->default_bitmap_type = save_type;
850         return retval;
851 }
852
853 static errcode_t recheck_bad_inode_checksum(ext2_filsys fs, ext2_ino_t ino,
854                                             e2fsck_t ctx,
855                                             struct problem_context *pctx)
856 {
857         errcode_t retval;
858         struct ext2_inode_large inode;
859
860         /*
861          * Reread inode.  If we don't see checksum error, then this inode
862          * has been fixed elsewhere.
863          */
864         ctx->stashed_ino = 0;
865         retval = ext2fs_read_inode_full(fs, ino, (struct ext2_inode *)&inode,
866                                         sizeof(inode));
867         if (retval && retval != EXT2_ET_INODE_CSUM_INVALID)
868                 return retval;
869         if (!retval)
870                 return 0;
871
872         /*
873          * Checksum still doesn't match.  That implies that the inode passes
874          * all the sanity checks, so maybe the checksum is simply corrupt.
875          * See if the user will go for fixing that.
876          */
877         if (!fix_problem(ctx, PR_1_INODE_ONLY_CSUM_INVALID, pctx))
878                 return 0;
879
880         retval = ext2fs_write_inode_full(fs, ino, (struct ext2_inode *)&inode,
881                                          sizeof(inode));
882         return retval;
883 }
884
885 static void reserve_block_for_root_repair(e2fsck_t ctx)
886 {
887         blk64_t         blk = 0;
888         errcode_t       err;
889         ext2_filsys     fs = ctx->fs;
890
891         ctx->root_repair_block = 0;
892         if (ext2fs_test_inode_bitmap2(ctx->inode_used_map, EXT2_ROOT_INO))
893                 return;
894
895         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
896         if (err)
897                 return;
898         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
899         ctx->root_repair_block = blk;
900 }
901
902 static void reserve_block_for_lnf_repair(e2fsck_t ctx)
903 {
904         blk64_t         blk = 0;
905         errcode_t       err;
906         ext2_filsys     fs = ctx->fs;
907         static const char name[] = "lost+found";
908         ext2_ino_t      ino;
909
910         ctx->lnf_repair_block = 0;
911         if (!ext2fs_lookup(fs, EXT2_ROOT_INO, name, sizeof(name)-1, 0, &ino))
912                 return;
913
914         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
915         if (err)
916                 return;
917         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
918         ctx->lnf_repair_block = blk;
919 }
920
921 static errcode_t get_inline_data_ea_size(ext2_filsys fs, ext2_ino_t ino,
922                                          size_t *sz)
923 {
924         void *p;
925         struct ext2_xattr_handle *handle;
926         errcode_t retval;
927
928         retval = ext2fs_xattrs_open(fs, ino, &handle);
929         if (retval)
930                 return retval;
931
932         retval = ext2fs_xattrs_read(handle);
933         if (retval)
934                 goto err;
935
936         retval = ext2fs_xattr_get(handle, "system.data", &p, sz);
937         if (retval)
938                 goto err;
939         ext2fs_free_mem(&p);
940 err:
941         (void) ext2fs_xattrs_close(&handle);
942         return retval;
943 }
944
945 static void finish_processing_inode(e2fsck_t ctx, ext2_ino_t ino,
946                                     struct problem_context *pctx,
947                                     int failed_csum)
948 {
949         if (!failed_csum)
950                 return;
951
952         /*
953          * If the inode failed the checksum and the user didn't
954          * clear the inode, test the checksum again -- if it still
955          * fails, ask the user if the checksum should be corrected.
956          */
957         pctx->errcode = recheck_bad_inode_checksum(ctx->fs, ino, ctx, pctx);
958         if (pctx->errcode)
959                 ctx->flags |= E2F_FLAG_ABORT;
960 }
961 #define FINISH_INODE_LOOP(ctx, ino, pctx, failed_csum) \
962         do { \
963                 finish_processing_inode((ctx), (ino), (pctx), (failed_csum)); \
964                 if ((ctx)->flags & E2F_FLAG_ABORT) \
965                         return; \
966         } while (0)
967
968 static int could_be_block_map(ext2_filsys fs, struct ext2_inode *inode)
969 {
970         __u32 x;
971         int i;
972
973         for (i = 0; i < EXT2_N_BLOCKS; i++) {
974                 x = inode->i_block[i];
975 #ifdef WORDS_BIGENDIAN
976                 x = ext2fs_swab32(x);
977 #endif
978                 if (x >= ext2fs_blocks_count(fs->super))
979                         return 0;
980         }
981
982         return 1;
983 }
984
985 /*
986  * Figure out what to do with an inode that has both extents and inline data
987  * inode flags set.  Returns -1 if we decide to erase the inode, 0 otherwise.
988  */
989 static int fix_inline_data_extents_file(e2fsck_t ctx,
990                                         ext2_ino_t ino,
991                                         struct ext2_inode *inode,
992                                         int inode_size,
993                                         struct problem_context *pctx)
994 {
995         size_t max_inline_ea_size;
996         ext2_filsys fs = ctx->fs;
997         int dirty = 0;
998
999         /* Both feature flags not set?  Just run the regular checks */
1000         if (!ext2fs_has_feature_extents(fs->super) &&
1001             !ext2fs_has_feature_inline_data(fs->super))
1002                 return 0;
1003
1004         /* Clear both flags if it's a special file */
1005         if (LINUX_S_ISCHR(inode->i_mode) ||
1006             LINUX_S_ISBLK(inode->i_mode) ||
1007             LINUX_S_ISFIFO(inode->i_mode) ||
1008             LINUX_S_ISSOCK(inode->i_mode)) {
1009                 check_extents_inlinedata(ctx, pctx);
1010                 return 0;
1011         }
1012
1013         /* If it looks like an extent tree, try to clear inlinedata */
1014         if (ext2fs_extent_header_verify(inode->i_block,
1015                                  sizeof(inode->i_block)) == 0 &&
1016             fix_problem(ctx, PR_1_CLEAR_INLINE_DATA_FOR_EXTENT, pctx)) {
1017                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1018                 dirty = 1;
1019                 goto out;
1020         }
1021
1022         /* If it looks short enough to be inline data, try to clear extents */
1023         if (inode_size > EXT2_GOOD_OLD_INODE_SIZE)
1024                 max_inline_ea_size = inode_size -
1025                                      (EXT2_GOOD_OLD_INODE_SIZE +
1026                                       ((struct ext2_inode_large *)inode)->i_extra_isize);
1027         else
1028                 max_inline_ea_size = 0;
1029         if (EXT2_I_SIZE(inode) <
1030             EXT4_MIN_INLINE_DATA_SIZE + max_inline_ea_size &&
1031             fix_problem(ctx, PR_1_CLEAR_EXTENT_FOR_INLINE_DATA, pctx)) {
1032                 inode->i_flags &= ~EXT4_EXTENTS_FL;
1033                 dirty = 1;
1034                 goto out;
1035         }
1036
1037         /*
1038          * Too big for inline data, but no evidence of extent tree -
1039          * maybe it's a block map file?  If the mappings all look valid?
1040          */
1041         if (could_be_block_map(fs, inode) &&
1042             fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_FLAGS, pctx)) {
1043 #ifdef WORDS_BIGENDIAN
1044                 int i;
1045
1046                 for (i = 0; i < EXT2_N_BLOCKS; i++)
1047                         inode->i_block[i] = ext2fs_swab32(inode->i_block[i]);
1048 #endif
1049
1050                 inode->i_flags &= ~(EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL);
1051                 dirty = 1;
1052                 goto out;
1053         }
1054
1055         /* Oh well, just clear the busted inode. */
1056         if (fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_INODE, pctx)) {
1057                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1058                 return -1;
1059         }
1060
1061 out:
1062         if (dirty)
1063                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1064
1065         return 0;
1066 }
1067
1068 static void pass1_readahead(e2fsck_t ctx, dgrp_t *group, ext2_ino_t *next_ino)
1069 {
1070         ext2_ino_t inodes_in_group = 0, inodes_per_block, inodes_per_buffer;
1071         dgrp_t start = *group, grp;
1072         blk64_t blocks_to_read = 0;
1073         errcode_t err = EXT2_ET_INVALID_ARGUMENT;
1074
1075         if (ctx->readahead_kb == 0)
1076                 goto out;
1077
1078         /* Keep iterating groups until we have enough to readahead */
1079         inodes_per_block = EXT2_INODES_PER_BLOCK(ctx->fs->super);
1080         for (grp = start; grp < ctx->fs->group_desc_count; grp++) {
1081                 if (ext2fs_bg_flags_test(ctx->fs, grp, EXT2_BG_INODE_UNINIT))
1082                         continue;
1083                 inodes_in_group = ctx->fs->super->s_inodes_per_group -
1084                                         ext2fs_bg_itable_unused(ctx->fs, grp);
1085                 blocks_to_read += (inodes_in_group + inodes_per_block - 1) /
1086                                         inodes_per_block;
1087                 if (blocks_to_read * ctx->fs->blocksize >
1088                     ctx->readahead_kb * 1024)
1089                         break;
1090         }
1091
1092         err = e2fsck_readahead(ctx->fs, E2FSCK_READA_ITABLE, start,
1093                                grp - start + 1);
1094         if (err == EAGAIN) {
1095                 ctx->readahead_kb /= 2;
1096                 err = 0;
1097         }
1098
1099 out:
1100         if (err) {
1101                 /* Error; disable itable readahead */
1102                 *group = ctx->fs->group_desc_count;
1103                 *next_ino = ctx->fs->super->s_inodes_count;
1104         } else {
1105                 /*
1106                  * Don't do more readahead until we've reached the first inode
1107                  * of the last inode scan buffer block for the last group.
1108                  */
1109                 *group = grp + 1;
1110                 inodes_per_buffer = (ctx->inode_buffer_blocks ?
1111                                      ctx->inode_buffer_blocks :
1112                                      EXT2_INODE_SCAN_DEFAULT_BUFFER_BLOCKS) *
1113                                     ctx->fs->blocksize /
1114                                     EXT2_INODE_SIZE(ctx->fs->super);
1115                 inodes_in_group--;
1116                 *next_ino = inodes_in_group -
1117                             (inodes_in_group % inodes_per_buffer) + 1 +
1118                             (grp * ctx->fs->super->s_inodes_per_group);
1119         }
1120 }
1121
1122 /*
1123  * Check if the passed ino is one of the used superblock quota inodes.
1124  *
1125  * Before the quota inodes were journaled, older superblock quota inodes
1126  * were just regular files in the filesystem and not reserved inodes.  This
1127  * checks if the passed ino is one of the s_*_quota_inum superblock fields,
1128  * which may not always be the same as the EXT4_*_QUOTA_INO fields.
1129  */
1130 static int quota_inum_is_super(struct ext2_super_block *sb, ext2_ino_t ino)
1131 {
1132         enum quota_type qtype;
1133
1134         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1135                 if (*quota_sb_inump(sb, qtype) == ino)
1136                         return 1;
1137
1138         return 0;
1139 }
1140
1141 /*
1142  * Check if the passed ino is one of the reserved quota inodes.
1143  * This checks if the inode number is one of the reserved EXT4_*_QUOTA_INO
1144  * inodes.  These inodes may or may not be in use by the quota feature.
1145  */
1146 static int quota_inum_is_reserved(ext2_filsys fs, ext2_ino_t ino)
1147 {
1148         enum quota_type qtype;
1149
1150         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1151                 if (quota_type2inum(qtype, fs->super) == ino)
1152                         return 1;
1153
1154         return 0;
1155 }
1156
1157 static int e2fsck_should_abort(e2fsck_t ctx)
1158 {
1159         e2fsck_t global_ctx;
1160
1161         if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1162                 return 1;
1163
1164         if (ctx->global_ctx) {
1165                 global_ctx = ctx->global_ctx;
1166                 if (global_ctx->flags & E2F_FLAG_SIGNAL_MASK)
1167                         return 1;
1168         }
1169         return 0;
1170 }
1171
1172 void e2fsck_pass1_run(e2fsck_t ctx)
1173 {
1174         int     i;
1175         ext2_filsys fs = ctx->fs;
1176         ext2_ino_t      ino = 0;
1177         struct ext2_inode *inode = NULL;
1178         ext2_inode_scan scan = NULL;
1179         char            *block_buf = NULL;
1180 #ifdef RESOURCE_TRACK
1181         struct resource_track   rtrack;
1182 #endif
1183         unsigned char   frag, fsize;
1184         struct          problem_context pctx;
1185         struct          scan_callback_struct scan_struct;
1186         struct ext2_super_block *sb = ctx->fs->super;
1187         const char      *old_op;
1188         const char      *eop_next_inode = _("getting next inode from scan");
1189         int             imagic_fs, extent_fs, inlinedata_fs, casefold_fs;
1190         int             low_dtime_check = 1;
1191         unsigned int    inode_size = EXT2_INODE_SIZE(fs->super);
1192         unsigned int    bufsize;
1193         int             failed_csum = 0;
1194         ext2_ino_t      ino_threshold = 0;
1195         dgrp_t          ra_group = 0;
1196         struct ea_quota ea_ibody_quota;
1197         struct process_inode_block *inodes_to_process;
1198         int             process_inode_count;
1199
1200         init_resource_track(&rtrack, ctx->fs->io);
1201         clear_problem_context(&pctx);
1202
1203         /* If we can do readahead, figure out how many groups to pull in. */
1204         if (!e2fsck_can_readahead(ctx->fs))
1205                 ctx->readahead_kb = 0;
1206         else if (ctx->readahead_kb == ~0ULL)
1207                 ctx->readahead_kb = e2fsck_guess_readahead(ctx->fs);
1208         pass1_readahead(ctx, &ra_group, &ino_threshold);
1209
1210         if (!(ctx->options & E2F_OPT_PREEN))
1211                 fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1212
1213         if (ext2fs_has_feature_dir_index(fs->super) &&
1214             !(ctx->options & E2F_OPT_NO)) {
1215                 if (ext2fs_u32_list_create(&ctx->dirs_to_hash, 50))
1216                         ctx->dirs_to_hash = 0;
1217         }
1218
1219 #ifdef MTRACE
1220         mtrace_print("Pass 1");
1221 #endif
1222
1223         imagic_fs = ext2fs_has_feature_imagic_inodes(sb);
1224         extent_fs = ext2fs_has_feature_extents(sb);
1225         inlinedata_fs = ext2fs_has_feature_inline_data(sb);
1226         casefold_fs = ext2fs_has_feature_casefold(sb);
1227
1228         /*
1229          * Allocate bitmaps structures
1230          */
1231         pctx.errcode = e2fsck_allocate_inode_bitmap(fs, _("in-use inode map"),
1232                                                     EXT2FS_BMAP64_RBTREE,
1233                                                     "inode_used_map",
1234                                                     &ctx->inode_used_map);
1235         if (pctx.errcode) {
1236                 pctx.num = 1;
1237                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1238                 ctx->flags |= E2F_FLAG_ABORT;
1239                 return;
1240         }
1241         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1242                         _("directory inode map"),
1243                         ctx->global_ctx ? EXT2FS_BMAP64_RBTREE :
1244                         EXT2FS_BMAP64_AUTODIR,
1245                         "inode_dir_map", &ctx->inode_dir_map);
1246         if (pctx.errcode) {
1247                 pctx.num = 2;
1248                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1249                 ctx->flags |= E2F_FLAG_ABORT;
1250                 return;
1251         }
1252         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1253                         _("regular file inode map"), EXT2FS_BMAP64_RBTREE,
1254                         "inode_reg_map", &ctx->inode_reg_map);
1255         if (pctx.errcode) {
1256                 pctx.num = 6;
1257                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1258                 ctx->flags |= E2F_FLAG_ABORT;
1259                 return;
1260         }
1261         pctx.errcode = e2fsck_allocate_subcluster_bitmap(fs,
1262                         _("in-use block map"), EXT2FS_BMAP64_RBTREE,
1263                         "block_found_map", &ctx->block_found_map);
1264         if (pctx.errcode) {
1265                 pctx.num = 1;
1266                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1267                 ctx->flags |= E2F_FLAG_ABORT;
1268                 return;
1269         }
1270         pctx.errcode = e2fsck_allocate_block_bitmap(fs,
1271                         _("metadata block map"), EXT2FS_BMAP64_RBTREE,
1272                         "block_metadata_map", &ctx->block_metadata_map);
1273         if (pctx.errcode) {
1274                 pctx.num = 1;
1275                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1276                 ctx->flags |= E2F_FLAG_ABORT;
1277                 return;
1278         }
1279         if (casefold_fs) {
1280                 pctx.errcode =
1281                         e2fsck_allocate_inode_bitmap(fs,
1282                                                      _("inode casefold map"),
1283                                                      EXT2FS_BMAP64_RBTREE,
1284                                                      "inode_casefold_map",
1285                                                      &ctx->inode_casefold_map);
1286                 if (pctx.errcode) {
1287                         pctx.num = 1;
1288                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1289                         ctx->flags |= E2F_FLAG_ABORT;
1290                         return;
1291                 }
1292         }
1293         pctx.errcode = e2fsck_setup_icount(ctx, "inode_link_info", 0, NULL,
1294                                            &ctx->inode_link_info);
1295         if (pctx.errcode) {
1296                 fix_problem(ctx, PR_1_ALLOCATE_ICOUNT, &pctx);
1297                 ctx->flags |= E2F_FLAG_ABORT;
1298                 return;
1299         }
1300         bufsize = inode_size;
1301         if (bufsize < sizeof(struct ext2_inode_large))
1302                 bufsize = sizeof(struct ext2_inode_large);
1303         inode = (struct ext2_inode *)
1304                 e2fsck_allocate_memory(ctx, bufsize, "scratch inode");
1305
1306         inodes_to_process = (struct process_inode_block *)
1307                 e2fsck_allocate_memory(ctx,
1308                                        (ctx->process_inode_size *
1309                                         sizeof(struct process_inode_block)),
1310                                        "array of inodes to process");
1311         process_inode_count = 0;
1312
1313         pctx.errcode = ext2fs_init_dblist(fs, 0);
1314         if (pctx.errcode) {
1315                 fix_problem(ctx, PR_1_ALLOCATE_DBCOUNT, &pctx);
1316                 ctx->flags |= E2F_FLAG_ABORT;
1317                 goto endit;
1318         }
1319
1320         /*
1321          * If the last orphan field is set, clear it, since the pass1
1322          * processing will automatically find and clear the orphans.
1323          * In the future, we may want to try using the last_orphan
1324          * linked list ourselves, but for now, we clear it so that the
1325          * ext3 mount code won't get confused.
1326          */
1327         if (!(ctx->options & E2F_OPT_READONLY)) {
1328                 if (fs->super->s_last_orphan) {
1329                         fs->super->s_last_orphan = 0;
1330                         ext2fs_mark_super_dirty(fs);
1331                 }
1332         }
1333
1334         mark_table_blocks(ctx);
1335         pctx.errcode = ext2fs_convert_subcluster_bitmap(fs,
1336                                                 &ctx->block_found_map);
1337         if (pctx.errcode) {
1338                 fix_problem(ctx, PR_1_CONVERT_SUBCLUSTER, &pctx);
1339                 ctx->flags |= E2F_FLAG_ABORT;
1340                 goto endit;
1341         }
1342         block_buf = (char *) e2fsck_allocate_memory(ctx, fs->blocksize * 3,
1343                                                     "block interate buffer");
1344         if (EXT2_INODE_SIZE(fs->super) == EXT2_GOOD_OLD_INODE_SIZE)
1345                 e2fsck_use_inode_shortcuts(ctx, 1);
1346         e2fsck_intercept_block_allocations(ctx);
1347         old_op = ehandler_operation(_("opening inode scan"));
1348         pctx.errcode = ext2fs_open_inode_scan(fs, ctx->inode_buffer_blocks,
1349                                               &scan);
1350         ehandler_operation(old_op);
1351         if (pctx.errcode) {
1352                 fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1353                 ctx->flags |= E2F_FLAG_ABORT;
1354                 goto endit;
1355         }
1356         ext2fs_inode_scan_flags(scan, EXT2_SF_SKIP_MISSING_ITABLE |
1357                                       EXT2_SF_WARN_GARBAGE_INODES, 0);
1358         ctx->stashed_inode = inode;
1359         scan_struct.ctx = ctx;
1360         scan_struct.block_buf = block_buf;
1361         scan_struct.inodes_to_process = inodes_to_process;
1362         scan_struct.process_inode_count = &process_inode_count;
1363         ext2fs_set_inode_callback(scan, scan_callback, &scan_struct);
1364         if (ctx->progress && ((ctx->progress)(ctx, 1, 0,
1365                                               ctx->fs->group_desc_count)))
1366                 goto endit;
1367         if ((fs->super->s_wtime &&
1368              fs->super->s_wtime < fs->super->s_inodes_count) ||
1369             (fs->super->s_mtime &&
1370              fs->super->s_mtime < fs->super->s_inodes_count) ||
1371             (fs->super->s_mkfs_time &&
1372              fs->super->s_mkfs_time < fs->super->s_inodes_count))
1373                 low_dtime_check = 0;
1374
1375         if (ext2fs_has_feature_mmp(fs->super) &&
1376             fs->super->s_mmp_block > fs->super->s_first_data_block &&
1377             fs->super->s_mmp_block < ext2fs_blocks_count(fs->super))
1378                 ext2fs_mark_block_bitmap2(ctx->block_found_map,
1379                                           fs->super->s_mmp_block);
1380
1381         /* Set up ctx->lost_and_found if possible */
1382         (void) e2fsck_get_lost_and_found(ctx, 0);
1383
1384 #ifdef HAVE_PTHREAD
1385         if (ctx->global_ctx) {
1386                 if (ctx->options & E2F_OPT_DEBUG &&
1387                     ctx->options & E2F_OPT_MULTITHREAD)
1388                         fprintf(stderr, "thread %d jumping to group %d\n",
1389                                         ctx->thread_info.et_thread_index,
1390                                         ctx->thread_info.et_group_start);
1391                 pctx.errcode = ext2fs_inode_scan_goto_blockgroup(scan,
1392                                         ctx->thread_info.et_group_start);
1393                 if (pctx.errcode) {
1394                         fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1395                         ctx->flags |= E2F_FLAG_ABORT;
1396                         goto endit;
1397                 }
1398         }
1399 #endif
1400
1401         while (1) {
1402                 if (ino % (fs->super->s_inodes_per_group * 4) == 1) {
1403                         if (e2fsck_mmp_update(fs))
1404                                 fatal_error(ctx, 0);
1405                 }
1406                 old_op = ehandler_operation(eop_next_inode);
1407                 pctx.errcode = ext2fs_get_next_inode_full(scan, &ino,
1408                                                           inode, inode_size);
1409                 if (ino > ino_threshold)
1410                         pass1_readahead(ctx, &ra_group, &ino_threshold);
1411                 ehandler_operation(old_op);
1412                 if (e2fsck_should_abort(ctx))
1413                         goto endit;
1414                 if (pctx.errcode == EXT2_ET_BAD_BLOCK_IN_INODE_TABLE) {
1415                         /*
1416                          * If badblocks says badblocks is bad, offer to clear
1417                          * the list, update the in-core bb list, and restart
1418                          * the inode scan.
1419                          */
1420                         if (ino == EXT2_BAD_INO &&
1421                             fix_problem(ctx, PR_1_BADBLOCKS_IN_BADBLOCKS,
1422                                         &pctx)) {
1423                                 errcode_t err;
1424
1425                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1426                                 ext2fs_badblocks_list_free(ctx->fs->badblocks);
1427                                 ctx->fs->badblocks = NULL;
1428                                 err = ext2fs_read_bb_inode(ctx->fs,
1429                                                         &ctx->fs->badblocks);
1430                                 if (err) {
1431                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1432                                                     &pctx);
1433                                         ctx->flags |= E2F_FLAG_ABORT;
1434                                 } else
1435                                         ctx->flags |= E2F_FLAG_RESTART;
1436                                 goto endit;
1437                         }
1438                         if (!ctx->inode_bb_map)
1439                                 alloc_bb_map(ctx);
1440                         ext2fs_mark_inode_bitmap2(ctx->inode_bb_map, ino);
1441                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1442                         continue;
1443                 }
1444                 if (pctx.errcode == EXT2_ET_SCAN_FINISHED)
1445                         break;
1446                 if (pctx.errcode &&
1447                     pctx.errcode != EXT2_ET_INODE_CSUM_INVALID &&
1448                     pctx.errcode != EXT2_ET_INODE_IS_GARBAGE) {
1449                         fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1450                         ctx->flags |= E2F_FLAG_ABORT;
1451                         goto endit;
1452                 }
1453                 if (!ino)
1454                         break;
1455 #ifdef HAVE_PTHREAD
1456                 if (ctx->global_ctx)
1457                         ctx->thread_info.et_inode_number++;
1458 #endif
1459                 pctx.ino = ino;
1460                 pctx.inode = inode;
1461                 ctx->stashed_ino = ino;
1462
1463                 /* Clear trashed inode? */
1464                 if (pctx.errcode == EXT2_ET_INODE_IS_GARBAGE &&
1465                     inode->i_links_count > 0 &&
1466                     fix_problem(ctx, PR_1_INODE_IS_GARBAGE, &pctx)) {
1467                         pctx.errcode = 0;
1468                         e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1469                 }
1470                 failed_csum = pctx.errcode != 0;
1471
1472                 /*
1473                  * Check for inodes who might have been part of the
1474                  * orphaned list linked list.  They should have gotten
1475                  * dealt with by now, unless the list had somehow been
1476                  * corrupted.
1477                  *
1478                  * FIXME: In the future, inodes which are still in use
1479                  * (and which are therefore) pending truncation should
1480                  * be handled specially.  Right now we just clear the
1481                  * dtime field, and the normal e2fsck handling of
1482                  * inodes where i_size and the inode blocks are
1483                  * inconsistent is to fix i_size, instead of releasing
1484                  * the extra blocks.  This won't catch the inodes that
1485                  * was at the end of the orphan list, but it's better
1486                  * than nothing.  The right answer is that there
1487                  * shouldn't be any bugs in the orphan list handling.  :-)
1488                  */
1489                 if (inode->i_dtime && low_dtime_check &&
1490                     inode->i_dtime < ctx->fs->super->s_inodes_count) {
1491                         if (fix_problem(ctx, PR_1_LOW_DTIME, &pctx)) {
1492                                 inode->i_dtime = inode->i_links_count ?
1493                                         0 : ctx->now;
1494                                 e2fsck_write_inode(ctx, ino, inode,
1495                                                    "pass1");
1496                                 failed_csum = 0;
1497                         }
1498                 }
1499
1500                 if (inode->i_links_count) {
1501                         pctx.errcode = ext2fs_icount_store(ctx->inode_link_info,
1502                                            ino, inode->i_links_count);
1503                         if (pctx.errcode) {
1504                                 pctx.num = inode->i_links_count;
1505                                 fix_problem(ctx, PR_1_ICOUNT_STORE, &pctx);
1506                                 ctx->flags |= E2F_FLAG_ABORT;
1507                                 goto endit;
1508                         }
1509                 } else if ((ino >= EXT2_FIRST_INODE(fs->super)) &&
1510                            !quota_inum_is_reserved(fs, ino)) {
1511                         if (!inode->i_dtime && inode->i_mode) {
1512                                 if (fix_problem(ctx,
1513                                             PR_1_ZERO_DTIME, &pctx)) {
1514                                         inode->i_dtime = ctx->now;
1515                                         e2fsck_write_inode(ctx, ino, inode,
1516                                                            "pass1");
1517                                         failed_csum = 0;
1518                                 }
1519                         }
1520                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1521                         continue;
1522                 }
1523
1524                 if ((inode->i_flags & EXT4_CASEFOLD_FL) &&
1525                     ((!LINUX_S_ISDIR(inode->i_mode) &&
1526                       fix_problem(ctx, PR_1_CASEFOLD_NONDIR, &pctx)) ||
1527                      (!casefold_fs &&
1528                       fix_problem(ctx, PR_1_CASEFOLD_FEATURE, &pctx)))) {
1529                         inode->i_flags &= ~EXT4_CASEFOLD_FL;
1530                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1531                 }
1532
1533                 /* Conflicting inlinedata/extents inode flags? */
1534                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) &&
1535                     (inode->i_flags & EXT4_EXTENTS_FL)) {
1536                         int res = fix_inline_data_extents_file(ctx, ino, inode,
1537                                                                inode_size,
1538                                                                &pctx);
1539                         if (res < 0) {
1540                                 /* skip FINISH_INODE_LOOP */
1541                                 continue;
1542                         }
1543                 }
1544
1545                 /* Test for incorrect inline_data flags settings. */
1546                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && !inlinedata_fs &&
1547                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1548                         size_t size = 0;
1549
1550                         pctx.errcode = get_inline_data_ea_size(fs, ino, &size);
1551                         if (!pctx.errcode &&
1552                             fix_problem(ctx, PR_1_INLINE_DATA_FEATURE, &pctx)) {
1553                                 ext2fs_set_feature_inline_data(sb);
1554                                 ext2fs_mark_super_dirty(fs);
1555                                 inlinedata_fs = 1;
1556                         } else if (fix_problem(ctx, PR_1_INLINE_DATA_SET, &pctx)) {
1557                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1558                                 /* skip FINISH_INODE_LOOP */
1559                                 continue;
1560                         }
1561                 }
1562
1563                 /* Test for inline data flag but no attr */
1564                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && inlinedata_fs &&
1565                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1566                         size_t size = 0;
1567                         errcode_t err;
1568                         int flags;
1569
1570                         flags = fs->flags;
1571                         if (failed_csum)
1572                                 fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
1573                         err = get_inline_data_ea_size(fs, ino, &size);
1574                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
1575                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
1576
1577                         switch (err) {
1578                         case 0:
1579                                 /* Everything is awesome... */
1580                                 break;
1581                         case EXT2_ET_BAD_EA_BLOCK_NUM:
1582                         case EXT2_ET_BAD_EA_HASH:
1583                         case EXT2_ET_BAD_EA_HEADER:
1584                         case EXT2_ET_EA_BAD_NAME_LEN:
1585                         case EXT2_ET_EA_BAD_VALUE_SIZE:
1586                         case EXT2_ET_EA_KEY_NOT_FOUND:
1587                         case EXT2_ET_EA_NO_SPACE:
1588                         case EXT2_ET_MISSING_EA_FEATURE:
1589                         case EXT2_ET_INLINE_DATA_CANT_ITERATE:
1590                         case EXT2_ET_INLINE_DATA_NO_BLOCK:
1591                         case EXT2_ET_INLINE_DATA_NO_SPACE:
1592                         case EXT2_ET_NO_INLINE_DATA:
1593                         case EXT2_ET_EXT_ATTR_CSUM_INVALID:
1594                         case EXT2_ET_EA_BAD_VALUE_OFFSET:
1595                         case EXT2_ET_EA_INODE_CORRUPTED:
1596                                 /* broken EA or no system.data EA; truncate */
1597                                 if (fix_problem(ctx, PR_1_INLINE_DATA_NO_ATTR,
1598                                                 &pctx)) {
1599                                         err = ext2fs_inode_size_set(fs, inode, 0);
1600                                         if (err) {
1601                                                 pctx.errcode = err;
1602                                                 ctx->flags |= E2F_FLAG_ABORT;
1603                                                 goto endit;
1604                                         }
1605                                         inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1606                                         memset(&inode->i_block, 0,
1607                                                sizeof(inode->i_block));
1608                                         e2fsck_write_inode(ctx, ino, inode,
1609                                                            "pass1");
1610                                         failed_csum = 0;
1611                                 }
1612                                 break;
1613                         default:
1614                                 /* Some other kind of non-xattr error? */
1615                                 pctx.errcode = err;
1616                                 ctx->flags |= E2F_FLAG_ABORT;
1617                                 goto endit;
1618                         }
1619                 }
1620
1621                 /*
1622                  * Test for incorrect extent flag settings.
1623                  *
1624                  * On big-endian machines we must be careful:
1625                  * When the inode is read, the i_block array is not swapped
1626                  * if the extent flag is set.  Therefore if we are testing
1627                  * for or fixing a wrongly-set flag, we must potentially
1628                  * (un)swap before testing, or after fixing.
1629                  */
1630
1631                 /*
1632                  * In this case the extents flag was set when read, so
1633                  * extent_header_verify is ok.  If the inode is cleared,
1634                  * no need to swap... so no extra swapping here.
1635                  */
1636                 if ((inode->i_flags & EXT4_EXTENTS_FL) && !extent_fs &&
1637                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1638                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO))) {
1639                         if ((ext2fs_extent_header_verify(inode->i_block,
1640                                                  sizeof(inode->i_block)) == 0) &&
1641                             fix_problem(ctx, PR_1_EXTENT_FEATURE, &pctx)) {
1642                                 ext2fs_set_feature_extents(sb);
1643                                 ext2fs_mark_super_dirty(fs);
1644                                 extent_fs = 1;
1645                         } else if (fix_problem(ctx, PR_1_EXTENTS_SET, &pctx)) {
1646                         clear_inode:
1647                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1648                                 if (ino == EXT2_BAD_INO)
1649                                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map,
1650                                                                  ino);
1651                                 /* skip FINISH_INODE_LOOP */
1652                                 continue;
1653                         }
1654                 }
1655
1656                 /*
1657                  * For big-endian machines:
1658                  * If the inode didn't have the extents flag set when it
1659                  * was read, then the i_blocks array was swapped.  To test
1660                  * as an extents header, we must swap it back first.
1661                  * IF we then set the extents flag, the entire i_block
1662                  * array must be un/re-swapped to make it proper extents data.
1663                  */
1664                 if (extent_fs && !(inode->i_flags & EXT4_EXTENTS_FL) &&
1665                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1666                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO)) &&
1667                     (LINUX_S_ISREG(inode->i_mode) ||
1668                      LINUX_S_ISDIR(inode->i_mode))) {
1669                         void *ehp;
1670 #ifdef WORDS_BIGENDIAN
1671                         __u32 tmp_block[EXT2_N_BLOCKS];
1672
1673                         for (i = 0; i < EXT2_N_BLOCKS; i++)
1674                                 tmp_block[i] = ext2fs_swab32(inode->i_block[i]);
1675                         ehp = tmp_block;
1676 #else
1677                         ehp = inode->i_block;
1678 #endif
1679                         if ((ext2fs_extent_header_verify(ehp,
1680                                          sizeof(inode->i_block)) == 0) &&
1681                             (fix_problem(ctx, PR_1_UNSET_EXTENT_FL, &pctx))) {
1682                                 inode->i_flags |= EXT4_EXTENTS_FL;
1683 #ifdef WORDS_BIGENDIAN
1684                                 memcpy(inode->i_block, tmp_block,
1685                                        sizeof(inode->i_block));
1686 #endif
1687                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1688                                 failed_csum = 0;
1689                         }
1690                 }
1691
1692                 if (ino == EXT2_BAD_INO) {
1693                         struct process_block_struct pb;
1694
1695                         if ((failed_csum || inode->i_mode || inode->i_uid ||
1696                              inode->i_gid || inode->i_links_count ||
1697                              (inode->i_flags & EXT4_INLINE_DATA_FL) ||
1698                              inode->i_file_acl) &&
1699                             fix_problem(ctx, PR_1_INVALID_BAD_INODE, &pctx)) {
1700                                 memset(inode, 0, sizeof(struct ext2_inode));
1701                                 e2fsck_write_inode(ctx, ino, inode,
1702                                                    "clear bad inode");
1703                                 failed_csum = 0;
1704                         }
1705
1706                         pctx.errcode = ext2fs_copy_bitmap(ctx->block_found_map,
1707                                                           &pb.fs_meta_blocks);
1708                         if (pctx.errcode) {
1709                                 pctx.num = 4;
1710                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1711                                 ctx->flags |= E2F_FLAG_ABORT;
1712                                 goto endit;
1713                         }
1714                         pb.ino = EXT2_BAD_INO;
1715                         pb.num_blocks = pb.last_block = 0;
1716                         pb.last_db_block = -1;
1717                         pb.num_illegal_blocks = 0;
1718                         pb.suppress = 0; pb.clear = 0; pb.is_dir = 0;
1719                         pb.is_reg = 0; pb.fragmented = 0; pb.bbcheck = 0;
1720                         pb.inode = inode;
1721                         pb.pctx = &pctx;
1722                         pb.ctx = ctx;
1723                         pctx.errcode = ext2fs_block_iterate3(fs, ino, 0,
1724                                      block_buf, process_bad_block, &pb);
1725                         ext2fs_free_block_bitmap(pb.fs_meta_blocks);
1726                         if (pctx.errcode) {
1727                                 fix_problem(ctx, PR_1_BLOCK_ITERATE, &pctx);
1728                                 ctx->flags |= E2F_FLAG_ABORT;
1729                                 goto endit;
1730                         }
1731                         if (pb.bbcheck)
1732                                 if (!fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK_PROMPT, &pctx)) {
1733                                 ctx->flags |= E2F_FLAG_ABORT;
1734                                 goto endit;
1735                         }
1736                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1737                         clear_problem_context(&pctx);
1738                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1739                         continue;
1740                 } else if (ino == EXT2_ROOT_INO) {
1741                         /*
1742                          * Make sure the root inode is a directory; if
1743                          * not, offer to clear it.  It will be
1744                          * regenerated in pass #3.
1745                          */
1746                         if (!LINUX_S_ISDIR(inode->i_mode)) {
1747                                 if (fix_problem(ctx, PR_1_ROOT_NO_DIR, &pctx))
1748                                         goto clear_inode;
1749                         }
1750                         /*
1751                          * If dtime is set, offer to clear it.  mke2fs
1752                          * version 0.2b created filesystems with the
1753                          * dtime field set for the root and lost+found
1754                          * directories.  We won't worry about
1755                          * /lost+found, since that can be regenerated
1756                          * easily.  But we will fix the root directory
1757                          * as a special case.
1758                          */
1759                         if (inode->i_dtime && inode->i_links_count) {
1760                                 if (fix_problem(ctx, PR_1_ROOT_DTIME, &pctx)) {
1761                                         inode->i_dtime = 0;
1762                                         e2fsck_write_inode(ctx, ino, inode,
1763                                                            "pass1");
1764                                         failed_csum = 0;
1765                                 }
1766                         }
1767                 } else if (ino == EXT2_JOURNAL_INO) {
1768                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1769                         if (fs->super->s_journal_inum == EXT2_JOURNAL_INO) {
1770                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1771                                     fix_problem(ctx, PR_1_JOURNAL_BAD_MODE,
1772                                                 &pctx)) {
1773                                         inode->i_mode = LINUX_S_IFREG;
1774                                         e2fsck_write_inode(ctx, ino, inode,
1775                                                            "pass1");
1776                                         failed_csum = 0;
1777                                 }
1778                                 check_blocks(ctx, &pctx, block_buf, NULL);
1779                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1780                                 continue;
1781                         }
1782                         if ((inode->i_links_count ||
1783                              inode->i_blocks || inode->i_block[0]) &&
1784                             fix_problem(ctx, PR_1_JOURNAL_INODE_NOT_CLEAR,
1785                                         &pctx)) {
1786                                 memset(inode, 0, inode_size);
1787                                 ext2fs_icount_store(ctx->inode_link_info,
1788                                                     ino, 0);
1789                                 e2fsck_write_inode_full(ctx, ino, inode,
1790                                                         inode_size, "pass1");
1791                                 failed_csum = 0;
1792                         }
1793                 } else if (quota_inum_is_reserved(fs, ino)) {
1794                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1795                         if (ext2fs_has_feature_quota(fs->super) &&
1796                             quota_inum_is_super(fs->super, ino)) {
1797                                 if (!LINUX_S_ISREG(inode->i_mode) &&
1798                                     fix_problem(ctx, PR_1_QUOTA_BAD_MODE,
1799                                                         &pctx)) {
1800                                         inode->i_mode = LINUX_S_IFREG;
1801                                         e2fsck_write_inode(ctx, ino, inode,
1802                                                         "pass1");
1803                                         failed_csum = 0;
1804                                 }
1805                                 check_blocks(ctx, &pctx, block_buf, NULL);
1806                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1807                                 continue;
1808                         }
1809                         if ((inode->i_links_count ||
1810                              inode->i_blocks || inode->i_block[0]) &&
1811                             fix_problem(ctx, PR_1_QUOTA_INODE_NOT_CLEAR,
1812                                         &pctx)) {
1813                                 memset(inode, 0, inode_size);
1814                                 ext2fs_icount_store(ctx->inode_link_info,
1815                                                     ino, 0);
1816                                 e2fsck_write_inode_full(ctx, ino, inode,
1817                                                         inode_size, "pass1");
1818                                 failed_csum = 0;
1819                         }
1820                 } else if (ino < EXT2_FIRST_INODE(fs->super)) {
1821                         problem_t problem = 0;
1822
1823                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1824                         if (ino == EXT2_BOOT_LOADER_INO) {
1825                                 if (LINUX_S_ISDIR(inode->i_mode))
1826                                         problem = PR_1_RESERVED_BAD_MODE;
1827                         } else if (ino == EXT2_RESIZE_INO) {
1828                                 if (inode->i_mode &&
1829                                     !LINUX_S_ISREG(inode->i_mode))
1830                                         problem = PR_1_RESERVED_BAD_MODE;
1831                         } else {
1832                                 if (inode->i_mode != 0)
1833                                         problem = PR_1_RESERVED_BAD_MODE;
1834                         }
1835                         if (problem) {
1836                                 if (fix_problem(ctx, problem, &pctx)) {
1837                                         inode->i_mode = 0;
1838                                         e2fsck_write_inode(ctx, ino, inode,
1839                                                            "pass1");
1840                                         failed_csum = 0;
1841                                 }
1842                         }
1843                         check_blocks(ctx, &pctx, block_buf, NULL);
1844                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1845                         continue;
1846                 }
1847
1848                 if (!inode->i_links_count) {
1849                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1850                         continue;
1851                 }
1852                 /*
1853                  * n.b.  0.3c ext2fs code didn't clear i_links_count for
1854                  * deleted files.  Oops.
1855                  *
1856                  * Since all new ext2 implementations get this right,
1857                  * we now assume that the case of non-zero
1858                  * i_links_count and non-zero dtime means that we
1859                  * should keep the file, not delete it.
1860                  *
1861                  */
1862                 if (inode->i_dtime) {
1863                         if (fix_problem(ctx, PR_1_SET_DTIME, &pctx)) {
1864                                 inode->i_dtime = 0;
1865                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1866                                 failed_csum = 0;
1867                         }
1868                 }
1869
1870                 ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1871                 switch (fs->super->s_creator_os) {
1872                     case EXT2_OS_HURD:
1873                         frag = inode->osd2.hurd2.h_i_frag;
1874                         fsize = inode->osd2.hurd2.h_i_fsize;
1875                         break;
1876                     default:
1877                         frag = fsize = 0;
1878                 }
1879
1880                 if (inode->i_faddr || frag || fsize ||
1881                     (!ext2fs_has_feature_largedir(fs->super) &&
1882                     (LINUX_S_ISDIR(inode->i_mode) && inode->i_size_high)))
1883                         mark_inode_bad(ctx, ino);
1884                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1885                     !ext2fs_has_feature_64bit(fs->super) &&
1886                     inode->osd2.linux2.l_i_file_acl_high != 0)
1887                         mark_inode_bad(ctx, ino);
1888                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
1889                     !ext2fs_has_feature_huge_file(fs->super) &&
1890                     (inode->osd2.linux2.l_i_blocks_hi != 0))
1891                         mark_inode_bad(ctx, ino);
1892                 if (inode->i_flags & EXT2_IMAGIC_FL) {
1893                         if (imagic_fs) {
1894                                 if (!ctx->inode_imagic_map)
1895                                         alloc_imagic_map(ctx);
1896                                 ext2fs_mark_inode_bitmap2(ctx->inode_imagic_map,
1897                                                          ino);
1898                         } else {
1899                                 if (fix_problem(ctx, PR_1_SET_IMAGIC, &pctx)) {
1900                                         inode->i_flags &= ~EXT2_IMAGIC_FL;
1901                                         e2fsck_write_inode(ctx, ino,
1902                                                            inode, "pass1");
1903                                         failed_csum = 0;
1904                                 }
1905                         }
1906                 }
1907
1908                 check_inode_extra_space(ctx, &pctx, &ea_ibody_quota);
1909                 check_is_really_dir(ctx, &pctx, block_buf);
1910
1911                 /*
1912                  * ext2fs_inode_has_valid_blocks2 does not actually look
1913                  * at i_block[] values, so not endian-sensitive here.
1914                  */
1915                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL) &&
1916                     LINUX_S_ISLNK(inode->i_mode) &&
1917                     !ext2fs_inode_has_valid_blocks2(fs, inode) &&
1918                     fix_problem(ctx, PR_1_FAST_SYMLINK_EXTENT_FL, &pctx)) {
1919                         inode->i_flags &= ~EXT4_EXTENTS_FL;
1920                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1921                         failed_csum = 0;
1922                 }
1923
1924                 if ((inode->i_flags & EXT4_ENCRYPT_FL) &&
1925                     add_encrypted_file(ctx, &pctx) < 0)
1926                         goto clear_inode;
1927
1928                 if (casefold_fs && inode->i_flags & EXT4_CASEFOLD_FL)
1929                         ext2fs_mark_inode_bitmap2(ctx->inode_casefold_map, ino);
1930
1931                 if (LINUX_S_ISDIR(inode->i_mode)) {
1932                         ext2fs_mark_inode_bitmap2(ctx->inode_dir_map, ino);
1933                         e2fsck_add_dir_info(ctx, ino, 0);
1934                         ctx->fs_directory_count++;
1935                         if (inode->i_flags & EXT4_CASEFOLD_FL)
1936                                 add_casefolded_dir(ctx, ino);
1937                 } else if (LINUX_S_ISREG (inode->i_mode)) {
1938                         ext2fs_mark_inode_bitmap2(ctx->inode_reg_map, ino);
1939                         ctx->fs_regular_count++;
1940                 } else if (LINUX_S_ISCHR (inode->i_mode) &&
1941                            e2fsck_pass1_check_device_inode(fs, inode)) {
1942                         check_extents_inlinedata(ctx, &pctx);
1943                         check_immutable(ctx, &pctx);
1944                         check_size(ctx, &pctx);
1945                         ctx->fs_chardev_count++;
1946                 } else if (LINUX_S_ISBLK (inode->i_mode) &&
1947                            e2fsck_pass1_check_device_inode(fs, inode)) {
1948                         check_extents_inlinedata(ctx, &pctx);
1949                         check_immutable(ctx, &pctx);
1950                         check_size(ctx, &pctx);
1951                         ctx->fs_blockdev_count++;
1952                 } else if (LINUX_S_ISLNK (inode->i_mode) &&
1953                            e2fsck_pass1_check_symlink(fs, ino, inode,
1954                                                       block_buf)) {
1955                         check_immutable(ctx, &pctx);
1956                         ctx->fs_symlinks_count++;
1957                         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
1958                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1959                                 continue;
1960                         } else if (ext2fs_is_fast_symlink(inode)) {
1961                                 ctx->fs_fast_symlinks_count++;
1962                                 check_blocks(ctx, &pctx, block_buf,
1963                                              &ea_ibody_quota);
1964                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1965                                 continue;
1966                         }
1967                 }
1968                 else if (LINUX_S_ISFIFO (inode->i_mode) &&
1969                          e2fsck_pass1_check_device_inode(fs, inode)) {
1970                         check_extents_inlinedata(ctx, &pctx);
1971                         check_immutable(ctx, &pctx);
1972                         check_size(ctx, &pctx);
1973                         ctx->fs_fifo_count++;
1974                 } else if ((LINUX_S_ISSOCK (inode->i_mode)) &&
1975                            e2fsck_pass1_check_device_inode(fs, inode)) {
1976                         check_extents_inlinedata(ctx, &pctx);
1977                         check_immutable(ctx, &pctx);
1978                         check_size(ctx, &pctx);
1979                         ctx->fs_sockets_count++;
1980                 } else
1981                         mark_inode_bad(ctx, ino);
1982                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1983                     !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
1984                         if (inode->i_block[EXT2_IND_BLOCK])
1985                                 ctx->fs_ind_count++;
1986                         if (inode->i_block[EXT2_DIND_BLOCK])
1987                                 ctx->fs_dind_count++;
1988                         if (inode->i_block[EXT2_TIND_BLOCK])
1989                                 ctx->fs_tind_count++;
1990                 }
1991                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
1992                     !(inode->i_flags & EXT4_INLINE_DATA_FL) &&
1993                     (inode->i_block[EXT2_IND_BLOCK] ||
1994                      inode->i_block[EXT2_DIND_BLOCK] ||
1995                      inode->i_block[EXT2_TIND_BLOCK] ||
1996                      ext2fs_file_acl_block(fs, inode))) {
1997                         struct process_inode_block *itp;
1998
1999                         itp = &inodes_to_process[process_inode_count];
2000                         itp->ino = ino;
2001                         itp->ea_ibody_quota = ea_ibody_quota;
2002                         if (inode_size < sizeof(struct ext2_inode_large))
2003                                 memcpy(&itp->inode, inode, inode_size);
2004                         else
2005                                 memcpy(&itp->inode, inode, sizeof(itp->inode));
2006                         process_inode_count++;
2007                 } else
2008                         check_blocks(ctx, &pctx, block_buf, &ea_ibody_quota);
2009
2010                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2011
2012                 if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
2013                         goto endit;
2014
2015                 if (process_inode_count >= ctx->process_inode_size) {
2016                         process_inodes(ctx, block_buf, inodes_to_process,
2017                                        &process_inode_count);
2018
2019                         if (e2fsck_should_abort(ctx))
2020                                 goto endit;
2021                 }
2022         }
2023         process_inodes(ctx, block_buf, inodes_to_process,
2024                        &process_inode_count);
2025         ext2fs_close_inode_scan(scan);
2026         scan = NULL;
2027
2028         reserve_block_for_root_repair(ctx);
2029         reserve_block_for_lnf_repair(ctx);
2030
2031         /*
2032          * If any extended attribute blocks' reference counts need to
2033          * be adjusted, either up (ctx->refcount_extra), or down
2034          * (ctx->refcount), then fix them.
2035          */
2036         if (ctx->refcount) {
2037                 adjust_extattr_refcount(ctx, ctx->refcount, block_buf, -1);
2038                 ea_refcount_free(ctx->refcount);
2039                 ctx->refcount = 0;
2040         }
2041         if (ctx->refcount_extra) {
2042                 adjust_extattr_refcount(ctx, ctx->refcount_extra,
2043                                         block_buf, +1);
2044                 ea_refcount_free(ctx->refcount_extra);
2045                 ctx->refcount_extra = 0;
2046         }
2047
2048         if (ctx->ea_block_quota_blocks) {
2049                 ea_refcount_free(ctx->ea_block_quota_blocks);
2050                 ctx->ea_block_quota_blocks = 0;
2051         }
2052
2053         if (ctx->ea_block_quota_inodes) {
2054                 ea_refcount_free(ctx->ea_block_quota_inodes);
2055                 ctx->ea_block_quota_inodes = 0;
2056         }
2057
2058         if (ctx->invalid_bitmaps)
2059                 handle_fs_bad_blocks(ctx);
2060
2061         /* We don't need the block_ea_map any more */
2062         if (ctx->block_ea_map) {
2063                 ext2fs_free_block_bitmap(ctx->block_ea_map);
2064                 ctx->block_ea_map = 0;
2065         }
2066
2067         /* We don't need the encryption policy => ID map any more */
2068         destroy_encryption_policy_map(ctx);
2069
2070         if (ctx->flags & E2F_FLAG_RESIZE_INODE) {
2071                 clear_problem_context(&pctx);
2072                 pctx.errcode = ext2fs_create_resize_inode(fs);
2073                 if (pctx.errcode) {
2074                         if (!fix_problem(ctx, PR_1_RESIZE_INODE_CREATE,
2075                                          &pctx)) {
2076                                 ctx->flags |= E2F_FLAG_ABORT;
2077                                 goto endit;
2078                         }
2079                         pctx.errcode = 0;
2080                 }
2081                 if (!pctx.errcode) {
2082                         e2fsck_read_inode(ctx, EXT2_RESIZE_INO, inode,
2083                                           "recreate inode");
2084                         inode->i_mtime = ctx->now;
2085                         e2fsck_write_inode(ctx, EXT2_RESIZE_INO, inode,
2086                                            "recreate inode");
2087                 }
2088                 ctx->flags &= ~E2F_FLAG_RESIZE_INODE;
2089         }
2090
2091         if (ctx->flags & E2F_FLAG_RESTART) {
2092                 /*
2093                  * Only the master copy of the superblock and block
2094                  * group descriptors are going to be written during a
2095                  * restart, so set the superblock to be used to be the
2096                  * master superblock.
2097                  */
2098                 ctx->use_superblock = 0;
2099                 goto endit;
2100         }
2101
2102         if (ctx->large_dirs && !ext2fs_has_feature_largedir(fs->super)) {
2103                 if (fix_problem(ctx, PR_2_FEATURE_LARGE_DIRS, &pctx)) {
2104                         ext2fs_set_feature_largedir(fs->super);
2105                         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
2106                         ext2fs_mark_super_dirty(fs);
2107                 }
2108                 if (fs->super->s_rev_level == EXT2_GOOD_OLD_REV &&
2109                     fix_problem(ctx, PR_1_FS_REV_LEVEL, &pctx)) {
2110                         ext2fs_update_dynamic_rev(fs);
2111                         ext2fs_mark_super_dirty(fs);
2112                 }
2113         }
2114
2115         if (ctx->block_dup_map) {
2116                 if (ctx->options & E2F_OPT_PREEN) {
2117                         clear_problem_context(&pctx);
2118                         fix_problem(ctx, PR_1_DUP_BLOCKS_PREENSTOP, &pctx);
2119                 }
2120                 e2fsck_pass1_dupblocks(ctx, block_buf);
2121         }
2122         ctx->flags |= E2F_FLAG_ALLOC_OK;
2123 endit:
2124         e2fsck_use_inode_shortcuts(ctx, 0);
2125         ext2fs_free_mem(&inodes_to_process);
2126         inodes_to_process = 0;
2127
2128         if (scan)
2129                 ext2fs_close_inode_scan(scan);
2130         if (block_buf)
2131                 ext2fs_free_mem(&block_buf);
2132         if (inode)
2133                 ext2fs_free_mem(&inode);
2134
2135         /*
2136          * The l+f inode may have been cleared, so zap it now and
2137          * later passes will recalculate it if necessary
2138          */
2139         ctx->lost_and_found = 0;
2140
2141         if ((ctx->flags & E2F_FLAG_SIGNAL_MASK) == 0)
2142                 print_resource_track(ctx, _("Pass 1"), &rtrack, ctx->fs->io);
2143         else
2144                 ctx->invalid_bitmaps++;
2145 }
2146
2147 static void init_ext2_max_sizes()
2148 {
2149         int     i;
2150         __u64   max_sizes;
2151
2152         /*
2153          * Init ext2_max_sizes which will be immutable and shared between
2154          * threads
2155          */
2156 #define EXT2_BPP(bits) (1ULL << ((bits) - 2))
2157
2158         for (i = EXT2_MIN_BLOCK_LOG_SIZE; i <= EXT2_MAX_BLOCK_LOG_SIZE; i++) {
2159                 max_sizes = EXT2_NDIR_BLOCKS + EXT2_BPP(i);
2160                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i);
2161                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i) * EXT2_BPP(i);
2162                 max_sizes = (max_sizes * (1UL << i));
2163                 ext2_max_sizes[i - EXT2_MIN_BLOCK_LOG_SIZE] = max_sizes;
2164         }
2165 #undef EXT2_BPP
2166 }
2167
2168 #ifdef HAVE_PTHREAD
2169 static errcode_t e2fsck_pass1_copy_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2170                                           ext2fs_generic_bitmap *dest)
2171 {
2172         errcode_t ret;
2173
2174         ret = ext2fs_copy_bitmap(*src, dest);
2175         if (ret)
2176                 return ret;
2177
2178         (*dest)->fs = fs;
2179
2180         return 0;
2181 }
2182
2183 static void e2fsck_pass1_free_bitmap(ext2fs_generic_bitmap *bitmap)
2184 {
2185         if (*bitmap) {
2186                 ext2fs_free_generic_bmap(*bitmap);
2187                 *bitmap = NULL;
2188         }
2189
2190 }
2191
2192 static errcode_t e2fsck_pass1_merge_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2193                                           ext2fs_generic_bitmap *dest)
2194 {
2195         errcode_t ret = 0;
2196
2197         if (*src) {
2198                 if (*dest == NULL) {
2199                         *dest = *src;
2200                         *src = NULL;
2201                 } else {
2202                         ret = ext2fs_merge_bitmap(*src, *dest, NULL, NULL);
2203                         if (ret)
2204                                 return ret;
2205                 }
2206                 (*dest)->fs = fs;
2207         }
2208
2209         return 0;
2210 }
2211
2212 static errcode_t e2fsck_pass1_copy_fs(ext2_filsys dest, e2fsck_t src_context,
2213                                       ext2_filsys src)
2214 {
2215         errcode_t       retval;
2216
2217         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2218         dest->inode_map = NULL;
2219         dest->block_map = NULL;
2220         dest->badblocks = NULL;
2221         if (dest->dblist)
2222                 dest->dblist->fs = dest;
2223         if (src->block_map) {
2224                 retval = e2fsck_pass1_copy_bitmap(dest, &src->block_map,
2225                                                   &dest->block_map);
2226                 if (retval)
2227                         return retval;
2228         }
2229         if (src->inode_map) {
2230                 retval = e2fsck_pass1_copy_bitmap(dest, &src->inode_map,
2231                                                   &dest->inode_map);
2232                 if (retval)
2233                         return retval;
2234         }
2235
2236         if (src->badblocks) {
2237                 retval = ext2fs_badblocks_copy(src->badblocks,
2238                                                &dest->badblocks);
2239                 if (retval)
2240                         return retval;
2241         }
2242
2243         /* disable it for now */
2244         src_context->openfs_flags &= ~EXT2_FLAG_EXCLUSIVE;
2245         retval = ext2fs_open_channel(dest, src_context->io_options,
2246                                      src_context->io_manager,
2247                                      src_context->openfs_flags,
2248                                      src->io->block_size);
2249         if (retval)
2250                 return retval;
2251
2252         /* Block size might not be default */
2253         io_channel_set_blksize(dest->io, src->io->block_size);
2254         ehandler_init(dest->io);
2255
2256         assert(dest->io->magic == src->io->magic);
2257         assert(dest->io->manager == src->io->manager);
2258         assert(strcmp(dest->io->name, src->io->name) == 0);
2259         assert(dest->io->block_size == src->io->block_size);
2260         assert(dest->io->read_error == src->io->read_error);
2261         assert(dest->io->write_error == src->io->write_error);
2262         assert(dest->io->refcount == src->io->refcount);
2263         assert(dest->io->flags == src->io->flags);
2264         assert(dest->io->app_data == dest);
2265         assert(src->io->app_data == src);
2266         assert(dest->io->align == src->io->align);
2267
2268         /* The data should be written to disk immediately */
2269         dest->io->flags |= CHANNEL_FLAGS_WRITETHROUGH;
2270         /* icache will be rebuilt if needed, so do not copy from @src */
2271         src->icache = NULL;
2272         return 0;
2273 }
2274
2275 static int e2fsck_pass1_merge_fs(ext2_filsys dest, ext2_filsys src)
2276 {
2277         struct ext2_inode_cache *icache = dest->icache;
2278         errcode_t retval = 0;
2279         io_channel dest_io;
2280         io_channel dest_image_io;
2281         ext2fs_inode_bitmap inode_map;
2282         ext2fs_block_bitmap block_map;
2283         ext2_badblocks_list badblocks;
2284         ext2_dblist dblist;
2285         int flags;
2286
2287         dest_io = dest->io;
2288         dest_image_io = dest->image_io;
2289         inode_map = dest->inode_map;
2290         block_map = dest->block_map;
2291         badblocks = dest->badblocks;
2292         dblist = dest->dblist;
2293         flags = dest->flags;
2294
2295         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2296         dest->io = dest_io;
2297         dest->image_io = dest_image_io;
2298         dest->icache = icache;
2299         dest->inode_map = inode_map;
2300         dest->block_map = block_map;
2301         dest->badblocks = badblocks;
2302         dest->dblist = dblist;
2303         if (dest->dblist)
2304                 dest->dblist->fs = dest;
2305         dest->flags = src->flags | flags;
2306         if (!(src->flags & EXT2_FLAG_VALID) || !(flags & EXT2_FLAG_VALID))
2307                 ext2fs_unmark_valid(dest);
2308
2309         if (src->icache) {
2310                 ext2fs_free_inode_cache(src->icache);
2311                 src->icache = NULL;
2312         }
2313
2314         retval = e2fsck_pass1_merge_bitmap(dest, &src->inode_map,
2315                                            &dest->inode_map);
2316         if (retval)
2317                 goto out;
2318
2319         retval = e2fsck_pass1_merge_bitmap(dest, &src->block_map,
2320                                           &dest->block_map);
2321         if (retval)
2322                 goto out;
2323
2324         if (src->dblist) {
2325                 if (dest->dblist) {
2326                         retval = ext2fs_merge_dblist(src->dblist,
2327                                                      dest->dblist);
2328                         if (retval)
2329                                 goto out;
2330                 } else {
2331                         dest->dblist = src->dblist;
2332                         dest->dblist->fs = dest;
2333                         src->dblist = NULL;
2334                 }
2335         }
2336
2337         if (src->badblocks) {
2338                 if (dest->badblocks == NULL)
2339                         retval = ext2fs_badblocks_copy(src->badblocks,
2340                                                        &dest->badblocks);
2341                 else
2342                         retval = ext2fs_badblocks_merge(src->badblocks,
2343                                                         dest->badblocks);
2344         }
2345 out:
2346         io_channel_close(src->io);
2347         if (src->inode_map)
2348                 ext2fs_free_generic_bmap(src->inode_map);
2349         if (src->block_map)
2350                 ext2fs_free_generic_bmap(src->block_map);
2351         if (src->badblocks)
2352                 ext2fs_badblocks_list_free(src->badblocks);
2353         if (src->dblist)
2354                 ext2fs_free_dblist(src->dblist);
2355
2356         return retval;
2357 }
2358
2359 static errcode_t e2fsck_pass1_thread_prepare(e2fsck_t global_ctx, e2fsck_t *thread_ctx,
2360                                              int thread_index, int num_threads)
2361 {
2362         errcode_t               retval;
2363         e2fsck_t                thread_context;
2364         ext2_filsys             thread_fs;
2365         ext2_filsys             global_fs = global_ctx->fs;
2366         struct e2fsck_thread    *tinfo;
2367         dgrp_t                  average_group;
2368
2369         assert(global_ctx->inode_used_map == NULL);
2370         assert(global_ctx->inode_dir_map == NULL);
2371         assert(global_ctx->inode_bb_map == NULL);
2372         assert(global_ctx->inode_imagic_map == NULL);
2373         assert(global_ctx->inode_reg_map == NULL);
2374         assert(global_ctx->inodes_to_rebuild == NULL);
2375
2376         assert(global_ctx->block_found_map == NULL);
2377         assert(global_ctx->block_dup_map == NULL);
2378         assert(global_ctx->block_ea_map == NULL);
2379         assert(global_ctx->block_metadata_map == NULL);
2380         assert(global_ctx->fs->dblist == NULL);
2381
2382         retval = ext2fs_get_mem(sizeof(struct e2fsck_struct), &thread_context);
2383         if (retval) {
2384                 com_err(global_ctx->program_name, retval, "while allocating memory");
2385                 return retval;
2386         }
2387         memcpy(thread_context, global_ctx, sizeof(struct e2fsck_struct));
2388         thread_context->global_ctx = global_ctx;
2389
2390         retval = ext2fs_get_mem(sizeof(struct struct_ext2_filsys), &thread_fs);
2391         if (retval) {
2392                 com_err(global_ctx->program_name, retval, "while allocating memory");
2393                 goto out_context;
2394         }
2395
2396         io_channel_flush_cleanup(global_fs->io);
2397         retval = e2fsck_pass1_copy_fs(thread_fs, global_ctx, global_fs);
2398         if (retval) {
2399                 com_err(global_ctx->program_name, retval, "while copying fs");
2400                 goto out_fs;
2401         }
2402         thread_fs->priv_data = thread_context;
2403
2404         thread_context->thread_info.et_thread_index = thread_index;
2405         set_up_logging(thread_context);
2406
2407         /*
2408          * Distribute work to multiple threads:
2409          * Each thread work on fs->group_desc_count / nthread groups.
2410          */
2411         tinfo = &thread_context->thread_info;
2412         average_group = thread_fs->group_desc_count / num_threads;
2413         if (average_group == 0)
2414                 average_group = 1;
2415         tinfo->et_group_start = average_group * thread_index;
2416         if (thread_index == num_threads - 1)
2417                 tinfo->et_group_end = thread_fs->group_desc_count;
2418         else
2419                 tinfo->et_group_end = average_group * (thread_index + 1);
2420         tinfo->et_group_next = tinfo->et_group_start;
2421         tinfo->et_inode_number = 0;
2422         tinfo->et_log_buf[0] = '\0';
2423         tinfo->et_log_length = 0;
2424         if (thread_context->options & E2F_OPT_MULTITHREAD)
2425                 log_out(thread_context, _("Scan group range [%d, %d)\n"),
2426                         tinfo->et_group_start, tinfo->et_group_end);
2427         thread_context->fs = thread_fs;
2428         retval = quota_init_context(&thread_context->qctx, thread_fs, 0);
2429         if (retval) {
2430                 com_err(global_ctx->program_name, retval,
2431                         "while init quota context");
2432                 goto out_fs;
2433         }
2434         *thread_ctx = thread_context;
2435         return 0;
2436 out_fs:
2437         ext2fs_free_mem(&thread_fs);
2438 out_context:
2439         ext2fs_free_mem(&thread_context);
2440         return retval;
2441 }
2442
2443 static void e2fsck_pass1_merge_dir_info(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2444 {
2445         if (thread_ctx->dir_info == NULL)
2446                 return;
2447
2448         if (global_ctx->dir_info == NULL) {
2449                 global_ctx->dir_info = thread_ctx->dir_info;
2450                 thread_ctx->dir_info = NULL;
2451                 return;
2452         }
2453
2454         e2fsck_merge_dir_info(global_ctx, thread_ctx->dir_info,
2455                               global_ctx->dir_info);
2456 }
2457
2458 static void e2fsck_pass1_merge_dx_dir(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2459 {
2460         if (thread_ctx->dx_dir_info == NULL)
2461                 return;
2462
2463         if (global_ctx->dx_dir_info == NULL) {
2464                 global_ctx->dx_dir_info = thread_ctx->dx_dir_info;
2465                 global_ctx->dx_dir_info_size = thread_ctx->dx_dir_info_size;
2466                 global_ctx->dx_dir_info_count = thread_ctx->dx_dir_info_count;
2467                 thread_ctx->dx_dir_info = NULL;
2468                 return;
2469         }
2470
2471         e2fsck_merge_dx_dir(global_ctx, thread_ctx);
2472 }
2473
2474 static inline errcode_t
2475 e2fsck_pass1_merge_icount(ext2_icount_t *dest_icount,
2476                           ext2_icount_t *src_icount)
2477 {
2478         if (*src_icount) {
2479                 if (*dest_icount == NULL) {
2480                         *dest_icount = *src_icount;
2481                         *src_icount = NULL;
2482                 } else {
2483                         errcode_t ret;
2484
2485                         ret = ext2fs_icount_merge(*src_icount,
2486                                                   *dest_icount);
2487                         if (ret)
2488                                 return ret;
2489                 }
2490         }
2491
2492         return 0;
2493 }
2494
2495 static errcode_t e2fsck_pass1_merge_icounts(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2496 {
2497         errcode_t ret;
2498
2499         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_count,
2500                                         &thread_ctx->inode_count);
2501         if (ret)
2502                 return ret;
2503         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_link_info,
2504                                         &thread_ctx->inode_link_info);
2505
2506         return ret;
2507 }
2508
2509 static errcode_t e2fsck_pass1_merge_dirs_to_hash(e2fsck_t global_ctx,
2510                                                  e2fsck_t thread_ctx)
2511 {
2512         errcode_t retval = 0;
2513
2514         if (!thread_ctx->dirs_to_hash)
2515                 return 0;
2516
2517         if (!global_ctx->dirs_to_hash)
2518                 retval = ext2fs_badblocks_copy(thread_ctx->dirs_to_hash,
2519                                                &global_ctx->dirs_to_hash);
2520         else
2521                 retval = ext2fs_badblocks_merge(thread_ctx->dirs_to_hash,
2522                                                 global_ctx->dirs_to_hash);
2523
2524         return retval;
2525 }
2526
2527 static int e2fsck_pass1_thread_join_one(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2528 {
2529         errcode_t        retval;
2530         int              flags = global_ctx->flags;
2531         ext2_filsys      thread_fs = thread_ctx->fs;
2532         ext2_filsys      global_fs = global_ctx->fs;
2533         FILE            *global_logf = global_ctx->logf;
2534         FILE            *global_problem_logf = global_ctx->problem_logf;
2535         ext2fs_inode_bitmap inode_bad_map = global_ctx->inode_bad_map;
2536         struct dir_info_db *dir_info = global_ctx->dir_info;
2537         struct dx_dir_info *dx_dir_info = global_ctx->dx_dir_info;
2538         ext2fs_inode_bitmap inode_used_map = global_ctx->inode_used_map;
2539         ext2fs_inode_bitmap inode_dir_map = global_ctx->inode_dir_map;
2540         ext2fs_inode_bitmap inode_bb_map = global_ctx->inode_bb_map;
2541         ext2fs_inode_bitmap inode_imagic_map = global_ctx->inode_imagic_map;
2542         ext2fs_inode_bitmap inode_reg_map = global_ctx->inode_reg_map;
2543         ext2fs_block_bitmap block_found_map = global_ctx->block_found_map;
2544         ext2fs_block_bitmap block_dup_map = global_ctx->block_dup_map;
2545         ext2fs_block_bitmap block_ea_map = global_ctx->block_ea_map;
2546         ext2fs_block_bitmap block_metadata_map = global_ctx->block_metadata_map;
2547         ext2fs_block_bitmap inodes_to_rebuild = global_ctx->inodes_to_rebuild;
2548         ext2_icount_t inode_count = global_ctx->inode_count;
2549         ext2_icount_t inode_link_info = global_ctx->inode_link_info;
2550         __u32 fs_directory_count = global_ctx->fs_directory_count;
2551         __u32 fs_regular_count = global_ctx->fs_regular_count;
2552         __u32 fs_blockdev_count = global_ctx->fs_blockdev_count;
2553         __u32 fs_chardev_count = global_ctx->fs_chardev_count;
2554         __u32 fs_links_count = global_ctx->fs_links_count;
2555         __u32 fs_symlinks_count = global_ctx->fs_symlinks_count;
2556         __u32 fs_fast_symlinks_count = global_ctx->fs_fast_symlinks_count;
2557         __u32 fs_fifo_count = global_ctx->fs_fifo_count;
2558         __u32 fs_total_count = global_ctx->fs_total_count;
2559         __u32 fs_badblocks_count = global_ctx->fs_badblocks_count;
2560         __u32 fs_sockets_count = global_ctx->fs_sockets_count;
2561         __u32 fs_ind_count = global_ctx->fs_ind_count;
2562         __u32 fs_dind_count = global_ctx->fs_dind_count;
2563         __u32 fs_tind_count = global_ctx->fs_tind_count;
2564         __u32 fs_fragmented = global_ctx->fs_fragmented;
2565         __u32 fs_fragmented_dir = global_ctx->fs_fragmented_dir;
2566         __u32 large_files = global_ctx->large_files;
2567         ext2_ino_t dx_dir_info_size = global_ctx->dx_dir_info_size;
2568         ext2_ino_t dx_dir_info_count = global_ctx->dx_dir_info_count;
2569         ext2_u32_list dirs_to_hash = global_ctx->dirs_to_hash;
2570         quota_ctx_t qctx = global_ctx->qctx;
2571
2572 #ifdef HAVE_SETJMP_H
2573         jmp_buf          old_jmp;
2574
2575         memcpy(old_jmp, global_ctx->abort_loc, sizeof(jmp_buf));
2576 #endif
2577         memcpy(global_ctx, thread_ctx, sizeof(struct e2fsck_struct));
2578 #ifdef HAVE_SETJMP_H
2579         memcpy(global_ctx->abort_loc, old_jmp, sizeof(jmp_buf));
2580 #endif
2581
2582         global_ctx->inode_used_map = inode_used_map;
2583         global_ctx->inode_bad_map = inode_bad_map;
2584         global_ctx->inode_dir_map = inode_dir_map;
2585         global_ctx->inode_bb_map = inode_bb_map;
2586         global_ctx->inode_imagic_map = inode_imagic_map;
2587         global_ctx->inodes_to_rebuild = inodes_to_rebuild;
2588         global_ctx->inode_reg_map = inode_reg_map;
2589         global_ctx->block_found_map = block_found_map;
2590         global_ctx->block_dup_map = block_dup_map;
2591         global_ctx->block_ea_map = block_ea_map;
2592         global_ctx->block_metadata_map = block_metadata_map;
2593         global_ctx->dir_info = dir_info;
2594         e2fsck_pass1_merge_dir_info(global_ctx, thread_ctx);
2595         global_ctx->dx_dir_info = dx_dir_info;
2596         global_ctx->dx_dir_info_count = dx_dir_info_count;
2597         global_ctx->dx_dir_info_size = dx_dir_info_size;
2598         e2fsck_pass1_merge_dx_dir(global_ctx, thread_ctx);
2599         global_ctx->inode_count = inode_count;
2600         global_ctx->inode_link_info = inode_link_info;
2601         global_ctx->fs_directory_count += fs_directory_count;
2602         global_ctx->fs_regular_count += fs_regular_count;
2603         global_ctx->fs_blockdev_count += fs_blockdev_count;
2604         global_ctx->fs_chardev_count += fs_chardev_count;
2605         global_ctx->fs_links_count += fs_links_count;
2606         global_ctx->fs_symlinks_count += fs_symlinks_count;
2607         global_ctx->fs_fast_symlinks_count += fs_fast_symlinks_count;
2608         global_ctx->fs_fifo_count += fs_fifo_count;
2609         global_ctx->fs_total_count += fs_total_count;
2610         global_ctx->fs_badblocks_count += fs_badblocks_count;
2611         global_ctx->fs_sockets_count += fs_sockets_count;
2612         global_ctx->fs_ind_count += fs_ind_count;
2613         global_ctx->fs_dind_count += fs_dind_count;
2614         global_ctx->fs_tind_count += fs_tind_count;
2615         global_ctx->fs_fragmented += fs_fragmented;
2616         global_ctx->fs_fragmented_dir += fs_fragmented_dir;
2617         global_ctx->large_files += large_files;
2618
2619         global_ctx->flags |= flags;
2620
2621         retval = e2fsck_pass1_merge_fs(global_fs, thread_fs);
2622         if (retval) {
2623                 com_err(global_ctx->program_name, 0, _("while merging fs\n"));
2624                 return retval;
2625         }
2626         global_fs->priv_data = global_ctx;
2627         global_ctx->fs = global_fs;
2628         global_ctx->logf = global_logf;
2629         global_ctx->problem_logf = global_problem_logf;
2630         global_ctx->global_ctx = NULL;
2631         retval = e2fsck_pass1_merge_icounts(global_ctx, thread_ctx);
2632         if (retval) {
2633                 com_err(global_ctx->program_name, 0,
2634                         _("while merging icounts\n"));
2635                 return retval;
2636         }
2637
2638         global_ctx->dirs_to_hash = dirs_to_hash;
2639         retval = e2fsck_pass1_merge_dirs_to_hash(global_ctx, thread_ctx);
2640         if (retval) {
2641                 com_err(global_ctx->program_name, 0,
2642                         _("while merging dirs to hash\n"));
2643                 return retval;
2644         }
2645
2646         global_ctx->qctx = qctx;
2647         retval = quota_merge_and_update_usage(global_ctx->qctx,
2648                                               thread_ctx->qctx);
2649         if (retval)
2650                 return retval;
2651
2652         retval = e2fsck_pass1_merge_bitmap(global_fs,
2653                                 &thread_ctx->inode_used_map,
2654                                 &global_ctx->inode_used_map);
2655         if (retval)
2656                 return retval;
2657
2658         retval = e2fsck_pass1_merge_bitmap(global_fs,
2659                                 &thread_ctx->inode_bad_map,
2660                                 &global_ctx->inode_bad_map);
2661         if (retval)
2662                 return retval;
2663         retval = e2fsck_pass1_merge_bitmap(global_fs,
2664                                         &thread_ctx->inode_dir_map,
2665                                         &global_ctx->inode_dir_map);
2666         if (retval)
2667                 return retval;
2668         retval = e2fsck_pass1_merge_bitmap(global_fs,
2669                                 &thread_ctx->inode_bb_map,
2670                                 &global_ctx->inode_bb_map);
2671         if (retval)
2672                 return retval;
2673         retval = e2fsck_pass1_merge_bitmap(global_fs,
2674                                 &thread_ctx->inode_imagic_map,
2675                                 &global_ctx->inode_imagic_map);
2676         if (retval)
2677                 return retval;
2678         retval = e2fsck_pass1_merge_bitmap(global_fs,
2679                                 &thread_ctx->inode_reg_map,
2680                                 &global_ctx->inode_reg_map);
2681         if (retval)
2682                 return retval;
2683         retval = e2fsck_pass1_merge_bitmap(global_fs,
2684                                 &thread_ctx->inodes_to_rebuild,
2685                                 &global_ctx->inodes_to_rebuild);
2686         if (retval)
2687                 return retval;
2688         retval = e2fsck_pass1_merge_bitmap(global_fs,
2689                                 &thread_ctx->block_found_map,
2690                                 &global_ctx->block_found_map);
2691         if (retval)
2692                 return retval;
2693         retval = e2fsck_pass1_merge_bitmap(global_fs,
2694                                 &thread_ctx->block_dup_map,
2695                                 &global_ctx->block_dup_map);
2696         if (retval)
2697                 return retval;
2698         retval = e2fsck_pass1_merge_bitmap(global_fs,
2699                                 &thread_ctx->block_ea_map,
2700                                 &global_ctx->block_ea_map);
2701         if (retval)
2702                 return retval;
2703         retval = e2fsck_pass1_merge_bitmap(global_fs,
2704                                 &thread_ctx->block_metadata_map,
2705                                 &global_ctx->block_metadata_map);
2706         if (retval)
2707                 return retval;
2708
2709         return 0;
2710 }
2711
2712 static int e2fsck_pass1_thread_join(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2713 {
2714         errcode_t       retval;
2715
2716         retval = e2fsck_pass1_thread_join_one(global_ctx, thread_ctx);
2717         ext2fs_free_mem(&thread_ctx->fs);
2718         if (thread_ctx->logf)
2719                 fclose(thread_ctx->logf);
2720         if (thread_ctx->problem_logf) {
2721                 fputs("</problem_log>\n", thread_ctx->problem_logf);
2722                 fclose(thread_ctx->problem_logf);
2723         }
2724         e2fsck_pass1_free_bitmap(&thread_ctx->inode_used_map);
2725         e2fsck_pass1_free_bitmap(&thread_ctx->inode_bad_map);
2726         e2fsck_pass1_free_bitmap(&thread_ctx->inode_dir_map);
2727         e2fsck_pass1_free_bitmap(&thread_ctx->inode_bb_map);
2728         e2fsck_pass1_free_bitmap(&thread_ctx->inode_imagic_map);
2729         e2fsck_pass1_free_bitmap(&thread_ctx->inode_reg_map);
2730         e2fsck_pass1_free_bitmap(&thread_ctx->inodes_to_rebuild);
2731         e2fsck_pass1_free_bitmap(&thread_ctx->block_found_map);
2732         e2fsck_pass1_free_bitmap(&thread_ctx->block_dup_map);
2733         e2fsck_pass1_free_bitmap(&thread_ctx->block_ea_map);
2734         e2fsck_pass1_free_bitmap(&thread_ctx->block_metadata_map);
2735         e2fsck_free_dir_info(thread_ctx);
2736         ext2fs_free_icount(thread_ctx->inode_count);
2737         ext2fs_free_icount(thread_ctx->inode_link_info);
2738         if (thread_ctx->dirs_to_hash)
2739                 ext2fs_badblocks_list_free(thread_ctx->dirs_to_hash);
2740         quota_release_context(&thread_ctx->qctx);
2741         ext2fs_free_mem(&thread_ctx);
2742
2743         return retval;
2744 }
2745
2746 static int e2fsck_pass1_threads_join(struct e2fsck_thread_info *infos,
2747                                       int num_threads, e2fsck_t global_ctx)
2748 {
2749         errcode_t                        rc;
2750         errcode_t                        ret = 0;
2751         int                              i;
2752         struct e2fsck_thread_info       *pinfo;
2753
2754         for (i = 0; i < num_threads; i++) {
2755                 pinfo = &infos[i];
2756
2757                 if (!pinfo->eti_started)
2758                         continue;
2759
2760                 rc = pthread_join(pinfo->eti_thread_id, NULL);
2761                 if (rc) {
2762                         com_err(global_ctx->program_name, rc,
2763                                 _("while joining thread\n"));
2764                         if (ret == 0)
2765                                 ret = rc;
2766                 }
2767                 rc = e2fsck_pass1_thread_join(global_ctx, infos[i].eti_thread_ctx);
2768                 if (rc) {
2769                         com_err(global_ctx->program_name, rc,
2770                                 _("while joining pass1 thread\n"));
2771                         if (ret == 0)
2772                                 ret = rc;
2773                 }
2774         }
2775         free(infos);
2776
2777         return ret;
2778 }
2779
2780 static void *e2fsck_pass1_thread(void *arg)
2781 {
2782         struct e2fsck_thread_info       *info = arg;
2783         e2fsck_t                         thread_ctx = info->eti_thread_ctx;
2784 #ifdef DEBUG_THREADS
2785         struct e2fsck_thread_debug      *thread_debug = info->eti_debug;
2786 #endif
2787
2788 #ifdef DEBUG_THREADS
2789         pthread_mutex_lock(&thread_debug->etd_mutex);
2790         while (info->eti_thread_index > thread_debug->etd_finished_threads) {
2791                 pthread_cond_wait(&thread_debug->etd_cond,
2792                                   &thread_debug->etd_mutex);
2793         }
2794         pthread_mutex_unlock(&thread_debug->etd_mutex);
2795 #endif
2796
2797 #ifdef HAVE_SETJMP_H
2798         /*
2799          * When fatal_error() happens, jump to here. The thread
2800          * context's flags will be saved, but its abort_loc will
2801          * be overwritten by original jump buffer for the later
2802          * tests.
2803          */
2804         if (setjmp(thread_ctx->abort_loc)) {
2805                 thread_ctx->flags &= ~E2F_FLAG_SETJMP_OK;
2806                 goto out;
2807         }
2808         thread_ctx->flags |= E2F_FLAG_SETJMP_OK;
2809 #endif
2810
2811         e2fsck_pass1_run(thread_ctx);
2812
2813 out:
2814         if (thread_ctx->options & E2F_OPT_MULTITHREAD)
2815                 log_out(thread_ctx,
2816                         _("Scanned group range [%lu, %lu), inodes %lu\n"),
2817                         thread_ctx->thread_info.et_group_start,
2818                         thread_ctx->thread_info.et_group_end,
2819                         thread_ctx->thread_info.et_inode_number);
2820
2821 #ifdef DEBUG_THREADS
2822         pthread_mutex_lock(&thread_debug->etd_mutex);
2823         thread_debug->etd_finished_threads++;
2824         pthread_cond_broadcast(&thread_debug->etd_cond);
2825         pthread_mutex_unlock(&thread_debug->etd_mutex);
2826 #endif
2827
2828         return NULL;
2829 }
2830
2831 static int e2fsck_pass1_threads_start(struct e2fsck_thread_info **pinfo,
2832                                       int num_threads, e2fsck_t global_ctx)
2833 {
2834         struct e2fsck_thread_info       *infos;
2835         pthread_attr_t                   attr;
2836         errcode_t                        retval;
2837         errcode_t                        ret;
2838         struct e2fsck_thread_info       *tmp_pinfo;
2839         int                              i;
2840         e2fsck_t                         thread_ctx;
2841 #ifdef DEBUG_THREADS
2842         struct e2fsck_thread_debug       thread_debug =
2843                 {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER, 0};
2844
2845         thread_debug.etd_finished_threads = 0;
2846 #endif
2847
2848         retval = pthread_attr_init(&attr);
2849         if (retval) {
2850                 com_err(global_ctx->program_name, retval,
2851                         _("while setting pthread attribute\n"));
2852                 return retval;
2853         }
2854
2855         infos = calloc(num_threads, sizeof(struct e2fsck_thread_info));
2856         if (infos == NULL) {
2857                 retval = -ENOMEM;
2858                 com_err(global_ctx->program_name, retval,
2859                         _("while allocating memory for threads\n"));
2860                 pthread_attr_destroy(&attr);
2861                 return retval;
2862         }
2863
2864         for (i = 0; i < num_threads; i++) {
2865                 tmp_pinfo = &infos[i];
2866                 tmp_pinfo->eti_thread_index = i;
2867 #ifdef DEBUG_THREADS
2868                 tmp_pinfo->eti_debug = &thread_debug;
2869 #endif
2870                 retval = e2fsck_pass1_thread_prepare(global_ctx, &thread_ctx,
2871                                                      i, num_threads);
2872                 if (retval) {
2873                         com_err(global_ctx->program_name, retval,
2874                                 _("while preparing pass1 thread\n"));
2875                         break;
2876                 }
2877                 tmp_pinfo->eti_thread_ctx = thread_ctx;
2878
2879                 retval = pthread_create(&tmp_pinfo->eti_thread_id, &attr,
2880                                         &e2fsck_pass1_thread, tmp_pinfo);
2881                 if (retval) {
2882                         com_err(global_ctx->program_name, retval,
2883                                 _("while creating thread\n"));
2884                         e2fsck_pass1_thread_join(global_ctx, thread_ctx);
2885                         break;
2886                 }
2887
2888                 tmp_pinfo->eti_started = 1;
2889         }
2890
2891         /* destroy the thread attribute object, since it is no longer needed */
2892         ret = pthread_attr_destroy(&attr);
2893         if (ret) {
2894                 com_err(global_ctx->program_name, ret,
2895                         _("while destroying thread attribute\n"));
2896                 if (retval == 0)
2897                         retval = ret;
2898         }
2899
2900         if (retval) {
2901                 e2fsck_pass1_threads_join(infos, num_threads, global_ctx);
2902                 return retval;
2903         }
2904         *pinfo = infos;
2905         return 0;
2906 }
2907
2908 static void e2fsck_pass1_multithread(e2fsck_t global_ctx)
2909 {
2910         struct e2fsck_thread_info       *infos = NULL;
2911         int                              num_threads = 1;
2912         errcode_t                        retval;
2913
2914         retval = e2fsck_pass1_threads_start(&infos, num_threads, global_ctx);
2915         if (retval) {
2916                 com_err(global_ctx->program_name, retval,
2917                         _("while starting pass1 threads\n"));
2918                 goto out_abort;
2919         }
2920
2921         retval = e2fsck_pass1_threads_join(infos, num_threads, global_ctx);
2922         if (retval) {
2923                 com_err(global_ctx->program_name, retval,
2924                         _("while joining pass1 threads\n"));
2925                 goto out_abort;
2926         }
2927         return;
2928 out_abort:
2929         global_ctx->flags |= E2F_FLAG_ABORT;
2930         return;
2931 }
2932 #endif
2933
2934 /* TODO: tdb needs to be handled properly for multiple threads*/
2935 static int multiple_threads_supported(e2fsck_t ctx)
2936 {
2937 #ifdef  CONFIG_TDB
2938         unsigned int            threshold;
2939         ext2_ino_t              num_dirs;
2940         errcode_t               retval;
2941         char                    *tdb_dir;
2942         int                     enable;
2943
2944         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
2945                            &tdb_dir);
2946         profile_get_uint(ctx->profile, "scratch_files",
2947                          "numdirs_threshold", 0, 0, &threshold);
2948         profile_get_boolean(ctx->profile, "scratch_files",
2949                             "icount", 0, 1, &enable);
2950
2951         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
2952         if (retval)
2953                 num_dirs = 1024;        /* Guess */
2954
2955         /* tdb is unsupported now */
2956         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
2957             (!threshold || num_dirs > threshold))
2958                 return 0;
2959  #endif
2960         return 1;
2961 }
2962
2963 void e2fsck_pass1(e2fsck_t ctx)
2964 {
2965
2966         init_ext2_max_sizes();
2967 #ifdef HAVE_PTHREAD
2968         if (multiple_threads_supported(ctx)) {
2969                 e2fsck_pass1_multithread(ctx);
2970                 return;
2971         }
2972         fprintf(stderr, "Fall through single thread for pass1 "
2973                         "because tdb could not handle properly\n");
2974 #endif
2975         e2fsck_pass1_run(ctx);
2976 }
2977
2978 #undef FINISH_INODE_LOOP
2979
2980 /*
2981  * When the inode_scan routines call this callback at the end of the
2982  * glock group, call process_inodes.
2983  */
2984 static errcode_t scan_callback(ext2_filsys fs,
2985                                ext2_inode_scan scan EXT2FS_ATTR((unused)),
2986                                dgrp_t group, void * priv_data)
2987 {
2988         struct scan_callback_struct *scan_struct;
2989         e2fsck_t ctx;
2990         struct e2fsck_thread *tinfo;
2991
2992         scan_struct = (struct scan_callback_struct *) priv_data;
2993         ctx = scan_struct->ctx;
2994
2995         process_inodes((e2fsck_t) fs->priv_data, scan_struct->block_buf,
2996                        scan_struct->inodes_to_process,
2997                        scan_struct->process_inode_count);
2998
2999         if (ctx->progress)
3000                 if ((ctx->progress)(ctx, 1, group+1,
3001                                     ctx->fs->group_desc_count))
3002                         return EXT2_ET_CANCEL_REQUESTED;
3003
3004 #ifdef HAVE_PTHREAD
3005         if (ctx->global_ctx) {
3006                 tinfo = &ctx->thread_info;
3007                 tinfo->et_group_next++;
3008                 if (ctx->options & E2F_OPT_DEBUG &&
3009                     ctx->options & E2F_OPT_MULTITHREAD)
3010                         log_out(ctx, _("group %d finished\n"),
3011                                 tinfo->et_group_next);
3012                 if (tinfo->et_group_next >= tinfo->et_group_end)
3013                         return EXT2_ET_SCAN_FINISHED;
3014         }
3015 #endif
3016
3017         return 0;
3018 }
3019
3020 /*
3021  * Process the inodes in the "inodes to process" list.
3022  */
3023 static void process_inodes(e2fsck_t ctx, char *block_buf,
3024                            struct process_inode_block *inodes_to_process,
3025                            int *process_inode_count)
3026 {
3027         int                     i;
3028         struct ext2_inode       *old_stashed_inode;
3029         ext2_ino_t              old_stashed_ino;
3030         const char              *old_operation;
3031         char                    buf[80];
3032         struct problem_context  pctx;
3033
3034 #if 0
3035         printf("begin process_inodes: ");
3036 #endif
3037         if (*process_inode_count == 0)
3038                 return;
3039         old_operation = ehandler_operation(0);
3040         old_stashed_inode = ctx->stashed_inode;
3041         old_stashed_ino = ctx->stashed_ino;
3042         qsort(inodes_to_process, *process_inode_count,
3043                       sizeof(struct process_inode_block), process_inode_cmp);
3044         clear_problem_context(&pctx);
3045         for (i=0; i < *process_inode_count; i++) {
3046                 pctx.inode = ctx->stashed_inode =
3047                         (struct ext2_inode *) &inodes_to_process[i].inode;
3048                 pctx.ino = ctx->stashed_ino = inodes_to_process[i].ino;
3049
3050 #if 0
3051                 printf("%u ", pctx.ino);
3052 #endif
3053                 sprintf(buf, _("reading indirect blocks of inode %u"),
3054                         pctx.ino);
3055                 ehandler_operation(buf);
3056                 check_blocks(ctx, &pctx, block_buf,
3057                              &inodes_to_process[i].ea_ibody_quota);
3058                 if (e2fsck_should_abort(ctx))
3059                         break;
3060         }
3061         ctx->stashed_inode = old_stashed_inode;
3062         ctx->stashed_ino = old_stashed_ino;
3063         *process_inode_count = 0;
3064 #if 0
3065         printf("end process inodes\n");
3066 #endif
3067         ehandler_operation(old_operation);
3068 }
3069
3070 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b)
3071 {
3072         const struct process_inode_block *ib_a =
3073                 (const struct process_inode_block *) a;
3074         const struct process_inode_block *ib_b =
3075                 (const struct process_inode_block *) b;
3076         int     ret;
3077
3078         ret = (ib_a->inode.i_block[EXT2_IND_BLOCK] -
3079                ib_b->inode.i_block[EXT2_IND_BLOCK]);
3080         if (ret == 0)
3081                 /*
3082                  * We only call process_inodes() for non-extent
3083                  * inodes, so it's OK to pass NULL to
3084                  * ext2fs_file_acl_block() here.
3085                  */
3086                 ret = ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_a->inode)) -
3087                         ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_b->inode));
3088         if (ret == 0)
3089                 ret = ib_a->ino - ib_b->ino;
3090         return ret;
3091 }
3092
3093 /*
3094  * Mark an inode as being bad in some what
3095  */
3096 static void mark_inode_bad(e2fsck_t ctx, ino_t ino)
3097 {
3098         struct          problem_context pctx;
3099
3100         if (!ctx->inode_bad_map) {
3101                 clear_problem_context(&pctx);
3102
3103                 pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3104                                 _("bad inode map"), EXT2FS_BMAP64_RBTREE,
3105                                 "inode_bad_map", &ctx->inode_bad_map);
3106                 if (pctx.errcode) {
3107                         pctx.num = 3;
3108                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3109                         /* Should never get here */
3110                         ctx->flags |= E2F_FLAG_ABORT;
3111                         return;
3112                 }
3113         }
3114         ext2fs_mark_inode_bitmap2(ctx->inode_bad_map, ino);
3115 }
3116
3117 static void add_casefolded_dir(e2fsck_t ctx, ino_t ino)
3118 {
3119         struct          problem_context pctx;
3120
3121         if (!ctx->casefolded_dirs) {
3122                 pctx.errcode = ext2fs_u32_list_create(&ctx->casefolded_dirs, 0);
3123                 if (pctx.errcode)
3124                         goto error;
3125         }
3126         pctx.errcode = ext2fs_u32_list_add(ctx->casefolded_dirs, ino);
3127         if (pctx.errcode == 0)
3128                 return;
3129 error:
3130         fix_problem(ctx, PR_1_ALLOCATE_CASEFOLDED_DIRLIST, &pctx);
3131         /* Should never get here */
3132         ctx->flags |= E2F_FLAG_ABORT;
3133 }
3134
3135 /*
3136  * This procedure will allocate the inode "bb" (badblock) map table
3137  */
3138 static void alloc_bb_map(e2fsck_t ctx)
3139 {
3140         struct          problem_context pctx;
3141
3142         clear_problem_context(&pctx);
3143         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3144                         _("inode in bad block map"), EXT2FS_BMAP64_RBTREE,
3145                         "inode_bb_map", &ctx->inode_bb_map);
3146         if (pctx.errcode) {
3147                 pctx.num = 4;
3148                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3149                 /* Should never get here */
3150                 ctx->flags |= E2F_FLAG_ABORT;
3151                 return;
3152         }
3153 }
3154
3155 /*
3156  * This procedure will allocate the inode imagic table
3157  */
3158 static void alloc_imagic_map(e2fsck_t ctx)
3159 {
3160         struct          problem_context pctx;
3161
3162         clear_problem_context(&pctx);
3163         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3164                         _("imagic inode map"), EXT2FS_BMAP64_RBTREE,
3165                         "inode_imagic_map", &ctx->inode_imagic_map);
3166         if (pctx.errcode) {
3167                 pctx.num = 5;
3168                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3169                 /* Should never get here */
3170                 ctx->flags |= E2F_FLAG_ABORT;
3171                 return;
3172         }
3173 }
3174
3175 /*
3176  * Marks a block as in use, setting the dup_map if it's been set
3177  * already.  Called by process_block and process_bad_block.
3178  *
3179  * WARNING: Assumes checks have already been done to make sure block
3180  * is valid.  This is true in both process_block and process_bad_block.
3181  */
3182 static _INLINE_ void mark_block_used(e2fsck_t ctx, blk64_t block)
3183 {
3184         struct          problem_context pctx;
3185
3186         clear_problem_context(&pctx);
3187
3188         if (ext2fs_fast_test_block_bitmap2(ctx->block_found_map, block)) {
3189                 if (ext2fs_has_feature_shared_blocks(ctx->fs->super) &&
3190                     !(ctx->options & E2F_OPT_UNSHARE_BLOCKS)) {
3191                         return;
3192                 }
3193                 if (!ctx->block_dup_map) {
3194                         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
3195                                         _("multiply claimed block map"),
3196                                         EXT2FS_BMAP64_RBTREE, "block_dup_map",
3197                                         &ctx->block_dup_map);
3198                         if (pctx.errcode) {
3199                                 pctx.num = 3;
3200                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR,
3201                                             &pctx);
3202                                 /* Should never get here */
3203                                 ctx->flags |= E2F_FLAG_ABORT;
3204                                 return;
3205                         }
3206                 }
3207                 ext2fs_fast_mark_block_bitmap2(ctx->block_dup_map, block);
3208         } else {
3209                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, block);
3210         }
3211 }
3212
3213 /*
3214  * When cluster size is greater than one block, it is caller's responsibility
3215  * to make sure block parameter starts at a cluster boundary.
3216  */
3217 static _INLINE_ void mark_blocks_used(e2fsck_t ctx, blk64_t block,
3218                                       unsigned int num)
3219 {
3220         if (ext2fs_test_block_bitmap_range2(ctx->block_found_map, block, num))
3221                 ext2fs_mark_block_bitmap_range2(ctx->block_found_map, block, num);
3222         else {
3223                 unsigned int i;
3224
3225                 for (i = 0; i < num; i += EXT2FS_CLUSTER_RATIO(ctx->fs))
3226                         mark_block_used(ctx, block + i);
3227         }
3228 }
3229
3230 /*
3231  * Adjust the extended attribute block's reference counts at the end
3232  * of pass 1, either by subtracting out references for EA blocks that
3233  * are still referenced in ctx->refcount, or by adding references for
3234  * EA blocks that had extra references as accounted for in
3235  * ctx->refcount_extra.
3236  */
3237 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
3238                                     char *block_buf, int adjust_sign)
3239 {
3240         struct ext2_ext_attr_header     *header;
3241         struct problem_context          pctx;
3242         ext2_filsys                     fs = ctx->fs;
3243         blk64_t                         blk;
3244         __u32                           should_be;
3245         ea_value_t                      count;
3246
3247         clear_problem_context(&pctx);
3248
3249         ea_refcount_intr_begin(refcount);
3250         while (1) {
3251                 if ((blk = ea_refcount_intr_next(refcount, &count)) == 0)
3252                         break;
3253                 pctx.blk = blk;
3254                 pctx.errcode = ext2fs_read_ext_attr3(fs, blk, block_buf,
3255                                                      pctx.ino);
3256                 if (pctx.errcode) {
3257                         fix_problem(ctx, PR_1_EXTATTR_READ_ABORT, &pctx);
3258                         return;
3259                 }
3260                 header = (struct ext2_ext_attr_header *) block_buf;
3261                 pctx.blkcount = header->h_refcount;
3262                 should_be = header->h_refcount + adjust_sign * (int)count;
3263                 pctx.num = should_be;
3264                 if (fix_problem(ctx, PR_1_EXTATTR_REFCOUNT, &pctx)) {
3265                         header->h_refcount = should_be;
3266                         pctx.errcode = ext2fs_write_ext_attr3(fs, blk,
3267                                                              block_buf,
3268                                                              pctx.ino);
3269                         if (pctx.errcode) {
3270                                 fix_problem(ctx, PR_1_EXTATTR_WRITE_ABORT,
3271                                             &pctx);
3272                                 continue;
3273                         }
3274                 }
3275         }
3276 }
3277
3278 /*
3279  * Handle processing the extended attribute blocks
3280  */
3281 static int check_ext_attr(e2fsck_t ctx, struct problem_context *pctx,
3282                            char *block_buf, struct ea_quota *ea_block_quota)
3283 {
3284         ext2_filsys fs = ctx->fs;
3285         ext2_ino_t      ino = pctx->ino;
3286         struct ext2_inode *inode = pctx->inode;
3287         blk64_t         blk;
3288         char *          end;
3289         struct ext2_ext_attr_header *header;
3290         struct ext2_ext_attr_entry *first, *entry;
3291         blk64_t         quota_blocks = EXT2FS_C2B(fs, 1);
3292         __u64           quota_inodes = 0;
3293         region_t        region = 0;
3294         int             failed_csum = 0;
3295
3296         ea_block_quota->blocks = 0;
3297         ea_block_quota->inodes = 0;
3298
3299         blk = ext2fs_file_acl_block(fs, inode);
3300         if (blk == 0)
3301                 return 0;
3302
3303         /*
3304          * If the Extended attribute flag isn't set, then a non-zero
3305          * file acl means that the inode is corrupted.
3306          *
3307          * Or if the extended attribute block is an invalid block,
3308          * then the inode is also corrupted.
3309          */
3310         if (!ext2fs_has_feature_xattr(fs->super) ||
3311             (blk < fs->super->s_first_data_block) ||
3312             (blk >= ext2fs_blocks_count(fs->super))) {
3313                 mark_inode_bad(ctx, ino);
3314                 return 0;
3315         }
3316
3317         /* If ea bitmap hasn't been allocated, create it */
3318         if (!ctx->block_ea_map) {
3319                 pctx->errcode = e2fsck_allocate_block_bitmap(fs,
3320                                         _("ext attr block map"),
3321                                         EXT2FS_BMAP64_RBTREE, "block_ea_map",
3322                                         &ctx->block_ea_map);
3323                 if (pctx->errcode) {
3324                         pctx->num = 2;
3325                         fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, pctx);
3326                         ctx->flags |= E2F_FLAG_ABORT;
3327                         return 0;
3328                 }
3329         }
3330
3331         /* Create the EA refcount structure if necessary */
3332         if (!ctx->refcount) {
3333                 pctx->errcode = ea_refcount_create(0, &ctx->refcount);
3334                 if (pctx->errcode) {
3335                         pctx->num = 1;
3336                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3337                         ctx->flags |= E2F_FLAG_ABORT;
3338                         return 0;
3339                 }
3340         }
3341
3342 #if 0
3343         /* Debugging text */
3344         printf("Inode %u has EA block %u\n", ino, blk);
3345 #endif
3346
3347         /* Have we seen this EA block before? */
3348         if (ext2fs_fast_test_block_bitmap2(ctx->block_ea_map, blk)) {
3349                 ea_block_quota->blocks = EXT2FS_C2B(fs, 1);
3350                 ea_block_quota->inodes = 0;
3351
3352                 if (ctx->ea_block_quota_blocks) {
3353                         ea_refcount_fetch(ctx->ea_block_quota_blocks, blk,
3354                                           &quota_blocks);
3355                         if (quota_blocks)
3356                                 ea_block_quota->blocks = quota_blocks;
3357                 }
3358
3359                 if (ctx->ea_block_quota_inodes)
3360                         ea_refcount_fetch(ctx->ea_block_quota_inodes, blk,
3361                                           &ea_block_quota->inodes);
3362
3363                 if (ea_refcount_decrement(ctx->refcount, blk, 0) == 0)
3364                         return 1;
3365                 /* Ooops, this EA was referenced more than it stated */
3366                 if (!ctx->refcount_extra) {
3367                         pctx->errcode = ea_refcount_create(0,
3368                                            &ctx->refcount_extra);
3369                         if (pctx->errcode) {
3370                                 pctx->num = 2;
3371                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3372                                 ctx->flags |= E2F_FLAG_ABORT;
3373                                 return 0;
3374                         }
3375                 }
3376                 ea_refcount_increment(ctx->refcount_extra, blk, 0);
3377                 return 1;
3378         }
3379
3380         /*
3381          * OK, we haven't seen this EA block yet.  So we need to
3382          * validate it
3383          */
3384         pctx->blk = blk;
3385         pctx->errcode = ext2fs_read_ext_attr3(fs, blk, block_buf, pctx->ino);
3386         if (pctx->errcode == EXT2_ET_EXT_ATTR_CSUM_INVALID) {
3387                 pctx->errcode = 0;
3388                 failed_csum = 1;
3389         } else if (pctx->errcode == EXT2_ET_BAD_EA_HEADER)
3390                 pctx->errcode = 0;
3391
3392         if (pctx->errcode &&
3393             fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx)) {
3394                 pctx->errcode = 0;
3395                 goto clear_extattr;
3396         }
3397         header = (struct ext2_ext_attr_header *) block_buf;
3398         pctx->blk = ext2fs_file_acl_block(fs, inode);
3399         if (((ctx->ext_attr_ver == 1) &&
3400              (header->h_magic != EXT2_EXT_ATTR_MAGIC_v1)) ||
3401             ((ctx->ext_attr_ver == 2) &&
3402              (header->h_magic != EXT2_EXT_ATTR_MAGIC))) {
3403                 if (fix_problem(ctx, PR_1_BAD_EA_BLOCK, pctx))
3404                         goto clear_extattr;
3405         }
3406
3407         if (header->h_blocks != 1) {
3408                 if (fix_problem(ctx, PR_1_EA_MULTI_BLOCK, pctx))
3409                         goto clear_extattr;
3410         }
3411
3412         if (pctx->errcode && fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx))
3413                 goto clear_extattr;
3414
3415         region = region_create(0, fs->blocksize);
3416         if (!region) {
3417                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
3418                 ctx->flags |= E2F_FLAG_ABORT;
3419                 return 0;
3420         }
3421         if (region_allocate(region, 0, sizeof(struct ext2_ext_attr_header))) {
3422                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3423                         goto clear_extattr;
3424         }
3425
3426         first = (struct ext2_ext_attr_entry *)(header+1);
3427         end = block_buf + fs->blocksize;
3428         entry = first;
3429         while ((char *)entry < end && *(__u32 *)entry) {
3430                 __u32 hash;
3431
3432                 if (region_allocate(region, (char *)entry - (char *)header,
3433                                    EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
3434                         if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3435                                 goto clear_extattr;
3436                         break;
3437                 }
3438                 if ((ctx->ext_attr_ver == 1 &&
3439                      (entry->e_name_len == 0 || entry->e_name_index != 0)) ||
3440                     (ctx->ext_attr_ver == 2 &&
3441                      entry->e_name_index == 0)) {
3442                         if (fix_problem(ctx, PR_1_EA_BAD_NAME, pctx))
3443                                 goto clear_extattr;
3444                         break;
3445                 }
3446                 if (entry->e_value_inum == 0) {
3447                         if (entry->e_value_size > EXT2_XATTR_SIZE_MAX ||
3448                             (entry->e_value_offs + entry->e_value_size >
3449                              fs->blocksize)) {
3450                                 if (fix_problem(ctx, PR_1_EA_BAD_VALUE, pctx))
3451                                         goto clear_extattr;
3452                                 break;
3453                         }
3454                         if (entry->e_value_size &&
3455                             region_allocate(region, entry->e_value_offs,
3456                                             EXT2_EXT_ATTR_SIZE(entry->e_value_size))) {
3457                                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION,
3458                                                 pctx))
3459                                         goto clear_extattr;
3460                         }
3461
3462                         hash = ext2fs_ext_attr_hash_entry(entry, block_buf +
3463                                                           entry->e_value_offs);
3464
3465                         if (entry->e_hash != hash) {
3466                                 pctx->num = entry->e_hash;
3467                                 if (fix_problem(ctx, PR_1_ATTR_HASH, pctx))
3468                                         goto clear_extattr;
3469                                 entry->e_hash = hash;
3470                         }
3471                 } else {
3472                         problem_t problem;
3473                         blk64_t entry_quota_blocks;
3474
3475                         problem = check_large_ea_inode(ctx, entry, pctx,
3476                                                        &entry_quota_blocks);
3477                         if (problem && fix_problem(ctx, problem, pctx))
3478                                 goto clear_extattr;
3479
3480                         quota_blocks += entry_quota_blocks;
3481                         quota_inodes++;
3482                 }
3483
3484                 entry = EXT2_EXT_ATTR_NEXT(entry);
3485         }
3486         if (region_allocate(region, (char *)entry - (char *)header, 4)) {
3487                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3488                         goto clear_extattr;
3489         }
3490         region_free(region);
3491
3492         /*
3493          * We only get here if there was no other errors that were fixed.
3494          * If there was a checksum fail, ask to correct it.
3495          */
3496         if (failed_csum &&
3497             fix_problem(ctx, PR_1_EA_BLOCK_ONLY_CSUM_INVALID, pctx)) {
3498                 pctx->errcode = ext2fs_write_ext_attr3(fs, blk, block_buf,
3499                                                        pctx->ino);
3500                 if (pctx->errcode)
3501                         return 0;
3502         }
3503
3504         if (quota_blocks != EXT2FS_C2B(fs, 1U)) {
3505                 if (!ctx->ea_block_quota_blocks) {
3506                         pctx->errcode = ea_refcount_create(0,
3507                                                 &ctx->ea_block_quota_blocks);
3508                         if (pctx->errcode) {
3509                                 pctx->num = 3;
3510                                 goto refcount_fail;
3511                         }
3512                 }
3513                 ea_refcount_store(ctx->ea_block_quota_blocks, blk,
3514                                   quota_blocks);
3515         }
3516
3517         if (quota_inodes) {
3518                 if (!ctx->ea_block_quota_inodes) {
3519                         pctx->errcode = ea_refcount_create(0,
3520                                                 &ctx->ea_block_quota_inodes);
3521                         if (pctx->errcode) {
3522                                 pctx->num = 4;
3523 refcount_fail:
3524                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3525                                 ctx->flags |= E2F_FLAG_ABORT;
3526                                 return 0;
3527                         }
3528                 }
3529
3530                 ea_refcount_store(ctx->ea_block_quota_inodes, blk,
3531                                   quota_inodes);
3532         }
3533         ea_block_quota->blocks = quota_blocks;
3534         ea_block_quota->inodes = quota_inodes;
3535
3536         inc_ea_inode_refs(ctx, pctx, first, end);
3537         ea_refcount_store(ctx->refcount, blk, header->h_refcount - 1);
3538         mark_block_used(ctx, blk);
3539         ext2fs_fast_mark_block_bitmap2(ctx->block_ea_map, blk);
3540         return 1;
3541
3542 clear_extattr:
3543         if (region)
3544                 region_free(region);
3545         ext2fs_file_acl_block_set(fs, inode, 0);
3546         e2fsck_write_inode(ctx, ino, inode, "check_ext_attr");
3547         return 0;
3548 }
3549
3550 /* Returns 1 if bad htree, 0 if OK */
3551 static int handle_htree(e2fsck_t ctx, struct problem_context *pctx,
3552                         ext2_ino_t ino, struct ext2_inode *inode,
3553                         char *block_buf)
3554 {
3555         struct ext2_dx_root_info        *root;
3556         ext2_filsys                     fs = ctx->fs;
3557         errcode_t                       retval;
3558         blk64_t                         blk;
3559
3560         if ((!LINUX_S_ISDIR(inode->i_mode) &&
3561              fix_problem(ctx, PR_1_HTREE_NODIR, pctx)) ||
3562             (!ext2fs_has_feature_dir_index(fs->super) &&
3563              fix_problem(ctx, PR_1_HTREE_SET, pctx)))
3564                 return 1;
3565
3566         pctx->errcode = ext2fs_bmap2(fs, ino, inode, 0, 0, 0, 0, &blk);
3567
3568         if ((pctx->errcode) ||
3569             (blk == 0) ||
3570             (blk < fs->super->s_first_data_block) ||
3571             (blk >= ext2fs_blocks_count(fs->super))) {
3572                 if (fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3573                         return 1;
3574                 else
3575                         return 0;
3576         }
3577
3578         retval = io_channel_read_blk64(fs->io, blk, 1, block_buf);
3579         if (retval && fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3580                 return 1;
3581
3582         /* XXX should check that beginning matches a directory */
3583         root = (struct ext2_dx_root_info *) (block_buf + 24);
3584
3585         if ((root->reserved_zero || root->info_length < 8) &&
3586             fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
3587                 return 1;
3588
3589         pctx->num = root->hash_version;
3590         if ((root->hash_version != EXT2_HASH_LEGACY) &&
3591             (root->hash_version != EXT2_HASH_HALF_MD4) &&
3592             (root->hash_version != EXT2_HASH_TEA) &&
3593             (root->hash_version != EXT2_HASH_SIPHASH) &&
3594             fix_problem(ctx, PR_1_HTREE_HASHV, pctx))
3595                 return 1;
3596
3597         if (ext4_hash_in_dirent(inode)) {
3598                 if (root->hash_version != EXT2_HASH_SIPHASH &&
3599                     fix_problem(ctx, PR_1_HTREE_NEEDS_SIPHASH, pctx))
3600                         return 1;
3601         } else {
3602                 if (root->hash_version == EXT2_HASH_SIPHASH &&
3603                    fix_problem(ctx, PR_1_HTREE_CANNOT_SIPHASH, pctx))
3604                         return 1;
3605         }
3606
3607         if ((root->unused_flags & EXT2_HASH_FLAG_INCOMPAT) &&
3608             fix_problem(ctx, PR_1_HTREE_INCOMPAT, pctx))
3609                 return 1;
3610
3611         pctx->num = root->indirect_levels;
3612         /* if htree level is clearly too high, consider it to be broken */
3613         if (root->indirect_levels > EXT4_HTREE_LEVEL &&
3614             fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
3615                 return 1;
3616
3617         /* if level is only maybe too high, LARGE_DIR feature could be unset */
3618         if (root->indirect_levels > ext2_dir_htree_level(fs) &&
3619             !ext2fs_has_feature_largedir(fs->super)) {
3620                 int blockbits = EXT2_BLOCK_SIZE_BITS(fs->super) + 10;
3621                 unsigned idx_pb = 1 << (blockbits - 3);
3622
3623                 /* compare inode size/blocks vs. max-sized 2-level htree */
3624                 if (EXT2_I_SIZE(pctx->inode) <
3625                     (idx_pb - 1) * (idx_pb - 2) << blockbits &&
3626                     pctx->inode->i_blocks <
3627                     (idx_pb - 1) * (idx_pb - 2) << (blockbits - 9) &&
3628                     fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
3629                         return 1;
3630         }
3631
3632         if (root->indirect_levels > EXT4_HTREE_LEVEL_COMPAT ||
3633             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
3634                 ctx->large_dirs++;
3635
3636         return 0;
3637 }
3638
3639 void e2fsck_clear_inode(e2fsck_t ctx, ext2_ino_t ino,
3640                         struct ext2_inode *inode, int restart_flag,
3641                         const char *source)
3642 {
3643         inode->i_flags = 0;
3644         inode->i_links_count = 0;
3645         ext2fs_icount_store(ctx->inode_link_info, ino, 0);
3646         inode->i_dtime = ctx->now;
3647
3648         /*
3649          * If a special inode has such rotten block mappings that we
3650          * want to clear the whole inode, be sure to actually zap
3651          * the block maps because i_links_count isn't checked for
3652          * special inodes, and we'll end up right back here the next
3653          * time we run fsck.
3654          */
3655         if (ino < EXT2_FIRST_INODE(ctx->fs->super))
3656                 memset(inode->i_block, 0, sizeof(inode->i_block));
3657
3658         ext2fs_unmark_inode_bitmap2(ctx->inode_dir_map, ino);
3659         ext2fs_unmark_inode_bitmap2(ctx->inode_used_map, ino);
3660         if (ctx->inode_reg_map)
3661                 ext2fs_unmark_inode_bitmap2(ctx->inode_reg_map, ino);
3662         if (ctx->inode_bad_map)
3663                 ext2fs_unmark_inode_bitmap2(ctx->inode_bad_map, ino);
3664
3665         /*
3666          * If the inode was partially accounted for before processing
3667          * was aborted, we need to restart the pass 1 scan.
3668          */
3669         ctx->flags |= restart_flag;
3670
3671         if (ino == EXT2_BAD_INO)
3672                 memset(inode, 0, sizeof(struct ext2_inode));
3673
3674         e2fsck_write_inode(ctx, ino, inode, source);
3675 }
3676
3677 /*
3678  * Use the multiple-blocks reclamation code to fix alignment problems in
3679  * a bigalloc filesystem.  We want a logical cluster to map to *only* one
3680  * physical cluster, and we want the block offsets within that cluster to
3681  * line up.
3682  */
3683 static int has_unaligned_cluster_map(e2fsck_t ctx,
3684                                      blk64_t last_pblk, blk64_t last_lblk,
3685                                      blk64_t pblk, blk64_t lblk)
3686 {
3687         blk64_t cluster_mask;
3688
3689         if (!ctx->fs->cluster_ratio_bits)
3690                 return 0;
3691         cluster_mask = EXT2FS_CLUSTER_MASK(ctx->fs);
3692
3693         /*
3694          * If the block in the logical cluster doesn't align with the block in
3695          * the physical cluster...
3696          */
3697         if ((lblk & cluster_mask) != (pblk & cluster_mask))
3698                 return 1;
3699
3700         /*
3701          * If we cross a physical cluster boundary within a logical cluster...
3702          */
3703         if (last_pblk && (lblk & cluster_mask) != 0 &&
3704             EXT2FS_B2C(ctx->fs, lblk) == EXT2FS_B2C(ctx->fs, last_lblk) &&
3705             EXT2FS_B2C(ctx->fs, pblk) != EXT2FS_B2C(ctx->fs, last_pblk))
3706                 return 1;
3707
3708         return 0;
3709 }
3710
3711 static void scan_extent_node(e2fsck_t ctx, struct problem_context *pctx,
3712                              struct process_block_struct *pb,
3713                              blk64_t start_block, blk64_t end_block,
3714                              blk64_t eof_block,
3715                              ext2_extent_handle_t ehandle,
3716                              int try_repairs)
3717 {
3718         struct ext2fs_extent    extent;
3719         blk64_t                 blk, last_lblk;
3720         unsigned int            i, n;
3721         int                     is_dir, is_leaf;
3722         problem_t               problem;
3723         struct ext2_extent_info info;
3724         int                     failed_csum = 0;
3725
3726         if (pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID)
3727                 failed_csum = 1;
3728
3729         pctx->errcode = ext2fs_extent_get_info(ehandle, &info);
3730         if (pctx->errcode)
3731                 return;
3732         if (!(ctx->options & E2F_OPT_FIXES_ONLY) &&
3733             !pb->eti.force_rebuild &&
3734             info.curr_level < MAX_EXTENT_DEPTH_COUNT) {
3735                 struct extent_tree_level *etl;
3736
3737                 etl = pb->eti.ext_info + info.curr_level;
3738                 etl->num_extents += info.num_entries;
3739                 etl->max_extents += info.max_entries;
3740                 /*
3741                  * Implementation wart: Splitting extent blocks when appending
3742                  * will leave the old block with one free entry.  Therefore
3743                  * unless the node is totally full, pretend that a non-root
3744                  * extent block can hold one fewer entry than it actually does,
3745                  * so that we don't repeatedly rebuild the extent tree.
3746                  */
3747                 if (info.curr_level && info.num_entries < info.max_entries)
3748                         etl->max_extents--;
3749         }
3750
3751         pctx->errcode = ext2fs_extent_get(ehandle, EXT2_EXTENT_FIRST_SIB,
3752                                           &extent);
3753         while ((pctx->errcode == 0 ||
3754                 pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID) &&
3755                info.num_entries-- > 0) {
3756                 is_leaf = extent.e_flags & EXT2_EXTENT_FLAGS_LEAF;
3757                 is_dir = LINUX_S_ISDIR(pctx->inode->i_mode);
3758                 last_lblk = extent.e_lblk + extent.e_len - 1;
3759
3760                 problem = 0;
3761                 pctx->blk = extent.e_pblk;
3762                 pctx->blk2 = extent.e_lblk;
3763                 pctx->num = extent.e_len;
3764                 pctx->blkcount = extent.e_lblk + extent.e_len;
3765
3766                 if (extent.e_pblk == 0 ||
3767                     extent.e_pblk < ctx->fs->super->s_first_data_block ||
3768                     extent.e_pblk >= ext2fs_blocks_count(ctx->fs->super))
3769                         problem = PR_1_EXTENT_BAD_START_BLK;
3770                 else if (extent.e_lblk < start_block)
3771                         problem = PR_1_OUT_OF_ORDER_EXTENTS;
3772                 else if ((end_block && last_lblk > end_block) &&
3773                          !(last_lblk > eof_block &&
3774                            ((extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) ||
3775                             (pctx->inode->i_flags & EXT4_VERITY_FL))))
3776                         problem = PR_1_EXTENT_END_OUT_OF_BOUNDS;
3777                 else if (is_leaf && extent.e_len == 0)
3778                         problem = PR_1_EXTENT_LENGTH_ZERO;
3779                 else if (is_leaf &&
3780                          (extent.e_pblk + extent.e_len) >
3781                          ext2fs_blocks_count(ctx->fs->super))
3782                         problem = PR_1_EXTENT_ENDS_BEYOND;
3783                 else if (is_leaf && is_dir && !pctx->inode->i_size_high &&
3784                          !ext2fs_has_feature_largedir(ctx->fs->super) &&
3785                          ((extent.e_lblk + extent.e_len) >
3786                           (1U << (21 - ctx->fs->super->s_log_block_size))))
3787                         problem = PR_1_TOOBIG_DIR;
3788
3789                 if (is_leaf && problem == 0 && extent.e_len > 0) {
3790 #if 0
3791                         printf("extent_region(ino=%u, expect=%llu, "
3792                                "lblk=%llu, len=%u)\n", pb->ino,
3793                                (unsigned long long) pb->next_lblock,
3794                                (unsigned long long) extent.e_lblk,
3795                                extent.e_len);
3796 #endif
3797                         if (extent.e_lblk < pb->next_lblock)
3798                                 problem = PR_1_EXTENT_COLLISION;
3799                         else if (extent.e_lblk + extent.e_len > pb->next_lblock)
3800                                 pb->next_lblock = extent.e_lblk + extent.e_len;
3801                 }
3802
3803                 /*
3804                  * Uninitialized blocks in a directory?  Clear the flag and
3805                  * we'll interpret the blocks later.
3806                  */
3807                 if (try_repairs && is_dir && problem == 0 &&
3808                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3809                     fix_problem(ctx, PR_1_UNINIT_DBLOCK, pctx)) {
3810                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3811                         pb->inode_modified = 1;
3812                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3813                                                               &extent);
3814                         if (pctx->errcode)
3815                                 return;
3816                         failed_csum = 0;
3817                 }
3818 #ifdef CONFIG_DEVELOPER_FEATURES
3819                 if (try_repairs && !is_dir && problem == 0 &&
3820                     (ctx->options & E2F_OPT_CLEAR_UNINIT) &&
3821                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
3822                     fix_problem(ctx, PR_1_CLEAR_UNINIT_EXTENT, pctx)) {
3823                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
3824                         pb->inode_modified = 1;
3825                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
3826                                                               &extent);
3827                         if (pctx->errcode)
3828                                 return;
3829                         failed_csum = 0;
3830                 }
3831 #endif
3832                 if (try_repairs && problem) {
3833 report_problem:
3834                         if (fix_problem(ctx, problem, pctx)) {
3835                                 if (ctx->invalid_bitmaps) {
3836                                         /*
3837                                          * If fsck knows the bitmaps are bad,
3838                                          * skip to the next extent and
3839                                          * try to clear this extent again
3840                                          * after fixing the bitmaps, by
3841                                          * restarting fsck.
3842                                          */
3843                                         pctx->errcode = ext2fs_extent_get(
3844                                                           ehandle,
3845                                                           EXT2_EXTENT_NEXT_SIB,
3846                                                           &extent);
3847                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3848                                         if (pctx->errcode ==
3849                                                     EXT2_ET_NO_CURRENT_NODE) {
3850                                                 pctx->errcode = 0;
3851                                                 break;
3852                                         }
3853                                         continue;
3854                                 }
3855                                 e2fsck_read_bitmaps(ctx);
3856                                 pb->inode_modified = 1;
3857                                 pctx->errcode =
3858                                         ext2fs_extent_delete(ehandle, 0);
3859                                 if (pctx->errcode) {
3860                                         pctx->str = "ext2fs_extent_delete";
3861                                         return;
3862                                 }
3863                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
3864                                 if (pctx->errcode &&
3865                                     pctx->errcode != EXT2_ET_NO_CURRENT_NODE) {
3866                                         pctx->str = "ext2fs_extent_fix_parents";
3867                                         return;
3868                                 }
3869                                 pctx->errcode = ext2fs_extent_get(ehandle,
3870                                                                   EXT2_EXTENT_CURRENT,
3871                                                                   &extent);
3872                                 if (pctx->errcode == EXT2_ET_NO_CURRENT_NODE) {
3873                                         pctx->errcode = 0;
3874                                         break;
3875                                 }
3876                                 failed_csum = 0;
3877                                 continue;
3878                         }
3879                         goto next;
3880                 }
3881
3882                 if (!is_leaf) {
3883                         blk64_t lblk = extent.e_lblk;
3884                         int next_try_repairs = 1;
3885
3886                         blk = extent.e_pblk;
3887
3888                         /*
3889                          * If this lower extent block collides with critical
3890                          * metadata, don't try to repair the damage.  Pass 1b
3891                          * will reallocate the block; then we can try again.
3892                          */
3893                         if (pb->ino != EXT2_RESIZE_INO &&
3894                             extent.e_pblk < ctx->fs->super->s_blocks_count &&
3895                             ext2fs_test_block_bitmap2(ctx->block_metadata_map,
3896                                                       extent.e_pblk)) {
3897                                 next_try_repairs = 0;
3898                                 pctx->blk = blk;
3899                                 fix_problem(ctx,
3900                                             PR_1_CRITICAL_METADATA_COLLISION,
3901                                             pctx);
3902                                 if ((ctx->options & E2F_OPT_NO) == 0)
3903                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
3904                         }
3905                         pctx->errcode = ext2fs_extent_get(ehandle,
3906                                                   EXT2_EXTENT_DOWN, &extent);
3907                         if (pctx->errcode &&
3908                             pctx->errcode != EXT2_ET_EXTENT_CSUM_INVALID) {
3909                                 pctx->str = "EXT2_EXTENT_DOWN";
3910                                 problem = PR_1_EXTENT_HEADER_INVALID;
3911                                 if (!next_try_repairs)
3912                                         return;
3913                                 if (pctx->errcode == EXT2_ET_EXTENT_HEADER_BAD)
3914                                         goto report_problem;
3915                                 return;
3916                         }
3917                         /* The next extent should match this index's logical start */
3918                         if (extent.e_lblk != lblk) {
3919                                 struct ext2_extent_info e_info;
3920
3921                                 pctx->errcode = ext2fs_extent_get_info(ehandle,
3922                                                                        &e_info);
3923                                 if (pctx->errcode) {
3924                                         pctx->str = "ext2fs_extent_get_info";
3925                                         return;
3926                                 }
3927                                 pctx->blk = lblk;
3928                                 pctx->blk2 = extent.e_lblk;
3929                                 pctx->num = e_info.curr_level - 1;
3930                                 problem = PR_1_EXTENT_INDEX_START_INVALID;
3931                                 if (fix_problem(ctx, problem, pctx)) {
3932                                         pb->inode_modified = 1;
3933                                         pctx->errcode =
3934                                                 ext2fs_extent_fix_parents(ehandle);
3935                                         if (pctx->errcode) {
3936                                                 pctx->str = "ext2fs_extent_fix_parents";
3937                                                 return;
3938                                         }
3939                                 }
3940                         }
3941                         scan_extent_node(ctx, pctx, pb, extent.e_lblk,
3942                                          last_lblk, eof_block, ehandle,
3943                                          next_try_repairs);
3944                         if (pctx->errcode)
3945                                 return;
3946                         pctx->errcode = ext2fs_extent_get(ehandle,
3947                                                   EXT2_EXTENT_UP, &extent);
3948                         if (pctx->errcode) {
3949                                 pctx->str = "EXT2_EXTENT_UP";
3950                                 return;
3951                         }
3952                         mark_block_used(ctx, blk);
3953                         pb->num_blocks++;
3954                         goto next;
3955                 }
3956
3957                 if ((pb->previous_block != 0) &&
3958                     (pb->previous_block+1 != extent.e_pblk)) {
3959                         if (ctx->options & E2F_OPT_FRAGCHECK) {
3960                                 char type = '?';
3961
3962                                 if (pb->is_dir)
3963                                         type = 'd';
3964                                 else if (pb->is_reg)
3965                                         type = 'f';
3966
3967                                 printf(("%6lu(%c): expecting %6lu "
3968                                         "actual extent "
3969                                         "phys %6lu log %lu len %lu\n"),
3970                                        (unsigned long) pctx->ino, type,
3971                                        (unsigned long) pb->previous_block+1,
3972                                        (unsigned long) extent.e_pblk,
3973                                        (unsigned long) extent.e_lblk,
3974                                        (unsigned long) extent.e_len);
3975                         }
3976                         pb->fragmented = 1;
3977                 }
3978                 /*
3979                  * If we notice a gap in the logical block mappings of an
3980                  * extent-mapped directory, offer to close the hole by
3981                  * moving the logical block down, otherwise we'll go mad in
3982                  * pass 3 allocating empty directory blocks to fill the hole.
3983                  */
3984                 if (try_repairs && is_dir &&
3985                     pb->last_block + 1 < extent.e_lblk) {
3986                         blk64_t new_lblk;
3987
3988                         new_lblk = pb->last_block + 1;
3989                         if (EXT2FS_CLUSTER_RATIO(ctx->fs) > 1)
3990                                 new_lblk = ((new_lblk +
3991                                              EXT2FS_CLUSTER_RATIO(ctx->fs) - 1) &
3992                                             ~EXT2FS_CLUSTER_MASK(ctx->fs)) |
3993                                            (extent.e_pblk &
3994                                             EXT2FS_CLUSTER_MASK(ctx->fs));
3995                         pctx->blk = extent.e_lblk;
3996                         pctx->blk2 = new_lblk;
3997                         if (fix_problem(ctx, PR_1_COLLAPSE_DBLOCK, pctx)) {
3998                                 extent.e_lblk = new_lblk;
3999                                 pb->inode_modified = 1;
4000                                 pctx->errcode = ext2fs_extent_replace(ehandle,
4001                                                                 0, &extent);
4002                                 if (pctx->errcode) {
4003                                         pctx->errcode = 0;
4004                                         goto alloc_later;
4005                                 }
4006                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
4007                                 if (pctx->errcode)
4008                                         goto failed_add_dir_block;
4009                                 pctx->errcode = ext2fs_extent_goto(ehandle,
4010                                                                 extent.e_lblk);
4011                                 if (pctx->errcode)
4012                                         goto failed_add_dir_block;
4013                                 last_lblk = extent.e_lblk + extent.e_len - 1;
4014                                 failed_csum = 0;
4015                         }
4016                 }
4017 alloc_later:
4018                 if (is_dir) {
4019                         while (++pb->last_db_block <
4020                                (e2_blkcnt_t) extent.e_lblk) {
4021                                 pctx->errcode = ext2fs_add_dir_block2(
4022                                                         ctx->fs->dblist,
4023                                                         pb->ino, 0,
4024                                                         pb->last_db_block);
4025                                 if (pctx->errcode) {
4026                                         pctx->blk = 0;
4027                                         pctx->num = pb->last_db_block;
4028                                         goto failed_add_dir_block;
4029                                 }
4030                         }
4031
4032                         for (i = 0; i < extent.e_len; i++) {
4033                                 pctx->errcode = ext2fs_add_dir_block2(
4034                                                         ctx->fs->dblist,
4035                                                         pctx->ino,
4036                                                         extent.e_pblk + i,
4037                                                         extent.e_lblk + i);
4038                                 if (pctx->errcode) {
4039                                         pctx->blk = extent.e_pblk + i;
4040                                         pctx->num = extent.e_lblk + i;
4041                                 failed_add_dir_block:
4042                                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4043                                         /* Should never get here */
4044                                         ctx->flags |= E2F_FLAG_ABORT;
4045                                         return;
4046                                 }
4047                         }
4048                         if (extent.e_len > 0)
4049                                 pb->last_db_block = extent.e_lblk + extent.e_len - 1;
4050                 }
4051                 if (has_unaligned_cluster_map(ctx, pb->previous_block,
4052                                               pb->last_block,
4053                                               extent.e_pblk,
4054                                               extent.e_lblk)) {
4055                         for (i = 0; i < extent.e_len; i++) {
4056                                 pctx->blk = extent.e_lblk + i;
4057                                 pctx->blk2 = extent.e_pblk + i;
4058                                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4059                                 mark_block_used(ctx, extent.e_pblk + i);
4060                                 mark_block_used(ctx, extent.e_pblk + i);
4061                         }
4062                 }
4063
4064                 /*
4065                  * Check whether first cluster got marked in previous iteration.
4066                  */
4067                 if (ctx->fs->cluster_ratio_bits &&
4068                     pb->previous_block &&
4069                     (EXT2FS_B2C(ctx->fs, extent.e_pblk) ==
4070                      EXT2FS_B2C(ctx->fs, pb->previous_block)))
4071                         /* Set blk to the beginning of next cluster. */
4072                         blk = EXT2FS_C2B(
4073                                 ctx->fs,
4074                                 EXT2FS_B2C(ctx->fs, extent.e_pblk) + 1);
4075                 else
4076                         /* Set blk to the beginning of current cluster. */
4077                         blk = EXT2FS_C2B(ctx->fs,
4078                                          EXT2FS_B2C(ctx->fs, extent.e_pblk));
4079
4080                 if (blk < extent.e_pblk + extent.e_len) {
4081                         mark_blocks_used(ctx, blk,
4082                                          extent.e_pblk + extent.e_len - blk);
4083                         n = DIV_ROUND_UP(extent.e_pblk + extent.e_len - blk,
4084                                          EXT2FS_CLUSTER_RATIO(ctx->fs));
4085                         pb->num_blocks += n;
4086                 }
4087                 pb->last_block = extent.e_lblk + extent.e_len - 1;
4088                 pb->previous_block = extent.e_pblk + extent.e_len - 1;
4089                 start_block = pb->last_block = last_lblk;
4090                 if (is_leaf && !is_dir &&
4091                     !(extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT))
4092                         pb->last_init_lblock = last_lblk;
4093         next:
4094                 pctx->errcode = ext2fs_extent_get(ehandle,
4095                                                   EXT2_EXTENT_NEXT_SIB,
4096                                                   &extent);
4097         }
4098
4099         /* Failed csum but passes checks?  Ask to fix checksum. */
4100         if (failed_csum &&
4101             fix_problem(ctx, PR_1_EXTENT_ONLY_CSUM_INVALID, pctx)) {
4102                 pb->inode_modified = 1;
4103                 pctx->errcode = ext2fs_extent_replace(ehandle, 0, &extent);
4104                 if (pctx->errcode)
4105                         return;
4106         }
4107
4108         if (pctx->errcode == EXT2_ET_EXTENT_NO_NEXT)
4109                 pctx->errcode = 0;
4110 }
4111
4112 static void check_blocks_extents(e2fsck_t ctx, struct problem_context *pctx,
4113                                  struct process_block_struct *pb)
4114 {
4115         struct ext2_extent_info info;
4116         struct ext2_inode       *inode = pctx->inode;
4117         ext2_extent_handle_t    ehandle;
4118         ext2_filsys             fs = ctx->fs;
4119         ext2_ino_t              ino = pctx->ino;
4120         errcode_t               retval;
4121         blk64_t                 eof_lblk;
4122         struct ext3_extent_header       *eh;
4123
4124         /* Check for a proper extent header... */
4125         eh = (struct ext3_extent_header *) &inode->i_block[0];
4126         retval = ext2fs_extent_header_verify(eh, sizeof(inode->i_block));
4127         if (retval) {
4128                 if (fix_problem(ctx, PR_1_MISSING_EXTENT_HEADER, pctx))
4129                         e2fsck_clear_inode(ctx, ino, inode, 0,
4130                                            "check_blocks_extents");
4131                 pctx->errcode = 0;
4132                 return;
4133         }
4134
4135         /* ...since this function doesn't fail if i_block is zeroed. */
4136         pctx->errcode = ext2fs_extent_open2(fs, ino, inode, &ehandle);
4137         if (pctx->errcode) {
4138                 if (fix_problem(ctx, PR_1_READ_EXTENT, pctx))
4139                         e2fsck_clear_inode(ctx, ino, inode, 0,
4140                                            "check_blocks_extents");
4141                 pctx->errcode = 0;
4142                 return;
4143         }
4144
4145         retval = ext2fs_extent_get_info(ehandle, &info);
4146         if (retval == 0) {
4147                 int max_depth = info.max_depth;
4148
4149                 if (max_depth >= MAX_EXTENT_DEPTH_COUNT)
4150                         max_depth = MAX_EXTENT_DEPTH_COUNT-1;
4151                 ctx->extent_depth_count[max_depth]++;
4152         }
4153
4154         /* Check maximum extent depth */
4155         pctx->blk = info.max_depth;
4156         pctx->blk2 = ext2fs_max_extent_depth(ehandle);
4157         if (pctx->blk2 < pctx->blk &&
4158             fix_problem(ctx, PR_1_EXTENT_BAD_MAX_DEPTH, pctx))
4159                 pb->eti.force_rebuild = 1;
4160
4161         /* Can we collect extent tree level stats? */
4162         pctx->blk = MAX_EXTENT_DEPTH_COUNT;
4163         if (pctx->blk2 > pctx->blk)
4164                 fix_problem(ctx, PR_1E_MAX_EXTENT_TREE_DEPTH, pctx);
4165         memset(pb->eti.ext_info, 0, sizeof(pb->eti.ext_info));
4166         pb->eti.ino = pb->ino;
4167
4168         pb->next_lblock = 0;
4169
4170         eof_lblk = ((EXT2_I_SIZE(inode) + fs->blocksize - 1) >>
4171                 EXT2_BLOCK_SIZE_BITS(fs->super)) - 1;
4172         scan_extent_node(ctx, pctx, pb, 0, 0, eof_lblk, ehandle, 1);
4173         if (pctx->errcode &&
4174             fix_problem(ctx, PR_1_EXTENT_ITERATE_FAILURE, pctx)) {
4175                 pb->num_blocks = 0;
4176                 inode->i_blocks = 0;
4177                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4178                                    "check_blocks_extents");
4179                 pctx->errcode = 0;
4180         }
4181         ext2fs_extent_free(ehandle);
4182
4183         /* Rebuild unless it's a dir and we're rehashing it */
4184         if (LINUX_S_ISDIR(inode->i_mode) &&
4185             e2fsck_dir_will_be_rehashed(ctx, ino))
4186                 return;
4187
4188         if (ctx->options & E2F_OPT_CONVERT_BMAP)
4189                 e2fsck_rebuild_extents_later(ctx, ino);
4190         else
4191                 e2fsck_should_rebuild_extents(ctx, pctx, &pb->eti, &info);
4192 }
4193
4194 /*
4195  * In fact we don't need to check blocks for an inode with inline data
4196  * because this inode doesn't have any blocks.  In this function all
4197  * we need to do is add this inode into dblist when it is a directory.
4198  */
4199 static void check_blocks_inline_data(e2fsck_t ctx, struct problem_context *pctx,
4200                                      struct process_block_struct *pb)
4201 {
4202         int     flags;
4203         size_t  inline_data_size = 0;
4204
4205         if (!pb->is_dir) {
4206                 pctx->errcode = 0;
4207                 return;
4208         }
4209
4210         /* Process the dirents in i_block[] as the "first" block. */
4211         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 0);
4212         if (pctx->errcode)
4213                 goto err;
4214
4215         /* Process the dirents in the EA as a "second" block. */
4216         flags = ctx->fs->flags;
4217         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4218         pctx->errcode = ext2fs_inline_data_size(ctx->fs, pb->ino,
4219                                                 &inline_data_size);
4220         ctx->fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4221                          (ctx->fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4222         if (pctx->errcode) {
4223                 pctx->errcode = 0;
4224                 return;
4225         }
4226
4227         if (inline_data_size <= EXT4_MIN_INLINE_DATA_SIZE)
4228                 return;
4229
4230         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 1);
4231         if (pctx->errcode)
4232                 goto err;
4233
4234         return;
4235 err:
4236         pctx->blk = 0;
4237         pctx->num = 0;
4238         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4239         ctx->flags |= E2F_FLAG_ABORT;
4240 }
4241
4242 /*
4243  * This subroutine is called on each inode to account for all of the
4244  * blocks used by that inode.
4245  */
4246 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
4247                          char *block_buf, const struct ea_quota *ea_ibody_quota)
4248 {
4249         ext2_filsys fs = ctx->fs;
4250         struct process_block_struct pb;
4251         ext2_ino_t      ino = pctx->ino;
4252         struct ext2_inode *inode = pctx->inode;
4253         unsigned        bad_size = 0;
4254         int             dirty_inode = 0;
4255         int             extent_fs;
4256         int             inlinedata_fs;
4257         __u64           size;
4258         struct ea_quota ea_block_quota;
4259
4260         pb.ino = ino;
4261         pb.num_blocks = EXT2FS_B2C(ctx->fs,
4262                                    ea_ibody_quota ? ea_ibody_quota->blocks : 0);
4263         pb.last_block = ~0;
4264         pb.last_init_lblock = -1;
4265         pb.last_db_block = -1;
4266         pb.num_illegal_blocks = 0;
4267         pb.suppress = 0; pb.clear = 0;
4268         pb.fragmented = 0;
4269         pb.compressed = 0;
4270         pb.previous_block = 0;
4271         pb.is_dir = LINUX_S_ISDIR(inode->i_mode);
4272         pb.is_reg = LINUX_S_ISREG(inode->i_mode);
4273         pb.max_blocks = 1U << (31 - fs->super->s_log_block_size);
4274         pb.inode = inode;
4275         pb.pctx = pctx;
4276         pb.ctx = ctx;
4277         pb.inode_modified = 0;
4278         pb.eti.force_rebuild = 0;
4279         pctx->ino = ino;
4280         pctx->errcode = 0;
4281
4282         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
4283         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
4284
4285         if (check_ext_attr(ctx, pctx, block_buf, &ea_block_quota)) {
4286                 if (e2fsck_should_abort(ctx))
4287                         goto out;
4288                 pb.num_blocks += EXT2FS_B2C(ctx->fs, ea_block_quota.blocks);
4289         }
4290
4291         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL))
4292                 check_blocks_inline_data(ctx, pctx, &pb);
4293         else if (ext2fs_inode_has_valid_blocks2(fs, inode)) {
4294                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL))
4295                         check_blocks_extents(ctx, pctx, &pb);
4296                 else {
4297                         int flags;
4298                         /*
4299                          * If we've modified the inode, write it out before
4300                          * iterate() tries to use it.
4301                          */
4302                         if (dirty_inode) {
4303                                 e2fsck_write_inode(ctx, ino, inode,
4304                                                    "check_blocks");
4305                                 dirty_inode = 0;
4306                         }
4307                         flags = fs->flags;
4308                         fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4309                         pctx->errcode = ext2fs_block_iterate3(fs, ino,
4310                                                 pb.is_dir ? BLOCK_FLAG_HOLE : 0,
4311                                                 block_buf, process_block, &pb);
4312                         /*
4313                          * We do not have uninitialized extents in non extent
4314                          * files.
4315                          */
4316                         pb.last_init_lblock = pb.last_block;
4317                         /*
4318                          * If iterate() changed a block mapping, we have to
4319                          * re-read the inode.  If we decide to clear the
4320                          * inode after clearing some stuff, we'll re-write the
4321                          * bad mappings into the inode!
4322                          */
4323                         if (pb.inode_modified)
4324                                 e2fsck_read_inode(ctx, ino, inode,
4325                                                   "check_blocks");
4326                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4327                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4328
4329                         if (ctx->options & E2F_OPT_CONVERT_BMAP) {
4330 #ifdef DEBUG
4331                                 printf("bmap rebuild ino=%d\n", ino);
4332 #endif
4333                                 if (!LINUX_S_ISDIR(inode->i_mode) ||
4334                                     !e2fsck_dir_will_be_rehashed(ctx, ino))
4335                                         e2fsck_rebuild_extents_later(ctx, ino);
4336                         }
4337                 }
4338         }
4339         end_problem_latch(ctx, PR_LATCH_BLOCK);
4340         end_problem_latch(ctx, PR_LATCH_TOOBIG);
4341         if (e2fsck_should_abort(ctx))
4342                 goto out;
4343         if (pctx->errcode)
4344                 fix_problem(ctx, PR_1_BLOCK_ITERATE, pctx);
4345
4346         if (pb.fragmented && pb.num_blocks < fs->super->s_blocks_per_group) {
4347                 if (LINUX_S_ISDIR(inode->i_mode))
4348                         ctx->fs_fragmented_dir++;
4349                 else
4350                         ctx->fs_fragmented++;
4351         }
4352
4353         if (pb.clear) {
4354                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4355                                    "check_blocks");
4356                 return;
4357         }
4358
4359         if (inode->i_flags & EXT2_INDEX_FL) {
4360                 if (handle_htree(ctx, pctx, ino, inode, block_buf)) {
4361                         inode->i_flags &= ~EXT2_INDEX_FL;
4362                         dirty_inode++;
4363                 } else {
4364                         e2fsck_add_dx_dir(ctx, ino, inode, pb.last_block+1);
4365                 }
4366         }
4367
4368         if (!pb.num_blocks && pb.is_dir &&
4369             !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
4370                 if (fix_problem(ctx, PR_1_ZERO_LENGTH_DIR, pctx)) {
4371                         e2fsck_clear_inode(ctx, ino, inode, 0, "check_blocks");
4372                         ctx->fs_directory_count--;
4373                         return;
4374                 }
4375         }
4376
4377         if (ino != quota_type2inum(PRJQUOTA, fs->super) &&
4378             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INODE(ctx->fs->super)) &&
4379             !(inode->i_flags & EXT4_EA_INODE_FL)) {
4380                 quota_data_add(ctx->qctx, (struct ext2_inode_large *) inode,
4381                                ino,
4382                                pb.num_blocks * EXT2_CLUSTER_SIZE(fs->super));
4383                 quota_data_inodes(ctx->qctx, (struct ext2_inode_large *) inode,
4384                                   ino, (ea_ibody_quota ?
4385                                         ea_ibody_quota->inodes : 0) +
4386                                                 ea_block_quota.inodes + 1);
4387         }
4388
4389         if (!ext2fs_has_feature_huge_file(fs->super) ||
4390             !(inode->i_flags & EXT4_HUGE_FILE_FL))
4391                 pb.num_blocks *= (fs->blocksize / 512);
4392         pb.num_blocks *= EXT2FS_CLUSTER_RATIO(fs);
4393 #if 0
4394         printf("inode %u, i_size = %u, last_block = %llu, i_blocks=%llu, num_blocks = %llu\n",
4395                ino, inode->i_size, (unsigned long long) pb.last_block,
4396                (unsigned long long) ext2fs_inode_i_blocks(fs, inode),
4397                (unsigned long long) pb.num_blocks);
4398 #endif
4399         size = EXT2_I_SIZE(inode);
4400         if (pb.is_dir) {
4401                 unsigned nblock = size >> EXT2_BLOCK_SIZE_BITS(fs->super);
4402                 if (inode->i_flags & EXT4_INLINE_DATA_FL) {
4403                         int flags;
4404                         size_t sz = 0;
4405                         errcode_t err;
4406
4407                         flags = ctx->fs->flags;
4408                         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4409                         err = ext2fs_inline_data_size(ctx->fs, pctx->ino,
4410                                                       &sz);
4411                         ctx->fs->flags = (flags &
4412                                           EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4413                                          (ctx->fs->flags &
4414                                           ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4415                         if (err || sz != size) {
4416                                 bad_size = 7;
4417                                 pctx->num = sz;
4418                         }
4419                 } else if (size & (fs->blocksize - 1))
4420                         bad_size = 5;
4421                 else if (nblock > (pb.last_block + 1))
4422                         bad_size = 1;
4423                 else if (nblock < (pb.last_block + 1)) {
4424                         if (((pb.last_block + 1) - nblock) >
4425                             fs->super->s_prealloc_dir_blocks)
4426                                 bad_size = 2;
4427                 }
4428         } else {
4429                 if ((pb.last_init_lblock >= 0) &&
4430                     /* Do not allow initialized allocated blocks past i_size*/
4431                     (size < (__u64)pb.last_init_lblock * fs->blocksize) &&
4432                     !(inode->i_flags & EXT4_VERITY_FL))
4433                         bad_size = 3;
4434                 else if (!(extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4435                          size > ext2_max_sizes[fs->super->s_log_block_size])
4436                         /* too big for a direct/indirect-mapped file */
4437                         bad_size = 4;
4438                 else if ((extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4439                          size >
4440                          ((1ULL << (32 + EXT2_BLOCK_SIZE_BITS(fs->super))) - 1))
4441                         /* too big for an extent-based file - 32bit ee_block */
4442                         bad_size = 6;
4443         }
4444         /* i_size for symlinks is checked elsewhere */
4445         if (bad_size && !LINUX_S_ISLNK(inode->i_mode)) {
4446                 /* Did inline_data set pctx->num earlier? */
4447                 if (bad_size != 7)
4448                         pctx->num = (pb.last_block + 1) * fs->blocksize;
4449                 pctx->group = bad_size;
4450                 if (fix_problem(ctx, PR_1_BAD_I_SIZE, pctx)) {
4451                         ext2fs_inode_size_set(fs, inode, pctx->num);
4452                         if (EXT2_I_SIZE(inode) == 0 &&
4453                             (inode->i_flags & EXT4_INLINE_DATA_FL)) {
4454                                 memset(inode->i_block, 0,
4455                                        sizeof(inode->i_block));
4456                                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
4457                         }
4458                         dirty_inode++;
4459                 }
4460                 pctx->num = 0;
4461         }
4462         if (LINUX_S_ISREG(inode->i_mode) &&
4463             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
4464                 ctx->large_files++;
4465         if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
4466             ((pb.num_blocks != ext2fs_inode_i_blocks(fs, inode)) ||
4467              (ext2fs_has_feature_huge_file(fs->super) &&
4468               (inode->i_flags & EXT4_HUGE_FILE_FL) &&
4469               (inode->osd2.linux2.l_i_blocks_hi != 0)))) {
4470                 pctx->num = pb.num_blocks;
4471                 if (fix_problem(ctx, PR_1_BAD_I_BLOCKS, pctx)) {
4472                         inode->i_blocks = pb.num_blocks;
4473                         inode->osd2.linux2.l_i_blocks_hi = pb.num_blocks >> 32;
4474                         dirty_inode++;
4475                 }
4476                 pctx->num = 0;
4477         }
4478
4479         /*
4480          * The kernel gets mad if we ask it to allocate bigalloc clusters to
4481          * a block mapped file, so rebuild it as an extent file.  We can skip
4482          * symlinks because they're never rewritten.
4483          */
4484         if (ext2fs_has_feature_bigalloc(fs->super) &&
4485             (LINUX_S_ISREG(inode->i_mode) || LINUX_S_ISDIR(inode->i_mode)) &&
4486             ext2fs_inode_data_blocks2(fs, inode) > 0 &&
4487             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INO(fs->super)) &&
4488             !(inode->i_flags & (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)) &&
4489             fix_problem(ctx, PR_1_NO_BIGALLOC_BLOCKMAP_FILES, pctx)) {
4490                 pctx->errcode = e2fsck_rebuild_extents_later(ctx, ino);
4491                 if (pctx->errcode)
4492                         goto out;
4493         }
4494
4495         if (ctx->dirs_to_hash && pb.is_dir &&
4496             !(ctx->lost_and_found && ctx->lost_and_found == ino) &&
4497             !(inode->i_flags & EXT2_INDEX_FL) &&
4498             ((inode->i_size / fs->blocksize) >= 3))
4499                 e2fsck_rehash_dir_later(ctx, ino);
4500
4501 out:
4502         if (dirty_inode)
4503                 e2fsck_write_inode(ctx, ino, inode, "check_blocks");
4504 }
4505
4506 #if 0
4507 /*
4508  * Helper function called by process block when an illegal block is
4509  * found.  It returns a description about why the block is illegal
4510  */
4511 static char *describe_illegal_block(ext2_filsys fs, blk64_t block)
4512 {
4513         blk64_t super;
4514         int     i;
4515         static char     problem[80];
4516
4517         super = fs->super->s_first_data_block;
4518         strcpy(problem, "PROGRAMMING ERROR: Unknown reason for illegal block");
4519         if (block < super) {
4520                 sprintf(problem, "< FIRSTBLOCK (%u)", super);
4521                 return(problem);
4522         } else if (block >= ext2fs_blocks_count(fs->super)) {
4523                 sprintf(problem, "> BLOCKS (%u)", ext2fs_blocks_count(fs->super));
4524                 return(problem);
4525         }
4526         for (i = 0; i < fs->group_desc_count; i++) {
4527                 if (block == super) {
4528                         sprintf(problem, "is the superblock in group %d", i);
4529                         break;
4530                 }
4531                 if (block > super &&
4532                     block <= (super + fs->desc_blocks)) {
4533                         sprintf(problem, "is in the group descriptors "
4534                                 "of group %d", i);
4535                         break;
4536                 }
4537                 if (block == ext2fs_block_bitmap_loc(fs, i)) {
4538                         sprintf(problem, "is the block bitmap of group %d", i);
4539                         break;
4540                 }
4541                 if (block == ext2fs_inode_bitmap_loc(fs, i)) {
4542                         sprintf(problem, "is the inode bitmap of group %d", i);
4543                         break;
4544                 }
4545                 if (block >= ext2fs_inode_table_loc(fs, i) &&
4546                     (block < ext2fs_inode_table_loc(fs, i)
4547                      + fs->inode_blocks_per_group)) {
4548                         sprintf(problem, "is in the inode table of group %d",
4549                                 i);
4550                         break;
4551                 }
4552                 super += fs->super->s_blocks_per_group;
4553         }
4554         return(problem);
4555 }
4556 #endif
4557
4558 /*
4559  * This is a helper function for check_blocks().
4560  */
4561 static int process_block(ext2_filsys fs,
4562                   blk64_t       *block_nr,
4563                   e2_blkcnt_t blockcnt,
4564                   blk64_t ref_block EXT2FS_ATTR((unused)),
4565                   int ref_offset EXT2FS_ATTR((unused)),
4566                   void *priv_data)
4567 {
4568         struct process_block_struct *p;
4569         struct problem_context *pctx;
4570         blk64_t blk = *block_nr;
4571         int     ret_code = 0;
4572         problem_t       problem = 0;
4573         e2fsck_t        ctx;
4574
4575         p = (struct process_block_struct *) priv_data;
4576         pctx = p->pctx;
4577         ctx = p->ctx;
4578
4579         /*
4580          * For a directory, add logical block zero for processing even if it's
4581          * not mapped or we'll be perennially stuck with broken "." and ".."
4582          * entries.
4583          */
4584         if (p->is_dir && blockcnt == 0 && blk == 0) {
4585                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino, 0, 0);
4586                 if (pctx->errcode) {
4587                         pctx->blk = blk;
4588                         pctx->num = blockcnt;
4589                         goto failed_add_dir_block;
4590                 }
4591                 p->last_db_block++;
4592         }
4593
4594         if (blk == 0)
4595                 return 0;
4596
4597 #if 0
4598         printf("Process_block, inode %lu, block %u, #%d\n", p->ino, blk,
4599                blockcnt);
4600 #endif
4601
4602         /*
4603          * Simplistic fragmentation check.  We merely require that the
4604          * file be contiguous.  (Which can never be true for really
4605          * big files that are greater than a block group.)
4606          */
4607         if (p->previous_block && p->ino != EXT2_RESIZE_INO) {
4608                 if (p->previous_block+1 != blk) {
4609                         if (ctx->options & E2F_OPT_FRAGCHECK) {
4610                                 char type = '?';
4611
4612                                 if (p->is_dir)
4613                                         type = 'd';
4614                                 else if (p->is_reg)
4615                                         type = 'f';
4616
4617                                 printf(_("%6lu(%c): expecting %6lu "
4618                                          "got phys %6lu (blkcnt %lld)\n"),
4619                                        (unsigned long) pctx->ino, type,
4620                                        (unsigned long) p->previous_block+1,
4621                                        (unsigned long) blk,
4622                                        (long long) blockcnt);
4623                         }
4624                         p->fragmented = 1;
4625                 }
4626         }
4627
4628         if (p->is_dir && !ext2fs_has_feature_largedir(fs->super) &&
4629             !pctx->inode->i_size_high &&
4630             blockcnt > (1 << (21 - fs->super->s_log_block_size)))
4631                 problem = PR_1_TOOBIG_DIR;
4632         if (p->is_dir && p->num_blocks + 1 >= p->max_blocks)
4633                 problem = PR_1_TOOBIG_DIR;
4634         if (p->is_reg && p->num_blocks + 1 >= p->max_blocks)
4635                 problem = PR_1_TOOBIG_REG;
4636         if (!p->is_dir && !p->is_reg && blockcnt > 0)
4637                 problem = PR_1_TOOBIG_SYMLINK;
4638
4639         if (blk < fs->super->s_first_data_block ||
4640             blk >= ext2fs_blocks_count(fs->super))
4641                 problem = PR_1_ILLEGAL_BLOCK_NUM;
4642
4643         /*
4644          * If this IND/DIND/TIND block is squatting atop some critical metadata
4645          * (group descriptors, superblock, bitmap, inode table), any write to
4646          * "fix" mapping problems will destroy the metadata.  We'll let pass 1b
4647          * fix that and restart fsck.
4648          */
4649         if (blockcnt < 0 &&
4650             p->ino != EXT2_RESIZE_INO &&
4651             blk < ctx->fs->super->s_blocks_count &&
4652             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk)) {
4653                 pctx->blk = blk;
4654                 fix_problem(ctx, PR_1_CRITICAL_METADATA_COLLISION, pctx);
4655                 if ((ctx->options & E2F_OPT_NO) == 0)
4656                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4657         }
4658
4659         if (problem) {
4660                 p->num_illegal_blocks++;
4661                 /*
4662                  * A bit of subterfuge here -- we're trying to fix a block
4663                  * mapping, but the IND/DIND/TIND block could have collided
4664                  * with some critical metadata.  So, fix the in-core mapping so
4665                  * iterate won't go insane, but return 0 instead of
4666                  * BLOCK_CHANGED so that it won't write the remapping out to
4667                  * our multiply linked block.
4668                  *
4669                  * Even if we previously determined that an *IND block
4670                  * conflicts with critical metadata, we must still try to
4671                  * iterate the *IND block as if it is an *IND block to find and
4672                  * mark the blocks it points to.  Better to be overly cautious
4673                  * with the used_blocks map so that we don't move the *IND
4674                  * block to a block that's really in use!
4675                  */
4676                 if (p->ino != EXT2_RESIZE_INO &&
4677                     ref_block != 0 &&
4678                     ext2fs_test_block_bitmap2(ctx->block_metadata_map,
4679                                               ref_block)) {
4680                         *block_nr = 0;
4681                         return 0;
4682                 }
4683                 if (!p->suppress && (p->num_illegal_blocks % 12) == 0) {
4684                         if (fix_problem(ctx, PR_1_TOO_MANY_BAD_BLOCKS, pctx)) {
4685                                 p->clear = 1;
4686                                 return BLOCK_ABORT;
4687                         }
4688                         if (fix_problem(ctx, PR_1_SUPPRESS_MESSAGES, pctx)) {
4689                                 p->suppress = 1;
4690                                 set_latch_flags(PR_LATCH_BLOCK,
4691                                                 PRL_SUPPRESS, 0);
4692                         }
4693                 }
4694                 pctx->blk = blk;
4695                 pctx->blkcount = blockcnt;
4696                 if (fix_problem(ctx, problem, pctx)) {
4697                         blk = *block_nr = 0;
4698                         ret_code = BLOCK_CHANGED;
4699                         p->inode_modified = 1;
4700                         /*
4701                          * If the directory block is too big and is beyond the
4702                          * end of the FS, don't bother trying to add it for
4703                          * processing -- the kernel would never have created a
4704                          * directory this large, and we risk an ENOMEM abort.
4705                          * In any case, the toobig handler for extent-based
4706                          * directories also doesn't feed toobig blocks to
4707                          * pass 2.
4708                          */
4709                         if (problem == PR_1_TOOBIG_DIR)
4710                                 return ret_code;
4711                         goto mark_dir;
4712                 } else
4713                         return 0;
4714         }
4715
4716         if (p->ino == EXT2_RESIZE_INO) {
4717                 /*
4718                  * The resize inode has already be sanity checked
4719                  * during pass #0 (the superblock checks).  All we
4720                  * have to do is mark the double indirect block as
4721                  * being in use; all of the other blocks are handled
4722                  * by mark_table_blocks()).
4723                  */
4724                 if (blockcnt == BLOCK_COUNT_DIND)
4725                         mark_block_used(ctx, blk);
4726                 p->num_blocks++;
4727         } else if (!(ctx->fs->cluster_ratio_bits &&
4728                      p->previous_block &&
4729                      (EXT2FS_B2C(ctx->fs, blk) ==
4730                       EXT2FS_B2C(ctx->fs, p->previous_block)) &&
4731                      (blk & EXT2FS_CLUSTER_MASK(ctx->fs)) ==
4732                      ((unsigned) blockcnt & EXT2FS_CLUSTER_MASK(ctx->fs)))) {
4733                 mark_block_used(ctx, blk);
4734                 p->num_blocks++;
4735         } else if (has_unaligned_cluster_map(ctx, p->previous_block,
4736                                              p->last_block, blk, blockcnt)) {
4737                 pctx->blk = blockcnt;
4738                 pctx->blk2 = blk;
4739                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4740                 mark_block_used(ctx, blk);
4741                 mark_block_used(ctx, blk);
4742         }
4743         if (blockcnt >= 0)
4744                 p->last_block = blockcnt;
4745         p->previous_block = blk;
4746 mark_dir:
4747         if (p->is_dir && (blockcnt >= 0)) {
4748                 while (++p->last_db_block < blockcnt) {
4749                         pctx->errcode = ext2fs_add_dir_block2(fs->dblist,
4750                                                               p->ino, 0,
4751                                                               p->last_db_block);
4752                         if (pctx->errcode) {
4753                                 pctx->blk = 0;
4754                                 pctx->num = p->last_db_block;
4755                                 goto failed_add_dir_block;
4756                         }
4757                 }
4758                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino,
4759                                                       blk, blockcnt);
4760                 if (pctx->errcode) {
4761                         pctx->blk = blk;
4762                         pctx->num = blockcnt;
4763                 failed_add_dir_block:
4764                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4765                         /* Should never get here */
4766                         ctx->flags |= E2F_FLAG_ABORT;
4767                         return BLOCK_ABORT;
4768                 }
4769         }
4770         return ret_code;
4771 }
4772
4773 static int process_bad_block(ext2_filsys fs,
4774                       blk64_t *block_nr,
4775                       e2_blkcnt_t blockcnt,
4776                       blk64_t ref_block EXT2FS_ATTR((unused)),
4777                       int ref_offset EXT2FS_ATTR((unused)),
4778                       void *priv_data)
4779 {
4780         struct process_block_struct *p;
4781         blk64_t         blk = *block_nr;
4782         blk64_t         first_block;
4783         dgrp_t          i;
4784         struct problem_context *pctx;
4785         e2fsck_t        ctx;
4786
4787         if (!blk)
4788                 return 0;
4789
4790         p = (struct process_block_struct *) priv_data;
4791         ctx = p->ctx;
4792         pctx = p->pctx;
4793
4794         pctx->ino = EXT2_BAD_INO;
4795         pctx->blk = blk;
4796         pctx->blkcount = blockcnt;
4797
4798         if ((blk < fs->super->s_first_data_block) ||
4799             (blk >= ext2fs_blocks_count(fs->super))) {
4800                 if (fix_problem(ctx, PR_1_BB_ILLEGAL_BLOCK_NUM, pctx)) {
4801                         *block_nr = 0;
4802                         return BLOCK_CHANGED;
4803                 } else
4804                         return 0;
4805         }
4806
4807         if (blockcnt < 0) {
4808                 if (ext2fs_test_block_bitmap2(p->fs_meta_blocks, blk)) {
4809                         p->bbcheck = 1;
4810                         if (fix_problem(ctx, PR_1_BB_FS_BLOCK, pctx)) {
4811                                 *block_nr = 0;
4812                                 return BLOCK_CHANGED;
4813                         }
4814                 } else if (ext2fs_test_block_bitmap2(ctx->block_found_map,
4815                                                     blk)) {
4816                         p->bbcheck = 1;
4817                         if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK,
4818                                         pctx)) {
4819                                 *block_nr = 0;
4820                                 return BLOCK_CHANGED;
4821                         }
4822                         if (e2fsck_should_abort(ctx))
4823                                 return BLOCK_ABORT;
4824                 } else
4825                         mark_block_used(ctx, blk);
4826                 return 0;
4827         }
4828 #if 0
4829         printf ("DEBUG: Marking %u as bad.\n", blk);
4830 #endif
4831         ctx->fs_badblocks_count++;
4832         /*
4833          * If the block is not used, then mark it as used and return.
4834          * If it is already marked as found, this must mean that
4835          * there's an overlap between the filesystem table blocks
4836          * (bitmaps and inode table) and the bad block list.
4837          */
4838         if (!ext2fs_test_block_bitmap2(ctx->block_found_map, blk)) {
4839                 ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
4840                 return 0;
4841         }
4842         /*
4843          * Try to find the where the filesystem block was used...
4844          */
4845         first_block = fs->super->s_first_data_block;
4846
4847         for (i = 0; i < fs->group_desc_count; i++ ) {
4848                 pctx->group = i;
4849                 pctx->blk = blk;
4850                 if (!ext2fs_bg_has_super(fs, i))
4851                         goto skip_super;
4852                 if (blk == first_block) {
4853                         if (i == 0) {
4854                                 if (fix_problem(ctx,
4855                                                 PR_1_BAD_PRIMARY_SUPERBLOCK,
4856                                                 pctx)) {
4857                                         *block_nr = 0;
4858                                         return BLOCK_CHANGED;
4859                                 }
4860                                 return 0;
4861                         }
4862                         fix_problem(ctx, PR_1_BAD_SUPERBLOCK, pctx);
4863                         return 0;
4864                 }
4865                 if ((blk > first_block) &&
4866                     (blk <= first_block + fs->desc_blocks)) {
4867                         if (i == 0) {
4868                                 pctx->blk = *block_nr;
4869                                 if (fix_problem(ctx,
4870                         PR_1_BAD_PRIMARY_GROUP_DESCRIPTOR, pctx)) {
4871                                         *block_nr = 0;
4872                                         return BLOCK_CHANGED;
4873                                 }
4874                                 return 0;
4875                         }
4876                         fix_problem(ctx, PR_1_BAD_GROUP_DESCRIPTORS, pctx);
4877                         return 0;
4878                 }
4879         skip_super:
4880                 if (blk == ext2fs_block_bitmap_loc(fs, i)) {
4881                         if (fix_problem(ctx, PR_1_BB_BAD_BLOCK, pctx)) {
4882                                 ctx->invalid_block_bitmap_flag[i]++;
4883                                 ctx->invalid_bitmaps++;
4884                         }
4885                         return 0;
4886                 }
4887                 if (blk == ext2fs_inode_bitmap_loc(fs, i)) {
4888                         if (fix_problem(ctx, PR_1_IB_BAD_BLOCK, pctx)) {
4889                                 ctx->invalid_inode_bitmap_flag[i]++;
4890                                 ctx->invalid_bitmaps++;
4891                         }
4892                         return 0;
4893                 }
4894                 if ((blk >= ext2fs_inode_table_loc(fs, i)) &&
4895                     (blk < (ext2fs_inode_table_loc(fs, i) +
4896                             fs->inode_blocks_per_group))) {
4897                         /*
4898                          * If there are bad blocks in the inode table,
4899                          * the inode scan code will try to do
4900                          * something reasonable automatically.
4901                          */
4902                         return 0;
4903                 }
4904                 first_block += fs->super->s_blocks_per_group;
4905         }
4906         /*
4907          * If we've gotten to this point, then the only
4908          * possibility is that the bad block inode meta data
4909          * is using a bad block.
4910          */
4911         if ((blk == p->inode->i_block[EXT2_IND_BLOCK]) ||
4912             (blk == p->inode->i_block[EXT2_DIND_BLOCK]) ||
4913             (blk == p->inode->i_block[EXT2_TIND_BLOCK])) {
4914                 p->bbcheck = 1;
4915                 if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK, pctx)) {
4916                         *block_nr = 0;
4917                         return BLOCK_CHANGED;
4918                 }
4919                 if (e2fsck_should_abort(ctx))
4920                         return BLOCK_ABORT;
4921                 return 0;
4922         }
4923
4924         pctx->group = -1;
4925
4926         /* Warn user that the block wasn't claimed */
4927         fix_problem(ctx, PR_1_PROGERR_CLAIMED_BLOCK, pctx);
4928
4929         return 0;
4930 }
4931
4932 static void new_table_block(e2fsck_t ctx, blk64_t first_block, dgrp_t group,
4933                             const char *name, int num, blk64_t *new_block)
4934 {
4935         ext2_filsys fs = ctx->fs;
4936         dgrp_t          last_grp;
4937         blk64_t         old_block = *new_block;
4938         blk64_t         last_block;
4939         dgrp_t          flexbg;
4940         unsigned        flexbg_size;
4941         int             i, is_flexbg;
4942         char            *buf;
4943         struct problem_context  pctx;
4944
4945         clear_problem_context(&pctx);
4946
4947         pctx.group = group;
4948         pctx.blk = old_block;
4949         pctx.str = name;
4950
4951         /*
4952          * For flex_bg filesystems, first try to allocate the metadata
4953          * within the flex_bg, and if that fails then try finding the
4954          * space anywhere in the filesystem.
4955          */
4956         is_flexbg = ext2fs_has_feature_flex_bg(fs->super);
4957         if (is_flexbg) {
4958                 flexbg_size = 1U << fs->super->s_log_groups_per_flex;
4959                 flexbg = group / flexbg_size;
4960                 first_block = ext2fs_group_first_block2(fs,
4961                                                         flexbg_size * flexbg);
4962                 last_grp = group | (flexbg_size - 1);
4963                 if (last_grp >= fs->group_desc_count)
4964                         last_grp = fs->group_desc_count - 1;
4965                 last_block = ext2fs_group_last_block2(fs, last_grp);
4966         } else
4967                 last_block = ext2fs_group_last_block2(fs, group);
4968         pctx.errcode = ext2fs_get_free_blocks2(fs, first_block, last_block,
4969                                                num, ctx->block_found_map,
4970                                                new_block);
4971         if (is_flexbg && (pctx.errcode == EXT2_ET_BLOCK_ALLOC_FAIL))
4972                 pctx.errcode = ext2fs_get_free_blocks2(fs,
4973                                 fs->super->s_first_data_block,
4974                                 ext2fs_blocks_count(fs->super),
4975                                 num, ctx->block_found_map, new_block);
4976         if (pctx.errcode) {
4977                 pctx.num = num;
4978                 fix_problem(ctx, PR_1_RELOC_BLOCK_ALLOCATE, &pctx);
4979                 ext2fs_unmark_valid(fs);
4980                 ctx->flags |= E2F_FLAG_ABORT;
4981                 return;
4982         }
4983         pctx.errcode = ext2fs_get_mem(fs->blocksize, &buf);
4984         if (pctx.errcode) {
4985                 fix_problem(ctx, PR_1_RELOC_MEMORY_ALLOCATE, &pctx);
4986                 ext2fs_unmark_valid(fs);
4987                 ctx->flags |= E2F_FLAG_ABORT;
4988                 return;
4989         }
4990         ext2fs_mark_super_dirty(fs);
4991         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
4992         pctx.blk2 = *new_block;
4993         fix_problem(ctx, (old_block ? PR_1_RELOC_FROM_TO :
4994                           PR_1_RELOC_TO), &pctx);
4995         pctx.blk2 = 0;
4996         for (i = 0; i < num; i++) {
4997                 pctx.blk = i;
4998                 ext2fs_mark_block_bitmap2(ctx->block_found_map, (*new_block)+i);
4999                 if (old_block) {
5000                         pctx.errcode = io_channel_read_blk64(fs->io,
5001                                    old_block + i, 1, buf);
5002                         if (pctx.errcode)
5003                                 fix_problem(ctx, PR_1_RELOC_READ_ERR, &pctx);
5004                         pctx.blk = (*new_block) + i;
5005                         pctx.errcode = io_channel_write_blk64(fs->io, pctx.blk,
5006                                                               1, buf);
5007                 } else {
5008                         pctx.blk = (*new_block) + i;
5009                         pctx.errcode = ext2fs_zero_blocks2(fs, pctx.blk, 1,
5010                                                            NULL, NULL);
5011                 }
5012
5013                 if (pctx.errcode)
5014                         fix_problem(ctx, PR_1_RELOC_WRITE_ERR, &pctx);
5015         }
5016         ext2fs_free_mem(&buf);
5017 }
5018
5019 /*
5020  * This routine gets called at the end of pass 1 if bad blocks are
5021  * detected in the superblock, group descriptors, inode_bitmaps, or
5022  * block bitmaps.  At this point, all of the blocks have been mapped
5023  * out, so we can try to allocate new block(s) to replace the bad
5024  * blocks.
5025  */
5026 static void handle_fs_bad_blocks(e2fsck_t ctx)
5027 {
5028         ext2_filsys fs = ctx->fs;
5029         dgrp_t          i;
5030         blk64_t         first_block;
5031         blk64_t         new_blk;
5032
5033         for (i = 0; i < fs->group_desc_count; i++) {
5034                 first_block = ext2fs_group_first_block2(fs, i);
5035
5036                 if (ctx->invalid_block_bitmap_flag[i]) {
5037                         new_blk = ext2fs_block_bitmap_loc(fs, i);
5038                         new_table_block(ctx, first_block, i, _("block bitmap"),
5039                                         1, &new_blk);
5040                         ext2fs_block_bitmap_loc_set(fs, i, new_blk);
5041                 }
5042                 if (ctx->invalid_inode_bitmap_flag[i]) {
5043                         new_blk = ext2fs_inode_bitmap_loc(fs, i);
5044                         new_table_block(ctx, first_block, i, _("inode bitmap"),
5045                                         1, &new_blk);
5046                         ext2fs_inode_bitmap_loc_set(fs, i, new_blk);
5047                 }
5048                 if (ctx->invalid_inode_table_flag[i]) {
5049                         new_blk = ext2fs_inode_table_loc(fs, i);
5050                         new_table_block(ctx, first_block, i, _("inode table"),
5051                                         fs->inode_blocks_per_group,
5052                                         &new_blk);
5053                         ext2fs_inode_table_loc_set(fs, i, new_blk);
5054                         ctx->flags |= E2F_FLAG_RESTART;
5055                 }
5056         }
5057         ctx->invalid_bitmaps = 0;
5058 }
5059
5060 /*
5061  * This routine marks all blocks which are used by the superblock,
5062  * group descriptors, inode bitmaps, and block bitmaps.
5063  */
5064 static void mark_table_blocks(e2fsck_t ctx)
5065 {
5066         ext2_filsys fs = ctx->fs;
5067         blk64_t b;
5068         dgrp_t  i;
5069         unsigned int    j;
5070         struct problem_context pctx;
5071
5072         clear_problem_context(&pctx);
5073
5074         for (i = 0; i < fs->group_desc_count; i++) {
5075                 pctx.group = i;
5076
5077                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_found_map);
5078                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_metadata_map);
5079
5080                 /*
5081                  * Mark the blocks used for the inode table
5082                  */
5083                 if (ext2fs_inode_table_loc(fs, i)) {
5084                         for (j = 0, b = ext2fs_inode_table_loc(fs, i);
5085                              j < fs->inode_blocks_per_group;
5086                              j++, b++) {
5087                                 if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5088                                                              b)) {
5089                                         pctx.blk = b;
5090                                         if (!ctx->invalid_inode_table_flag[i] &&
5091                                             fix_problem(ctx,
5092                                                 PR_1_ITABLE_CONFLICT, &pctx)) {
5093                                                 ctx->invalid_inode_table_flag[i]++;
5094                                                 ctx->invalid_bitmaps++;
5095                                         }
5096                                 } else {
5097                                     ext2fs_mark_block_bitmap2(
5098                                                 ctx->block_found_map, b);
5099                                     ext2fs_mark_block_bitmap2(
5100                                                 ctx->block_metadata_map, b);
5101                                 }
5102                         }
5103                 }
5104
5105                 /*
5106                  * Mark block used for the block bitmap
5107                  */
5108                 if (ext2fs_block_bitmap_loc(fs, i)) {
5109                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5110                                      ext2fs_block_bitmap_loc(fs, i))) {
5111                                 pctx.blk = ext2fs_block_bitmap_loc(fs, i);
5112                                 if (fix_problem(ctx, PR_1_BB_CONFLICT, &pctx)) {
5113                                         ctx->invalid_block_bitmap_flag[i]++;
5114                                         ctx->invalid_bitmaps++;
5115                                 }
5116                         } else {
5117                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5118                                      ext2fs_block_bitmap_loc(fs, i));
5119                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5120                                      ext2fs_block_bitmap_loc(fs, i));
5121                         }
5122                 }
5123                 /*
5124                  * Mark block used for the inode bitmap
5125                  */
5126                 if (ext2fs_inode_bitmap_loc(fs, i)) {
5127                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5128                                      ext2fs_inode_bitmap_loc(fs, i))) {
5129                                 pctx.blk = ext2fs_inode_bitmap_loc(fs, i);
5130                                 if (fix_problem(ctx, PR_1_IB_CONFLICT, &pctx)) {
5131                                         ctx->invalid_inode_bitmap_flag[i]++;
5132                                         ctx->invalid_bitmaps++;
5133                                 }
5134                         } else {
5135                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5136                                      ext2fs_inode_bitmap_loc(fs, i));
5137                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5138                                      ext2fs_inode_bitmap_loc(fs, i));
5139                         }
5140                 }
5141         }
5142 }
5143
5144 /*
5145  * These subroutines short circuits ext2fs_get_blocks and
5146  * ext2fs_check_directory; we use them since we already have the inode
5147  * structure, so there's no point in letting the ext2fs library read
5148  * the inode again.
5149  */
5150 static errcode_t pass1_get_blocks(ext2_filsys fs, ext2_ino_t ino,
5151                                   blk_t *blocks)
5152 {
5153         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5154         int     i;
5155
5156         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5157                 return EXT2_ET_CALLBACK_NOTHANDLED;
5158
5159         for (i=0; i < EXT2_N_BLOCKS; i++)
5160                 blocks[i] = ctx->stashed_inode->i_block[i];
5161         return 0;
5162 }
5163
5164 static errcode_t pass1_read_inode(ext2_filsys fs, ext2_ino_t ino,
5165                                   struct ext2_inode *inode)
5166 {
5167         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5168
5169         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5170                 return EXT2_ET_CALLBACK_NOTHANDLED;
5171         *inode = *ctx->stashed_inode;
5172         return 0;
5173 }
5174
5175 static errcode_t pass1_write_inode(ext2_filsys fs, ext2_ino_t ino,
5176                             struct ext2_inode *inode)
5177 {
5178         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5179
5180         if ((ino == ctx->stashed_ino) && ctx->stashed_inode &&
5181                 (inode != ctx->stashed_inode))
5182                 *ctx->stashed_inode = *inode;
5183         return EXT2_ET_CALLBACK_NOTHANDLED;
5184 }
5185
5186 static errcode_t pass1_check_directory(ext2_filsys fs, ext2_ino_t ino)
5187 {
5188         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5189
5190         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5191                 return EXT2_ET_CALLBACK_NOTHANDLED;
5192
5193         if (!LINUX_S_ISDIR(ctx->stashed_inode->i_mode))
5194                 return EXT2_ET_NO_DIRECTORY;
5195         return 0;
5196 }
5197
5198 static errcode_t e2fsck_get_alloc_block(ext2_filsys fs, blk64_t goal,
5199                                         blk64_t *ret)
5200 {
5201         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5202         errcode_t       retval;
5203         blk64_t         new_block;
5204
5205         if (ctx->block_found_map) {
5206                 retval = ext2fs_new_block2(fs, goal, ctx->block_found_map,
5207                                            &new_block);
5208                 if (retval)
5209                         return retval;
5210                 if (fs->block_map) {
5211                         ext2fs_mark_block_bitmap2(fs->block_map, new_block);
5212                         ext2fs_mark_bb_dirty(fs);
5213                 }
5214         } else {
5215                 if (!fs->block_map) {
5216                         retval = ext2fs_read_block_bitmap(fs);
5217                         if (retval)
5218                                 return retval;
5219                 }
5220
5221                 retval = ext2fs_new_block2(fs, goal, fs->block_map, &new_block);
5222                 if (retval)
5223                         return retval;
5224         }
5225
5226         *ret = new_block;
5227         return (0);
5228 }
5229
5230 static errcode_t e2fsck_new_range(ext2_filsys fs, int flags, blk64_t goal,
5231                                   blk64_t len, blk64_t *pblk, blk64_t *plen)
5232 {
5233         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5234         errcode_t       retval;
5235
5236         if (ctx->block_found_map)
5237                 return ext2fs_new_range(fs, flags, goal, len,
5238                                         ctx->block_found_map, pblk, plen);
5239
5240         if (!fs->block_map) {
5241                 retval = ext2fs_read_block_bitmap(fs);
5242                 if (retval)
5243                         return retval;
5244         }
5245
5246         return ext2fs_new_range(fs, flags, goal, len, fs->block_map,
5247                                 pblk, plen);
5248 }
5249
5250 static void e2fsck_block_alloc_stats(ext2_filsys fs, blk64_t blk, int inuse)
5251 {
5252         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5253
5254         /* Never free a critical metadata block */
5255         if (ctx->block_found_map &&
5256             ctx->block_metadata_map &&
5257             inuse < 0 &&
5258             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk))
5259                 return;
5260
5261         if (ctx->block_found_map) {
5262                 if (inuse > 0)
5263                         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5264                 else
5265                         ext2fs_unmark_block_bitmap2(ctx->block_found_map, blk);
5266         }
5267 }
5268
5269 static void e2fsck_block_alloc_stats_range(ext2_filsys fs, blk64_t blk,
5270                                            blk_t num, int inuse)
5271 {
5272         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5273
5274         /* Never free a critical metadata block */
5275         if (ctx->block_found_map &&
5276             ctx->block_metadata_map &&
5277             inuse < 0 &&
5278             ext2fs_test_block_bitmap_range2(ctx->block_metadata_map, blk, num))
5279                 return;
5280
5281         if (ctx->block_found_map) {
5282                 if (inuse > 0)
5283                         ext2fs_mark_block_bitmap_range2(ctx->block_found_map,
5284                                                         blk, num);
5285                 else
5286                         ext2fs_unmark_block_bitmap_range2(ctx->block_found_map,
5287                                                         blk, num);
5288         }
5289 }
5290
5291 void e2fsck_use_inode_shortcuts(e2fsck_t ctx, int use_shortcuts)
5292 {
5293         ext2_filsys fs = ctx->fs;
5294
5295         if (use_shortcuts) {
5296                 fs->get_blocks = pass1_get_blocks;
5297                 fs->check_directory = pass1_check_directory;
5298                 fs->read_inode = pass1_read_inode;
5299                 fs->write_inode = pass1_write_inode;
5300                 ctx->stashed_ino = 0;
5301         } else {
5302                 fs->get_blocks = 0;
5303                 fs->check_directory = 0;
5304                 fs->read_inode = 0;
5305                 fs->write_inode = 0;
5306         }
5307 }
5308
5309 void e2fsck_intercept_block_allocations(e2fsck_t ctx)
5310 {
5311         ext2fs_set_alloc_block_callback(ctx->fs, e2fsck_get_alloc_block, 0);
5312         ext2fs_set_block_alloc_stats_callback(ctx->fs,
5313                                                 e2fsck_block_alloc_stats, 0);
5314         ext2fs_set_new_range_callback(ctx->fs, e2fsck_new_range, NULL);
5315         ext2fs_set_block_alloc_stats_range_callback(ctx->fs,
5316                                         e2fsck_block_alloc_stats_range, NULL);
5317 }