Whamcloud - gitweb
e2fsck: cleanup e2fsck_pass1_thread_join()
[tools/e2fsprogs.git] / e2fsck / pass1.c
1 /*
2  * pass1.c -- pass #1 of e2fsck: sequential scan of the inode table
3  *
4  * Copyright (C) 1993, 1994, 1995, 1996, 1997 Theodore Ts'o.
5  *
6  * %Begin-Header%
7  * This file may be redistributed under the terms of the GNU Public
8  * License.
9  * %End-Header%
10  *
11  * Pass 1 of e2fsck iterates over all the inodes in the filesystems,
12  * and applies the following tests to each inode:
13  *
14  *      - The mode field of the inode must be legal.
15  *      - The size and block count fields of the inode are correct.
16  *      - A data block must not be used by another inode
17  *
18  * Pass 1 also gathers the collects the following information:
19  *
20  *      - A bitmap of which inodes are in use.          (inode_used_map)
21  *      - A bitmap of which inodes are directories.     (inode_dir_map)
22  *      - A bitmap of which inodes are regular files.   (inode_reg_map)
23  *      - A bitmap of which inodes have bad fields.     (inode_bad_map)
24  *      - A bitmap of which inodes are in bad blocks.   (inode_bb_map)
25  *      - A bitmap of which inodes are imagic inodes.   (inode_imagic_map)
26  *      - A bitmap of which inodes are casefolded.      (inode_casefold_map)
27  *      - A bitmap of which blocks are in use.          (block_found_map)
28  *      - A bitmap of which blocks are in use by two inodes     (block_dup_map)
29  *      - The data blocks of the directory inodes.      (dir_map)
30  *      - Ref counts for ea_inodes.                     (ea_inode_refs)
31  *      - The encryption policy ID of each encrypted inode. (encrypted_files)
32  *
33  * Pass 1 is designed to stash away enough information so that the
34  * other passes should not need to read in the inode information
35  * during the normal course of a filesystem check.  (Although if an
36  * inconsistency is detected, other passes may need to read in an
37  * inode to fix it.)
38  *
39  * Note that pass 1B will be invoked if there are any duplicate blocks
40  * found.
41  */
42
43 #define _GNU_SOURCE 1 /* get strnlen() */
44 #include "config.h"
45 #include <string.h>
46 #include <time.h>
47 #ifdef HAVE_ERRNO_H
48 #include <errno.h>
49 #endif
50 #include <assert.h>
51 #ifdef HAVE_PTHREAD
52 #include <pthread.h>
53 #endif
54
55 #include "e2fsck.h"
56 #include <ext2fs/ext2_ext_attr.h>
57 /* todo remove this finally */
58 #include <ext2fs/ext2fsP.h>
59 #include <e2p/e2p.h>
60
61 #include "problem.h"
62
63 #ifdef NO_INLINE_FUNCS
64 #define _INLINE_
65 #else
66 #define _INLINE_ inline
67 #endif
68
69 #undef DEBUG
70
71 struct ea_quota {
72         blk64_t blocks;
73         __u64 inodes;
74 };
75
76 static int process_block(ext2_filsys fs, blk64_t        *blocknr,
77                          e2_blkcnt_t blockcnt, blk64_t ref_blk,
78                          int ref_offset, void *priv_data);
79 static int process_bad_block(ext2_filsys fs, blk64_t *block_nr,
80                              e2_blkcnt_t blockcnt, blk64_t ref_blk,
81                              int ref_offset, void *priv_data);
82 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
83                          char *block_buf,
84                          const struct ea_quota *ea_ibody_quota);
85 static void mark_table_blocks(e2fsck_t ctx);
86 static void alloc_bb_map(e2fsck_t ctx);
87 static void alloc_imagic_map(e2fsck_t ctx);
88 static void mark_inode_bad(e2fsck_t ctx, ext2_ino_t ino);
89 static void add_casefolded_dir(e2fsck_t ctx, ext2_ino_t ino);
90 static void handle_fs_bad_blocks(e2fsck_t ctx);
91 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b);
92 static errcode_t scan_callback(ext2_filsys fs, ext2_inode_scan scan,
93                                   dgrp_t group, void * priv_data);
94 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
95                                     char *block_buf, int adjust_sign);
96 /* static char *describe_illegal_block(ext2_filsys fs, blk64_t block); */
97
98 struct process_block_struct {
99         ext2_ino_t      ino;
100         unsigned        is_dir:1, is_reg:1, clear:1, suppress:1,
101                                 fragmented:1, compressed:1, bbcheck:1,
102                                 inode_modified:1;
103         blk64_t         num_blocks;
104         blk64_t         max_blocks;
105         blk64_t         last_block;
106         e2_blkcnt_t     last_init_lblock;
107         e2_blkcnt_t     last_db_block;
108         int             num_illegal_blocks;
109         blk64_t         previous_block;
110         struct ext2_inode *inode;
111         struct problem_context *pctx;
112         ext2fs_block_bitmap fs_meta_blocks;
113         e2fsck_t        ctx;
114         blk64_t         next_lblock;
115         struct extent_tree_info eti;
116 };
117
118 struct process_inode_block {
119         ext2_ino_t ino;
120         struct ea_quota ea_ibody_quota;
121         struct ext2_inode_large inode;
122 };
123
124 struct scan_callback_struct {
125         e2fsck_t                         ctx;
126         char                            *block_buf;
127         struct process_inode_block      *inodes_to_process;
128         int                             *process_inode_count;
129 };
130
131 static void process_inodes(e2fsck_t ctx, char *block_buf,
132                            struct process_inode_block *inodes_to_process,
133                            int *process_inode_count);
134
135 static __u64 ext2_max_sizes[EXT2_MAX_BLOCK_LOG_SIZE -
136                             EXT2_MIN_BLOCK_LOG_SIZE + 1];
137
138 /*
139  * Check to make sure a device inode is real.  Returns 1 if the device
140  * checks out, 0 if not.
141  *
142  * Note: this routine is now also used to check FIFO's and Sockets,
143  * since they have the same requirement; the i_block fields should be
144  * zero.
145  */
146 int e2fsck_pass1_check_device_inode(ext2_filsys fs EXT2FS_ATTR((unused)),
147                                     struct ext2_inode *inode)
148 {
149         int     i;
150
151         /*
152          * If the index or extents flag is set, then this is a bogus
153          * device/fifo/socket
154          */
155         if (inode->i_flags & (EXT2_INDEX_FL | EXT4_EXTENTS_FL))
156                 return 0;
157
158         /*
159          * We should be able to do the test below all the time, but
160          * because the kernel doesn't forcibly clear the device
161          * inode's additional i_block fields, there are some rare
162          * occasions when a legitimate device inode will have non-zero
163          * additional i_block fields.  So for now, we only complain
164          * when the immutable flag is set, which should never happen
165          * for devices.  (And that's when the problem is caused, since
166          * you can't set or clear immutable flags for devices.)  Once
167          * the kernel has been fixed we can change this...
168          */
169         if (inode->i_flags & (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)) {
170                 for (i=4; i < EXT2_N_BLOCKS; i++)
171                         if (inode->i_block[i])
172                                 return 0;
173         }
174         return 1;
175 }
176
177 /*
178  * Check to make sure a symlink inode is real.  Returns 1 if the symlink
179  * checks out, 0 if not.
180  */
181 int e2fsck_pass1_check_symlink(ext2_filsys fs, ext2_ino_t ino,
182                                struct ext2_inode *inode, char *buf)
183 {
184         unsigned int buflen;
185         unsigned int len;
186
187         if ((inode->i_size_high || inode->i_size == 0) ||
188             (inode->i_flags & EXT2_INDEX_FL))
189                 return 0;
190
191         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
192                 size_t inline_size;
193
194                 if (inode->i_flags & EXT4_EXTENTS_FL)
195                         return 0;
196                 if (ext2fs_inline_data_size(fs, ino, &inline_size))
197                         return 0;
198                 if (inode->i_size != inline_size)
199                         return 0;
200
201                 return 1;
202         }
203
204         if (ext2fs_is_fast_symlink(inode)) {
205                 if (inode->i_flags & EXT4_EXTENTS_FL)
206                         return 0;
207                 buf = (char *)inode->i_block;
208                 buflen = sizeof(inode->i_block);
209         } else {
210                 ext2_extent_handle_t    handle;
211                 struct ext2_extent_info info;
212                 struct ext2fs_extent    extent;
213                 blk64_t blk;
214                 int i;
215
216                 if (inode->i_flags & EXT4_EXTENTS_FL) {
217                         if (ext2fs_extent_open2(fs, ino, inode, &handle))
218                                 return 0;
219                         if (ext2fs_extent_get_info(handle, &info) ||
220                             (info.num_entries != 1) ||
221                             (info.max_depth != 0)) {
222                                 ext2fs_extent_free(handle);
223                                 return 0;
224                         }
225                         if (ext2fs_extent_get(handle, EXT2_EXTENT_ROOT,
226                                               &extent) ||
227                             (extent.e_lblk != 0) ||
228                             (extent.e_len != 1)) {
229                                 ext2fs_extent_free(handle);
230                                 return 0;
231                         }
232                         blk = extent.e_pblk;
233                         ext2fs_extent_free(handle);
234                 } else {
235                         blk = inode->i_block[0];
236
237                         for (i = 1; i < EXT2_N_BLOCKS; i++)
238                                 if (inode->i_block[i])
239                                         return 0;
240                 }
241
242                 if (blk < fs->super->s_first_data_block ||
243                     blk >= ext2fs_blocks_count(fs->super))
244                         return 0;
245
246                 if (io_channel_read_blk64(fs->io, blk, 1, buf))
247                         return 0;
248
249                 buflen = fs->blocksize;
250         }
251
252         if (inode->i_flags & EXT4_ENCRYPT_FL)
253                 len = ext2fs_le16_to_cpu(*(__u16 *)buf) + 2;
254         else
255                 len = strnlen(buf, buflen);
256
257         if (len >= buflen)
258                 return 0;
259
260         if (len != inode->i_size)
261                 return 0;
262         return 1;
263 }
264
265 /*
266  * If the extents or inlinedata flags are set on the inode, offer to clear 'em.
267  */
268 #define BAD_SPECIAL_FLAGS (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)
269 static void check_extents_inlinedata(e2fsck_t ctx,
270                                      struct problem_context *pctx)
271 {
272         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
273                 return;
274
275         if (!fix_problem(ctx, PR_1_SPECIAL_EXTENTS_IDATA, pctx))
276                 return;
277
278         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
279         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
280 }
281 #undef BAD_SPECIAL_FLAGS
282
283 /*
284  * If the immutable (or append-only) flag is set on the inode, offer
285  * to clear it.
286  */
287 #define BAD_SPECIAL_FLAGS (EXT2_IMMUTABLE_FL | EXT2_APPEND_FL)
288 static void check_immutable(e2fsck_t ctx, struct problem_context *pctx)
289 {
290         if (!(pctx->inode->i_flags & BAD_SPECIAL_FLAGS))
291                 return;
292
293         if (!fix_problem(ctx, PR_1_SET_IMMUTABLE, pctx))
294                 return;
295
296         pctx->inode->i_flags &= ~BAD_SPECIAL_FLAGS;
297         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
298 }
299
300 /*
301  * If device, fifo or socket, check size is zero -- if not offer to
302  * clear it
303  */
304 static void check_size(e2fsck_t ctx, struct problem_context *pctx)
305 {
306         struct ext2_inode *inode = pctx->inode;
307
308         if (EXT2_I_SIZE(inode) == 0)
309                 return;
310
311         if (!fix_problem(ctx, PR_1_SET_NONZSIZE, pctx))
312                 return;
313
314         ext2fs_inode_size_set(ctx->fs, inode, 0);
315         e2fsck_write_inode(ctx, pctx->ino, pctx->inode, "pass1");
316 }
317
318 /*
319  * For a given size, calculate how many blocks would be charged towards quota.
320  */
321 static blk64_t size_to_quota_blocks(ext2_filsys fs, size_t size)
322 {
323         blk64_t clusters;
324
325         clusters = DIV_ROUND_UP(size, fs->blocksize << fs->cluster_ratio_bits);
326         return EXT2FS_C2B(fs, clusters);
327 }
328
329 /*
330  * Check validity of EA inode. Return 0 if EA inode is valid, otherwise return
331  * the problem code.
332  */
333 static problem_t check_large_ea_inode(e2fsck_t ctx,
334                                       struct ext2_ext_attr_entry *entry,
335                                       struct problem_context *pctx,
336                                       blk64_t *quota_blocks)
337 {
338         struct ext2_inode inode;
339         __u32 hash, signed_hash;
340         errcode_t retval;
341
342         /* Check if inode is within valid range */
343         if ((entry->e_value_inum < EXT2_FIRST_INODE(ctx->fs->super)) ||
344             (entry->e_value_inum > ctx->fs->super->s_inodes_count)) {
345                 pctx->num = entry->e_value_inum;
346                 return PR_1_ATTR_VALUE_EA_INODE;
347         }
348
349         e2fsck_read_inode(ctx, entry->e_value_inum, &inode, "pass1");
350
351         retval = ext2fs_ext_attr_hash_entry3(ctx->fs, entry, NULL, &hash,
352                                              &signed_hash);
353         if (retval) {
354                 com_err("check_large_ea_inode", retval,
355                         _("while hashing entry with e_value_inum = %u"),
356                         entry->e_value_inum);
357                 fatal_error(ctx, 0);
358         }
359
360         if ((hash == entry->e_hash) || (signed_hash == entry->e_hash)) {
361                 *quota_blocks = size_to_quota_blocks(ctx->fs,
362                                                      entry->e_value_size);
363         } else {
364                 /* This might be an old Lustre-style ea_inode reference. */
365                 if (inode.i_mtime == pctx->ino &&
366                     inode.i_generation == pctx->inode->i_generation) {
367                         *quota_blocks = 0;
368                 } else {
369                         /* If target inode is also missing EA_INODE flag,
370                          * this is likely to be a bad reference.
371                          */
372                         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
373                                 pctx->num = entry->e_value_inum;
374                                 return PR_1_ATTR_VALUE_EA_INODE;
375                         } else {
376                                 pctx->num = entry->e_hash;
377                                 return PR_1_ATTR_HASH;
378                         }
379                 }
380         }
381
382         if (!(inode.i_flags & EXT4_EA_INODE_FL)) {
383                 pctx->num = entry->e_value_inum;
384                 if (fix_problem(ctx, PR_1_ATTR_SET_EA_INODE_FL, pctx)) {
385                         inode.i_flags |= EXT4_EA_INODE_FL;
386                         e2fsck_pass1_fix_lock(ctx);
387                         ext2fs_write_inode(ctx->fs, entry->e_value_inum,
388                                            &inode);
389                         e2fsck_pass1_fix_unlock(ctx);
390                 } else {
391                         return PR_1_ATTR_NO_EA_INODE_FL;
392                 }
393         }
394         return 0;
395 }
396
397 static void inc_ea_inode_refs(e2fsck_t ctx, struct problem_context *pctx,
398                               struct ext2_ext_attr_entry *first, void *end)
399 {
400         struct ext2_ext_attr_entry *entry = first;
401         struct ext2_ext_attr_entry *np = EXT2_EXT_ATTR_NEXT(entry);
402
403         while ((void *) entry < end && (void *) np < end &&
404                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
405                 if (!entry->e_value_inum)
406                         goto next;
407                 if (!ctx->ea_inode_refs) {
408                         pctx->errcode = ea_refcount_create(0,
409                                                            &ctx->ea_inode_refs);
410                         if (pctx->errcode) {
411                                 pctx->num = 4;
412                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
413                                 ctx->flags |= E2F_FLAG_ABORT;
414                                 return;
415                         }
416                 }
417                 ea_refcount_increment(ctx->ea_inode_refs, entry->e_value_inum,
418                                       0);
419         next:
420                 entry = np;
421                 np = EXT2_EXT_ATTR_NEXT(entry);
422         }
423 }
424
425 static void check_ea_in_inode(e2fsck_t ctx, struct problem_context *pctx,
426                               struct ea_quota *ea_ibody_quota)
427 {
428         struct ext2_super_block *sb = ctx->fs->super;
429         struct ext2_inode_large *inode;
430         struct ext2_ext_attr_entry *entry;
431         char *start, *header, *end;
432         unsigned int storage_size, remain;
433         problem_t problem = 0;
434         region_t region = 0;
435
436         ea_ibody_quota->blocks = 0;
437         ea_ibody_quota->inodes = 0;
438
439         inode = (struct ext2_inode_large *) pctx->inode;
440         storage_size = EXT2_INODE_SIZE(ctx->fs->super) - EXT2_GOOD_OLD_INODE_SIZE -
441                 inode->i_extra_isize;
442         header = ((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
443                  inode->i_extra_isize;
444         end = header + storage_size;
445         start = header + sizeof(__u32);
446         entry = (struct ext2_ext_attr_entry *) start;
447
448         /* scan all entry's headers first */
449
450         /* take finish entry 0UL into account */
451         remain = storage_size - sizeof(__u32);
452
453         region = region_create(0, storage_size);
454         if (!region) {
455                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
456                 problem = 0;
457                 ctx->flags |= E2F_FLAG_ABORT;
458                 return;
459         }
460         if (region_allocate(region, 0, sizeof(__u32))) {
461                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
462                 goto fix;
463         }
464
465         while (remain >= sizeof(struct ext2_ext_attr_entry) &&
466                !EXT2_EXT_IS_LAST_ENTRY(entry)) {
467                 __u32 hash;
468
469                 if (region_allocate(region, (char *)entry - (char *)header,
470                                     EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
471                         problem = PR_1_INODE_EA_ALLOC_COLLISION;
472                         goto fix;
473                 }
474
475                 /* header eats this space */
476                 remain -= sizeof(struct ext2_ext_attr_entry);
477
478                 /* is attribute name valid? */
479                 if (EXT2_EXT_ATTR_SIZE(entry->e_name_len) > remain) {
480                         pctx->num = entry->e_name_len;
481                         problem = PR_1_ATTR_NAME_LEN;
482                         goto fix;
483                 }
484
485                 /* attribute len eats this space */
486                 remain -= EXT2_EXT_ATTR_SIZE(entry->e_name_len);
487
488                 if (entry->e_value_inum == 0) {
489                         /* check value size */
490                         if (entry->e_value_size > remain) {
491                                 pctx->num = entry->e_value_size;
492                                 problem = PR_1_ATTR_VALUE_SIZE;
493                                 goto fix;
494                         }
495
496                         if (entry->e_value_size &&
497                             region_allocate(region,
498                                             sizeof(__u32) + entry->e_value_offs,
499                                             EXT2_EXT_ATTR_SIZE(
500                                                 entry->e_value_size))) {
501                                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
502                                 goto fix;
503                         }
504
505                         hash = ext2fs_ext_attr_hash_entry(entry,
506                                                 start + entry->e_value_offs);
507                         if (entry->e_hash != 0 && entry->e_hash != hash)
508                                 hash = ext2fs_ext_attr_hash_entry_signed(entry,
509                                                 start + entry->e_value_offs);
510
511                         /* e_hash may be 0 in older inode's ea */
512                         if (entry->e_hash != 0 && entry->e_hash != hash) {
513                                 pctx->num = entry->e_hash;
514                                 problem = PR_1_ATTR_HASH;
515                                 goto fix;
516                         }
517                 } else {
518                         blk64_t quota_blocks;
519
520                         problem = check_large_ea_inode(ctx, entry, pctx,
521                                                        &quota_blocks);
522                         if (problem != 0)
523                                 goto fix;
524
525                         ea_ibody_quota->blocks += quota_blocks;
526                         ea_ibody_quota->inodes++;
527                 }
528
529                 /* If EA value is stored in external inode then it does not
530                  * consume space here */
531                 if (entry->e_value_inum == 0)
532                         remain -= entry->e_value_size;
533
534                 entry = EXT2_EXT_ATTR_NEXT(entry);
535         }
536
537         if (region_allocate(region, (char *)entry - (char *)header,
538                             sizeof(__u32))) {
539                 problem = PR_1_INODE_EA_ALLOC_COLLISION;
540                 goto fix;
541         }
542 fix:
543         if (region)
544                 region_free(region);
545         /*
546          * it seems like a corruption. it's very unlikely we could repair
547          * EA(s) in automatic fashion -bzzz
548          */
549         if (problem == 0 || !fix_problem(ctx, problem, pctx)) {
550                 inc_ea_inode_refs(ctx, pctx,
551                                   (struct ext2_ext_attr_entry *)start, end);
552                 return;
553         }
554
555         /* simply remove all possible EA(s) */
556         *((__u32 *)header) = 0UL;
557         e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
558                                 EXT2_INODE_SIZE(sb), "pass1");
559         ea_ibody_quota->blocks = 0;
560         ea_ibody_quota->inodes = 0;
561 }
562
563 static int check_inode_extra_negative_epoch(__u32 xtime, __u32 extra) {
564         return (xtime & (1U << 31)) != 0 &&
565                 (extra & EXT4_EPOCH_MASK) == EXT4_EPOCH_MASK;
566 }
567
568 #define CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, xtime) \
569         check_inode_extra_negative_epoch(inode->i_##xtime, \
570                                          inode->i_##xtime##_extra)
571
572 /* When today's date is earlier than 2242, we assume that atimes,
573  * ctimes, crtimes, and mtimes with years in the range 2310..2378 are
574  * actually pre-1970 dates mis-encoded.
575  */
576 #define EXT4_EXTRA_NEGATIVE_DATE_CUTOFF 2 * (1LL << 32)
577
578 static void check_inode_extra_space(e2fsck_t ctx, struct problem_context *pctx,
579                                     struct ea_quota *ea_ibody_quota)
580 {
581         struct ext2_super_block *sb = ctx->fs->super;
582         struct ext2_inode_large *inode;
583         __u32 *eamagic;
584         int min, max;
585
586         ea_ibody_quota->blocks = 0;
587         ea_ibody_quota->inodes = 0;
588
589         inode = (struct ext2_inode_large *) pctx->inode;
590         if (EXT2_INODE_SIZE(sb) == EXT2_GOOD_OLD_INODE_SIZE) {
591                 /* this isn't large inode. so, nothing to check */
592                 return;
593         }
594
595 #if 0
596         printf("inode #%u, i_extra_size %d\n", pctx->ino,
597                         inode->i_extra_isize);
598 #endif
599         /* i_extra_isize must cover i_extra_isize + i_checksum_hi at least */
600         min = sizeof(inode->i_extra_isize) + sizeof(inode->i_checksum_hi);
601         max = EXT2_INODE_SIZE(sb) - EXT2_GOOD_OLD_INODE_SIZE;
602         /*
603          * For now we will allow i_extra_isize to be 0, but really
604          * implementations should never allow i_extra_isize to be 0
605          */
606         if (inode->i_extra_isize &&
607             (inode->i_extra_isize < min || inode->i_extra_isize > max ||
608              inode->i_extra_isize & 3)) {
609                 if (!fix_problem(ctx, PR_1_EXTRA_ISIZE, pctx))
610                         return;
611                 if (inode->i_extra_isize < min || inode->i_extra_isize > max)
612                         inode->i_extra_isize = sb->s_want_extra_isize;
613                 else
614                         inode->i_extra_isize = (inode->i_extra_isize + 3) & ~3;
615                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
616                                         EXT2_INODE_SIZE(sb), "pass1");
617         }
618
619         /* check if there is no place for an EA header */
620         if (inode->i_extra_isize >= max - sizeof(__u32))
621                 return;
622
623         eamagic = (__u32 *) (((char *) inode) + EXT2_GOOD_OLD_INODE_SIZE +
624                         inode->i_extra_isize);
625         if (*eamagic == EXT2_EXT_ATTR_MAGIC) {
626                 /* it seems inode has an extended attribute(s) in body */
627                 check_ea_in_inode(ctx, pctx, ea_ibody_quota);
628         }
629
630         /*
631          * If the inode's extended atime (ctime, crtime, mtime) is stored in
632          * the old, invalid format, repair it.
633          */
634         if (((sizeof(time_t) <= 4) ||
635              (((sizeof(time_t) > 4) &&
636                ctx->now < EXT4_EXTRA_NEGATIVE_DATE_CUTOFF))) &&
637             (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime) ||
638              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime) ||
639              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime) ||
640              CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))) {
641
642                 if (!fix_problem(ctx, PR_1_EA_TIME_OUT_OF_RANGE, pctx))
643                         return;
644
645                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, atime))
646                         inode->i_atime_extra &= ~EXT4_EPOCH_MASK;
647                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, ctime))
648                         inode->i_ctime_extra &= ~EXT4_EPOCH_MASK;
649                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, crtime))
650                         inode->i_crtime_extra &= ~EXT4_EPOCH_MASK;
651                 if (CHECK_INODE_EXTRA_NEGATIVE_EPOCH(inode, mtime))
652                         inode->i_mtime_extra &= ~EXT4_EPOCH_MASK;
653                 e2fsck_write_inode_full(ctx, pctx->ino, pctx->inode,
654                                         EXT2_INODE_SIZE(sb), "pass1");
655         }
656
657 }
658
659 static _INLINE_ int is_blocks_used(e2fsck_t ctx, blk64_t block,
660                                    unsigned int num)
661 {
662         int retval;
663
664         /* used to avoid duplicate output from below */
665         retval = ext2fs_test_block_bitmap_range2_valid(ctx->block_found_map,
666                                                        block, num);
667         if (!retval)
668                 return 0;
669
670         retval = ext2fs_test_block_bitmap_range2(ctx->block_found_map, block, num);
671         if (retval) {
672                 e2fsck_pass1_block_map_r_lock(ctx);
673                 if (ctx->global_ctx)
674                         retval = ext2fs_test_block_bitmap_range2(
675                                         ctx->global_ctx->block_found_map, block, num);
676                 e2fsck_pass1_block_map_r_unlock(ctx);
677                 if (retval)
678                         return 0;
679         }
680
681         return 1;
682 }
683
684 /*
685  * Check to see if the inode might really be a directory, despite i_mode
686  *
687  * This is a lot of complexity for something for which I'm not really
688  * convinced happens frequently in the wild.  If for any reason this
689  * causes any problems, take this code out.
690  * [tytso:20070331.0827EDT]
691  */
692 static void check_is_really_dir(e2fsck_t ctx, struct problem_context *pctx,
693                                 char *buf)
694 {
695         struct ext2_inode *inode = pctx->inode;
696         struct ext2_dir_entry   *dirent;
697         errcode_t               retval;
698         blk64_t                 blk;
699         unsigned int            i, rec_len, not_device = 0;
700         int                     extent_fs;
701         int                     inlinedata_fs;
702
703         /*
704          * If the mode looks OK, we believe it.  If the first block in
705          * the i_block array is 0, this cannot be a directory. If the
706          * inode is extent-mapped, it is still the case that the latter
707          * cannot be 0 - the magic number in the extent header would make
708          * it nonzero.
709          */
710         if (LINUX_S_ISDIR(inode->i_mode) || LINUX_S_ISREG(inode->i_mode) ||
711             LINUX_S_ISLNK(inode->i_mode) || inode->i_block[0] == 0)
712                 return;
713
714         /*
715          * Check the block numbers in the i_block array for validity:
716          * zero blocks are skipped (but the first one cannot be zero -
717          * see above), other blocks are checked against the first and
718          * max data blocks (from the the superblock) and against the
719          * block bitmap. Any invalid block found means this cannot be
720          * a directory.
721          *
722          * If there are non-zero blocks past the fourth entry, then
723          * this cannot be a device file: we remember that for the next
724          * check.
725          *
726          * For extent mapped files, we don't do any sanity checking:
727          * just try to get the phys block of logical block 0 and run
728          * with it.
729          *
730          * For inline data files, we just try to get the size of inline
731          * data.  If it's true, we will treat it as a directory.
732          */
733
734         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
735         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
736         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL)) {
737                 size_t size;
738                 __u32 dotdot;
739                 unsigned int rec_len2;
740                 struct ext2_dir_entry de;
741
742                 if (ext2fs_inline_data_size(ctx->fs, pctx->ino, &size))
743                         return;
744                 /*
745                  * If the size isn't a multiple of 4, it's probably not a
746                  * directory??
747                  */
748                 if (size & 3)
749                         return;
750                 /*
751                  * If the first 10 bytes don't look like a directory entry,
752                  * it's probably not a directory.
753                  */
754                 memcpy(&dotdot, inode->i_block, sizeof(dotdot));
755                 memcpy(&de, ((char *)inode->i_block) + EXT4_INLINE_DATA_DOTDOT_SIZE,
756                        EXT2_DIR_REC_LEN(0));
757                 dotdot = ext2fs_le32_to_cpu(dotdot);
758                 de.inode = ext2fs_le32_to_cpu(de.inode);
759                 de.rec_len = ext2fs_le16_to_cpu(de.rec_len);
760                 ext2fs_get_rec_len(ctx->fs, &de, &rec_len2);
761                 if (dotdot >= ctx->fs->super->s_inodes_count ||
762                     (dotdot < EXT2_FIRST_INO(ctx->fs->super) &&
763                      dotdot != EXT2_ROOT_INO) ||
764                     de.inode >= ctx->fs->super->s_inodes_count ||
765                     (de.inode < EXT2_FIRST_INO(ctx->fs->super) &&
766                      de.inode != 0) ||
767                     rec_len2 > EXT4_MIN_INLINE_DATA_SIZE -
768                               EXT4_INLINE_DATA_DOTDOT_SIZE)
769                         return;
770                 /* device files never have a "system.data" entry */
771                 goto isdir;
772         } else if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) {
773                 /* extent mapped */
774                 if  (ext2fs_bmap2(ctx->fs, pctx->ino, inode, 0, 0, 0, 0,
775                                  &blk))
776                         return;
777                 /* device files are never extent mapped */
778                 not_device++;
779         } else {
780                 for (i=0; i < EXT2_N_BLOCKS; i++) {
781                         blk = inode->i_block[i];
782                         if (!blk)
783                                 continue;
784                         if (i >= 4)
785                                 not_device++;
786
787                         if (blk < ctx->fs->super->s_first_data_block ||
788                             blk >= ext2fs_blocks_count(ctx->fs->super) ||
789                             is_blocks_used(ctx, blk, 1))
790                                 return; /* Invalid block, can't be dir */
791                 }
792                 blk = inode->i_block[0];
793         }
794
795         /*
796          * If the mode says this is a device file and the i_links_count field
797          * is sane and we have not ruled it out as a device file previously,
798          * we declare it a device file, not a directory.
799          */
800         if ((LINUX_S_ISCHR(inode->i_mode) || LINUX_S_ISBLK(inode->i_mode)) &&
801             (inode->i_links_count == 1) && !not_device)
802                 return;
803
804         /* read the first block */
805         ehandler_operation(_("reading directory block"));
806         retval = ext2fs_read_dir_block4(ctx->fs, blk, buf, 0, pctx->ino);
807         ehandler_operation(0);
808         if (retval)
809                 return;
810
811         dirent = (struct ext2_dir_entry *) buf;
812         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
813         if (retval)
814                 return;
815         if ((ext2fs_dirent_name_len(dirent) != 1) ||
816             (dirent->name[0] != '.') ||
817             (dirent->inode != pctx->ino) ||
818             (rec_len < 12) ||
819             (rec_len % 4) ||
820             (rec_len >= ctx->fs->blocksize - 12))
821                 return;
822
823         dirent = (struct ext2_dir_entry *) (buf + rec_len);
824         retval = ext2fs_get_rec_len(ctx->fs, dirent, &rec_len);
825         if (retval)
826                 return;
827         if ((ext2fs_dirent_name_len(dirent) != 2) ||
828             (dirent->name[0] != '.') ||
829             (dirent->name[1] != '.') ||
830             (rec_len < 12) ||
831             (rec_len % 4))
832                 return;
833
834 isdir:
835         if (fix_problem(ctx, PR_1_TREAT_AS_DIRECTORY, pctx)) {
836                 inode->i_mode = (inode->i_mode & 07777) | LINUX_S_IFDIR;
837                 e2fsck_write_inode_full(ctx, pctx->ino, inode,
838                                         EXT2_INODE_SIZE(ctx->fs->super),
839                                         "check_is_really_dir");
840         }
841 }
842
843 extern errcode_t e2fsck_setup_icount(e2fsck_t ctx, const char *icount_name,
844                                      int flags, ext2_icount_t hint,
845                                      ext2_icount_t *ret)
846 {
847         unsigned int            threshold;
848         unsigned int            save_type;
849         ext2_ino_t              num_dirs;
850         errcode_t               retval;
851         char                    *tdb_dir;
852         int                     enable;
853
854         *ret = 0;
855
856         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
857                            &tdb_dir);
858         profile_get_uint(ctx->profile, "scratch_files",
859                          "numdirs_threshold", 0, 0, &threshold);
860         profile_get_boolean(ctx->profile, "scratch_files",
861                             "icount", 0, 1, &enable);
862
863         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
864         if (retval)
865                 num_dirs = 1024;        /* Guess */
866
867         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
868             (!threshold || num_dirs > threshold)) {
869                 retval = ext2fs_create_icount_tdb(ctx->fs, tdb_dir,
870                                                   flags, ret);
871                 if (retval == 0)
872                         return 0;
873         }
874         e2fsck_set_bitmap_type(ctx->fs, EXT2FS_BMAP64_RBTREE, icount_name,
875                                &save_type);
876         if (ctx->options & E2F_OPT_ICOUNT_FULLMAP)
877                 flags |= EXT2_ICOUNT_OPT_FULLMAP;
878         retval = ext2fs_create_icount2(ctx->fs, flags, 0, hint, ret);
879         ctx->fs->default_bitmap_type = save_type;
880         return retval;
881 }
882
883 static errcode_t recheck_bad_inode_checksum(ext2_filsys fs, ext2_ino_t ino,
884                                             e2fsck_t ctx,
885                                             struct problem_context *pctx)
886 {
887         errcode_t retval;
888         struct ext2_inode_large inode;
889
890         /*
891          * Reread inode.  If we don't see checksum error, then this inode
892          * has been fixed elsewhere.
893          */
894         ctx->stashed_ino = 0;
895         retval = ext2fs_read_inode_full(fs, ino, (struct ext2_inode *)&inode,
896                                         sizeof(inode));
897         if (retval && retval != EXT2_ET_INODE_CSUM_INVALID)
898                 return retval;
899         if (!retval)
900                 return 0;
901
902         /*
903          * Checksum still doesn't match.  That implies that the inode passes
904          * all the sanity checks, so maybe the checksum is simply corrupt.
905          * See if the user will go for fixing that.
906          */
907         if (!fix_problem(ctx, PR_1_INODE_ONLY_CSUM_INVALID, pctx))
908                 return 0;
909
910
911         e2fsck_pass1_fix_lock(ctx);
912         retval = ext2fs_write_inode_full(fs, ino, (struct ext2_inode *)&inode,
913                                          sizeof(inode));
914         e2fsck_pass1_fix_unlock(ctx);
915         return retval;
916 }
917
918 static void reserve_block_for_root_repair(e2fsck_t ctx)
919 {
920         blk64_t         blk = 0;
921         errcode_t       err;
922         ext2_filsys     fs = ctx->fs;
923
924         ctx->root_repair_block = 0;
925         if (ext2fs_test_inode_bitmap2(ctx->inode_used_map, EXT2_ROOT_INO))
926                 return;
927
928         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
929         if (err)
930                 return;
931         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
932         ctx->root_repair_block = blk;
933 }
934
935 static void reserve_block_for_lnf_repair(e2fsck_t ctx)
936 {
937         blk64_t         blk = 0;
938         errcode_t       err;
939         ext2_filsys     fs = ctx->fs;
940         static const char name[] = "lost+found";
941         ext2_ino_t      ino;
942
943         ctx->lnf_repair_block = 0;
944         if (!ext2fs_lookup(fs, EXT2_ROOT_INO, name, sizeof(name)-1, 0, &ino))
945                 return;
946
947         err = ext2fs_new_block2(fs, 0, ctx->block_found_map, &blk);
948         if (err)
949                 return;
950         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
951         ctx->lnf_repair_block = blk;
952         return;
953 }
954
955 static errcode_t get_inline_data_ea_size(ext2_filsys fs, ext2_ino_t ino,
956                                          struct ext2_inode *inode,
957                                          size_t *sz)
958 {
959         void *p;
960         struct ext2_xattr_handle *handle;
961         errcode_t retval;
962
963         retval = ext2fs_xattrs_open(fs, ino, &handle);
964         if (retval)
965                 return retval;
966
967         retval = ext2fs_xattrs_read_inode(handle,
968                                           (struct ext2_inode_large *)inode);
969         if (retval)
970                 goto err;
971
972         retval = ext2fs_xattr_get(handle, "system.data", &p, sz);
973         if (retval)
974                 goto err;
975         ext2fs_free_mem(&p);
976 err:
977         (void) ext2fs_xattrs_close(&handle);
978         return retval;
979 }
980
981 static void finish_processing_inode(e2fsck_t ctx, ext2_ino_t ino,
982                                     struct problem_context *pctx,
983                                     int failed_csum)
984 {
985         if (!failed_csum)
986                 return;
987
988         /*
989          * If the inode failed the checksum and the user didn't
990          * clear the inode, test the checksum again -- if it still
991          * fails, ask the user if the checksum should be corrected.
992          */
993         pctx->errcode = recheck_bad_inode_checksum(ctx->fs, ino, ctx, pctx);
994         if (pctx->errcode)
995                 ctx->flags |= E2F_FLAG_ABORT;
996 }
997 #define FINISH_INODE_LOOP(ctx, ino, pctx, failed_csum) \
998         do { \
999                 finish_processing_inode((ctx), (ino), (pctx), (failed_csum)); \
1000                 if ((ctx)->flags & E2F_FLAG_ABORT) { \
1001                         e2fsck_pass1_check_unlock(ctx); \
1002                         return; \
1003                 } \
1004         } while (0)
1005
1006 static int could_be_block_map(ext2_filsys fs, struct ext2_inode *inode)
1007 {
1008         __u32 x;
1009         int i;
1010
1011         for (i = 0; i < EXT2_N_BLOCKS; i++) {
1012                 x = inode->i_block[i];
1013 #ifdef WORDS_BIGENDIAN
1014                 x = ext2fs_swab32(x);
1015 #endif
1016                 if (x >= ext2fs_blocks_count(fs->super))
1017                         return 0;
1018         }
1019
1020         return 1;
1021 }
1022
1023 /*
1024  * Figure out what to do with an inode that has both extents and inline data
1025  * inode flags set.  Returns -1 if we decide to erase the inode, 0 otherwise.
1026  */
1027 static int fix_inline_data_extents_file(e2fsck_t ctx,
1028                                         ext2_ino_t ino,
1029                                         struct ext2_inode *inode,
1030                                         int inode_size,
1031                                         struct problem_context *pctx)
1032 {
1033         size_t max_inline_ea_size;
1034         ext2_filsys fs = ctx->fs;
1035         int dirty = 0;
1036
1037         /* Both feature flags not set?  Just run the regular checks */
1038         if (!ext2fs_has_feature_extents(fs->super) &&
1039             !ext2fs_has_feature_inline_data(fs->super))
1040                 return 0;
1041
1042         /* Clear both flags if it's a special file */
1043         if (LINUX_S_ISCHR(inode->i_mode) ||
1044             LINUX_S_ISBLK(inode->i_mode) ||
1045             LINUX_S_ISFIFO(inode->i_mode) ||
1046             LINUX_S_ISSOCK(inode->i_mode)) {
1047                 check_extents_inlinedata(ctx, pctx);
1048                 return 0;
1049         }
1050
1051         /* If it looks like an extent tree, try to clear inlinedata */
1052         if (ext2fs_extent_header_verify(inode->i_block,
1053                                  sizeof(inode->i_block)) == 0 &&
1054             fix_problem(ctx, PR_1_CLEAR_INLINE_DATA_FOR_EXTENT, pctx)) {
1055                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1056                 dirty = 1;
1057                 goto out;
1058         }
1059
1060         /* If it looks short enough to be inline data, try to clear extents */
1061         if (inode_size > EXT2_GOOD_OLD_INODE_SIZE)
1062                 max_inline_ea_size = inode_size -
1063                                      (EXT2_GOOD_OLD_INODE_SIZE +
1064                                       ((struct ext2_inode_large *)inode)->i_extra_isize);
1065         else
1066                 max_inline_ea_size = 0;
1067         if (EXT2_I_SIZE(inode) <
1068             EXT4_MIN_INLINE_DATA_SIZE + max_inline_ea_size &&
1069             fix_problem(ctx, PR_1_CLEAR_EXTENT_FOR_INLINE_DATA, pctx)) {
1070                 inode->i_flags &= ~EXT4_EXTENTS_FL;
1071                 dirty = 1;
1072                 goto out;
1073         }
1074
1075         /*
1076          * Too big for inline data, but no evidence of extent tree -
1077          * maybe it's a block map file?  If the mappings all look valid?
1078          */
1079         if (could_be_block_map(fs, inode) &&
1080             fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_FLAGS, pctx)) {
1081 #ifdef WORDS_BIGENDIAN
1082                 int i;
1083
1084                 for (i = 0; i < EXT2_N_BLOCKS; i++)
1085                         inode->i_block[i] = ext2fs_swab32(inode->i_block[i]);
1086 #endif
1087
1088                 inode->i_flags &= ~(EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL);
1089                 dirty = 1;
1090                 goto out;
1091         }
1092
1093         /* Oh well, just clear the busted inode. */
1094         if (fix_problem(ctx, PR_1_CLEAR_EXTENT_INLINE_DATA_INODE, pctx)) {
1095                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1096                 return -1;
1097         }
1098
1099 out:
1100         if (dirty)
1101                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1102
1103         return 0;
1104 }
1105
1106 static void pass1_readahead(e2fsck_t ctx, dgrp_t *group, ext2_ino_t *next_ino)
1107 {
1108         ext2_ino_t inodes_in_group = 0, inodes_per_block, inodes_per_buffer;
1109         dgrp_t start = *group, grp, grp_end = ctx->fs->group_desc_count;
1110         blk64_t blocks_to_read = 0;
1111         errcode_t err = EXT2_ET_INVALID_ARGUMENT;
1112
1113 #ifdef HAVE_PTHREAD
1114         if (ctx->fs->fs_num_threads > 1)
1115                 grp_end = ctx->thread_info.et_group_end;
1116 #endif
1117         if (ctx->readahead_kb == 0)
1118                 goto out;
1119
1120         /* Keep iterating groups until we have enough to readahead */
1121         inodes_per_block = EXT2_INODES_PER_BLOCK(ctx->fs->super);
1122         for (grp = start; grp < grp_end; grp++) {
1123                 if (ext2fs_bg_flags_test(ctx->fs, grp, EXT2_BG_INODE_UNINIT))
1124                         continue;
1125                 inodes_in_group = ctx->fs->super->s_inodes_per_group -
1126                                         ext2fs_bg_itable_unused(ctx->fs, grp);
1127                 blocks_to_read += (inodes_in_group + inodes_per_block - 1) /
1128                                         inodes_per_block;
1129                 if (blocks_to_read * ctx->fs->blocksize >
1130                     ctx->readahead_kb * 1024)
1131                         break;
1132         }
1133
1134         err = e2fsck_readahead(ctx->fs, E2FSCK_READA_ITABLE, start,
1135                                grp - start + 1);
1136         if (err == EAGAIN) {
1137                 ctx->readahead_kb /= 2;
1138                 err = 0;
1139         }
1140
1141 out:
1142         if (err) {
1143                 /* Error; disable itable readahead */
1144                 *group = ctx->fs->group_desc_count;
1145                 *next_ino = ctx->fs->super->s_inodes_count;
1146         } else {
1147                 /*
1148                  * Don't do more readahead until we've reached the first inode
1149                  * of the last inode scan buffer block for the last group.
1150                  */
1151                 *group = grp + 1;
1152                 inodes_per_buffer = (ctx->inode_buffer_blocks ?
1153                                      ctx->inode_buffer_blocks :
1154                                      EXT2_INODE_SCAN_DEFAULT_BUFFER_BLOCKS) *
1155                                     ctx->fs->blocksize /
1156                                     EXT2_INODE_SIZE(ctx->fs->super);
1157                 inodes_in_group--;
1158                 *next_ino = inodes_in_group -
1159                             (inodes_in_group % inodes_per_buffer) + 1 +
1160                             (grp * ctx->fs->super->s_inodes_per_group);
1161         }
1162 }
1163
1164 /*
1165  * Check if the passed ino is one of the used superblock quota inodes.
1166  *
1167  * Before the quota inodes were journaled, older superblock quota inodes
1168  * were just regular files in the filesystem and not reserved inodes.  This
1169  * checks if the passed ino is one of the s_*_quota_inum superblock fields,
1170  * which may not always be the same as the EXT4_*_QUOTA_INO fields.
1171  */
1172 static int quota_inum_is_super(struct ext2_super_block *sb, ext2_ino_t ino)
1173 {
1174         enum quota_type qtype;
1175
1176         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1177                 if (*quota_sb_inump(sb, qtype) == ino)
1178                         return 1;
1179
1180         return 0;
1181 }
1182
1183 /*
1184  * Check if the passed ino is one of the reserved quota inodes.
1185  * This checks if the inode number is one of the reserved EXT4_*_QUOTA_INO
1186  * inodes.  These inodes may or may not be in use by the quota feature.
1187  */
1188 static int quota_inum_is_reserved(ext2_filsys fs, ext2_ino_t ino)
1189 {
1190         enum quota_type qtype;
1191
1192         for (qtype = 0; qtype < MAXQUOTAS; qtype++)
1193                 if (quota_type2inum(qtype, fs->super) == ino)
1194                         return 1;
1195
1196         return 0;
1197 }
1198
1199 static int e2fsck_should_abort(e2fsck_t ctx)
1200 {
1201         e2fsck_t global_ctx;
1202
1203         if (ctx->flags & E2F_FLAG_SIGNAL_MASK)
1204                 return 1;
1205
1206         if (ctx->global_ctx) {
1207                 global_ctx = ctx->global_ctx;
1208                 if (global_ctx->flags & E2F_FLAG_SIGNAL_MASK)
1209                         return 1;
1210         }
1211         return 0;
1212 }
1213
1214 static void init_ext2_max_sizes()
1215 {
1216         int     i;
1217         __u64   max_sizes;
1218
1219         /*
1220          * Init ext2_max_sizes which will be immutable and shared between
1221          * threads
1222          */
1223 #define EXT2_BPP(bits) (1ULL << ((bits) - 2))
1224
1225         for (i = EXT2_MIN_BLOCK_LOG_SIZE; i <= EXT2_MAX_BLOCK_LOG_SIZE; i++) {
1226                 max_sizes = EXT2_NDIR_BLOCKS + EXT2_BPP(i);
1227                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i);
1228                 max_sizes = max_sizes + EXT2_BPP(i) * EXT2_BPP(i) * EXT2_BPP(i);
1229                 max_sizes = (max_sizes * (1UL << i));
1230                 ext2_max_sizes[i - EXT2_MIN_BLOCK_LOG_SIZE] = max_sizes;
1231         }
1232 #undef EXT2_BPP
1233 }
1234
1235 #ifdef HAVE_PTHREAD
1236 /* TODO: tdb needs to be handled properly for multiple threads*/
1237 static int multiple_threads_supported(e2fsck_t ctx)
1238 {
1239 #ifdef  CONFIG_TDB
1240         unsigned int            threshold;
1241         ext2_ino_t              num_dirs;
1242         errcode_t               retval;
1243         char                    *tdb_dir;
1244         int                     enable;
1245
1246         profile_get_string(ctx->profile, "scratch_files", "directory", 0, 0,
1247                            &tdb_dir);
1248         profile_get_uint(ctx->profile, "scratch_files",
1249                          "numdirs_threshold", 0, 0, &threshold);
1250         profile_get_boolean(ctx->profile, "scratch_files",
1251                             "icount", 0, 1, &enable);
1252
1253         retval = ext2fs_get_num_dirs(ctx->fs, &num_dirs);
1254         if (retval)
1255                 num_dirs = 1024;        /* Guess */
1256
1257         /* tdb is unsupported now */
1258         if (enable && tdb_dir && !access(tdb_dir, W_OK) &&
1259             (!threshold || num_dirs > threshold))
1260                 return 0;
1261 #endif
1262         return 1;
1263 }
1264
1265 /**
1266  * Even though we could specify number of threads,
1267  * but it might be more than the whole filesystem
1268  * block groups, correct it here.
1269  */
1270 static void e2fsck_pass1_set_thread_num(e2fsck_t ctx)
1271 {
1272         unsigned flexbg_size = 1;
1273         ext2_filsys fs = ctx->fs;
1274         int num_threads = ctx->fs_num_threads;
1275         int max_threads;
1276
1277         if (num_threads < 1) {
1278                 num_threads = 1;
1279                 goto out;
1280         }
1281
1282         if (!multiple_threads_supported(ctx)) {
1283                 num_threads = 1;
1284                 fprintf(stderr, "Fall through single thread for pass1 "
1285                         "because tdb could not handle properly\n");
1286                 goto out;
1287         }
1288
1289         if (ext2fs_has_feature_flex_bg(fs->super))
1290                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
1291         max_threads = fs->group_desc_count / flexbg_size;
1292         if (max_threads == 0)
1293                 max_threads = 1;
1294
1295         if (num_threads > max_threads) {
1296                 fprintf(stderr, "Use max possible thread num: %d instead\n",
1297                                 max_threads);
1298                 num_threads = max_threads;
1299         }
1300 out:
1301         ctx->fs_num_threads = num_threads;
1302         ctx->fs->fs_num_threads = num_threads;
1303 }
1304 #endif
1305
1306 /*
1307  * We need call mark_table_blocks() before multiple
1308  * thread start, since all known system blocks should be
1309  * marked and checked later.
1310  */
1311 static errcode_t e2fsck_pass1_prepare(e2fsck_t ctx)
1312 {
1313         struct problem_context pctx;
1314         ext2_filsys fs = ctx->fs;
1315         unsigned long long readahead_kb;
1316
1317         init_ext2_max_sizes();
1318 #ifdef HAVE_PTHREAD
1319         e2fsck_pass1_set_thread_num(ctx);
1320 #endif
1321         /* If we can do readahead, figure out how many groups to pull in. */
1322         if (!e2fsck_can_readahead(ctx->fs))
1323                 ctx->readahead_kb = 0;
1324         else if (ctx->readahead_kb == ~0ULL)
1325                 ctx->readahead_kb = e2fsck_guess_readahead(ctx->fs);
1326
1327 #ifdef HAVE_PTHREAD
1328         /* don't use more than 1/10 of memory for threads checking */
1329         readahead_kb = get_memory_size() / (10 * ctx->fs_num_threads);
1330         /* maybe better disable RA if this is too small? */
1331         if (ctx->readahead_kb > readahead_kb)
1332                 ctx->readahead_kb = readahead_kb;
1333 #endif
1334         clear_problem_context(&pctx);
1335         if (!(ctx->options & E2F_OPT_PREEN))
1336                 fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1337
1338         pctx.errcode = e2fsck_allocate_subcluster_bitmap(ctx->fs,
1339                         _("in-use block map"), EXT2FS_BMAP64_RBTREE,
1340                         "block_found_map", &ctx->block_found_map);
1341         if (pctx.errcode) {
1342                 pctx.num = 1;
1343                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1344                 ctx->flags |= E2F_FLAG_ABORT;
1345                 return pctx.errcode;
1346         }
1347         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
1348                         _("metadata block map"), EXT2FS_BMAP64_RBTREE,
1349                         "block_metadata_map", &ctx->block_metadata_map);
1350         if (pctx.errcode) {
1351                 pctx.num = 1;
1352                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
1353                 ctx->flags |= E2F_FLAG_ABORT;
1354                 return pctx.errcode;
1355         }
1356
1357         mark_table_blocks(ctx);
1358         pctx.errcode = ext2fs_convert_subcluster_bitmap(ctx->fs,
1359                                                 &ctx->block_found_map);
1360         if (pctx.errcode) {
1361                 fix_problem(ctx, PR_1_CONVERT_SUBCLUSTER, &pctx);
1362                 ctx->flags |= E2F_FLAG_ABORT;
1363                 return pctx.errcode;
1364         }
1365
1366         pctx.errcode = e2fsck_allocate_block_bitmap(ctx->fs,
1367                         _("multiply claimed block map"),
1368                         EXT2FS_BMAP64_RBTREE, "block_dup_map",
1369                         &ctx->block_dup_map);
1370         if (pctx.errcode) {
1371                 pctx.num = 3;
1372                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR,
1373                             &pctx);
1374                 /* Should never get here */
1375                 ctx->flags |= E2F_FLAG_ABORT;
1376                 return pctx.errcode;
1377         }
1378
1379         if (ext2fs_has_feature_mmp(fs->super) &&
1380             fs->super->s_mmp_block > fs->super->s_first_data_block &&
1381             fs->super->s_mmp_block < ext2fs_blocks_count(fs->super))
1382                 ext2fs_mark_block_bitmap2(ctx->block_found_map,
1383                                           fs->super->s_mmp_block);
1384 #ifdef  HAVE_PTHREAD
1385         pthread_rwlock_init(&ctx->fs_fix_rwlock, NULL);
1386         pthread_rwlock_init(&ctx->fs_block_map_rwlock, NULL);
1387         if (ctx->fs_num_threads > 1)
1388                 ctx->fs_need_locking = 1;
1389 #endif
1390
1391         return 0;
1392 }
1393
1394 static void e2fsck_pass1_post(e2fsck_t ctx)
1395 {
1396         struct problem_context pctx;
1397         ext2_filsys fs = ctx->fs;
1398         char *block_buf;
1399
1400         if (e2fsck_should_abort(ctx))
1401                 return;
1402
1403         block_buf = (char *)e2fsck_allocate_memory(ctx, ctx->fs->blocksize * 3,
1404                                               "block interate buffer");
1405         reserve_block_for_root_repair(ctx);
1406         reserve_block_for_lnf_repair(ctx);
1407
1408         /*
1409          * If any extended attribute blocks' reference counts need to
1410          * be adjusted, either up (ctx->refcount_extra), or down
1411          * (ctx->refcount), then fix them.
1412          */
1413         if (ctx->refcount) {
1414                 adjust_extattr_refcount(ctx, ctx->refcount, block_buf, -1);
1415                 ea_refcount_free(ctx->refcount);
1416                 ctx->refcount = 0;
1417         }
1418         if (ctx->refcount_extra) {
1419                 adjust_extattr_refcount(ctx, ctx->refcount_extra,
1420                                         block_buf, +1);
1421                 ea_refcount_free(ctx->refcount_extra);
1422                 ctx->refcount_extra = 0;
1423         }
1424
1425         if (ctx->invalid_bitmaps)
1426                 handle_fs_bad_blocks(ctx);
1427
1428         /* We don't need the block_ea_map any more */
1429         if (ctx->block_ea_map) {
1430                 ext2fs_free_block_bitmap(ctx->block_ea_map);
1431                 ctx->block_ea_map = 0;
1432         }
1433
1434         if (ctx->flags & E2F_FLAG_RESIZE_INODE) {
1435                 struct ext2_inode *inode;
1436                 int inode_size = EXT2_INODE_SIZE(fs->super);
1437                 inode = e2fsck_allocate_memory(ctx, inode_size,
1438                                                "scratch inode");
1439
1440                 clear_problem_context(&pctx);
1441                 pctx.errcode = ext2fs_create_resize_inode(fs);
1442                 if (pctx.errcode) {
1443                         if (!fix_problem(ctx, PR_1_RESIZE_INODE_CREATE,
1444                                          &pctx)) {
1445                                 ctx->flags |= E2F_FLAG_ABORT;
1446                                 ext2fs_free_mem(&inode);
1447                                 ext2fs_free_mem(&block_buf);
1448                                 return;
1449                         }
1450                         pctx.errcode = 0;
1451                 }
1452                 if (!pctx.errcode) {
1453                         e2fsck_read_inode(ctx, EXT2_RESIZE_INO, inode,
1454                                           "recreate inode");
1455                         inode->i_mtime = ctx->now;
1456                         e2fsck_write_inode(ctx, EXT2_RESIZE_INO, inode,
1457                                            "recreate inode");
1458                 }
1459                 ctx->flags &= ~E2F_FLAG_RESIZE_INODE;
1460                 ext2fs_free_mem(&inode);
1461         }
1462
1463         if (ctx->flags & E2F_FLAG_RESTART) {
1464                 ext2fs_free_mem(&block_buf);
1465                 return;
1466         }
1467
1468         if (ctx->block_dup_map) {
1469                 if (!(ctx->flags & E2F_FLAG_DUP_BLOCK)) {
1470                         ext2fs_free_mem(&block_buf);
1471                         return;
1472                 }
1473                 if (ctx->options & E2F_OPT_PREEN) {
1474                         clear_problem_context(&pctx);
1475                         fix_problem(ctx, PR_1_DUP_BLOCKS_PREENSTOP, &pctx);
1476                 }
1477                 e2fsck_pass1_dupblocks(ctx, block_buf);
1478                 ext2fs_free_mem(&block_buf);
1479                 ctx->flags &= ~E2F_FLAG_DUP_BLOCK;
1480         }
1481
1482         ctx->flags |= E2F_FLAG_ALLOC_OK;
1483 }
1484
1485
1486 void e2fsck_pass1_run(e2fsck_t ctx)
1487 {
1488         int     i;
1489         ext2_filsys fs = ctx->fs;
1490         ext2_ino_t      ino = 0;
1491         struct ext2_inode *inode = NULL;
1492         ext2_inode_scan scan = NULL;
1493         char            *block_buf = NULL;
1494 #ifdef RESOURCE_TRACK
1495         struct resource_track   rtrack;
1496 #endif
1497         unsigned char   frag, fsize;
1498         struct          problem_context pctx;
1499         struct          scan_callback_struct scan_struct;
1500         struct ext2_super_block *sb = ctx->fs->super;
1501         const char      *old_op;
1502         const char      *eop_next_inode = _("getting next inode from scan");
1503         int             imagic_fs, extent_fs, inlinedata_fs, casefold_fs;
1504         int             low_dtime_check = 1;
1505         unsigned int    inode_size = EXT2_INODE_SIZE(fs->super);
1506         unsigned int    bufsize;
1507         int             failed_csum = 0;
1508         ext2_ino_t      ino_threshold = 0;
1509         dgrp_t          ra_group = 0;
1510         struct ea_quota ea_ibody_quota;
1511         struct process_inode_block *inodes_to_process;
1512         int             process_inode_count;
1513
1514         init_resource_track(&rtrack, ctx->fs->io);
1515         clear_problem_context(&pctx);
1516
1517         pass1_readahead(ctx, &ra_group, &ino_threshold);
1518         if (ext2fs_has_feature_dir_index(fs->super) &&
1519             !(ctx->options & E2F_OPT_NO)) {
1520                 if (ext2fs_u32_list_create(&ctx->dirs_to_hash, 50))
1521                         ctx->dirs_to_hash = 0;
1522         }
1523
1524 #ifdef MTRACE
1525         mtrace_print("Pass 1");
1526 #endif
1527
1528         imagic_fs = ext2fs_has_feature_imagic_inodes(sb);
1529         extent_fs = ext2fs_has_feature_extents(sb);
1530         inlinedata_fs = ext2fs_has_feature_inline_data(sb);
1531         casefold_fs = ext2fs_has_feature_casefold(sb);
1532
1533         /*
1534          * Allocate bitmaps structures
1535          */
1536         pctx.errcode = e2fsck_allocate_inode_bitmap(fs, _("in-use inode map"),
1537                                                     EXT2FS_BMAP64_RBTREE,
1538                                                     "inode_used_map",
1539                                                     &ctx->inode_used_map);
1540         if (pctx.errcode) {
1541                 pctx.num = 1;
1542                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1543                 ctx->flags |= E2F_FLAG_ABORT;
1544                 return;
1545         }
1546         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1547                         _("directory inode map"),
1548                         ctx->global_ctx ? EXT2FS_BMAP64_RBTREE :
1549                         EXT2FS_BMAP64_AUTODIR,
1550                         "inode_dir_map", &ctx->inode_dir_map);
1551         if (pctx.errcode) {
1552                 pctx.num = 2;
1553                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1554                 ctx->flags |= E2F_FLAG_ABORT;
1555                 return;
1556         }
1557         pctx.errcode = e2fsck_allocate_inode_bitmap(fs,
1558                         _("regular file inode map"), EXT2FS_BMAP64_RBTREE,
1559                         "inode_reg_map", &ctx->inode_reg_map);
1560         if (pctx.errcode) {
1561                 pctx.num = 6;
1562                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1563                 ctx->flags |= E2F_FLAG_ABORT;
1564                 return;
1565         }
1566         if (casefold_fs) {
1567                 pctx.errcode =
1568                         e2fsck_allocate_inode_bitmap(fs,
1569                                                      _("inode casefold map"),
1570                                                      EXT2FS_BMAP64_RBTREE,
1571                                                      "inode_casefold_map",
1572                                                      &ctx->inode_casefold_map);
1573                 if (pctx.errcode) {
1574                         pctx.num = 1;
1575                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
1576                         ctx->flags |= E2F_FLAG_ABORT;
1577                         return;
1578                 }
1579         }
1580         pctx.errcode = e2fsck_setup_icount(ctx, "inode_link_info", 0, NULL,
1581                                            &ctx->inode_link_info);
1582         if (pctx.errcode) {
1583                 fix_problem(ctx, PR_1_ALLOCATE_ICOUNT, &pctx);
1584                 ctx->flags |= E2F_FLAG_ABORT;
1585                 return;
1586         }
1587         bufsize = inode_size;
1588         if (bufsize < sizeof(struct ext2_inode_large))
1589                 bufsize = sizeof(struct ext2_inode_large);
1590         inode = (struct ext2_inode *)
1591                 e2fsck_allocate_memory(ctx, bufsize, "scratch inode");
1592
1593         inodes_to_process = (struct process_inode_block *)
1594                 e2fsck_allocate_memory(ctx,
1595                                        (ctx->process_inode_size *
1596                                         sizeof(struct process_inode_block)),
1597                                        "array of inodes to process");
1598         process_inode_count = 0;
1599
1600         pctx.errcode = ext2fs_init_dblist(fs, 0);
1601         if (pctx.errcode) {
1602                 fix_problem(ctx, PR_1_ALLOCATE_DBCOUNT, &pctx);
1603                 ctx->flags |= E2F_FLAG_ABORT;
1604                 goto endit;
1605         }
1606
1607         /*
1608          * If the last orphan field is set, clear it, since the pass1
1609          * processing will automatically find and clear the orphans.
1610          * In the future, we may want to try using the last_orphan
1611          * linked list ourselves, but for now, we clear it so that the
1612          * ext3 mount code won't get confused.
1613          */
1614         if (!(ctx->options & E2F_OPT_READONLY)) {
1615                 if (fs->super->s_last_orphan) {
1616                         fs->super->s_last_orphan = 0;
1617                         ext2fs_mark_super_dirty(fs);
1618                 }
1619         }
1620
1621         block_buf = (char *) e2fsck_allocate_memory(ctx, fs->blocksize * 3,
1622                                                     "block iterate buffer");
1623         if (EXT2_INODE_SIZE(fs->super) == EXT2_GOOD_OLD_INODE_SIZE)
1624                 e2fsck_use_inode_shortcuts(ctx, 1);
1625         e2fsck_intercept_block_allocations(ctx);
1626         old_op = ehandler_operation(_("opening inode scan"));
1627         pctx.errcode = ext2fs_open_inode_scan(fs, ctx->inode_buffer_blocks,
1628                                               &scan);
1629         ehandler_operation(old_op);
1630         if (pctx.errcode) {
1631                 fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1632                 ctx->flags |= E2F_FLAG_ABORT;
1633                 goto endit;
1634         }
1635         ext2fs_inode_scan_flags(scan, EXT2_SF_SKIP_MISSING_ITABLE |
1636                                       EXT2_SF_WARN_GARBAGE_INODES, 0);
1637         ctx->stashed_inode = inode;
1638         scan_struct.ctx = ctx;
1639         scan_struct.block_buf = block_buf;
1640         scan_struct.inodes_to_process = inodes_to_process;
1641         scan_struct.process_inode_count = &process_inode_count;
1642         ext2fs_set_inode_callback(scan, scan_callback, &scan_struct);
1643         if (ctx->progress && ((ctx->progress)(ctx, 1, 0,
1644                                               ctx->fs->group_desc_count)))
1645                 goto endit;
1646         if ((fs->super->s_wtime &&
1647              fs->super->s_wtime < fs->super->s_inodes_count) ||
1648             (fs->super->s_mtime &&
1649              fs->super->s_mtime < fs->super->s_inodes_count) ||
1650             (fs->super->s_mkfs_time &&
1651              fs->super->s_mkfs_time < fs->super->s_inodes_count))
1652                 low_dtime_check = 0;
1653
1654         /* Set up ctx->lost_and_found if possible */
1655         (void) e2fsck_get_lost_and_found(ctx, 0);
1656
1657 #ifdef HAVE_PTHREAD
1658         if (ctx->global_ctx) {
1659                 if (ctx->options & E2F_OPT_DEBUG &&
1660                     ctx->options & E2F_OPT_MULTITHREAD)
1661                         fprintf(stderr, "thread %d jumping to group %d\n",
1662                                         ctx->thread_info.et_thread_index,
1663                                         ctx->thread_info.et_group_start);
1664                 pctx.errcode = ext2fs_inode_scan_goto_blockgroup(scan,
1665                                         ctx->thread_info.et_group_start);
1666                 if (pctx.errcode) {
1667                         fix_problem(ctx, PR_1_PASS_HEADER, &pctx);
1668                         ctx->flags |= E2F_FLAG_ABORT;
1669                         goto endit;
1670                 }
1671         }
1672 #endif
1673
1674         while (1) {
1675                 e2fsck_pass1_check_lock(ctx);
1676                 if (ino % (fs->super->s_inodes_per_group * 4) == 1) {
1677                         if (e2fsck_mmp_update(fs))
1678                                 fatal_error(ctx, 0);
1679                 }
1680                 old_op = ehandler_operation(eop_next_inode);
1681                 pctx.errcode = ext2fs_get_next_inode_full(scan, &ino,
1682                                                           inode, inode_size);
1683                 if (ino > ino_threshold)
1684                         pass1_readahead(ctx, &ra_group, &ino_threshold);
1685                 ehandler_operation(old_op);
1686                 if (e2fsck_should_abort(ctx)) {
1687                         e2fsck_pass1_check_unlock(ctx);
1688                         goto endit;
1689                 }
1690                 if (pctx.errcode == EXT2_ET_BAD_BLOCK_IN_INODE_TABLE) {
1691                         /*
1692                          * If badblocks says badblocks is bad, offer to clear
1693                          * the list, update the in-core bb list, and restart
1694                          * the inode scan.
1695                          */
1696                         if (ino == EXT2_BAD_INO &&
1697                             fix_problem(ctx, PR_1_BADBLOCKS_IN_BADBLOCKS,
1698                                         &pctx)) {
1699                                 errcode_t err;
1700
1701                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1702                                 ext2fs_badblocks_list_free(ctx->fs->badblocks);
1703                                 ctx->fs->badblocks = NULL;
1704                                 err = ext2fs_read_bb_inode(ctx->fs,
1705                                                         &ctx->fs->badblocks);
1706                                 if (err) {
1707                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1708                                                     &pctx);
1709                                         ctx->flags |= E2F_FLAG_ABORT;
1710                                         e2fsck_pass1_check_unlock(ctx);
1711                                         goto endit;
1712                                 } else
1713                                         ctx->flags |= E2F_FLAG_RESTART;
1714                                 err = ext2fs_inode_scan_goto_blockgroup(scan,
1715                                                                         0);
1716                                 if (err) {
1717                                         fix_problem(ctx, PR_1_ISCAN_ERROR,
1718                                                     &pctx);
1719                                         ctx->flags |= E2F_FLAG_ABORT;
1720                                         e2fsck_pass1_check_unlock(ctx);
1721                                         goto endit;
1722                                 }
1723                                 e2fsck_pass1_check_unlock(ctx);
1724                                 continue;
1725                         }
1726                         if (!ctx->inode_bb_map)
1727                                 alloc_bb_map(ctx);
1728                         ext2fs_mark_inode_bitmap2(ctx->inode_bb_map, ino);
1729                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
1730                         e2fsck_pass1_check_unlock(ctx);
1731                         continue;
1732                 }
1733                 if (pctx.errcode == EXT2_ET_SCAN_FINISHED) {
1734                         e2fsck_pass1_check_unlock(ctx);
1735                         break;
1736                 }
1737                 if (pctx.errcode &&
1738                     pctx.errcode != EXT2_ET_INODE_CSUM_INVALID &&
1739                     pctx.errcode != EXT2_ET_INODE_IS_GARBAGE) {
1740                         fix_problem(ctx, PR_1_ISCAN_ERROR, &pctx);
1741                         ctx->flags |= E2F_FLAG_ABORT;
1742                         e2fsck_pass1_check_unlock(ctx);
1743                         goto endit;
1744                 }
1745                 if (!ino) {
1746                         e2fsck_pass1_check_unlock(ctx);
1747                         break;
1748                 }
1749 #ifdef HAVE_PTHREAD
1750                 if (ctx->global_ctx)
1751                         ctx->thread_info.et_inode_number++;
1752 #endif
1753                 pctx.ino = ino;
1754                 pctx.inode = inode;
1755                 ctx->stashed_ino = ino;
1756
1757                 /* Clear trashed inode? */
1758                 if (pctx.errcode == EXT2_ET_INODE_IS_GARBAGE &&
1759                     inode->i_links_count > 0 &&
1760                     fix_problem(ctx, PR_1_INODE_IS_GARBAGE, &pctx)) {
1761                         pctx.errcode = 0;
1762                         e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1763                 }
1764                 failed_csum = pctx.errcode != 0;
1765
1766                 /*
1767                  * Check for inodes who might have been part of the
1768                  * orphaned list linked list.  They should have gotten
1769                  * dealt with by now, unless the list had somehow been
1770                  * corrupted.
1771                  *
1772                  * FIXME: In the future, inodes which are still in use
1773                  * (and which are therefore) pending truncation should
1774                  * be handled specially.  Right now we just clear the
1775                  * dtime field, and the normal e2fsck handling of
1776                  * inodes where i_size and the inode blocks are
1777                  * inconsistent is to fix i_size, instead of releasing
1778                  * the extra blocks.  This won't catch the inodes that
1779                  * was at the end of the orphan list, but it's better
1780                  * than nothing.  The right answer is that there
1781                  * shouldn't be any bugs in the orphan list handling.  :-)
1782                  */
1783                 if (inode->i_dtime && low_dtime_check &&
1784                     inode->i_dtime < ctx->fs->super->s_inodes_count) {
1785                         if (fix_problem(ctx, PR_1_LOW_DTIME, &pctx)) {
1786                                 inode->i_dtime = inode->i_links_count ?
1787                                         0 : ctx->now;
1788                                 e2fsck_write_inode(ctx, ino, inode,
1789                                                    "pass1");
1790                                 failed_csum = 0;
1791                         }
1792                 }
1793
1794                 if (inode->i_links_count) {
1795                         pctx.errcode = ext2fs_icount_store(ctx->inode_link_info,
1796                                            ino, inode->i_links_count);
1797                         if (pctx.errcode) {
1798                                 pctx.num = inode->i_links_count;
1799                                 fix_problem(ctx, PR_1_ICOUNT_STORE, &pctx);
1800                                 ctx->flags |= E2F_FLAG_ABORT;
1801                                 e2fsck_pass1_check_unlock(ctx);
1802                                 goto endit;
1803                         }
1804                 } else if ((ino >= EXT2_FIRST_INODE(fs->super)) &&
1805                            !quota_inum_is_reserved(fs, ino)) {
1806                         if (!inode->i_dtime && inode->i_mode) {
1807                                 if (fix_problem(ctx,
1808                                             PR_1_ZERO_DTIME, &pctx)) {
1809                                         inode->i_dtime = ctx->now;
1810                                         e2fsck_write_inode(ctx, ino, inode,
1811                                                            "pass1");
1812                                         failed_csum = 0;
1813                                 }
1814                         }
1815                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
1816                         e2fsck_pass1_check_unlock(ctx);
1817                         continue;
1818                 }
1819
1820                 if ((inode->i_flags & EXT4_CASEFOLD_FL) &&
1821                     ((!LINUX_S_ISDIR(inode->i_mode) &&
1822                       fix_problem(ctx, PR_1_CASEFOLD_NONDIR, &pctx)) ||
1823                      (!casefold_fs &&
1824                       fix_problem(ctx, PR_1_CASEFOLD_FEATURE, &pctx)))) {
1825                         inode->i_flags &= ~EXT4_CASEFOLD_FL;
1826                         e2fsck_write_inode(ctx, ino, inode, "pass1");
1827                 }
1828
1829                 /* Conflicting inlinedata/extents inode flags? */
1830                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) &&
1831                     (inode->i_flags & EXT4_EXTENTS_FL)) {
1832                         int res = fix_inline_data_extents_file(ctx, ino, inode,
1833                                                                inode_size,
1834                                                                &pctx);
1835                         if (res < 0) {
1836                                 /* skip FINISH_INODE_LOOP */
1837                                 e2fsck_pass1_check_unlock(ctx);
1838                                 continue;
1839                         }
1840                 }
1841
1842                 /* Test for incorrect inline_data flags settings. */
1843                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && !inlinedata_fs &&
1844                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1845                         size_t size = 0;
1846
1847                         pctx.errcode = get_inline_data_ea_size(fs, ino, inode,
1848                                                                &size);
1849                         if (!pctx.errcode &&
1850                             fix_problem(ctx, PR_1_INLINE_DATA_FEATURE, &pctx)) {
1851                                 e2fsck_pass1_fix_lock(ctx);
1852                                 ext2fs_set_feature_inline_data(sb);
1853                                 ext2fs_mark_super_dirty(fs);
1854                                 e2fsck_pass1_fix_unlock(ctx);
1855                                 inlinedata_fs = 1;
1856                         } else if (fix_problem(ctx, PR_1_INLINE_DATA_SET, &pctx)) {
1857                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1858                                 /* skip FINISH_INODE_LOOP */
1859                                 e2fsck_pass1_check_unlock(ctx);
1860                                 continue;
1861                         }
1862                 }
1863
1864                 /* Test for inline data flag but no attr */
1865                 if ((inode->i_flags & EXT4_INLINE_DATA_FL) && inlinedata_fs &&
1866                     (ino >= EXT2_FIRST_INODE(fs->super))) {
1867                         size_t size = 0;
1868                         errcode_t err;
1869                         int flags;
1870
1871                         flags = fs->flags;
1872                         if (failed_csum)
1873                                 fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
1874                         err = get_inline_data_ea_size(fs, ino, inode, &size);
1875                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
1876                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
1877
1878                         switch (err) {
1879                         case 0:
1880                                 /* Everything is awesome... */
1881                                 break;
1882                         case EXT2_ET_BAD_EA_BLOCK_NUM:
1883                         case EXT2_ET_BAD_EA_HASH:
1884                         case EXT2_ET_BAD_EA_HEADER:
1885                         case EXT2_ET_EA_BAD_NAME_LEN:
1886                         case EXT2_ET_EA_BAD_VALUE_SIZE:
1887                         case EXT2_ET_EA_KEY_NOT_FOUND:
1888                         case EXT2_ET_EA_NO_SPACE:
1889                         case EXT2_ET_MISSING_EA_FEATURE:
1890                         case EXT2_ET_INLINE_DATA_CANT_ITERATE:
1891                         case EXT2_ET_INLINE_DATA_NO_BLOCK:
1892                         case EXT2_ET_INLINE_DATA_NO_SPACE:
1893                         case EXT2_ET_NO_INLINE_DATA:
1894                         case EXT2_ET_EXT_ATTR_CSUM_INVALID:
1895                         case EXT2_ET_EA_BAD_VALUE_OFFSET:
1896                         case EXT2_ET_EA_INODE_CORRUPTED:
1897                                 /* broken EA or no system.data EA; truncate */
1898                                 if (fix_problem(ctx, PR_1_INLINE_DATA_NO_ATTR,
1899                                                 &pctx)) {
1900                                         err = ext2fs_inode_size_set(fs, inode, 0);
1901                                         if (err) {
1902                                                 pctx.errcode = err;
1903                                                 ctx->flags |= E2F_FLAG_ABORT;
1904                                                 e2fsck_pass1_check_unlock(ctx);
1905                                                 goto endit;
1906                                         }
1907                                         inode->i_flags &= ~EXT4_INLINE_DATA_FL;
1908                                         memset(&inode->i_block, 0,
1909                                                sizeof(inode->i_block));
1910                                         e2fsck_write_inode(ctx, ino, inode,
1911                                                            "pass1");
1912                                         failed_csum = 0;
1913                                 }
1914                                 break;
1915                         default:
1916                                 /* Some other kind of non-xattr error? */
1917                                 pctx.errcode = err;
1918                                 ctx->flags |= E2F_FLAG_ABORT;
1919                                 e2fsck_pass1_check_unlock(ctx);
1920                                 goto endit;
1921                         }
1922                 }
1923
1924                 /*
1925                  * Test for incorrect extent flag settings.
1926                  *
1927                  * On big-endian machines we must be careful:
1928                  * When the inode is read, the i_block array is not swapped
1929                  * if the extent flag is set.  Therefore if we are testing
1930                  * for or fixing a wrongly-set flag, we must potentially
1931                  * (un)swap before testing, or after fixing.
1932                  */
1933
1934                 /*
1935                  * In this case the extents flag was set when read, so
1936                  * extent_header_verify is ok.  If the inode is cleared,
1937                  * no need to swap... so no extra swapping here.
1938                  */
1939                 if ((inode->i_flags & EXT4_EXTENTS_FL) && !extent_fs &&
1940                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1941                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO))) {
1942                         if ((ext2fs_extent_header_verify(inode->i_block,
1943                                                  sizeof(inode->i_block)) == 0) &&
1944                             fix_problem(ctx, PR_1_EXTENT_FEATURE, &pctx)) {
1945                                 e2fsck_pass1_fix_lock(ctx);
1946                                 ext2fs_set_feature_extents(sb);
1947                                 ext2fs_mark_super_dirty(fs);
1948                                 extent_fs = 1;
1949                                 e2fsck_pass1_fix_unlock(ctx);
1950                         } else if (fix_problem(ctx, PR_1_EXTENTS_SET, &pctx)) {
1951                         clear_inode:
1952                                 e2fsck_clear_inode(ctx, ino, inode, 0, "pass1");
1953                                 if (ino == EXT2_BAD_INO)
1954                                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map,
1955                                                                  ino);
1956                                 /* skip FINISH_INODE_LOOP */
1957                                 e2fsck_pass1_check_unlock(ctx);
1958                                 continue;
1959                         }
1960                 }
1961
1962                 /*
1963                  * For big-endian machines:
1964                  * If the inode didn't have the extents flag set when it
1965                  * was read, then the i_blocks array was swapped.  To test
1966                  * as an extents header, we must swap it back first.
1967                  * IF we then set the extents flag, the entire i_block
1968                  * array must be un/re-swapped to make it proper extents data.
1969                  */
1970                 if (extent_fs && !(inode->i_flags & EXT4_EXTENTS_FL) &&
1971                     (inode->i_links_count || (ino == EXT2_BAD_INO) ||
1972                      (ino == EXT2_ROOT_INO) || (ino == EXT2_JOURNAL_INO)) &&
1973                     (LINUX_S_ISREG(inode->i_mode) ||
1974                      LINUX_S_ISDIR(inode->i_mode))) {
1975                         void *ehp;
1976 #ifdef WORDS_BIGENDIAN
1977                         __u32 tmp_block[EXT2_N_BLOCKS];
1978
1979                         for (i = 0; i < EXT2_N_BLOCKS; i++)
1980                                 tmp_block[i] = ext2fs_swab32(inode->i_block[i]);
1981                         ehp = tmp_block;
1982 #else
1983                         ehp = inode->i_block;
1984 #endif
1985                         if ((ext2fs_extent_header_verify(ehp,
1986                                          sizeof(inode->i_block)) == 0) &&
1987                             (fix_problem(ctx, PR_1_UNSET_EXTENT_FL, &pctx))) {
1988                                 inode->i_flags |= EXT4_EXTENTS_FL;
1989 #ifdef WORDS_BIGENDIAN
1990                                 memcpy(inode->i_block, tmp_block,
1991                                        sizeof(inode->i_block));
1992 #endif
1993                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
1994                                 failed_csum = 0;
1995                         }
1996                 }
1997
1998                 if (ino == EXT2_BAD_INO) {
1999                         struct process_block_struct pb;
2000
2001                         if ((failed_csum || inode->i_mode || inode->i_uid ||
2002                              inode->i_gid || inode->i_links_count ||
2003                              (inode->i_flags & EXT4_INLINE_DATA_FL) ||
2004                              inode->i_file_acl) &&
2005                             fix_problem(ctx, PR_1_INVALID_BAD_INODE, &pctx)) {
2006                                 memset(inode, 0, sizeof(struct ext2_inode));
2007                                 e2fsck_write_inode(ctx, ino, inode,
2008                                                    "clear bad inode");
2009                                 failed_csum = 0;
2010                         }
2011
2012                         e2fsck_pass1_block_map_r_lock(ctx);
2013                         pctx.errcode = ext2fs_copy_bitmap(ctx->global_ctx ?
2014                                         ctx->global_ctx->block_found_map :
2015                                         ctx->block_found_map, &pb.fs_meta_blocks);
2016                         e2fsck_pass1_block_map_r_unlock(ctx);
2017                         if (pctx.errcode) {
2018                                 pctx.num = 4;
2019                                 fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, &pctx);
2020                                 ctx->flags |= E2F_FLAG_ABORT;
2021                                 e2fsck_pass1_check_unlock(ctx);
2022                                 goto endit;
2023                         }
2024                         pb.ino = EXT2_BAD_INO;
2025                         pb.num_blocks = pb.last_block = 0;
2026                         pb.last_db_block = -1;
2027                         pb.num_illegal_blocks = 0;
2028                         pb.suppress = 0; pb.clear = 0; pb.is_dir = 0;
2029                         pb.is_reg = 0; pb.fragmented = 0; pb.bbcheck = 0;
2030                         pb.inode = inode;
2031                         pb.pctx = &pctx;
2032                         pb.ctx = ctx;
2033                         pctx.errcode = ext2fs_block_iterate3(fs, ino, 0,
2034                                      block_buf, process_bad_block, &pb);
2035                         ext2fs_free_block_bitmap(pb.fs_meta_blocks);
2036                         if (pctx.errcode) {
2037                                 fix_problem(ctx, PR_1_BLOCK_ITERATE, &pctx);
2038                                 ctx->flags |= E2F_FLAG_ABORT;
2039                                 e2fsck_pass1_check_unlock(ctx);
2040                                 goto endit;
2041                         }
2042                         if (pb.bbcheck)
2043                                 if (!fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK_PROMPT, &pctx)) {
2044                                 ctx->flags |= E2F_FLAG_ABORT;
2045                                 e2fsck_pass1_check_unlock(ctx);
2046                                 goto endit;
2047                         }
2048                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2049                         clear_problem_context(&pctx);
2050                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2051                         e2fsck_pass1_check_unlock(ctx);
2052                         continue;
2053                 } else if (ino == EXT2_ROOT_INO) {
2054                         /*
2055                          * Make sure the root inode is a directory; if
2056                          * not, offer to clear it.  It will be
2057                          * regenerated in pass #3.
2058                          */
2059                         if (!LINUX_S_ISDIR(inode->i_mode)) {
2060                                 if (fix_problem(ctx, PR_1_ROOT_NO_DIR, &pctx))
2061                                         goto clear_inode;
2062                         }
2063                         /*
2064                          * If dtime is set, offer to clear it.  mke2fs
2065                          * version 0.2b created filesystems with the
2066                          * dtime field set for the root and lost+found
2067                          * directories.  We won't worry about
2068                          * /lost+found, since that can be regenerated
2069                          * easily.  But we will fix the root directory
2070                          * as a special case.
2071                          */
2072                         if (inode->i_dtime && inode->i_links_count) {
2073                                 if (fix_problem(ctx, PR_1_ROOT_DTIME, &pctx)) {
2074                                         inode->i_dtime = 0;
2075                                         e2fsck_write_inode(ctx, ino, inode,
2076                                                            "pass1");
2077                                         failed_csum = 0;
2078                                 }
2079                         }
2080                 } else if (ino == EXT2_JOURNAL_INO) {
2081                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2082                         if (fs->super->s_journal_inum == EXT2_JOURNAL_INO) {
2083                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2084                                     fix_problem(ctx, PR_1_JOURNAL_BAD_MODE,
2085                                                 &pctx)) {
2086                                         inode->i_mode = LINUX_S_IFREG;
2087                                         e2fsck_write_inode(ctx, ino, inode,
2088                                                            "pass1");
2089                                         failed_csum = 0;
2090                                 }
2091                                 check_blocks(ctx, &pctx, block_buf, NULL);
2092                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2093                                 e2fsck_pass1_check_unlock(ctx);
2094                                 continue;
2095                         }
2096                         if ((inode->i_links_count ||
2097                              inode->i_blocks || inode->i_block[0]) &&
2098                             fix_problem(ctx, PR_1_JOURNAL_INODE_NOT_CLEAR,
2099                                         &pctx)) {
2100                                 memset(inode, 0, inode_size);
2101                                 ext2fs_icount_store(ctx->inode_link_info,
2102                                                     ino, 0);
2103                                 e2fsck_write_inode_full(ctx, ino, inode,
2104                                                         inode_size, "pass1");
2105                                 failed_csum = 0;
2106                         }
2107                 } else if (quota_inum_is_reserved(fs, ino)) {
2108                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2109                         if (ext2fs_has_feature_quota(fs->super) &&
2110                             quota_inum_is_super(fs->super, ino)) {
2111                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2112                                     fix_problem(ctx, PR_1_QUOTA_BAD_MODE,
2113                                                         &pctx)) {
2114                                         inode->i_mode = LINUX_S_IFREG;
2115                                         e2fsck_write_inode(ctx, ino, inode,
2116                                                         "pass1");
2117                                         failed_csum = 0;
2118                                 }
2119                                 check_blocks(ctx, &pctx, block_buf, NULL);
2120                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2121                                 e2fsck_pass1_check_unlock(ctx);
2122                                 continue;
2123                         }
2124                         if ((inode->i_links_count ||
2125                              inode->i_blocks || inode->i_block[0]) &&
2126                             fix_problem(ctx, PR_1_QUOTA_INODE_NOT_CLEAR,
2127                                         &pctx)) {
2128                                 memset(inode, 0, inode_size);
2129                                 ext2fs_icount_store(ctx->inode_link_info,
2130                                                     ino, 0);
2131                                 e2fsck_write_inode_full(ctx, ino, inode,
2132                                                         inode_size, "pass1");
2133                                 failed_csum = 0;
2134                         }
2135                 } else if (ino == fs->super->s_orphan_file_inum) {
2136                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2137                         if (ext2fs_has_feature_orphan_file(fs->super)) {
2138                                 if (!LINUX_S_ISREG(inode->i_mode) &&
2139                                     fix_problem(ctx, PR_1_ORPHAN_FILE_BAD_MODE,
2140                                                 &pctx)) {
2141                                         inode->i_mode = LINUX_S_IFREG;
2142                                         e2fsck_write_inode(ctx, ino, inode,
2143                                                            "pass1");
2144                                         failed_csum = 0;
2145                                 }
2146                                 check_blocks(ctx, &pctx, block_buf, NULL);
2147                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2148                                 continue;
2149                         }
2150                         if ((inode->i_links_count ||
2151                              inode->i_blocks || inode->i_block[0]) &&
2152                             fix_problem(ctx, PR_1_ORPHAN_FILE_NOT_CLEAR,
2153                                         &pctx)) {
2154                                 memset(inode, 0, inode_size);
2155                                 ext2fs_icount_store(ctx->inode_link_info, ino,
2156                                                     0);
2157                                 e2fsck_write_inode_full(ctx, ino, inode,
2158                                                         inode_size, "pass1");
2159                                 failed_csum = 0;
2160                         }
2161                 } else if (ino < EXT2_FIRST_INODE(fs->super)) {
2162                         problem_t problem = 0;
2163
2164                         ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2165                         if (ino == EXT2_BOOT_LOADER_INO) {
2166                                 if (LINUX_S_ISDIR(inode->i_mode))
2167                                         problem = PR_1_RESERVED_BAD_MODE;
2168                         } else if (ino == EXT2_RESIZE_INO) {
2169                                 if (inode->i_mode &&
2170                                     !LINUX_S_ISREG(inode->i_mode))
2171                                         problem = PR_1_RESERVED_BAD_MODE;
2172                         } else {
2173                                 if (inode->i_mode != 0)
2174                                         problem = PR_1_RESERVED_BAD_MODE;
2175                         }
2176                         if (problem) {
2177                                 if (fix_problem(ctx, problem, &pctx)) {
2178                                         inode->i_mode = 0;
2179                                         e2fsck_write_inode(ctx, ino, inode,
2180                                                            "pass1");
2181                                         failed_csum = 0;
2182                                 }
2183                         }
2184                         check_blocks(ctx, &pctx, block_buf, NULL);
2185                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2186                         e2fsck_pass1_check_unlock(ctx);
2187                         continue;
2188                 }
2189
2190                 if (!inode->i_links_count) {
2191                         FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2192                         e2fsck_pass1_check_unlock(ctx);
2193                         continue;
2194                 }
2195                 /*
2196                  * n.b.  0.3c ext2fs code didn't clear i_links_count for
2197                  * deleted files.  Oops.
2198                  *
2199                  * Since all new ext2 implementations get this right,
2200                  * we now assume that the case of non-zero
2201                  * i_links_count and non-zero dtime means that we
2202                  * should keep the file, not delete it.
2203                  *
2204                  */
2205                 if (inode->i_dtime) {
2206                         if (fix_problem(ctx, PR_1_SET_DTIME, &pctx)) {
2207                                 inode->i_dtime = 0;
2208                                 e2fsck_write_inode(ctx, ino, inode, "pass1");
2209                                 failed_csum = 0;
2210                         }
2211                 }
2212
2213                 ext2fs_mark_inode_bitmap2(ctx->inode_used_map, ino);
2214                 switch (fs->super->s_creator_os) {
2215                     case EXT2_OS_HURD:
2216                         frag = inode->osd2.hurd2.h_i_frag;
2217                         fsize = inode->osd2.hurd2.h_i_fsize;
2218                         break;
2219                     default:
2220                         frag = fsize = 0;
2221                 }
2222
2223                 if (inode->i_faddr || frag || fsize ||
2224                     (!ext2fs_has_feature_largedir(fs->super) &&
2225                     (LINUX_S_ISDIR(inode->i_mode) && inode->i_size_high)))
2226                         mark_inode_bad(ctx, ino);
2227                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
2228                     !ext2fs_has_feature_64bit(fs->super) &&
2229                     inode->osd2.linux2.l_i_file_acl_high != 0)
2230                         mark_inode_bad(ctx, ino);
2231                 if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
2232                     !ext2fs_has_feature_huge_file(fs->super) &&
2233                     (inode->osd2.linux2.l_i_blocks_hi != 0))
2234                         mark_inode_bad(ctx, ino);
2235                 if (inode->i_flags & EXT2_IMAGIC_FL) {
2236                         if (imagic_fs) {
2237                                 if (!ctx->inode_imagic_map)
2238                                         alloc_imagic_map(ctx);
2239                                 ext2fs_mark_inode_bitmap2(ctx->inode_imagic_map,
2240                                                          ino);
2241                         } else {
2242                                 if (fix_problem(ctx, PR_1_SET_IMAGIC, &pctx)) {
2243                                         inode->i_flags &= ~EXT2_IMAGIC_FL;
2244                                         e2fsck_write_inode(ctx, ino,
2245                                                            inode, "pass1");
2246                                         failed_csum = 0;
2247                                 }
2248                         }
2249                 }
2250
2251                 check_inode_extra_space(ctx, &pctx, &ea_ibody_quota);
2252                 check_is_really_dir(ctx, &pctx, block_buf);
2253
2254                 /*
2255                  * ext2fs_inode_has_valid_blocks2 does not actually look
2256                  * at i_block[] values, so not endian-sensitive here.
2257                  */
2258                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL) &&
2259                     LINUX_S_ISLNK(inode->i_mode) &&
2260                     !ext2fs_inode_has_valid_blocks2(fs, inode) &&
2261                     fix_problem(ctx, PR_1_FAST_SYMLINK_EXTENT_FL, &pctx)) {
2262                         inode->i_flags &= ~EXT4_EXTENTS_FL;
2263                         e2fsck_write_inode(ctx, ino, inode, "pass1");
2264                         failed_csum = 0;
2265                 }
2266
2267                 if ((inode->i_flags & EXT4_ENCRYPT_FL) &&
2268                     add_encrypted_file(ctx, &pctx) < 0)
2269                         goto clear_inode;
2270
2271                 if (casefold_fs && inode->i_flags & EXT4_CASEFOLD_FL)
2272                         ext2fs_mark_inode_bitmap2(ctx->inode_casefold_map, ino);
2273
2274                 if (LINUX_S_ISDIR(inode->i_mode)) {
2275                         ext2fs_mark_inode_bitmap2(ctx->inode_dir_map, ino);
2276                         e2fsck_add_dir_info(ctx, ino, 0);
2277                         ctx->fs_directory_count++;
2278                         if (inode->i_flags & EXT4_CASEFOLD_FL)
2279                                 add_casefolded_dir(ctx, ino);
2280                 } else if (LINUX_S_ISREG (inode->i_mode)) {
2281                         ext2fs_mark_inode_bitmap2(ctx->inode_reg_map, ino);
2282                         ctx->fs_regular_count++;
2283                 } else if (LINUX_S_ISCHR (inode->i_mode) &&
2284                            e2fsck_pass1_check_device_inode(fs, inode)) {
2285                         check_extents_inlinedata(ctx, &pctx);
2286                         check_immutable(ctx, &pctx);
2287                         check_size(ctx, &pctx);
2288                         ctx->fs_chardev_count++;
2289                 } else if (LINUX_S_ISBLK (inode->i_mode) &&
2290                            e2fsck_pass1_check_device_inode(fs, inode)) {
2291                         check_extents_inlinedata(ctx, &pctx);
2292                         check_immutable(ctx, &pctx);
2293                         check_size(ctx, &pctx);
2294                         ctx->fs_blockdev_count++;
2295                 } else if (LINUX_S_ISLNK (inode->i_mode) &&
2296                            e2fsck_pass1_check_symlink(fs, ino, inode,
2297                                                       block_buf)) {
2298                         check_immutable(ctx, &pctx);
2299                         ctx->fs_symlinks_count++;
2300                         if (inode->i_flags & EXT4_INLINE_DATA_FL) {
2301                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2302                                 e2fsck_pass1_check_unlock(ctx);
2303                                 continue;
2304                         } else if (ext2fs_is_fast_symlink(inode)) {
2305                                 ctx->fs_fast_symlinks_count++;
2306                                 check_blocks(ctx, &pctx, block_buf,
2307                                              &ea_ibody_quota);
2308                                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2309                                 e2fsck_pass1_check_unlock(ctx);
2310                                 continue;
2311                         }
2312                 }
2313                 else if (LINUX_S_ISFIFO (inode->i_mode) &&
2314                          e2fsck_pass1_check_device_inode(fs, inode)) {
2315                         check_extents_inlinedata(ctx, &pctx);
2316                         check_immutable(ctx, &pctx);
2317                         check_size(ctx, &pctx);
2318                         ctx->fs_fifo_count++;
2319                 } else if ((LINUX_S_ISSOCK (inode->i_mode)) &&
2320                            e2fsck_pass1_check_device_inode(fs, inode)) {
2321                         check_extents_inlinedata(ctx, &pctx);
2322                         check_immutable(ctx, &pctx);
2323                         check_size(ctx, &pctx);
2324                         ctx->fs_sockets_count++;
2325                 } else
2326                         mark_inode_bad(ctx, ino);
2327                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
2328                     !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
2329                         if (inode->i_block[EXT2_IND_BLOCK])
2330                                 ctx->fs_ind_count++;
2331                         if (inode->i_block[EXT2_DIND_BLOCK])
2332                                 ctx->fs_dind_count++;
2333                         if (inode->i_block[EXT2_TIND_BLOCK])
2334                                 ctx->fs_tind_count++;
2335                 }
2336                 if (!(inode->i_flags & EXT4_EXTENTS_FL) &&
2337                     !(inode->i_flags & EXT4_INLINE_DATA_FL) &&
2338                     (inode->i_block[EXT2_IND_BLOCK] ||
2339                      inode->i_block[EXT2_DIND_BLOCK] ||
2340                      inode->i_block[EXT2_TIND_BLOCK] ||
2341                      ext2fs_file_acl_block(fs, inode))) {
2342                         struct process_inode_block *itp;
2343
2344                         itp = &inodes_to_process[process_inode_count];
2345                         itp->ino = ino;
2346                         itp->ea_ibody_quota = ea_ibody_quota;
2347                         if (inode_size < sizeof(struct ext2_inode_large))
2348                                 memcpy(&itp->inode, inode, inode_size);
2349                         else
2350                                 memcpy(&itp->inode, inode, sizeof(itp->inode));
2351                         process_inode_count++;
2352                 } else
2353                         check_blocks(ctx, &pctx, block_buf, &ea_ibody_quota);
2354
2355                 FINISH_INODE_LOOP(ctx, ino, &pctx, failed_csum);
2356
2357                 if (e2fsck_should_abort(ctx)) {
2358                         e2fsck_pass1_check_unlock(ctx);
2359                         goto endit;
2360                 }
2361
2362                 if (process_inode_count >= ctx->process_inode_size) {
2363                         process_inodes(ctx, block_buf, inodes_to_process,
2364                                        &process_inode_count);
2365
2366                         if (e2fsck_should_abort(ctx)) {
2367                                 e2fsck_pass1_check_unlock(ctx);
2368                                 goto endit;
2369                         }
2370                 }
2371                 e2fsck_pass1_check_unlock(ctx);
2372         }
2373         process_inodes(ctx, block_buf, inodes_to_process,
2374                        &process_inode_count);
2375         ext2fs_close_inode_scan(scan);
2376         scan = NULL;
2377
2378         if (ctx->ea_block_quota_blocks) {
2379                 ea_refcount_free(ctx->ea_block_quota_blocks);
2380                 ctx->ea_block_quota_blocks = 0;
2381         }
2382
2383         if (ctx->ea_block_quota_inodes) {
2384                 ea_refcount_free(ctx->ea_block_quota_inodes);
2385                 ctx->ea_block_quota_inodes = 0;
2386         }
2387
2388         /* We don't need the encryption policy => ID map any more */
2389         destroy_encryption_policy_map(ctx);
2390
2391         if (ctx->flags & E2F_FLAG_RESTART) {
2392                 /*
2393                  * Only the master copy of the superblock and block
2394                  * group descriptors are going to be written during a
2395                  * restart, so set the superblock to be used to be the
2396                  * master superblock.
2397                  */
2398                 ctx->use_superblock = 0;
2399                 goto endit;
2400         }
2401
2402         if (ctx->large_dirs && !ext2fs_has_feature_largedir(fs->super)) {
2403                 if (fix_problem(ctx, PR_2_FEATURE_LARGE_DIRS, &pctx)) {
2404                         ext2fs_set_feature_largedir(fs->super);
2405                         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
2406                         ext2fs_mark_super_dirty(fs);
2407                 }
2408                 if (fs->super->s_rev_level == EXT2_GOOD_OLD_REV &&
2409                     fix_problem(ctx, PR_1_FS_REV_LEVEL, &pctx)) {
2410                         ext2fs_update_dynamic_rev(fs);
2411                         ext2fs_mark_super_dirty(fs);
2412                 }
2413         }
2414
2415         ctx->flags |= E2F_FLAG_ALLOC_OK;
2416         ext2fs_free_mem(&inodes_to_process);
2417 endit:
2418         e2fsck_use_inode_shortcuts(ctx, 0);
2419         ext2fs_free_mem(&inodes_to_process);
2420         inodes_to_process = 0;
2421
2422         if (scan)
2423                 ext2fs_close_inode_scan(scan);
2424         if (block_buf)
2425                 ext2fs_free_mem(&block_buf);
2426         if (inode)
2427                 ext2fs_free_mem(&inode);
2428
2429         /*
2430          * The l+f inode may have been cleared, so zap it now and
2431          * later passes will recalculate it if necessary
2432          */
2433         ctx->lost_and_found = 0;
2434
2435         if ((ctx->flags & E2F_FLAG_SIGNAL_MASK) == 0)
2436                 print_resource_track(ctx, _("Pass 1"), &rtrack, ctx->fs->io);
2437         else
2438                 ctx->invalid_bitmaps++;
2439 }
2440
2441 #ifdef HAVE_PTHREAD
2442 static errcode_t e2fsck_pass1_copy_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2443                                           ext2fs_generic_bitmap *dest)
2444 {
2445         errcode_t ret;
2446
2447         ret = ext2fs_copy_bitmap(*src, dest);
2448         if (ret)
2449                 return ret;
2450
2451         (*dest)->fs = fs;
2452
2453         return 0;
2454 }
2455
2456 static void e2fsck_pass1_free_bitmap(ext2fs_generic_bitmap *bitmap)
2457 {
2458         if (*bitmap) {
2459                 ext2fs_free_generic_bmap(*bitmap);
2460                 *bitmap = NULL;
2461         }
2462
2463 }
2464
2465 static errcode_t e2fsck_pass1_merge_bitmap(ext2_filsys fs, ext2fs_generic_bitmap *src,
2466                                           ext2fs_generic_bitmap *dest)
2467 {
2468         errcode_t ret = 0;
2469
2470         if (*src) {
2471                 if (*dest == NULL) {
2472                         *dest = *src;
2473                         *src = NULL;
2474                 } else {
2475                         ret = ext2fs_merge_bitmap(*src, *dest, NULL, NULL);
2476                         if (ret)
2477                                 return ret;
2478                 }
2479                 (*dest)->fs = fs;
2480         }
2481
2482         return 0;
2483 }
2484
2485 static errcode_t e2fsck_pass1_copy_fs(ext2_filsys dest, e2fsck_t src_context,
2486                                       ext2_filsys src)
2487 {
2488         errcode_t       retval;
2489
2490         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2491         dest->inode_map = NULL;
2492         dest->block_map = NULL;
2493         dest->badblocks = NULL;
2494         if (dest->dblist)
2495                 dest->dblist->fs = dest;
2496         if (src->block_map) {
2497                 retval = e2fsck_pass1_copy_bitmap(dest, &src->block_map,
2498                                                   &dest->block_map);
2499                 if (retval)
2500                         return retval;
2501         }
2502         if (src->inode_map) {
2503                 retval = e2fsck_pass1_copy_bitmap(dest, &src->inode_map,
2504                                                   &dest->inode_map);
2505                 if (retval)
2506                         return retval;
2507         }
2508
2509         if (src->badblocks) {
2510                 retval = ext2fs_badblocks_copy(src->badblocks,
2511                                                &dest->badblocks);
2512                 if (retval)
2513                         return retval;
2514         }
2515
2516         /* disable it for now */
2517         src_context->openfs_flags &= ~EXT2_FLAG_EXCLUSIVE;
2518         retval = ext2fs_open_channel(dest, src_context->io_options,
2519                                      src_context->io_manager,
2520                                      src_context->openfs_flags,
2521                                      src->io->block_size);
2522         if (retval)
2523                 return retval;
2524
2525         /* Block size might not be default */
2526         io_channel_set_blksize(dest->io, src->io->block_size);
2527         ehandler_init(dest->io);
2528
2529         assert(dest->io->magic == src->io->magic);
2530         assert(dest->io->manager == src->io->manager);
2531         assert(strcmp(dest->io->name, src->io->name) == 0);
2532         assert(dest->io->block_size == src->io->block_size);
2533         assert(dest->io->read_error == src->io->read_error);
2534         assert(dest->io->write_error == src->io->write_error);
2535         assert(dest->io->refcount == src->io->refcount);
2536         assert(dest->io->flags == src->io->flags);
2537         assert(dest->io->app_data == dest);
2538         assert(src->io->app_data == src);
2539         assert(dest->io->align == src->io->align);
2540
2541         /* The data should be written to disk immediately */
2542         dest->io->flags |= CHANNEL_FLAGS_WRITETHROUGH;
2543         /* icache will be rebuilt if needed, so do not copy from @src */
2544         src->icache = NULL;
2545         return 0;
2546 }
2547
2548 static int e2fsck_pass1_merge_fs(ext2_filsys dest, ext2_filsys src)
2549 {
2550         struct ext2_inode_cache *icache = dest->icache;
2551         errcode_t retval = 0;
2552         io_channel dest_io;
2553         io_channel dest_image_io;
2554         ext2fs_inode_bitmap inode_map;
2555         ext2fs_block_bitmap block_map;
2556         ext2_badblocks_list badblocks;
2557         ext2_dblist dblist;
2558         int flags;
2559         e2fsck_t dest_ctx = dest->priv_data;
2560
2561         dest_io = dest->io;
2562         dest_image_io = dest->image_io;
2563         inode_map = dest->inode_map;
2564         block_map = dest->block_map;
2565         badblocks = dest->badblocks;
2566         dblist = dest->dblist;
2567         flags = dest->flags;
2568
2569         memcpy(dest, src, sizeof(struct struct_ext2_filsys));
2570         dest->io = dest_io;
2571         dest->image_io = dest_image_io;
2572         dest->icache = icache;
2573         dest->inode_map = inode_map;
2574         dest->block_map = block_map;
2575         dest->badblocks = badblocks;
2576         dest->dblist = dblist;
2577         dest->priv_data = dest_ctx;
2578         if (dest->dblist)
2579                 dest->dblist->fs = dest;
2580         dest->flags = src->flags | flags;
2581         if (!(src->flags & EXT2_FLAG_VALID) || !(flags & EXT2_FLAG_VALID))
2582                 ext2fs_unmark_valid(dest);
2583
2584         if (src->icache) {
2585                 ext2fs_free_inode_cache(src->icache);
2586                 src->icache = NULL;
2587         }
2588
2589         retval = e2fsck_pass1_merge_bitmap(dest, &src->inode_map,
2590                                            &dest->inode_map);
2591         if (retval)
2592                 goto out;
2593
2594         retval = e2fsck_pass1_merge_bitmap(dest, &src->block_map,
2595                                           &dest->block_map);
2596         if (retval)
2597                 goto out;
2598
2599         if (src->dblist) {
2600                 if (dest->dblist) {
2601                         retval = ext2fs_merge_dblist(src->dblist,
2602                                                      dest->dblist);
2603                         if (retval)
2604                                 goto out;
2605                 } else {
2606                         dest->dblist = src->dblist;
2607                         dest->dblist->fs = dest;
2608                         src->dblist = NULL;
2609                 }
2610         }
2611
2612         if (src->badblocks) {
2613                 if (dest->badblocks == NULL)
2614                         retval = ext2fs_badblocks_copy(src->badblocks,
2615                                                        &dest->badblocks);
2616                 else
2617                         retval = ext2fs_badblocks_merge(src->badblocks,
2618                                                         dest->badblocks);
2619         }
2620 out:
2621         io_channel_close(src->io);
2622         if (src->inode_map)
2623                 ext2fs_free_generic_bmap(src->inode_map);
2624         if (src->block_map)
2625                 ext2fs_free_generic_bmap(src->block_map);
2626         if (src->badblocks)
2627                 ext2fs_badblocks_list_free(src->badblocks);
2628         if (src->dblist)
2629                 ext2fs_free_dblist(src->dblist);
2630
2631         return retval;
2632 }
2633
2634 static void e2fsck_pass1_copy_invalid_bitmaps(e2fsck_t global_ctx,
2635                                               e2fsck_t thread_ctx)
2636 {
2637         dgrp_t i, j;
2638         dgrp_t grp_start = thread_ctx->thread_info.et_group_start;
2639         dgrp_t grp_end = thread_ctx->thread_info.et_group_end;
2640         dgrp_t total = grp_end - grp_start;
2641
2642         thread_ctx->invalid_inode_bitmap_flag =
2643                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2644                                                 "invalid_inode_bitmap");
2645         thread_ctx->invalid_block_bitmap_flag =
2646                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2647                                                "invalid_block_bitmap");
2648         thread_ctx->invalid_inode_table_flag =
2649                         e2fsck_allocate_memory(global_ctx, sizeof(int) * total,
2650                                                "invalid_inode_table");
2651
2652         memcpy(thread_ctx->invalid_block_bitmap_flag,
2653                &global_ctx->invalid_block_bitmap_flag[grp_start],
2654                total * sizeof(int));
2655         memcpy(thread_ctx->invalid_inode_bitmap_flag,
2656                &global_ctx->invalid_inode_bitmap_flag[grp_start],
2657                total * sizeof(int));
2658         memcpy(thread_ctx->invalid_inode_table_flag,
2659                &global_ctx->invalid_inode_table_flag[grp_start],
2660                total * sizeof(int));
2661
2662         thread_ctx->invalid_bitmaps = 0;
2663         for (i = grp_start, j = 0; i < grp_end; i++, j++) {
2664                 if (thread_ctx->invalid_block_bitmap_flag[j])
2665                         thread_ctx->invalid_bitmaps++;
2666                 if (thread_ctx->invalid_inode_bitmap_flag[j])
2667                         thread_ctx->invalid_bitmaps++;
2668                 if (thread_ctx->invalid_inode_table_flag[j])
2669                         thread_ctx->invalid_bitmaps++;
2670         }
2671 }
2672
2673 static void e2fsck_pass1_merge_invalid_bitmaps(e2fsck_t global_ctx,
2674                                                e2fsck_t thread_ctx)
2675 {
2676         dgrp_t grp_start = thread_ctx->thread_info.et_group_start;
2677         dgrp_t grp_end = thread_ctx->thread_info.et_group_end;
2678         dgrp_t total = grp_end - grp_start;
2679
2680         memcpy(&global_ctx->invalid_block_bitmap_flag[grp_start],
2681                thread_ctx->invalid_block_bitmap_flag, total * sizeof(int));
2682         memcpy(&global_ctx->invalid_inode_bitmap_flag[grp_start],
2683                thread_ctx->invalid_inode_bitmap_flag, total * sizeof(int));
2684         memcpy(&global_ctx->invalid_inode_table_flag[grp_start],
2685                thread_ctx->invalid_inode_table_flag, total * sizeof(int));
2686         global_ctx->invalid_bitmaps += thread_ctx->invalid_bitmaps;
2687 }
2688
2689 static errcode_t e2fsck_pass1_thread_prepare(e2fsck_t global_ctx, e2fsck_t *thread_ctx,
2690                                              int thread_index, int num_threads,
2691                                              dgrp_t average_group)
2692 {
2693         errcode_t               retval;
2694         e2fsck_t                thread_context;
2695         ext2_filsys             thread_fs;
2696         ext2_filsys             global_fs = global_ctx->fs;
2697         struct e2fsck_thread    *tinfo;
2698
2699         assert(global_ctx->inode_used_map == NULL);
2700         assert(global_ctx->inode_dir_map == NULL);
2701         assert(global_ctx->inode_bb_map == NULL);
2702         assert(global_ctx->inode_imagic_map == NULL);
2703         assert(global_ctx->inode_reg_map == NULL);
2704         assert(global_ctx->inodes_to_rebuild == NULL);
2705
2706         assert(global_ctx->block_found_map != NULL);
2707         assert(global_ctx->block_metadata_map != NULL);
2708         assert(global_ctx->block_dup_map != NULL);
2709         assert(global_ctx->block_ea_map == NULL);
2710         assert(global_ctx->fs->dblist == NULL);
2711
2712         retval = ext2fs_get_mem(sizeof(struct e2fsck_struct), &thread_context);
2713         if (retval) {
2714                 com_err(global_ctx->program_name, retval, "while allocating memory");
2715                 return retval;
2716         }
2717         memcpy(thread_context, global_ctx, sizeof(struct e2fsck_struct));
2718         thread_context->block_dup_map = NULL;
2719         thread_context->casefolded_dirs = NULL;
2720
2721         retval = e2fsck_allocate_block_bitmap(global_ctx->fs,
2722                                 _("in-use block map"), EXT2FS_BMAP64_RBTREE,
2723                                 "block_found_map", &thread_context->block_found_map);
2724         if (retval)
2725                 goto out_context;
2726
2727         thread_context->global_ctx = global_ctx;
2728         retval = ext2fs_get_mem(sizeof(struct struct_ext2_filsys), &thread_fs);
2729         if (retval) {
2730                 com_err(global_ctx->program_name, retval, "while allocating memory");
2731                 goto out_context;
2732         }
2733
2734         io_channel_flush_cleanup(global_fs->io);
2735         retval = e2fsck_pass1_copy_fs(thread_fs, global_ctx, global_fs);
2736         if (retval) {
2737                 com_err(global_ctx->program_name, retval, "while copying fs");
2738                 goto out_fs;
2739         }
2740         thread_fs->priv_data = thread_context;
2741
2742         thread_context->thread_info.et_thread_index = thread_index;
2743         set_up_logging(thread_context);
2744
2745         tinfo = &thread_context->thread_info;
2746         tinfo->et_group_start = average_group * thread_index;
2747         if (thread_index == global_fs->fs_num_threads - 1)
2748                 tinfo->et_group_end = thread_fs->group_desc_count;
2749         else
2750                 tinfo->et_group_end = average_group * (thread_index + 1);
2751         tinfo->et_group_next = tinfo->et_group_start;
2752         tinfo->et_inode_number = 0;
2753         tinfo->et_log_buf[0] = '\0';
2754         tinfo->et_log_length = 0;
2755         if (thread_context->options & E2F_OPT_MULTITHREAD)
2756                 log_out(thread_context, _("Scan group range [%d, %d)\n"),
2757                         tinfo->et_group_start, tinfo->et_group_end);
2758         thread_context->fs = thread_fs;
2759         retval = quota_init_context(&thread_context->qctx, thread_fs, 0);
2760         if (retval) {
2761                 com_err(global_ctx->program_name, retval,
2762                         "while init quota context");
2763                 goto out_fs;
2764         }
2765         *thread_ctx = thread_context;
2766         e2fsck_pass1_copy_invalid_bitmaps(global_ctx, thread_context);
2767         return 0;
2768 out_fs:
2769         ext2fs_free_mem(&thread_fs);
2770 out_context:
2771         if (thread_context->block_found_map)
2772                 ext2fs_free_mem(&thread_context->block_found_map);
2773         ext2fs_free_mem(&thread_context);
2774         return retval;
2775 }
2776
2777 static void e2fsck_pass1_merge_dir_info(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2778 {
2779         if (thread_ctx->dir_info == NULL)
2780                 return;
2781
2782         if (global_ctx->dir_info == NULL) {
2783                 global_ctx->dir_info = thread_ctx->dir_info;
2784                 thread_ctx->dir_info = NULL;
2785                 return;
2786         }
2787
2788         e2fsck_merge_dir_info(global_ctx, thread_ctx->dir_info,
2789                               global_ctx->dir_info);
2790 }
2791
2792 static void e2fsck_pass1_merge_dx_dir(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2793 {
2794         if (thread_ctx->dx_dir_info == NULL)
2795                 return;
2796
2797         if (global_ctx->dx_dir_info == NULL) {
2798                 global_ctx->dx_dir_info = thread_ctx->dx_dir_info;
2799                 global_ctx->dx_dir_info_size = thread_ctx->dx_dir_info_size;
2800                 global_ctx->dx_dir_info_count = thread_ctx->dx_dir_info_count;
2801                 thread_ctx->dx_dir_info = NULL;
2802                 return;
2803         }
2804
2805         e2fsck_merge_dx_dir(global_ctx, thread_ctx);
2806 }
2807
2808 static inline errcode_t
2809 e2fsck_pass1_merge_icount(ext2_icount_t *dest_icount,
2810                           ext2_icount_t *src_icount)
2811 {
2812         if (*src_icount) {
2813                 if (*dest_icount == NULL) {
2814                         *dest_icount = *src_icount;
2815                         *src_icount = NULL;
2816                 } else {
2817                         errcode_t ret;
2818
2819                         ret = ext2fs_icount_merge(*src_icount,
2820                                                   *dest_icount);
2821                         if (ret)
2822                                 return ret;
2823                 }
2824         }
2825
2826         return 0;
2827 }
2828
2829 static errcode_t e2fsck_pass1_merge_icounts(e2fsck_t global_ctx, e2fsck_t thread_ctx)
2830 {
2831         errcode_t ret;
2832
2833         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_count,
2834                                         &thread_ctx->inode_count);
2835         if (ret)
2836                 return ret;
2837         ret = e2fsck_pass1_merge_icount(&global_ctx->inode_link_info,
2838                                         &thread_ctx->inode_link_info);
2839
2840         return ret;
2841 }
2842
2843 static errcode_t e2fsck_pass1_merge_dirs_to_hash(e2fsck_t global_ctx,
2844                                                  e2fsck_t thread_ctx)
2845 {
2846         errcode_t retval = 0;
2847
2848         if (!thread_ctx->dirs_to_hash)
2849                 return 0;
2850
2851         if (!global_ctx->dirs_to_hash)
2852                 retval = ext2fs_badblocks_copy(thread_ctx->dirs_to_hash,
2853                                                &global_ctx->dirs_to_hash);
2854         else
2855                 retval = ext2fs_badblocks_merge(thread_ctx->dirs_to_hash,
2856                                                 global_ctx->dirs_to_hash);
2857
2858         return retval;
2859 }
2860
2861 static errcode_t e2fsck_pass1_merge_ea_inode_refs(e2fsck_t global_ctx,
2862                                                   e2fsck_t thread_ctx)
2863 {
2864         ea_value_t count;
2865         blk64_t blk;
2866         errcode_t retval;
2867
2868         if (!thread_ctx->ea_inode_refs)
2869                 return 0;
2870
2871         if (!global_ctx->ea_inode_refs) {
2872                 global_ctx->ea_inode_refs = thread_ctx->ea_inode_refs;
2873                 thread_ctx->ea_inode_refs = NULL;
2874                 return 0;
2875         }
2876
2877         ea_refcount_intr_begin(thread_ctx->ea_inode_refs);
2878         while (1) {
2879                 if ((blk = ea_refcount_intr_next(thread_ctx->ea_inode_refs,
2880                                                  &count)) == 0)
2881                         break;
2882                 if (!global_ctx->block_ea_map ||
2883                     !ext2fs_fast_test_block_bitmap2(global_ctx->block_ea_map,
2884                                                     blk)) {
2885                         retval = ea_refcount_store(global_ctx->ea_inode_refs,
2886                                                    blk, count);
2887                         if (retval)
2888                                 return retval;
2889                 }
2890         }
2891
2892         return retval;
2893 }
2894
2895 static ea_value_t ea_refcount_usage(e2fsck_t ctx, blk64_t blk,
2896                                     ea_value_t *orig)
2897 {
2898         ea_value_t count_cur;
2899         ea_value_t count_extra = 0;
2900         ea_value_t count_orig;
2901
2902         ea_refcount_fetch(ctx->refcount_orig, blk, &count_orig);
2903         ea_refcount_fetch(ctx->refcount, blk, &count_cur);
2904         /* most of time this is not needed */
2905         if (ctx->refcount_extra && count_cur == 0)
2906                 ea_refcount_fetch(ctx->refcount_extra, blk, &count_extra);
2907
2908         if (!count_orig)
2909                 count_orig = *orig;
2910         else if (orig)
2911                 *orig = count_orig;
2912
2913         return count_orig + count_extra - count_cur;
2914 }
2915
2916 static errcode_t e2fsck_pass1_merge_ea_refcount(e2fsck_t global_ctx,
2917                                                 e2fsck_t thread_ctx)
2918 {
2919         ea_value_t count;
2920         blk64_t blk;
2921         errcode_t retval = 0;
2922
2923         if (!thread_ctx->refcount)
2924                 return 0;
2925
2926         if (!global_ctx->refcount) {
2927                 global_ctx->refcount = thread_ctx->refcount;
2928                 thread_ctx->refcount = NULL;
2929                 global_ctx->refcount_extra = thread_ctx->refcount;
2930                 thread_ctx->refcount_extra = NULL;
2931                 return 0;
2932         }
2933
2934         ea_refcount_intr_begin(thread_ctx->refcount);
2935         while (1) {
2936                 if ((blk = ea_refcount_intr_next(thread_ctx->refcount,
2937                                                  &count)) == 0)
2938                         break;
2939                 /**
2940                  * this EA has never seen before, so just store its
2941                  * refcount and refcount_extra into global_ctx if needed.
2942                  */
2943                 if (!global_ctx->block_ea_map ||
2944                     !ext2fs_fast_test_block_bitmap2(global_ctx->block_ea_map,
2945                                                     blk)) {
2946                         ea_value_t extra;
2947
2948                         retval = ea_refcount_store(global_ctx->refcount,
2949                                                    blk, count);
2950                         if (retval)
2951                                 return retval;
2952
2953                         if (count > 0 || !thread_ctx->refcount_extra)
2954                                 continue;
2955                         ea_refcount_fetch(thread_ctx->refcount_extra, blk,
2956                                           &extra);
2957                         if (extra == 0)
2958                                 continue;
2959
2960                         if (!global_ctx->refcount_extra) {
2961                                 retval = ea_refcount_create(0,
2962                                                 &global_ctx->refcount_extra);
2963                                 if (retval)
2964                                         return retval;
2965                         }
2966                         retval = ea_refcount_store(global_ctx->refcount_extra,
2967                                                    blk, extra);
2968                         if (retval)
2969                                 return retval;
2970                 } else {
2971                         ea_value_t orig;
2972                         ea_value_t thread_usage;
2973                         ea_value_t global_usage;
2974                         ea_value_t new;
2975
2976                         thread_usage = ea_refcount_usage(thread_ctx,
2977                                                          blk, &orig);
2978                         global_usage = ea_refcount_usage(global_ctx,
2979                                                          blk, &orig);
2980                         if (thread_usage + global_usage <= orig) {
2981                                 new = orig - thread_usage - global_usage;
2982                                 retval = ea_refcount_store(global_ctx->refcount,
2983                                                            blk, new);
2984                                 if (retval)
2985                                         return retval;
2986                                 continue;
2987                         }
2988                         /* update it is as zero */
2989                         retval = ea_refcount_store(global_ctx->refcount,
2990                                                    blk, 0);
2991                         if (retval)
2992                                 return retval;
2993                         /* Ooops, this EA was referenced more than it stated */
2994                         if (!global_ctx->refcount_extra) {
2995                                 retval = ea_refcount_create(0,
2996                                                 &global_ctx->refcount_extra);
2997                                 if (retval)
2998                                         return retval;
2999                         }
3000                         new = global_usage + thread_usage - orig;
3001                         retval = ea_refcount_store(global_ctx->refcount_extra,
3002                                                    blk, new);
3003                         if (retval)
3004                                 return retval;
3005                 }
3006         }
3007
3008         return retval;
3009 }
3010
3011 static errcode_t e2fsck_pass1_merge_casefolded_dirs(e2fsck_t global_ctx,
3012                                                    e2fsck_t thread_ctx)
3013 {
3014         errcode_t retval = 0;
3015
3016         if (!thread_ctx->casefolded_dirs)
3017                 return 0;
3018
3019         if (!global_ctx->casefolded_dirs)
3020                 retval = ext2fs_badblocks_copy(thread_ctx->casefolded_dirs,
3021                                                &global_ctx->casefolded_dirs);
3022         else
3023                 retval = ext2fs_badblocks_merge(thread_ctx->casefolded_dirs,
3024                                                 global_ctx->casefolded_dirs);
3025
3026         return retval;
3027 }
3028
3029 static errcode_t e2fsck_pass1_merge_context(e2fsck_t global_ctx,
3030                                             e2fsck_t thread_ctx)
3031 {
3032         ext2_filsys global_fs = global_ctx->fs;
3033         errcode_t retval;
3034         int i;
3035
3036         global_ctx->fs_directory_count += thread_ctx->fs_directory_count;
3037         global_ctx->fs_regular_count += thread_ctx->fs_regular_count;
3038         global_ctx->fs_blockdev_count += thread_ctx->fs_blockdev_count;
3039         global_ctx->fs_chardev_count += thread_ctx->fs_chardev_count;
3040         global_ctx->fs_links_count += thread_ctx->fs_links_count;
3041         global_ctx->fs_symlinks_count += thread_ctx->fs_symlinks_count;
3042         global_ctx->fs_fast_symlinks_count += thread_ctx->fs_fast_symlinks_count;
3043         global_ctx->fs_fifo_count += thread_ctx->fs_fifo_count;
3044         global_ctx->fs_total_count += thread_ctx->fs_total_count;
3045         global_ctx->fs_badblocks_count += thread_ctx->fs_badblocks_count;
3046         global_ctx->fs_sockets_count += thread_ctx->fs_sockets_count;
3047         global_ctx->fs_ind_count += thread_ctx->fs_ind_count;
3048         global_ctx->fs_dind_count += thread_ctx->fs_dind_count;
3049         global_ctx->fs_tind_count += thread_ctx->fs_tind_count;
3050         global_ctx->fs_fragmented += thread_ctx->fs_fragmented;
3051         global_ctx->fs_fragmented_dir += thread_ctx->fs_fragmented_dir;
3052         global_ctx->large_files += thread_ctx->large_files;
3053         /* threads might enable E2F_OPT_YES */
3054         global_ctx->options |= thread_ctx->options;
3055         global_ctx->flags |= thread_ctx->flags;
3056         /*
3057          * The l+f inode may have been cleared, so zap it now and
3058          * later passes will recalculate it if necessary
3059          */
3060         global_ctx->lost_and_found = 0;
3061         /* merge extent depth count */
3062         for (i = 0; i < MAX_EXTENT_DEPTH_COUNT; i++)
3063                 global_ctx->extent_depth_count[i] +=
3064                         thread_ctx->extent_depth_count[i];
3065
3066         e2fsck_pass1_merge_dir_info(global_ctx, thread_ctx);
3067         e2fsck_pass1_merge_dx_dir(global_ctx, thread_ctx);
3068
3069         retval = e2fsck_pass1_merge_fs(global_ctx->fs, thread_ctx->fs);
3070         if (retval) {
3071                 com_err(global_ctx->program_name, 0, _("while merging fs\n"));
3072                 return retval;
3073         }
3074         retval = e2fsck_pass1_merge_icounts(global_ctx, thread_ctx);
3075         if (retval) {
3076                 com_err(global_ctx->program_name, 0,
3077                         _("while merging icounts\n"));
3078                 return retval;
3079         }
3080
3081         retval = e2fsck_pass1_merge_dirs_to_hash(global_ctx, thread_ctx);
3082         if (retval) {
3083                 com_err(global_ctx->program_name, 0,
3084                         _("while merging dirs to hash\n"));
3085                 return retval;
3086         }
3087
3088         e2fsck_pass1_merge_ea_inode_refs(global_ctx, thread_ctx);
3089         e2fsck_pass1_merge_ea_refcount(global_ctx, thread_ctx);
3090         retval = quota_merge_and_update_usage(global_ctx->qctx,
3091                                               thread_ctx->qctx);
3092         if (retval)
3093                 return retval;
3094
3095         retval = e2fsck_pass1_merge_casefolded_dirs(global_ctx, thread_ctx);
3096         if (retval) {
3097                 com_err(global_ctx->program_name, 0,
3098                         _("while merging casefolded dirs\n"));
3099                 return retval;
3100         }
3101
3102         e2fsck_pass1_merge_invalid_bitmaps(global_ctx, thread_ctx);
3103
3104         retval = e2fsck_pass1_merge_bitmap(global_fs,
3105                                 &thread_ctx->inode_used_map,
3106                                 &global_ctx->inode_used_map);
3107         if (retval)
3108                 return retval;
3109
3110         retval = e2fsck_pass1_merge_bitmap(global_fs,
3111                                 &thread_ctx->inode_bad_map,
3112                                 &global_ctx->inode_bad_map);
3113         if (retval)
3114                 return retval;
3115         retval = e2fsck_pass1_merge_bitmap(global_fs,
3116                                         &thread_ctx->inode_dir_map,
3117                                         &global_ctx->inode_dir_map);
3118         if (retval)
3119                 return retval;
3120         retval = e2fsck_pass1_merge_bitmap(global_fs,
3121                                 &thread_ctx->inode_bb_map,
3122                                 &global_ctx->inode_bb_map);
3123         if (retval)
3124                 return retval;
3125         retval = e2fsck_pass1_merge_bitmap(global_fs,
3126                                 &thread_ctx->inode_imagic_map,
3127                                 &global_ctx->inode_imagic_map);
3128         if (retval)
3129                 return retval;
3130         retval = e2fsck_pass1_merge_bitmap(global_fs,
3131                                 &thread_ctx->inode_reg_map,
3132                                 &global_ctx->inode_reg_map);
3133         if (retval)
3134                 return retval;
3135         retval = e2fsck_pass1_merge_bitmap(global_fs,
3136                                 &thread_ctx->inodes_to_rebuild,
3137                                 &global_ctx->inodes_to_rebuild);
3138         if (retval)
3139                 return retval;
3140         retval = e2fsck_pass1_merge_bitmap(global_fs,
3141                                 &thread_ctx->block_ea_map,
3142                                 &global_ctx->block_ea_map);
3143         if (retval)
3144                 return retval;
3145
3146         if (ext2fs_has_feature_shared_blocks(global_fs->super) &&
3147             !(global_ctx->options & E2F_OPT_UNSHARE_BLOCKS))
3148                 return 0;
3149         /*
3150          * This need be done after merging block_ea_map
3151          * because ea block might be shared, we need exclude
3152          * them from dup blocks.
3153          */
3154         e2fsck_pass1_block_map_w_lock(thread_ctx);
3155         retval = ext2fs_merge_bitmap(thread_ctx->block_found_map,
3156                                      global_ctx->block_found_map,
3157                                      global_ctx->block_dup_map,
3158                                      global_ctx->block_ea_map);
3159         e2fsck_pass1_block_map_w_unlock(thread_ctx);
3160         if (retval == EEXIST)
3161                 global_ctx->flags |= E2F_FLAG_DUP_BLOCK;
3162
3163         return 0;
3164 }
3165
3166 static int e2fsck_pass1_thread_join(e2fsck_t global_ctx, e2fsck_t thread_ctx)
3167 {
3168         errcode_t       retval;
3169
3170         retval = e2fsck_pass1_merge_context(global_ctx, thread_ctx);
3171         ext2fs_free_mem(&thread_ctx->fs);
3172         if (thread_ctx->logf)
3173                 fclose(thread_ctx->logf);
3174         if (thread_ctx->problem_logf) {
3175                 fputs("</problem_log>\n", thread_ctx->problem_logf);
3176                 fclose(thread_ctx->problem_logf);
3177         }
3178
3179         /*
3180          * @block_metadata_map and @block_dup_map are
3181          * shared, so we don't free them.
3182          */
3183         thread_ctx->block_metadata_map = NULL;
3184         thread_ctx->block_dup_map = NULL;
3185         e2fsck_reset_context(thread_ctx);
3186         ext2fs_free_mem(&thread_ctx);
3187
3188         return retval;
3189 }
3190
3191 static int e2fsck_pass1_threads_join(struct e2fsck_thread_info *infos,
3192                                      e2fsck_t global_ctx)
3193 {
3194         errcode_t                        rc;
3195         errcode_t                        ret = 0;
3196         int                              i;
3197         struct e2fsck_thread_info       *pinfo;
3198         int                              num_threads = global_ctx->fs_num_threads;
3199
3200         /* merge invalid bitmaps will recalculate it */
3201         global_ctx->invalid_bitmaps = 0;
3202         for (i = 0; i < num_threads; i++) {
3203                 pinfo = &infos[i];
3204
3205                 if (!pinfo->eti_started)
3206                         continue;
3207
3208                 rc = pthread_join(pinfo->eti_thread_id, NULL);
3209                 if (rc) {
3210                         com_err(global_ctx->program_name, rc,
3211                                 _("while joining thread\n"));
3212                         if (ret == 0)
3213                                 ret = rc;
3214                 }
3215                 rc = e2fsck_pass1_thread_join(global_ctx, infos[i].eti_thread_ctx);
3216                 if (rc) {
3217                         com_err(global_ctx->program_name, rc,
3218                                 _("while joining pass1 thread\n"));
3219                         if (ret == 0)
3220                                 ret = rc;
3221                 }
3222         }
3223         free(infos);
3224
3225         return ret;
3226 }
3227
3228 static void *e2fsck_pass1_thread(void *arg)
3229 {
3230         struct e2fsck_thread_info       *info = arg;
3231         e2fsck_t                         thread_ctx = info->eti_thread_ctx;
3232 #ifdef DEBUG_THREADS
3233         struct e2fsck_thread_debug      *thread_debug = info->eti_debug;
3234 #endif
3235
3236 #ifdef DEBUG_THREADS
3237         pthread_mutex_lock(&thread_debug->etd_mutex);
3238         while (info->eti_thread_index > thread_debug->etd_finished_threads) {
3239                 pthread_cond_wait(&thread_debug->etd_cond,
3240                                   &thread_debug->etd_mutex);
3241         }
3242         pthread_mutex_unlock(&thread_debug->etd_mutex);
3243 #endif
3244
3245 #ifdef HAVE_SETJMP_H
3246         /*
3247          * When fatal_error() happens, jump to here. The thread
3248          * context's flags will be saved, but its abort_loc will
3249          * be overwritten by original jump buffer for the later
3250          * tests.
3251          */
3252         if (setjmp(thread_ctx->abort_loc)) {
3253                 thread_ctx->flags &= ~E2F_FLAG_SETJMP_OK;
3254                 goto out;
3255         }
3256         thread_ctx->flags |= E2F_FLAG_SETJMP_OK;
3257 #endif
3258
3259         e2fsck_pass1_run(thread_ctx);
3260
3261 out:
3262         if (thread_ctx->options & E2F_OPT_MULTITHREAD)
3263                 log_out(thread_ctx,
3264                         _("Scanned group range [%lu, %lu), inodes %lu\n"),
3265                         thread_ctx->thread_info.et_group_start,
3266                         thread_ctx->thread_info.et_group_end,
3267                         thread_ctx->thread_info.et_inode_number);
3268
3269 #ifdef DEBUG_THREADS
3270         pthread_mutex_lock(&thread_debug->etd_mutex);
3271         thread_debug->etd_finished_threads++;
3272         pthread_cond_broadcast(&thread_debug->etd_cond);
3273         pthread_mutex_unlock(&thread_debug->etd_mutex);
3274 #endif
3275
3276         return NULL;
3277 }
3278
3279 static dgrp_t ext2fs_get_avg_group(ext2_filsys fs)
3280 {
3281 #ifdef HAVE_PTHREAD
3282         dgrp_t average_group;
3283         unsigned flexbg_size;
3284
3285         if (fs->fs_num_threads <= 1)
3286                 return fs->group_desc_count;
3287
3288         average_group = fs->group_desc_count / fs->fs_num_threads;
3289         if (average_group <= 1)
3290                 return 1;
3291
3292         if (ext2fs_has_feature_flex_bg(fs->super)) {
3293                 int times = 1;
3294
3295                 flexbg_size = 1 << fs->super->s_log_groups_per_flex;
3296                 if (average_group % flexbg_size) {
3297                         times = average_group / flexbg_size;
3298                         average_group = times * flexbg_size;
3299                 }
3300         }
3301
3302         return average_group;
3303 #else
3304         return fs->group_desc_count;
3305 #endif
3306 }
3307
3308 static int e2fsck_pass1_threads_start(struct e2fsck_thread_info **pinfo,
3309                                       e2fsck_t global_ctx)
3310 {
3311         struct e2fsck_thread_info       *infos;
3312         pthread_attr_t                   attr;
3313         errcode_t                        retval;
3314         errcode_t                        ret;
3315         struct e2fsck_thread_info       *tmp_pinfo;
3316         int                              i;
3317         e2fsck_t                         thread_ctx;
3318         dgrp_t                           average_group;
3319         int                              num_threads = global_ctx->fs_num_threads;
3320 #ifdef DEBUG_THREADS
3321         struct e2fsck_thread_debug       thread_debug =
3322                 {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER, 0};
3323
3324         thread_debug.etd_finished_threads = 0;
3325 #endif
3326
3327         retval = pthread_attr_init(&attr);
3328         if (retval) {
3329                 com_err(global_ctx->program_name, retval,
3330                         _("while setting pthread attribute\n"));
3331                 return retval;
3332         }
3333
3334         infos = calloc(num_threads, sizeof(struct e2fsck_thread_info));
3335         if (infos == NULL) {
3336                 retval = -ENOMEM;
3337                 com_err(global_ctx->program_name, retval,
3338                         _("while allocating memory for threads\n"));
3339                 pthread_attr_destroy(&attr);
3340                 return retval;
3341         }
3342
3343         average_group = ext2fs_get_avg_group(global_ctx->fs);
3344         for (i = 0; i < num_threads; i++) {
3345                 tmp_pinfo = &infos[i];
3346                 tmp_pinfo->eti_thread_index = i;
3347 #ifdef DEBUG_THREADS
3348                 tmp_pinfo->eti_debug = &thread_debug;
3349 #endif
3350                 retval = e2fsck_pass1_thread_prepare(global_ctx, &thread_ctx,
3351                                                      i, num_threads,
3352                                                      average_group);
3353                 if (retval) {
3354                         com_err(global_ctx->program_name, retval,
3355                                 _("while preparing pass1 thread\n"));
3356                         break;
3357                 }
3358                 tmp_pinfo->eti_thread_ctx = thread_ctx;
3359
3360                 retval = pthread_create(&tmp_pinfo->eti_thread_id, &attr,
3361                                         &e2fsck_pass1_thread, tmp_pinfo);
3362                 if (retval) {
3363                         com_err(global_ctx->program_name, retval,
3364                                 _("while creating thread\n"));
3365                         e2fsck_pass1_thread_join(global_ctx, thread_ctx);
3366                         break;
3367                 }
3368
3369                 tmp_pinfo->eti_started = 1;
3370         }
3371
3372         /* destroy the thread attribute object, since it is no longer needed */
3373         ret = pthread_attr_destroy(&attr);
3374         if (ret) {
3375                 com_err(global_ctx->program_name, ret,
3376                         _("while destroying thread attribute\n"));
3377                 if (retval == 0)
3378                         retval = ret;
3379         }
3380
3381         if (retval) {
3382                 e2fsck_pass1_threads_join(infos, global_ctx);
3383                 return retval;
3384         }
3385         *pinfo = infos;
3386         return 0;
3387 }
3388
3389 static void e2fsck_pass1_multithread(e2fsck_t global_ctx)
3390 {
3391         struct e2fsck_thread_info *infos = NULL;
3392         errcode_t retval;
3393
3394         retval = e2fsck_pass1_threads_start(&infos, global_ctx);
3395         if (retval) {
3396                 com_err(global_ctx->program_name, retval,
3397                         _("while starting pass1 threads\n"));
3398                 goto out_abort;
3399         }
3400
3401         retval = e2fsck_pass1_threads_join(infos, global_ctx);
3402         if (retval) {
3403                 com_err(global_ctx->program_name, retval,
3404                         _("while joining pass1 threads\n"));
3405                 goto out_abort;
3406         }
3407         return;
3408 out_abort:
3409         global_ctx->flags |= E2F_FLAG_ABORT;
3410         return;
3411 }
3412 #endif
3413
3414 void e2fsck_pass1(e2fsck_t ctx)
3415 {
3416         errcode_t retval;
3417         int need_single = 1;
3418
3419         retval = e2fsck_pass1_prepare(ctx);
3420         if (retval)
3421                 return;
3422 #ifdef HAVE_PTHREAD
3423         if (ctx->fs_num_threads > 1 ||
3424             ctx->options & E2F_OPT_MULTITHREAD) {
3425                 need_single = 0;
3426                 e2fsck_pass1_multithread(ctx);
3427         }
3428         /* No lock is needed at this time */
3429         ctx->fs_need_locking = 0;
3430 #endif
3431         if (need_single)
3432                 e2fsck_pass1_run(ctx);
3433         e2fsck_pass1_post(ctx);
3434 }
3435
3436 #undef FINISH_INODE_LOOP
3437
3438 /*
3439  * When the inode_scan routines call this callback at the end of the
3440  * glock group, call process_inodes.
3441  */
3442 static errcode_t scan_callback(ext2_filsys fs,
3443                                ext2_inode_scan scan EXT2FS_ATTR((unused)),
3444                                dgrp_t group, void * priv_data)
3445 {
3446         struct scan_callback_struct *scan_struct;
3447         e2fsck_t ctx;
3448         struct e2fsck_thread *tinfo;
3449
3450         scan_struct = (struct scan_callback_struct *) priv_data;
3451         ctx = scan_struct->ctx;
3452
3453         process_inodes((e2fsck_t) fs->priv_data, scan_struct->block_buf,
3454                        scan_struct->inodes_to_process,
3455                        scan_struct->process_inode_count);
3456
3457         if (ctx->progress)
3458                 if ((ctx->progress)(ctx, 1, group+1,
3459                                     ctx->fs->group_desc_count))
3460                         return EXT2_ET_CANCEL_REQUESTED;
3461
3462 #ifdef HAVE_PTHREAD
3463         if (ctx->global_ctx) {
3464                 tinfo = &ctx->thread_info;
3465                 tinfo->et_group_next++;
3466                 if (ctx->options & E2F_OPT_DEBUG &&
3467                     ctx->options & E2F_OPT_MULTITHREAD)
3468                         log_out(ctx, _("group %d finished\n"),
3469                                 tinfo->et_group_next);
3470                 if (tinfo->et_group_next >= tinfo->et_group_end)
3471                         return EXT2_ET_SCAN_FINISHED;
3472         }
3473 #endif
3474
3475         return 0;
3476 }
3477
3478 /*
3479  * Process the inodes in the "inodes to process" list.
3480  */
3481 static void process_inodes(e2fsck_t ctx, char *block_buf,
3482                            struct process_inode_block *inodes_to_process,
3483                            int *process_inode_count)
3484 {
3485         int                     i;
3486         struct ext2_inode       *old_stashed_inode;
3487         ext2_ino_t              old_stashed_ino;
3488         const char              *old_operation;
3489         char                    buf[80];
3490         struct problem_context  pctx;
3491
3492 #if 0
3493         printf("begin process_inodes: ");
3494 #endif
3495         if (*process_inode_count == 0)
3496                 return;
3497         old_operation = ehandler_operation(0);
3498         old_stashed_inode = ctx->stashed_inode;
3499         old_stashed_ino = ctx->stashed_ino;
3500         qsort(inodes_to_process, *process_inode_count,
3501                       sizeof(struct process_inode_block), process_inode_cmp);
3502         clear_problem_context(&pctx);
3503         for (i=0; i < *process_inode_count; i++) {
3504                 pctx.inode = ctx->stashed_inode =
3505                         (struct ext2_inode *) &inodes_to_process[i].inode;
3506                 pctx.ino = ctx->stashed_ino = inodes_to_process[i].ino;
3507
3508 #if 0
3509                 printf("%u ", pctx.ino);
3510 #endif
3511                 sprintf(buf, _("reading indirect blocks of inode %u"),
3512                         pctx.ino);
3513                 ehandler_operation(buf);
3514                 check_blocks(ctx, &pctx, block_buf,
3515                              &inodes_to_process[i].ea_ibody_quota);
3516                 if (e2fsck_should_abort(ctx))
3517                         break;
3518         }
3519         ctx->stashed_inode = old_stashed_inode;
3520         ctx->stashed_ino = old_stashed_ino;
3521         *process_inode_count = 0;
3522 #if 0
3523         printf("end process inodes\n");
3524 #endif
3525         ehandler_operation(old_operation);
3526 }
3527
3528 static EXT2_QSORT_TYPE process_inode_cmp(const void *a, const void *b)
3529 {
3530         const struct process_inode_block *ib_a =
3531                 (const struct process_inode_block *) a;
3532         const struct process_inode_block *ib_b =
3533                 (const struct process_inode_block *) b;
3534         int     ret;
3535
3536         ret = (ib_a->inode.i_block[EXT2_IND_BLOCK] -
3537                ib_b->inode.i_block[EXT2_IND_BLOCK]);
3538         if (ret == 0)
3539                 /*
3540                  * We only call process_inodes() for non-extent
3541                  * inodes, so it's OK to pass NULL to
3542                  * ext2fs_file_acl_block() here.
3543                  */
3544                 ret = ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_a->inode)) -
3545                         ext2fs_file_acl_block(0, ext2fs_const_inode(&ib_b->inode));
3546         if (ret == 0)
3547                 ret = ib_a->ino - ib_b->ino;
3548         return ret;
3549 }
3550
3551 /*
3552  * Mark an inode as being bad in some what
3553  */
3554 static void mark_inode_bad(e2fsck_t ctx, ext2_ino_t ino)
3555 {
3556         struct          problem_context pctx;
3557
3558         if (!ctx->inode_bad_map) {
3559                 clear_problem_context(&pctx);
3560
3561                 pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3562                                 _("bad inode map"), EXT2FS_BMAP64_RBTREE,
3563                                 "inode_bad_map", &ctx->inode_bad_map);
3564                 if (pctx.errcode) {
3565                         pctx.num = 3;
3566                         fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3567                         /* Should never get here */
3568                         ctx->flags |= E2F_FLAG_ABORT;
3569                         return;
3570                 }
3571         }
3572         ext2fs_mark_inode_bitmap2(ctx->inode_bad_map, ino);
3573 }
3574
3575 static void add_casefolded_dir(e2fsck_t ctx, ext2_ino_t ino)
3576 {
3577         struct          problem_context pctx;
3578
3579         if (!ctx->casefolded_dirs) {
3580                 pctx.errcode = ext2fs_u32_list_create(&ctx->casefolded_dirs, 0);
3581                 if (pctx.errcode)
3582                         goto error;
3583         }
3584         pctx.errcode = ext2fs_u32_list_add(ctx->casefolded_dirs, ino);
3585         if (pctx.errcode == 0)
3586                 return;
3587 error:
3588         fix_problem(ctx, PR_1_ALLOCATE_CASEFOLDED_DIRLIST, &pctx);
3589         /* Should never get here */
3590         ctx->flags |= E2F_FLAG_ABORT;
3591 }
3592
3593 /*
3594  * This procedure will allocate the inode "bb" (badblock) map table
3595  */
3596 static void alloc_bb_map(e2fsck_t ctx)
3597 {
3598         struct          problem_context pctx;
3599
3600         clear_problem_context(&pctx);
3601         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3602                         _("inode in bad block map"), EXT2FS_BMAP64_RBTREE,
3603                         "inode_bb_map", &ctx->inode_bb_map);
3604         if (pctx.errcode) {
3605                 pctx.num = 4;
3606                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3607                 /* Should never get here */
3608                 ctx->flags |= E2F_FLAG_ABORT;
3609                 return;
3610         }
3611 }
3612
3613 /*
3614  * This procedure will allocate the inode imagic table
3615  */
3616 static void alloc_imagic_map(e2fsck_t ctx)
3617 {
3618         struct          problem_context pctx;
3619
3620         clear_problem_context(&pctx);
3621         pctx.errcode = e2fsck_allocate_inode_bitmap(ctx->fs,
3622                         _("imagic inode map"), EXT2FS_BMAP64_RBTREE,
3623                         "inode_imagic_map", &ctx->inode_imagic_map);
3624         if (pctx.errcode) {
3625                 pctx.num = 5;
3626                 fix_problem(ctx, PR_1_ALLOCATE_IBITMAP_ERROR, &pctx);
3627                 /* Should never get here */
3628                 ctx->flags |= E2F_FLAG_ABORT;
3629                 return;
3630         }
3631 }
3632
3633 /*
3634  * Marks a block as in use, setting the dup_map if it's been set
3635  * already.  Called by process_block and process_bad_block.
3636  *
3637  * WARNING: Assumes checks have already been done to make sure block
3638  * is valid.  This is true in both process_block and process_bad_block.
3639  */
3640 static _INLINE_ void mark_block_used(e2fsck_t ctx, blk64_t block)
3641 {
3642         struct problem_context pctx;
3643         e2fsck_t global_ctx = ctx->global_ctx ? ctx->global_ctx : ctx;
3644
3645         clear_problem_context(&pctx);
3646
3647         if (is_blocks_used(ctx, block, 1)) {
3648                 if (ext2fs_has_feature_shared_blocks(ctx->fs->super) &&
3649                     !(ctx->options & E2F_OPT_UNSHARE_BLOCKS)) {
3650                         return;
3651                 }
3652                 ctx->flags |= E2F_FLAG_DUP_BLOCK;
3653                 e2fsck_pass1_block_map_w_lock(ctx);
3654                 ext2fs_fast_mark_block_bitmap2(global_ctx->block_dup_map, block);
3655                 e2fsck_pass1_block_map_w_unlock(ctx);
3656         } else {
3657                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, block);
3658         }
3659 }
3660
3661 /*
3662  * When cluster size is greater than one block, it is caller's responsibility
3663  * to make sure block parameter starts at a cluster boundary.
3664  */
3665 static _INLINE_ void mark_blocks_used(e2fsck_t ctx, blk64_t block,
3666                                       unsigned int num)
3667 {
3668         if (!is_blocks_used(ctx, block, num)) {
3669                 ext2fs_mark_block_bitmap_range2(ctx->block_found_map, block, num);
3670         } else {
3671                 unsigned int i;
3672
3673                 for (i = 0; i < num; i += EXT2FS_CLUSTER_RATIO(ctx->fs))
3674                         mark_block_used(ctx, block + i);
3675         }
3676 }
3677
3678 static errcode_t _INLINE_ e2fsck_write_ext_attr3(e2fsck_t ctx, blk64_t block,
3679                                                  void *inbuf, ext2_ino_t inum)
3680 {
3681         errcode_t retval;
3682         ext2_filsys fs = ctx->fs;
3683
3684         e2fsck_pass1_fix_lock(ctx);
3685         retval = ext2fs_write_ext_attr3(fs, block, inbuf, inum);
3686         e2fsck_pass1_fix_unlock(ctx);
3687
3688         return retval;
3689 }
3690 /*
3691  * Adjust the extended attribute block's reference counts at the end
3692  * of pass 1, either by subtracting out references for EA blocks that
3693  * are still referenced in ctx->refcount, or by adding references for
3694  * EA blocks that had extra references as accounted for in
3695  * ctx->refcount_extra.
3696  */
3697 static void adjust_extattr_refcount(e2fsck_t ctx, ext2_refcount_t refcount,
3698                                     char *block_buf, int adjust_sign)
3699 {
3700         struct ext2_ext_attr_header     *header;
3701         struct problem_context          pctx;
3702         ext2_filsys                     fs = ctx->fs;
3703         blk64_t                         blk;
3704         __u32                           should_be;
3705         ea_value_t                      count;
3706
3707         clear_problem_context(&pctx);
3708
3709         ea_refcount_intr_begin(refcount);
3710         while (1) {
3711                 if ((blk = ea_refcount_intr_next(refcount, &count)) == 0)
3712                         break;
3713                 pctx.blk = blk;
3714                 pctx.errcode = ext2fs_read_ext_attr3(fs, blk, block_buf,
3715                                                      pctx.ino);
3716                 if (pctx.errcode) {
3717                         fix_problem(ctx, PR_1_EXTATTR_READ_ABORT, &pctx);
3718                         return;
3719                 }
3720                 header = (struct ext2_ext_attr_header *) block_buf;
3721                 pctx.blkcount = header->h_refcount;
3722                 should_be = header->h_refcount + adjust_sign * (int)count;
3723                 pctx.num = should_be;
3724                 if (fix_problem(ctx, PR_1_EXTATTR_REFCOUNT, &pctx)) {
3725                         header->h_refcount = should_be;
3726                         pctx.errcode = e2fsck_write_ext_attr3(ctx, blk,
3727                                                              block_buf,
3728                                                              pctx.ino);
3729                         if (pctx.errcode) {
3730                                 fix_problem(ctx, PR_1_EXTATTR_WRITE_ABORT,
3731                                             &pctx);
3732                                 continue;
3733                         }
3734                 }
3735         }
3736 }
3737
3738 /*
3739  * Handle processing the extended attribute blocks
3740  */
3741 static int check_ext_attr(e2fsck_t ctx, struct problem_context *pctx,
3742                            char *block_buf, struct ea_quota *ea_block_quota)
3743 {
3744         ext2_filsys fs = ctx->fs;
3745         ext2_ino_t      ino = pctx->ino;
3746         struct ext2_inode *inode = pctx->inode;
3747         blk64_t         blk;
3748         char *          end;
3749         struct ext2_ext_attr_header *header;
3750         struct ext2_ext_attr_entry *first, *entry;
3751         blk64_t         quota_blocks = EXT2FS_C2B(fs, 1);
3752         __u64           quota_inodes = 0;
3753         region_t        region = 0;
3754         int             failed_csum = 0;
3755
3756         ea_block_quota->blocks = 0;
3757         ea_block_quota->inodes = 0;
3758
3759         blk = ext2fs_file_acl_block(fs, inode);
3760         if (blk == 0)
3761                 return 0;
3762
3763         /*
3764          * If the Extended attribute flag isn't set, then a non-zero
3765          * file acl means that the inode is corrupted.
3766          *
3767          * Or if the extended attribute block is an invalid block,
3768          * then the inode is also corrupted.
3769          */
3770         if (!ext2fs_has_feature_xattr(fs->super) ||
3771             (blk < fs->super->s_first_data_block) ||
3772             (blk >= ext2fs_blocks_count(fs->super))) {
3773                 mark_inode_bad(ctx, ino);
3774                 return 0;
3775         }
3776
3777         /* If ea bitmap hasn't been allocated, create it */
3778         if (!ctx->block_ea_map) {
3779                 pctx->errcode = e2fsck_allocate_block_bitmap(fs,
3780                                         _("ext attr block map"),
3781                                         EXT2FS_BMAP64_RBTREE, "block_ea_map",
3782                                         &ctx->block_ea_map);
3783                 if (pctx->errcode) {
3784                         pctx->num = 2;
3785                         fix_problem(ctx, PR_1_ALLOCATE_BBITMAP_ERROR, pctx);
3786                         ctx->flags |= E2F_FLAG_ABORT;
3787                         return 0;
3788                 }
3789         }
3790
3791         /* Create the EA refcount structure if necessary */
3792         if (!ctx->refcount) {
3793                 pctx->errcode = ea_refcount_create(0,
3794                                         &ctx->refcount_orig);
3795                 if (pctx->errcode) {
3796                         pctx->num = 1;
3797                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3798                         ctx->flags |= E2F_FLAG_ABORT;
3799                         return 0;
3800                 }
3801
3802                 pctx->errcode = ea_refcount_create(0, &ctx->refcount);
3803                 if (pctx->errcode) {
3804                         pctx->num = 1;
3805                         fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3806                         ctx->flags |= E2F_FLAG_ABORT;
3807                         return 0;
3808                 }
3809         }
3810
3811 #if 0
3812         /* Debugging text */
3813         printf("Inode %u has EA block %u\n", ino, blk);
3814 #endif
3815
3816         /* Have we seen this EA block before? */
3817         if (ext2fs_fast_test_block_bitmap2(ctx->block_ea_map, blk)) {
3818                 ea_block_quota->blocks = EXT2FS_C2B(fs, 1);
3819                 ea_block_quota->inodes = 0;
3820
3821                 if (ctx->ea_block_quota_blocks) {
3822                         ea_refcount_fetch(ctx->ea_block_quota_blocks, blk,
3823                                           &quota_blocks);
3824                         if (quota_blocks)
3825                                 ea_block_quota->blocks = quota_blocks;
3826                 }
3827
3828                 if (ctx->ea_block_quota_inodes)
3829                         ea_refcount_fetch(ctx->ea_block_quota_inodes, blk,
3830                                           &ea_block_quota->inodes);
3831
3832                 if (ea_refcount_decrement(ctx->refcount, blk, 0) == 0)
3833                         return 1;
3834                 /* Ooops, this EA was referenced more than it stated */
3835                 if (!ctx->refcount_extra) {
3836                         pctx->errcode = ea_refcount_create(0,
3837                                            &ctx->refcount_extra);
3838                         if (pctx->errcode) {
3839                                 pctx->num = 2;
3840                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3841                                 ctx->flags |= E2F_FLAG_ABORT;
3842                                 return 0;
3843                         }
3844                 }
3845                 ea_refcount_increment(ctx->refcount_extra, blk, 0);
3846                 return 1;
3847         }
3848
3849         /*
3850          * OK, we haven't seen this EA block yet.  So we need to
3851          * validate it
3852          */
3853         pctx->blk = blk;
3854         pctx->errcode = ext2fs_read_ext_attr3(fs, blk, block_buf, pctx->ino);
3855         if (pctx->errcode == EXT2_ET_EXT_ATTR_CSUM_INVALID) {
3856                 pctx->errcode = 0;
3857                 failed_csum = 1;
3858         } else if (pctx->errcode == EXT2_ET_BAD_EA_HEADER)
3859                 pctx->errcode = 0;
3860
3861         if (pctx->errcode &&
3862             fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx)) {
3863                 pctx->errcode = 0;
3864                 goto clear_extattr;
3865         }
3866         header = (struct ext2_ext_attr_header *) block_buf;
3867         pctx->blk = ext2fs_file_acl_block(fs, inode);
3868         if (((ctx->ext_attr_ver == 1) &&
3869              (header->h_magic != EXT2_EXT_ATTR_MAGIC_v1)) ||
3870             ((ctx->ext_attr_ver == 2) &&
3871              (header->h_magic != EXT2_EXT_ATTR_MAGIC))) {
3872                 if (fix_problem(ctx, PR_1_BAD_EA_BLOCK, pctx))
3873                         goto clear_extattr;
3874         }
3875
3876         if (header->h_blocks != 1) {
3877                 if (fix_problem(ctx, PR_1_EA_MULTI_BLOCK, pctx))
3878                         goto clear_extattr;
3879         }
3880
3881         if (pctx->errcode && fix_problem(ctx, PR_1_READ_EA_BLOCK, pctx))
3882                 goto clear_extattr;
3883
3884         region = region_create(0, fs->blocksize);
3885         if (!region) {
3886                 fix_problem(ctx, PR_1_EA_ALLOC_REGION_ABORT, pctx);
3887                 ctx->flags |= E2F_FLAG_ABORT;
3888                 return 0;
3889         }
3890         if (region_allocate(region, 0, sizeof(struct ext2_ext_attr_header))) {
3891                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3892                         goto clear_extattr;
3893         }
3894
3895         first = (struct ext2_ext_attr_entry *)(header+1);
3896         end = block_buf + fs->blocksize;
3897         entry = first;
3898         while ((char *)entry < end && *(__u32 *)entry) {
3899                 __u32 hash;
3900
3901                 if (region_allocate(region, (char *)entry - (char *)header,
3902                                    EXT2_EXT_ATTR_LEN(entry->e_name_len))) {
3903                         if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3904                                 goto clear_extattr;
3905                         break;
3906                 }
3907                 if ((ctx->ext_attr_ver == 1 &&
3908                      (entry->e_name_len == 0 || entry->e_name_index != 0)) ||
3909                     (ctx->ext_attr_ver == 2 &&
3910                      entry->e_name_index == 0)) {
3911                         if (fix_problem(ctx, PR_1_EA_BAD_NAME, pctx))
3912                                 goto clear_extattr;
3913                         break;
3914                 }
3915                 if (entry->e_value_inum == 0) {
3916                         if (entry->e_value_size > EXT2_XATTR_SIZE_MAX ||
3917                             (entry->e_value_offs + entry->e_value_size >
3918                              fs->blocksize)) {
3919                                 if (fix_problem(ctx, PR_1_EA_BAD_VALUE, pctx))
3920                                         goto clear_extattr;
3921                                 break;
3922                         }
3923                         if (entry->e_value_size &&
3924                             region_allocate(region, entry->e_value_offs,
3925                                             EXT2_EXT_ATTR_SIZE(entry->e_value_size))) {
3926                                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION,
3927                                                 pctx))
3928                                         goto clear_extattr;
3929                         }
3930
3931                         hash = ext2fs_ext_attr_hash_entry(entry, block_buf +
3932                                                           entry->e_value_offs);
3933                         if (entry->e_hash != hash)
3934                                 hash = ext2fs_ext_attr_hash_entry_signed(entry,
3935                                         block_buf + entry->e_value_offs);
3936
3937                         if (entry->e_hash != hash) {
3938                                 pctx->num = entry->e_hash;
3939                                 if (fix_problem(ctx, PR_1_ATTR_HASH, pctx))
3940                                         goto clear_extattr;
3941                                 entry->e_hash = hash;
3942                         }
3943                 } else {
3944                         problem_t problem;
3945                         blk64_t entry_quota_blocks;
3946
3947                         problem = check_large_ea_inode(ctx, entry, pctx,
3948                                                        &entry_quota_blocks);
3949                         if (problem && fix_problem(ctx, problem, pctx))
3950                                 goto clear_extattr;
3951
3952                         quota_blocks += entry_quota_blocks;
3953                         quota_inodes++;
3954                 }
3955
3956                 entry = EXT2_EXT_ATTR_NEXT(entry);
3957         }
3958         if (region_allocate(region, (char *)entry - (char *)header, 4)) {
3959                 if (fix_problem(ctx, PR_1_EA_ALLOC_COLLISION, pctx))
3960                         goto clear_extattr;
3961         }
3962         region_free(region);
3963
3964         /*
3965          * We only get here if there was no other errors that were fixed.
3966          * If there was a checksum fail, ask to correct it.
3967          */
3968         if (failed_csum &&
3969             fix_problem(ctx, PR_1_EA_BLOCK_ONLY_CSUM_INVALID, pctx)) {
3970                 pctx->errcode = e2fsck_write_ext_attr3(ctx, blk, block_buf,
3971                                                        pctx->ino);
3972                 if (pctx->errcode)
3973                         return 0;
3974         }
3975
3976         if (quota_blocks != EXT2FS_C2B(fs, 1U)) {
3977                 if (!ctx->ea_block_quota_blocks) {
3978                         pctx->errcode = ea_refcount_create(0,
3979                                                 &ctx->ea_block_quota_blocks);
3980                         if (pctx->errcode) {
3981                                 pctx->num = 3;
3982                                 goto refcount_fail;
3983                         }
3984                 }
3985                 ea_refcount_store(ctx->ea_block_quota_blocks, blk,
3986                                   quota_blocks);
3987         }
3988
3989         if (quota_inodes) {
3990                 if (!ctx->ea_block_quota_inodes) {
3991                         pctx->errcode = ea_refcount_create(0,
3992                                                 &ctx->ea_block_quota_inodes);
3993                         if (pctx->errcode) {
3994                                 pctx->num = 4;
3995 refcount_fail:
3996                                 fix_problem(ctx, PR_1_ALLOCATE_REFCOUNT, pctx);
3997                                 ctx->flags |= E2F_FLAG_ABORT;
3998                                 return 0;
3999                         }
4000                 }
4001
4002                 ea_refcount_store(ctx->ea_block_quota_inodes, blk,
4003                                   quota_inodes);
4004         }
4005         ea_block_quota->blocks = quota_blocks;
4006         ea_block_quota->inodes = quota_inodes;
4007
4008         inc_ea_inode_refs(ctx, pctx, first, end);
4009         ea_refcount_store(ctx->refcount, blk, header->h_refcount - 1);
4010         ea_refcount_store(ctx->refcount_orig, blk, header->h_refcount);
4011         /**
4012          * It might be racy that this block has been merged in the
4013          * global found map.
4014          */
4015         if (!is_blocks_used(ctx, blk, 1))
4016                 ext2fs_fast_mark_block_bitmap2(ctx->block_found_map, blk);
4017         ext2fs_fast_mark_block_bitmap2(ctx->block_ea_map, blk);
4018         return 1;
4019
4020 clear_extattr:
4021         if (region)
4022                 region_free(region);
4023         ext2fs_file_acl_block_set(fs, inode, 0);
4024         e2fsck_write_inode(ctx, ino, inode, "check_ext_attr");
4025         return 0;
4026 }
4027
4028 /* Returns 1 if bad htree, 0 if OK */
4029 static int handle_htree(e2fsck_t ctx, struct problem_context *pctx,
4030                         ext2_ino_t ino, struct ext2_inode *inode,
4031                         char *block_buf)
4032 {
4033         struct ext2_dx_root_info        *root;
4034         ext2_filsys                     fs = ctx->fs;
4035         errcode_t                       retval;
4036         blk64_t                         blk;
4037
4038         if ((!LINUX_S_ISDIR(inode->i_mode) &&
4039              fix_problem(ctx, PR_1_HTREE_NODIR, pctx)) ||
4040             (!ext2fs_has_feature_dir_index(fs->super) &&
4041              fix_problem(ctx, PR_1_HTREE_SET, pctx)))
4042                 return 1;
4043
4044         pctx->errcode = ext2fs_bmap2(fs, ino, inode, 0, 0, 0, 0, &blk);
4045
4046         if ((pctx->errcode) ||
4047             (blk == 0) ||
4048             (blk < fs->super->s_first_data_block) ||
4049             (blk >= ext2fs_blocks_count(fs->super))) {
4050                 if (fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4051                         return 1;
4052                 else
4053                         return 0;
4054         }
4055
4056         retval = io_channel_read_blk64(fs->io, blk, 1, block_buf);
4057         if (retval && fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4058                 return 1;
4059
4060         /* XXX should check that beginning matches a directory */
4061         root = (struct ext2_dx_root_info *) (block_buf + 24);
4062
4063         if ((root->reserved_zero || root->info_length < 8) &&
4064             fix_problem(ctx, PR_1_HTREE_BADROOT, pctx))
4065                 return 1;
4066
4067         pctx->num = root->hash_version;
4068         if ((root->hash_version != EXT2_HASH_LEGACY) &&
4069             (root->hash_version != EXT2_HASH_HALF_MD4) &&
4070             (root->hash_version != EXT2_HASH_TEA) &&
4071             (root->hash_version != EXT2_HASH_SIPHASH) &&
4072             fix_problem(ctx, PR_1_HTREE_HASHV, pctx))
4073                 return 1;
4074
4075         if (ext4_hash_in_dirent(inode)) {
4076                 if (root->hash_version != EXT2_HASH_SIPHASH &&
4077                     fix_problem(ctx, PR_1_HTREE_NEEDS_SIPHASH, pctx))
4078                         return 1;
4079         } else {
4080                 if (root->hash_version == EXT2_HASH_SIPHASH &&
4081                    fix_problem(ctx, PR_1_HTREE_CANNOT_SIPHASH, pctx))
4082                         return 1;
4083         }
4084
4085         if ((root->unused_flags & EXT2_HASH_FLAG_INCOMPAT) &&
4086             fix_problem(ctx, PR_1_HTREE_INCOMPAT, pctx))
4087                 return 1;
4088
4089         pctx->num = root->indirect_levels;
4090         /* if htree level is clearly too high, consider it to be broken */
4091         if (root->indirect_levels > EXT4_HTREE_LEVEL &&
4092             fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
4093                 return 1;
4094
4095         /* if level is only maybe too high, LARGE_DIR feature could be unset */
4096         if (root->indirect_levels > ext2_dir_htree_level(fs) &&
4097             !ext2fs_has_feature_largedir(fs->super)) {
4098                 int blockbits = EXT2_BLOCK_SIZE_BITS(fs->super) + 10;
4099                 unsigned idx_pb = 1 << (blockbits - 3);
4100
4101                 /* compare inode size/blocks vs. max-sized 2-level htree */
4102                 if (EXT2_I_SIZE(pctx->inode) <
4103                     (idx_pb - 1) * (idx_pb - 2) << blockbits &&
4104                     pctx->inode->i_blocks <
4105                     (idx_pb - 1) * (idx_pb - 2) << (blockbits - 9) &&
4106                     fix_problem(ctx, PR_1_HTREE_DEPTH, pctx))
4107                         return 1;
4108         }
4109
4110         if (root->indirect_levels > EXT4_HTREE_LEVEL_COMPAT ||
4111             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
4112                 ctx->large_dirs++;
4113
4114         return 0;
4115 }
4116
4117 void e2fsck_clear_inode(e2fsck_t ctx, ext2_ino_t ino,
4118                         struct ext2_inode *inode, int restart_flag,
4119                         const char *source)
4120 {
4121         inode->i_flags = 0;
4122         inode->i_links_count = 0;
4123         ext2fs_icount_store(ctx->inode_link_info, ino, 0);
4124         inode->i_dtime = ctx->now;
4125
4126         /*
4127          * If a special inode has such rotten block mappings that we
4128          * want to clear the whole inode, be sure to actually zap
4129          * the block maps because i_links_count isn't checked for
4130          * special inodes, and we'll end up right back here the next
4131          * time we run fsck.
4132          */
4133         if (ino < EXT2_FIRST_INODE(ctx->fs->super))
4134                 memset(inode->i_block, 0, sizeof(inode->i_block));
4135
4136         ext2fs_unmark_inode_bitmap2(ctx->inode_dir_map, ino);
4137         ext2fs_unmark_inode_bitmap2(ctx->inode_used_map, ino);
4138         if (ctx->inode_reg_map)
4139                 ext2fs_unmark_inode_bitmap2(ctx->inode_reg_map, ino);
4140         if (ctx->inode_bad_map)
4141                 ext2fs_unmark_inode_bitmap2(ctx->inode_bad_map, ino);
4142
4143         /*
4144          * If the inode was partially accounted for before processing
4145          * was aborted, we need to restart the pass 1 scan.
4146          */
4147         ctx->flags |= restart_flag;
4148
4149         if (ino == EXT2_BAD_INO)
4150                 memset(inode, 0, sizeof(struct ext2_inode));
4151
4152         e2fsck_write_inode(ctx, ino, inode, source);
4153 }
4154
4155 /*
4156  * Use the multiple-blocks reclamation code to fix alignment problems in
4157  * a bigalloc filesystem.  We want a logical cluster to map to *only* one
4158  * physical cluster, and we want the block offsets within that cluster to
4159  * line up.
4160  */
4161 static int has_unaligned_cluster_map(e2fsck_t ctx,
4162                                      blk64_t last_pblk, blk64_t last_lblk,
4163                                      blk64_t pblk, blk64_t lblk)
4164 {
4165         blk64_t cluster_mask;
4166
4167         if (!ctx->fs->cluster_ratio_bits)
4168                 return 0;
4169         cluster_mask = EXT2FS_CLUSTER_MASK(ctx->fs);
4170
4171         /*
4172          * If the block in the logical cluster doesn't align with the block in
4173          * the physical cluster...
4174          */
4175         if ((lblk & cluster_mask) != (pblk & cluster_mask))
4176                 return 1;
4177
4178         /*
4179          * If we cross a physical cluster boundary within a logical cluster...
4180          */
4181         if (last_pblk && (lblk & cluster_mask) != 0 &&
4182             EXT2FS_B2C(ctx->fs, lblk) == EXT2FS_B2C(ctx->fs, last_lblk) &&
4183             EXT2FS_B2C(ctx->fs, pblk) != EXT2FS_B2C(ctx->fs, last_pblk))
4184                 return 1;
4185
4186         return 0;
4187 }
4188
4189 static void scan_extent_node(e2fsck_t ctx, struct problem_context *pctx,
4190                              struct process_block_struct *pb,
4191                              blk64_t start_block, blk64_t end_block,
4192                              blk64_t eof_block,
4193                              ext2_extent_handle_t ehandle,
4194                              int try_repairs)
4195 {
4196         struct ext2fs_extent    extent;
4197         blk64_t                 blk, last_lblk;
4198         unsigned int            i, n;
4199         int                     is_dir, is_leaf;
4200         problem_t               problem;
4201         struct ext2_extent_info info;
4202         int                     failed_csum = 0;
4203
4204         if (pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID)
4205                 failed_csum = 1;
4206
4207         pctx->errcode = ext2fs_extent_get_info(ehandle, &info);
4208         if (pctx->errcode)
4209                 return;
4210         if (!(ctx->options & E2F_OPT_FIXES_ONLY) &&
4211             !pb->eti.force_rebuild &&
4212             info.curr_level < MAX_EXTENT_DEPTH_COUNT) {
4213                 struct extent_tree_level *etl;
4214
4215                 etl = pb->eti.ext_info + info.curr_level;
4216                 etl->num_extents += info.num_entries;
4217                 etl->max_extents += info.max_entries;
4218                 /*
4219                  * Implementation wart: Splitting extent blocks when appending
4220                  * will leave the old block with one free entry.  Therefore
4221                  * unless the node is totally full, pretend that a non-root
4222                  * extent block can hold one fewer entry than it actually does,
4223                  * so that we don't repeatedly rebuild the extent tree.
4224                  */
4225                 if (info.curr_level && info.num_entries < info.max_entries)
4226                         etl->max_extents--;
4227         }
4228
4229         pctx->errcode = ext2fs_extent_get(ehandle, EXT2_EXTENT_FIRST_SIB,
4230                                           &extent);
4231         while ((pctx->errcode == 0 ||
4232                 pctx->errcode == EXT2_ET_EXTENT_CSUM_INVALID) &&
4233                info.num_entries-- > 0) {
4234                 is_leaf = extent.e_flags & EXT2_EXTENT_FLAGS_LEAF;
4235                 is_dir = LINUX_S_ISDIR(pctx->inode->i_mode);
4236                 last_lblk = extent.e_lblk + extent.e_len - 1;
4237
4238                 problem = 0;
4239                 pctx->blk = extent.e_pblk;
4240                 pctx->blk2 = extent.e_lblk;
4241                 pctx->num = extent.e_len;
4242                 pctx->blkcount = extent.e_lblk + extent.e_len;
4243
4244                 if (extent.e_pblk == 0 ||
4245                     extent.e_pblk < ctx->fs->super->s_first_data_block ||
4246                     extent.e_pblk >= ext2fs_blocks_count(ctx->fs->super))
4247                         problem = PR_1_EXTENT_BAD_START_BLK;
4248                 else if (extent.e_lblk < start_block)
4249                         problem = PR_1_OUT_OF_ORDER_EXTENTS;
4250                 else if ((end_block && last_lblk > end_block) &&
4251                          !(last_lblk > eof_block &&
4252                            ((extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) ||
4253                             (pctx->inode->i_flags & EXT4_VERITY_FL))))
4254                         problem = PR_1_EXTENT_END_OUT_OF_BOUNDS;
4255                 else if (is_leaf && extent.e_len == 0)
4256                         problem = PR_1_EXTENT_LENGTH_ZERO;
4257                 else if (is_leaf &&
4258                          (extent.e_pblk + extent.e_len) >
4259                          ext2fs_blocks_count(ctx->fs->super))
4260                         problem = PR_1_EXTENT_ENDS_BEYOND;
4261                 else if (is_leaf && is_dir && !pctx->inode->i_size_high &&
4262                          !ext2fs_has_feature_largedir(ctx->fs->super) &&
4263                          ((extent.e_lblk + extent.e_len) >
4264                           (1U << (21 - ctx->fs->super->s_log_block_size))))
4265                         problem = PR_1_TOOBIG_DIR;
4266
4267                 if (is_leaf && problem == 0 && extent.e_len > 0) {
4268 #if 0
4269                         printf("extent_region(ino=%u, expect=%llu, "
4270                                "lblk=%llu, len=%u)\n", pb->ino,
4271                                (unsigned long long) pb->next_lblock,
4272                                (unsigned long long) extent.e_lblk,
4273                                extent.e_len);
4274 #endif
4275                         if (extent.e_lblk < pb->next_lblock)
4276                                 problem = PR_1_EXTENT_COLLISION;
4277                         else if (extent.e_lblk + extent.e_len > pb->next_lblock)
4278                                 pb->next_lblock = extent.e_lblk + extent.e_len;
4279                 }
4280
4281                 /*
4282                  * Uninitialized blocks in a directory?  Clear the flag and
4283                  * we'll interpret the blocks later.
4284                  */
4285                 if (try_repairs && is_dir && problem == 0 &&
4286                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
4287                     fix_problem(ctx, PR_1_UNINIT_DBLOCK, pctx)) {
4288                         e2fsck_pass1_fix_lock(ctx);
4289                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
4290                         pb->inode_modified = 1;
4291                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
4292                                                               &extent);
4293                         e2fsck_pass1_fix_unlock(ctx);
4294                         if (pctx->errcode)
4295                                 return;
4296                         failed_csum = 0;
4297                 }
4298 #ifdef CONFIG_DEVELOPER_FEATURES
4299                 if (try_repairs && !is_dir && problem == 0 &&
4300                     (ctx->options & E2F_OPT_CLEAR_UNINIT) &&
4301                     (extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT) &&
4302                     fix_problem(ctx, PR_1_CLEAR_UNINIT_EXTENT, pctx)) {
4303                         extent.e_flags &= ~EXT2_EXTENT_FLAGS_UNINIT;
4304                         pb->inode_modified = 1;
4305                         pctx->errcode = ext2fs_extent_replace(ehandle, 0,
4306                                                               &extent);
4307                         if (pctx->errcode)
4308                                 return;
4309                         failed_csum = 0;
4310                 }
4311 #endif
4312                 if (try_repairs && problem) {
4313 report_problem:
4314                         if (fix_problem(ctx, problem, pctx)) {
4315                                 if (ctx->invalid_bitmaps) {
4316                                         /*
4317                                          * If fsck knows the bitmaps are bad,
4318                                          * skip to the next extent and
4319                                          * try to clear this extent again
4320                                          * after fixing the bitmaps, by
4321                                          * restarting fsck.
4322                                          */
4323                                         pctx->errcode = ext2fs_extent_get(
4324                                                           ehandle,
4325                                                           EXT2_EXTENT_NEXT_SIB,
4326                                                           &extent);
4327                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4328                                         if (pctx->errcode ==
4329                                                     EXT2_ET_NO_CURRENT_NODE) {
4330                                                 pctx->errcode = 0;
4331                                                 break;
4332                                         }
4333                                         continue;
4334                                 }
4335                                 e2fsck_pass1_fix_lock(ctx);
4336                                 e2fsck_read_bitmaps(ctx);
4337                                 pb->inode_modified = 1;
4338                                 pctx->errcode =
4339                                         ext2fs_extent_delete(ehandle, 0);
4340                                 e2fsck_pass1_fix_unlock(ctx);
4341                                 if (pctx->errcode) {
4342                                         pctx->str = "ext2fs_extent_delete";
4343                                         return;
4344                                 }
4345                                 e2fsck_pass1_fix_lock(ctx);
4346                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
4347                                 e2fsck_pass1_fix_unlock(ctx);
4348                                 if (pctx->errcode &&
4349                                     pctx->errcode != EXT2_ET_NO_CURRENT_NODE) {
4350                                         pctx->str = "ext2fs_extent_fix_parents";
4351                                         return;
4352                                 }
4353                                 pctx->errcode = ext2fs_extent_get(ehandle,
4354                                                                   EXT2_EXTENT_CURRENT,
4355                                                                   &extent);
4356                                 if (pctx->errcode == EXT2_ET_NO_CURRENT_NODE) {
4357                                         pctx->errcode = 0;
4358                                         break;
4359                                 }
4360                                 failed_csum = 0;
4361                                 continue;
4362                         }
4363                         goto next;
4364                 }
4365
4366                 if (!is_leaf) {
4367                         blk64_t lblk = extent.e_lblk;
4368                         int next_try_repairs = 1;
4369
4370                         blk = extent.e_pblk;
4371
4372                         /*
4373                          * If this lower extent block collides with critical
4374                          * metadata, don't try to repair the damage.  Pass 1b
4375                          * will reallocate the block; then we can try again.
4376                          */
4377                         if (pb->ino != EXT2_RESIZE_INO &&
4378                             extent.e_pblk < ctx->fs->super->s_blocks_count &&
4379                             ext2fs_test_block_bitmap2(ctx->block_metadata_map,
4380                                                       extent.e_pblk)) {
4381                                 next_try_repairs = 0;
4382                                 pctx->blk = blk;
4383                                 fix_problem(ctx,
4384                                             PR_1_CRITICAL_METADATA_COLLISION,
4385                                             pctx);
4386                                 if ((ctx->options & E2F_OPT_NO) == 0)
4387                                         ctx->flags |= E2F_FLAG_RESTART_LATER;
4388                         }
4389                         pctx->errcode = ext2fs_extent_get(ehandle,
4390                                                   EXT2_EXTENT_DOWN, &extent);
4391                         if (pctx->errcode &&
4392                             pctx->errcode != EXT2_ET_EXTENT_CSUM_INVALID) {
4393                                 pctx->str = "EXT2_EXTENT_DOWN";
4394                                 problem = PR_1_EXTENT_HEADER_INVALID;
4395                                 if (!next_try_repairs)
4396                                         return;
4397                                 if (pctx->errcode == EXT2_ET_EXTENT_HEADER_BAD)
4398                                         goto report_problem;
4399                                 return;
4400                         }
4401                         /* The next extent should match this index's logical start */
4402                         if (extent.e_lblk != lblk) {
4403                                 struct ext2_extent_info e_info;
4404
4405                                 pctx->errcode = ext2fs_extent_get_info(ehandle,
4406                                                                        &e_info);
4407                                 if (pctx->errcode) {
4408                                         pctx->str = "ext2fs_extent_get_info";
4409                                         return;
4410                                 }
4411                                 pctx->blk = lblk;
4412                                 pctx->blk2 = extent.e_lblk;
4413                                 pctx->num = e_info.curr_level - 1;
4414                                 problem = PR_1_EXTENT_INDEX_START_INVALID;
4415                                 if (fix_problem(ctx, problem, pctx)) {
4416                                         e2fsck_pass1_fix_lock(ctx);
4417                                         pb->inode_modified = 1;
4418                                         pctx->errcode =
4419                                                 ext2fs_extent_fix_parents(ehandle);
4420                                         e2fsck_pass1_fix_unlock(ctx);
4421                                         if (pctx->errcode) {
4422                                                 pctx->str = "ext2fs_extent_fix_parents";
4423                                                 return;
4424                                         }
4425                                 }
4426                         }
4427                         scan_extent_node(ctx, pctx, pb, extent.e_lblk,
4428                                          last_lblk, eof_block, ehandle,
4429                                          next_try_repairs);
4430                         if (pctx->errcode)
4431                                 return;
4432                         pctx->errcode = ext2fs_extent_get(ehandle,
4433                                                   EXT2_EXTENT_UP, &extent);
4434                         if (pctx->errcode) {
4435                                 pctx->str = "EXT2_EXTENT_UP";
4436                                 return;
4437                         }
4438                         mark_block_used(ctx, blk);
4439                         pb->num_blocks++;
4440                         goto next;
4441                 }
4442
4443                 if ((pb->previous_block != 0) &&
4444                     (pb->previous_block+1 != extent.e_pblk)) {
4445                         if (ctx->options & E2F_OPT_FRAGCHECK) {
4446                                 char type = '?';
4447
4448                                 if (pb->is_dir)
4449                                         type = 'd';
4450                                 else if (pb->is_reg)
4451                                         type = 'f';
4452
4453                                 printf(("%6lu(%c): expecting %6lu "
4454                                         "actual extent "
4455                                         "phys %6lu log %lu len %lu\n"),
4456                                        (unsigned long) pctx->ino, type,
4457                                        (unsigned long) pb->previous_block+1,
4458                                        (unsigned long) extent.e_pblk,
4459                                        (unsigned long) extent.e_lblk,
4460                                        (unsigned long) extent.e_len);
4461                         }
4462                         pb->fragmented = 1;
4463                 }
4464                 /*
4465                  * If we notice a gap in the logical block mappings of an
4466                  * extent-mapped directory, offer to close the hole by
4467                  * moving the logical block down, otherwise we'll go mad in
4468                  * pass 3 allocating empty directory blocks to fill the hole.
4469                  */
4470                 if (try_repairs && is_dir &&
4471                     pb->last_block + 1 < extent.e_lblk) {
4472                         blk64_t new_lblk;
4473
4474                         new_lblk = pb->last_block + 1;
4475                         if (EXT2FS_CLUSTER_RATIO(ctx->fs) > 1)
4476                                 new_lblk = ((new_lblk +
4477                                              EXT2FS_CLUSTER_RATIO(ctx->fs) - 1) &
4478                                             ~EXT2FS_CLUSTER_MASK(ctx->fs)) |
4479                                            (extent.e_pblk &
4480                                             EXT2FS_CLUSTER_MASK(ctx->fs));
4481                         pctx->blk = extent.e_lblk;
4482                         pctx->blk2 = new_lblk;
4483                         if (fix_problem(ctx, PR_1_COLLAPSE_DBLOCK, pctx)) {
4484                                 e2fsck_pass1_fix_lock(ctx);
4485                                 extent.e_lblk = new_lblk;
4486                                 pb->inode_modified = 1;
4487                                 pctx->errcode = ext2fs_extent_replace(ehandle,
4488                                                                 0, &extent);
4489                                 e2fsck_pass1_fix_unlock(ctx);
4490                                 if (pctx->errcode) {
4491                                         pctx->errcode = 0;
4492                                         goto alloc_later;
4493                                 }
4494                                 e2fsck_pass1_fix_lock(ctx);
4495                                 pctx->errcode = ext2fs_extent_fix_parents(ehandle);
4496                                 e2fsck_pass1_fix_unlock(ctx);
4497                                 if (pctx->errcode)
4498                                         goto failed_add_dir_block;
4499                                 pctx->errcode = ext2fs_extent_goto(ehandle,
4500                                                                 extent.e_lblk);
4501                                 if (pctx->errcode)
4502                                         goto failed_add_dir_block;
4503                                 last_lblk = extent.e_lblk + extent.e_len - 1;
4504                                 failed_csum = 0;
4505                         }
4506                 }
4507 alloc_later:
4508                 if (is_dir) {
4509                         while (++pb->last_db_block <
4510                                (e2_blkcnt_t) extent.e_lblk) {
4511                                 pctx->errcode = ext2fs_add_dir_block2(
4512                                                         ctx->fs->dblist,
4513                                                         pb->ino, 0,
4514                                                         pb->last_db_block);
4515                                 if (pctx->errcode) {
4516                                         pctx->blk = 0;
4517                                         pctx->num = pb->last_db_block;
4518                                         goto failed_add_dir_block;
4519                                 }
4520                         }
4521
4522                         for (i = 0; i < extent.e_len; i++) {
4523                                 pctx->errcode = ext2fs_add_dir_block2(
4524                                                         ctx->fs->dblist,
4525                                                         pctx->ino,
4526                                                         extent.e_pblk + i,
4527                                                         extent.e_lblk + i);
4528                                 if (pctx->errcode) {
4529                                         pctx->blk = extent.e_pblk + i;
4530                                         pctx->num = extent.e_lblk + i;
4531                                 failed_add_dir_block:
4532                                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4533                                         /* Should never get here */
4534                                         ctx->flags |= E2F_FLAG_ABORT;
4535                                         return;
4536                                 }
4537                         }
4538                         if (extent.e_len > 0)
4539                                 pb->last_db_block = extent.e_lblk + extent.e_len - 1;
4540                 }
4541                 if (has_unaligned_cluster_map(ctx, pb->previous_block,
4542                                               pb->last_block,
4543                                               extent.e_pblk,
4544                                               extent.e_lblk)) {
4545                         for (i = 0; i < extent.e_len; i++) {
4546                                 pctx->blk = extent.e_lblk + i;
4547                                 pctx->blk2 = extent.e_pblk + i;
4548                                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
4549                                 mark_block_used(ctx, extent.e_pblk + i);
4550                                 mark_block_used(ctx, extent.e_pblk + i);
4551                         }
4552                 }
4553
4554                 /*
4555                  * Check whether first cluster got marked in previous iteration.
4556                  */
4557                 if (ctx->fs->cluster_ratio_bits &&
4558                     pb->previous_block &&
4559                     (EXT2FS_B2C(ctx->fs, extent.e_pblk) ==
4560                      EXT2FS_B2C(ctx->fs, pb->previous_block)))
4561                         /* Set blk to the beginning of next cluster. */
4562                         blk = EXT2FS_C2B(
4563                                 ctx->fs,
4564                                 EXT2FS_B2C(ctx->fs, extent.e_pblk) + 1);
4565                 else
4566                         /* Set blk to the beginning of current cluster. */
4567                         blk = EXT2FS_C2B(ctx->fs,
4568                                          EXT2FS_B2C(ctx->fs, extent.e_pblk));
4569
4570                 if (blk < extent.e_pblk + extent.e_len) {
4571                         mark_blocks_used(ctx, blk,
4572                                          extent.e_pblk + extent.e_len - blk);
4573                         n = DIV_ROUND_UP(extent.e_pblk + extent.e_len - blk,
4574                                          EXT2FS_CLUSTER_RATIO(ctx->fs));
4575                         pb->num_blocks += n;
4576                 }
4577                 pb->last_block = extent.e_lblk + extent.e_len - 1;
4578                 pb->previous_block = extent.e_pblk + extent.e_len - 1;
4579                 start_block = pb->last_block = last_lblk;
4580                 if (is_leaf && !is_dir &&
4581                     !(extent.e_flags & EXT2_EXTENT_FLAGS_UNINIT))
4582                         pb->last_init_lblock = last_lblk;
4583         next:
4584                 pctx->errcode = ext2fs_extent_get(ehandle,
4585                                                   EXT2_EXTENT_NEXT_SIB,
4586                                                   &extent);
4587         }
4588
4589         /* Failed csum but passes checks?  Ask to fix checksum. */
4590         if (failed_csum &&
4591             fix_problem(ctx, PR_1_EXTENT_ONLY_CSUM_INVALID, pctx)) {
4592                 e2fsck_pass1_fix_lock(ctx);
4593                 pb->inode_modified = 1;
4594                 pctx->errcode = ext2fs_extent_replace(ehandle, 0, &extent);
4595                 e2fsck_pass1_fix_unlock(ctx);
4596                 if (pctx->errcode)
4597                         return;
4598         }
4599
4600         if (pctx->errcode == EXT2_ET_EXTENT_NO_NEXT)
4601                 pctx->errcode = 0;
4602 }
4603
4604 static void check_blocks_extents(e2fsck_t ctx, struct problem_context *pctx,
4605                                  struct process_block_struct *pb)
4606 {
4607         struct ext2_extent_info info;
4608         struct ext2_inode       *inode = pctx->inode;
4609         ext2_extent_handle_t    ehandle;
4610         ext2_filsys             fs = ctx->fs;
4611         ext2_ino_t              ino = pctx->ino;
4612         errcode_t               retval;
4613         blk64_t                 eof_lblk;
4614         struct ext3_extent_header       *eh;
4615
4616         /* Check for a proper extent header... */
4617         eh = (struct ext3_extent_header *) &inode->i_block[0];
4618         retval = ext2fs_extent_header_verify(eh, sizeof(inode->i_block));
4619         if (retval) {
4620                 if (fix_problem(ctx, PR_1_MISSING_EXTENT_HEADER, pctx))
4621                         e2fsck_clear_inode(ctx, ino, inode, 0,
4622                                            "check_blocks_extents");
4623                 pctx->errcode = 0;
4624                 return;
4625         }
4626
4627         /* ...since this function doesn't fail if i_block is zeroed. */
4628         pctx->errcode = ext2fs_extent_open2(fs, ino, inode, &ehandle);
4629         if (pctx->errcode) {
4630                 if (fix_problem(ctx, PR_1_READ_EXTENT, pctx))
4631                         e2fsck_clear_inode(ctx, ino, inode, 0,
4632                                            "check_blocks_extents");
4633                 pctx->errcode = 0;
4634                 return;
4635         }
4636
4637         retval = ext2fs_extent_get_info(ehandle, &info);
4638         if (retval == 0) {
4639                 int max_depth = info.max_depth;
4640
4641                 if (max_depth >= MAX_EXTENT_DEPTH_COUNT)
4642                         max_depth = MAX_EXTENT_DEPTH_COUNT-1;
4643                 ctx->extent_depth_count[max_depth]++;
4644         }
4645
4646         /* Check maximum extent depth */
4647         pctx->blk = info.max_depth;
4648         pctx->blk2 = ext2fs_max_extent_depth(ehandle);
4649         if (pctx->blk2 < pctx->blk &&
4650             fix_problem(ctx, PR_1_EXTENT_BAD_MAX_DEPTH, pctx))
4651                 pb->eti.force_rebuild = 1;
4652
4653         /* Can we collect extent tree level stats? */
4654         pctx->blk = MAX_EXTENT_DEPTH_COUNT;
4655         if (pctx->blk2 > pctx->blk)
4656                 fix_problem(ctx, PR_1E_MAX_EXTENT_TREE_DEPTH, pctx);
4657         memset(pb->eti.ext_info, 0, sizeof(pb->eti.ext_info));
4658         pb->eti.ino = pb->ino;
4659
4660         pb->next_lblock = 0;
4661
4662         eof_lblk = ((EXT2_I_SIZE(inode) + fs->blocksize - 1) >>
4663                 EXT2_BLOCK_SIZE_BITS(fs->super)) - 1;
4664         scan_extent_node(ctx, pctx, pb, 0, 0, eof_lblk, ehandle, 1);
4665         if (pctx->errcode &&
4666             fix_problem(ctx, PR_1_EXTENT_ITERATE_FAILURE, pctx)) {
4667                 pb->num_blocks = 0;
4668                 inode->i_blocks = 0;
4669                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4670                                    "check_blocks_extents");
4671                 pctx->errcode = 0;
4672         }
4673         ext2fs_extent_free(ehandle);
4674
4675         /* Rebuild unless it's a dir and we're rehashing it */
4676         if (LINUX_S_ISDIR(inode->i_mode) &&
4677             e2fsck_dir_will_be_rehashed(ctx, ino))
4678                 return;
4679
4680         if (ctx->options & E2F_OPT_CONVERT_BMAP)
4681                 e2fsck_rebuild_extents_later(ctx, ino);
4682         else
4683                 e2fsck_should_rebuild_extents(ctx, pctx, &pb->eti, &info);
4684 }
4685
4686 /*
4687  * In fact we don't need to check blocks for an inode with inline data
4688  * because this inode doesn't have any blocks.  In this function all
4689  * we need to do is add this inode into dblist when it is a directory.
4690  */
4691 static void check_blocks_inline_data(e2fsck_t ctx, struct problem_context *pctx,
4692                                      struct process_block_struct *pb)
4693 {
4694         int     flags;
4695         size_t  inline_data_size = 0;
4696
4697         if (!pb->is_dir) {
4698                 pctx->errcode = 0;
4699                 return;
4700         }
4701
4702         /* Process the dirents in i_block[] as the "first" block. */
4703         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 0);
4704         if (pctx->errcode)
4705                 goto err;
4706
4707         /* Process the dirents in the EA as a "second" block. */
4708         flags = ctx->fs->flags;
4709         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4710         pctx->errcode = ext2fs_inline_data_size(ctx->fs, pb->ino,
4711                                                 &inline_data_size);
4712         ctx->fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4713                          (ctx->fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4714         if (pctx->errcode) {
4715                 pctx->errcode = 0;
4716                 return;
4717         }
4718
4719         if (inline_data_size <= EXT4_MIN_INLINE_DATA_SIZE)
4720                 return;
4721
4722         pctx->errcode = ext2fs_add_dir_block2(ctx->fs->dblist, pb->ino, 0, 1);
4723         if (pctx->errcode)
4724                 goto err;
4725
4726         return;
4727 err:
4728         pctx->blk = 0;
4729         pctx->num = 0;
4730         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
4731         ctx->flags |= E2F_FLAG_ABORT;
4732 }
4733
4734 /*
4735  * This subroutine is called on each inode to account for all of the
4736  * blocks used by that inode.
4737  */
4738 static void check_blocks(e2fsck_t ctx, struct problem_context *pctx,
4739                          char *block_buf, const struct ea_quota *ea_ibody_quota)
4740 {
4741         ext2_filsys fs = ctx->fs;
4742         struct process_block_struct pb;
4743         ext2_ino_t      ino = pctx->ino;
4744         struct ext2_inode *inode = pctx->inode;
4745         unsigned        bad_size = 0;
4746         int             dirty_inode = 0;
4747         int             extent_fs;
4748         int             inlinedata_fs;
4749         __u64           size;
4750         struct ea_quota ea_block_quota;
4751
4752         pb.ino = ino;
4753         pb.num_blocks = EXT2FS_B2C(ctx->fs,
4754                                    ea_ibody_quota ? ea_ibody_quota->blocks : 0);
4755         pb.last_block = ~0;
4756         pb.last_init_lblock = -1;
4757         pb.last_db_block = -1;
4758         pb.num_illegal_blocks = 0;
4759         pb.suppress = 0; pb.clear = 0;
4760         pb.fragmented = 0;
4761         pb.compressed = 0;
4762         pb.previous_block = 0;
4763         pb.is_dir = LINUX_S_ISDIR(inode->i_mode);
4764         pb.is_reg = LINUX_S_ISREG(inode->i_mode);
4765         pb.max_blocks = 1U << (31 - fs->super->s_log_block_size);
4766         pb.inode = inode;
4767         pb.pctx = pctx;
4768         pb.ctx = ctx;
4769         pb.inode_modified = 0;
4770         pb.eti.force_rebuild = 0;
4771         pctx->ino = ino;
4772         pctx->errcode = 0;
4773
4774         extent_fs = ext2fs_has_feature_extents(ctx->fs->super);
4775         inlinedata_fs = ext2fs_has_feature_inline_data(ctx->fs->super);
4776
4777         if (check_ext_attr(ctx, pctx, block_buf, &ea_block_quota)) {
4778                 if (e2fsck_should_abort(ctx))
4779                         goto out;
4780                 pb.num_blocks += EXT2FS_B2C(ctx->fs, ea_block_quota.blocks);
4781         }
4782
4783         if (inlinedata_fs && (inode->i_flags & EXT4_INLINE_DATA_FL))
4784                 check_blocks_inline_data(ctx, pctx, &pb);
4785         else if (ext2fs_inode_has_valid_blocks2(fs, inode)) {
4786                 if (extent_fs && (inode->i_flags & EXT4_EXTENTS_FL))
4787                         check_blocks_extents(ctx, pctx, &pb);
4788                 else {
4789                         int flags;
4790                         /*
4791                          * If we've modified the inode, write it out before
4792                          * iterate() tries to use it.
4793                          */
4794                         if (dirty_inode) {
4795                                 e2fsck_write_inode(ctx, ino, inode,
4796                                                    "check_blocks");
4797                                 dirty_inode = 0;
4798                         }
4799                         flags = fs->flags;
4800                         fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4801                         pctx->errcode = ext2fs_block_iterate3(fs, ino,
4802                                                 pb.is_dir ? BLOCK_FLAG_HOLE : 0,
4803                                                 block_buf, process_block, &pb);
4804                         /*
4805                          * We do not have uninitialized extents in non extent
4806                          * files.
4807                          */
4808                         pb.last_init_lblock = pb.last_block;
4809                         /*
4810                          * If iterate() changed a block mapping, we have to
4811                          * re-read the inode.  If we decide to clear the
4812                          * inode after clearing some stuff, we'll re-write the
4813                          * bad mappings into the inode!
4814                          */
4815                         if (pb.inode_modified)
4816                                 e2fsck_read_inode(ctx, ino, inode,
4817                                                   "check_blocks");
4818                         fs->flags = (flags & EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4819                                     (fs->flags & ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4820
4821                         if (ctx->options & E2F_OPT_CONVERT_BMAP) {
4822 #ifdef DEBUG
4823                                 printf("bmap rebuild ino=%d\n", ino);
4824 #endif
4825                                 if (!LINUX_S_ISDIR(inode->i_mode) ||
4826                                     !e2fsck_dir_will_be_rehashed(ctx, ino))
4827                                         e2fsck_rebuild_extents_later(ctx, ino);
4828                         }
4829                 }
4830         }
4831         end_problem_latch(ctx, PR_LATCH_BLOCK);
4832         end_problem_latch(ctx, PR_LATCH_TOOBIG);
4833         if (e2fsck_should_abort(ctx))
4834                 goto out;
4835         if (pctx->errcode)
4836                 fix_problem(ctx, PR_1_BLOCK_ITERATE, pctx);
4837
4838         if (pb.fragmented && pb.num_blocks < fs->super->s_blocks_per_group) {
4839                 if (LINUX_S_ISDIR(inode->i_mode))
4840                         ctx->fs_fragmented_dir++;
4841                 else
4842                         ctx->fs_fragmented++;
4843         }
4844
4845         if (pb.clear) {
4846                 e2fsck_clear_inode(ctx, ino, inode, E2F_FLAG_RESTART,
4847                                    "check_blocks");
4848                 return;
4849         }
4850
4851         if (inode->i_flags & EXT2_INDEX_FL) {
4852                 if (handle_htree(ctx, pctx, ino, inode, block_buf)) {
4853                         inode->i_flags &= ~EXT2_INDEX_FL;
4854                         dirty_inode++;
4855                 } else {
4856                         e2fsck_add_dx_dir(ctx, ino, inode, pb.last_block+1);
4857                 }
4858         }
4859
4860         if (!pb.num_blocks && pb.is_dir &&
4861             !(inode->i_flags & EXT4_INLINE_DATA_FL)) {
4862                 if (fix_problem(ctx, PR_1_ZERO_LENGTH_DIR, pctx)) {
4863                         e2fsck_clear_inode(ctx, ino, inode, 0, "check_blocks");
4864                         ctx->fs_directory_count--;
4865                         return;
4866                 }
4867         }
4868
4869         if (ino != quota_type2inum(PRJQUOTA, fs->super) &&
4870             ino != fs->super->s_orphan_file_inum &&
4871             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INODE(ctx->fs->super)) &&
4872             !(inode->i_flags & EXT4_EA_INODE_FL)) {
4873                 quota_data_add(ctx->qctx, (struct ext2_inode_large *) inode,
4874                                ino,
4875                                pb.num_blocks * EXT2_CLUSTER_SIZE(fs->super));
4876                 quota_data_inodes(ctx->qctx, (struct ext2_inode_large *) inode,
4877                                   ino, (ea_ibody_quota ?
4878                                         ea_ibody_quota->inodes : 0) +
4879                                                 ea_block_quota.inodes + 1);
4880         }
4881
4882         if (!ext2fs_has_feature_huge_file(fs->super) ||
4883             !(inode->i_flags & EXT4_HUGE_FILE_FL))
4884                 pb.num_blocks *= (fs->blocksize / 512);
4885         pb.num_blocks *= EXT2FS_CLUSTER_RATIO(fs);
4886 #if 0
4887         printf("inode %u, i_size = %u, last_block = %llu, i_blocks=%llu, num_blocks = %llu\n",
4888                ino, inode->i_size, (unsigned long long) pb.last_block,
4889                (unsigned long long) ext2fs_inode_i_blocks(fs, inode),
4890                (unsigned long long) pb.num_blocks);
4891 #endif
4892         size = EXT2_I_SIZE(inode);
4893         if (pb.is_dir) {
4894                 unsigned nblock = size >> EXT2_BLOCK_SIZE_BITS(fs->super);
4895                 if (inode->i_flags & EXT4_INLINE_DATA_FL) {
4896                         int flags;
4897                         size_t sz = 0;
4898                         errcode_t err;
4899
4900                         flags = ctx->fs->flags;
4901                         ctx->fs->flags |= EXT2_FLAG_IGNORE_CSUM_ERRORS;
4902                         err = ext2fs_inline_data_size(ctx->fs, pctx->ino,
4903                                                       &sz);
4904                         ctx->fs->flags = (flags &
4905                                           EXT2_FLAG_IGNORE_CSUM_ERRORS) |
4906                                          (ctx->fs->flags &
4907                                           ~EXT2_FLAG_IGNORE_CSUM_ERRORS);
4908                         if (err || sz != size) {
4909                                 bad_size = 7;
4910                                 pctx->num = sz;
4911                         }
4912                 } else if (size & (fs->blocksize - 1))
4913                         bad_size = 5;
4914                 else if (nblock > (pb.last_block + 1))
4915                         bad_size = 1;
4916                 else if (nblock < (pb.last_block + 1)) {
4917                         if (((pb.last_block + 1) - nblock) >
4918                             fs->super->s_prealloc_dir_blocks)
4919                                 bad_size = 2;
4920                 }
4921         } else {
4922                 if ((pb.last_init_lblock >= 0) &&
4923                     /* Do not allow initialized allocated blocks past i_size*/
4924                     (size < (__u64)pb.last_init_lblock * fs->blocksize) &&
4925                     !(inode->i_flags & EXT4_VERITY_FL))
4926                         bad_size = 3;
4927                 else if (!(extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4928                          size > ext2_max_sizes[fs->super->s_log_block_size])
4929                         /* too big for a direct/indirect-mapped file */
4930                         bad_size = 4;
4931                 else if ((extent_fs && (inode->i_flags & EXT4_EXTENTS_FL)) &&
4932                          size >
4933                          ((1ULL << (32 + EXT2_BLOCK_SIZE_BITS(fs->super))) - 1))
4934                         /* too big for an extent-based file - 32bit ee_block */
4935                         bad_size = 6;
4936         }
4937         /* i_size for symlinks is checked elsewhere */
4938         if (bad_size && !LINUX_S_ISLNK(inode->i_mode)) {
4939                 /* Did inline_data set pctx->num earlier? */
4940                 if (bad_size != 7)
4941                         pctx->num = (pb.last_block + 1) * fs->blocksize;
4942                 pctx->group = bad_size;
4943                 if (fix_problem(ctx, PR_1_BAD_I_SIZE, pctx)) {
4944                         ext2fs_inode_size_set(fs, inode, pctx->num);
4945                         if (EXT2_I_SIZE(inode) == 0 &&
4946                             (inode->i_flags & EXT4_INLINE_DATA_FL)) {
4947                                 memset(inode->i_block, 0,
4948                                        sizeof(inode->i_block));
4949                                 inode->i_flags &= ~EXT4_INLINE_DATA_FL;
4950                         }
4951                         dirty_inode++;
4952                 }
4953                 pctx->num = 0;
4954         }
4955         if (LINUX_S_ISREG(inode->i_mode) &&
4956             ext2fs_needs_large_file_feature(EXT2_I_SIZE(inode)))
4957                 ctx->large_files++;
4958         if ((fs->super->s_creator_os != EXT2_OS_HURD) &&
4959             ((pb.num_blocks != ext2fs_inode_i_blocks(fs, inode)) ||
4960              (ext2fs_has_feature_huge_file(fs->super) &&
4961               (inode->i_flags & EXT4_HUGE_FILE_FL) &&
4962               (inode->osd2.linux2.l_i_blocks_hi != 0)))) {
4963                 pctx->num = pb.num_blocks;
4964                 if (fix_problem(ctx, PR_1_BAD_I_BLOCKS, pctx)) {
4965                         inode->i_blocks = pb.num_blocks;
4966                         inode->osd2.linux2.l_i_blocks_hi = pb.num_blocks >> 32;
4967                         dirty_inode++;
4968                 }
4969                 pctx->num = 0;
4970         }
4971
4972         /*
4973          * The kernel gets mad if we ask it to allocate bigalloc clusters to
4974          * a block mapped file, so rebuild it as an extent file.  We can skip
4975          * symlinks because they're never rewritten.
4976          */
4977         if (ext2fs_has_feature_bigalloc(fs->super) &&
4978             (LINUX_S_ISREG(inode->i_mode) || LINUX_S_ISDIR(inode->i_mode)) &&
4979             ext2fs_inode_data_blocks2(fs, inode) > 0 &&
4980             (ino == EXT2_ROOT_INO || ino >= EXT2_FIRST_INO(fs->super)) &&
4981             !(inode->i_flags & (EXT4_EXTENTS_FL | EXT4_INLINE_DATA_FL)) &&
4982             fix_problem(ctx, PR_1_NO_BIGALLOC_BLOCKMAP_FILES, pctx)) {
4983                 pctx->errcode = e2fsck_rebuild_extents_later(ctx, ino);
4984                 if (pctx->errcode)
4985                         goto out;
4986         }
4987
4988         if (ctx->dirs_to_hash && pb.is_dir &&
4989             !(ctx->lost_and_found && ctx->lost_and_found == ino) &&
4990             !(inode->i_flags & EXT2_INDEX_FL) &&
4991             ((inode->i_size / fs->blocksize) >= 3))
4992                 e2fsck_rehash_dir_later(ctx, ino);
4993
4994 out:
4995         if (dirty_inode)
4996                 e2fsck_write_inode(ctx, ino, inode, "check_blocks");
4997 }
4998
4999 #if 0
5000 /*
5001  * Helper function called by process block when an illegal block is
5002  * found.  It returns a description about why the block is illegal
5003  */
5004 static char *describe_illegal_block(ext2_filsys fs, blk64_t block)
5005 {
5006         blk64_t super;
5007         int     i;
5008         static char     problem[80];
5009
5010         super = fs->super->s_first_data_block;
5011         strcpy(problem, "PROGRAMMING ERROR: Unknown reason for illegal block");
5012         if (block < super) {
5013                 sprintf(problem, "< FIRSTBLOCK (%u)", super);
5014                 return(problem);
5015         } else if (block >= ext2fs_blocks_count(fs->super)) {
5016                 sprintf(problem, "> BLOCKS (%u)", ext2fs_blocks_count(fs->super));
5017                 return(problem);
5018         }
5019         for (i = 0; i < fs->group_desc_count; i++) {
5020                 if (block == super) {
5021                         sprintf(problem, "is the superblock in group %d", i);
5022                         break;
5023                 }
5024                 if (block > super &&
5025                     block <= (super + fs->desc_blocks)) {
5026                         sprintf(problem, "is in the group descriptors "
5027                                 "of group %d", i);
5028                         break;
5029                 }
5030                 if (block == ext2fs_block_bitmap_loc(fs, i)) {
5031                         sprintf(problem, "is the block bitmap of group %d", i);
5032                         break;
5033                 }
5034                 if (block == ext2fs_inode_bitmap_loc(fs, i)) {
5035                         sprintf(problem, "is the inode bitmap of group %d", i);
5036                         break;
5037                 }
5038                 if (block >= ext2fs_inode_table_loc(fs, i) &&
5039                     (block < ext2fs_inode_table_loc(fs, i)
5040                      + fs->inode_blocks_per_group)) {
5041                         sprintf(problem, "is in the inode table of group %d",
5042                                 i);
5043                         break;
5044                 }
5045                 super += fs->super->s_blocks_per_group;
5046         }
5047         return(problem);
5048 }
5049 #endif
5050
5051 /*
5052  * This is a helper function for check_blocks().
5053  */
5054 static int process_block(ext2_filsys fs,
5055                   blk64_t       *block_nr,
5056                   e2_blkcnt_t blockcnt,
5057                   blk64_t ref_block EXT2FS_ATTR((unused)),
5058                   int ref_offset EXT2FS_ATTR((unused)),
5059                   void *priv_data)
5060 {
5061         struct process_block_struct *p;
5062         struct problem_context *pctx;
5063         blk64_t blk = *block_nr;
5064         int     ret_code = 0;
5065         problem_t       problem = 0;
5066         e2fsck_t        ctx;
5067
5068         p = (struct process_block_struct *) priv_data;
5069         pctx = p->pctx;
5070         ctx = p->ctx;
5071
5072         /*
5073          * For a directory, add logical block zero for processing even if it's
5074          * not mapped or we'll be perennially stuck with broken "." and ".."
5075          * entries.
5076          */
5077         if (p->is_dir && blockcnt == 0 && blk == 0) {
5078                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino, 0, 0);
5079                 if (pctx->errcode) {
5080                         pctx->blk = blk;
5081                         pctx->num = blockcnt;
5082                         goto failed_add_dir_block;
5083                 }
5084                 p->last_db_block++;
5085         }
5086
5087         if (blk == 0)
5088                 return 0;
5089
5090 #if 0
5091         printf("Process_block, inode %lu, block %u, #%d\n", p->ino, blk,
5092                blockcnt);
5093 #endif
5094
5095         /*
5096          * Simplistic fragmentation check.  We merely require that the
5097          * file be contiguous.  (Which can never be true for really
5098          * big files that are greater than a block group.)
5099          */
5100         if (p->previous_block && p->ino != EXT2_RESIZE_INO) {
5101                 if (p->previous_block+1 != blk) {
5102                         if (ctx->options & E2F_OPT_FRAGCHECK) {
5103                                 char type = '?';
5104
5105                                 if (p->is_dir)
5106                                         type = 'd';
5107                                 else if (p->is_reg)
5108                                         type = 'f';
5109
5110                                 printf(_("%6lu(%c): expecting %6lu "
5111                                          "got phys %6lu (blkcnt %lld)\n"),
5112                                        (unsigned long) pctx->ino, type,
5113                                        (unsigned long) p->previous_block+1,
5114                                        (unsigned long) blk,
5115                                        (long long) blockcnt);
5116                         }
5117                         p->fragmented = 1;
5118                 }
5119         }
5120
5121         if (p->is_dir && !ext2fs_has_feature_largedir(fs->super) &&
5122             !pctx->inode->i_size_high &&
5123             blockcnt > (1 << (21 - fs->super->s_log_block_size)))
5124                 problem = PR_1_TOOBIG_DIR;
5125         if (p->is_dir && p->num_blocks + 1 >= p->max_blocks)
5126                 problem = PR_1_TOOBIG_DIR;
5127         if (p->is_reg && p->num_blocks + 1 >= p->max_blocks)
5128                 problem = PR_1_TOOBIG_REG;
5129         if (!p->is_dir && !p->is_reg && blockcnt > 0)
5130                 problem = PR_1_TOOBIG_SYMLINK;
5131
5132         if (blk < fs->super->s_first_data_block ||
5133             blk >= ext2fs_blocks_count(fs->super))
5134                 problem = PR_1_ILLEGAL_BLOCK_NUM;
5135
5136         /*
5137          * If this IND/DIND/TIND block is squatting atop some critical metadata
5138          * (group descriptors, superblock, bitmap, inode table), any write to
5139          * "fix" mapping problems will destroy the metadata.  We'll let pass 1b
5140          * fix that and restart fsck.
5141          */
5142         if (blockcnt < 0 &&
5143             p->ino != EXT2_RESIZE_INO &&
5144             blk < ctx->fs->super->s_blocks_count &&
5145             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk)) {
5146                 pctx->blk = blk;
5147                 fix_problem(ctx, PR_1_CRITICAL_METADATA_COLLISION, pctx);
5148                 if ((ctx->options & E2F_OPT_NO) == 0)
5149                         ctx->flags |= E2F_FLAG_RESTART_LATER;
5150         }
5151
5152         if (problem) {
5153                 p->num_illegal_blocks++;
5154                 /*
5155                  * A bit of subterfuge here -- we're trying to fix a block
5156                  * mapping, but the IND/DIND/TIND block could have collided
5157                  * with some critical metadata.  So, fix the in-core mapping so
5158                  * iterate won't go insane, but return 0 instead of
5159                  * BLOCK_CHANGED so that it won't write the remapping out to
5160                  * our multiply linked block.
5161                  *
5162                  * Even if we previously determined that an *IND block
5163                  * conflicts with critical metadata, we must still try to
5164                  * iterate the *IND block as if it is an *IND block to find and
5165                  * mark the blocks it points to.  Better to be overly cautious
5166                  * with the used_blocks map so that we don't move the *IND
5167                  * block to a block that's really in use!
5168                  */
5169                 if (p->ino != EXT2_RESIZE_INO &&
5170                     ref_block != 0 &&
5171                     ext2fs_test_block_bitmap2(ctx->block_metadata_map,
5172                                               ref_block)) {
5173                         *block_nr = 0;
5174                         return 0;
5175                 }
5176                 if (!p->suppress && (p->num_illegal_blocks % 12) == 0) {
5177                         if (fix_problem(ctx, PR_1_TOO_MANY_BAD_BLOCKS, pctx)) {
5178                                 p->clear = 1;
5179                                 return BLOCK_ABORT;
5180                         }
5181                         if (fix_problem(ctx, PR_1_SUPPRESS_MESSAGES, pctx)) {
5182                                 p->suppress = 1;
5183                                 set_latch_flags(PR_LATCH_BLOCK,
5184                                                 PRL_SUPPRESS, 0);
5185                         }
5186                 }
5187                 pctx->blk = blk;
5188                 pctx->blkcount = blockcnt;
5189                 if (fix_problem(ctx, problem, pctx)) {
5190                         blk = *block_nr = 0;
5191                         ret_code = BLOCK_CHANGED;
5192                         p->inode_modified = 1;
5193                         /*
5194                          * If the directory block is too big and is beyond the
5195                          * end of the FS, don't bother trying to add it for
5196                          * processing -- the kernel would never have created a
5197                          * directory this large, and we risk an ENOMEM abort.
5198                          * In any case, the toobig handler for extent-based
5199                          * directories also doesn't feed toobig blocks to
5200                          * pass 2.
5201                          */
5202                         if (problem == PR_1_TOOBIG_DIR)
5203                                 return ret_code;
5204                         goto mark_dir;
5205                 } else
5206                         return 0;
5207         }
5208
5209         if (p->ino == EXT2_RESIZE_INO) {
5210                 /*
5211                  * The resize inode has already be sanity checked
5212                  * during pass #0 (the superblock checks).  All we
5213                  * have to do is mark the double indirect block as
5214                  * being in use; all of the other blocks are handled
5215                  * by mark_table_blocks()).
5216                  */
5217                 if (blockcnt == BLOCK_COUNT_DIND)
5218                         mark_block_used(ctx, blk);
5219                 p->num_blocks++;
5220         } else if (!(ctx->fs->cluster_ratio_bits &&
5221                      p->previous_block &&
5222                      (EXT2FS_B2C(ctx->fs, blk) ==
5223                       EXT2FS_B2C(ctx->fs, p->previous_block)) &&
5224                      (blk & EXT2FS_CLUSTER_MASK(ctx->fs)) ==
5225                      ((unsigned) blockcnt & EXT2FS_CLUSTER_MASK(ctx->fs)))) {
5226                 mark_block_used(ctx, blk);
5227                 p->num_blocks++;
5228         } else if (has_unaligned_cluster_map(ctx, p->previous_block,
5229                                              p->last_block, blk, blockcnt)) {
5230                 pctx->blk = blockcnt;
5231                 pctx->blk2 = blk;
5232                 fix_problem(ctx, PR_1_MISALIGNED_CLUSTER, pctx);
5233                 mark_block_used(ctx, blk);
5234                 mark_block_used(ctx, blk);
5235         }
5236         if (blockcnt >= 0)
5237                 p->last_block = blockcnt;
5238         p->previous_block = blk;
5239 mark_dir:
5240         if (p->is_dir && (blockcnt >= 0)) {
5241                 while (++p->last_db_block < blockcnt) {
5242                         pctx->errcode = ext2fs_add_dir_block2(fs->dblist,
5243                                                               p->ino, 0,
5244                                                               p->last_db_block);
5245                         if (pctx->errcode) {
5246                                 pctx->blk = 0;
5247                                 pctx->num = p->last_db_block;
5248                                 goto failed_add_dir_block;
5249                         }
5250                 }
5251                 pctx->errcode = ext2fs_add_dir_block2(fs->dblist, p->ino,
5252                                                       blk, blockcnt);
5253                 if (pctx->errcode) {
5254                         pctx->blk = blk;
5255                         pctx->num = blockcnt;
5256                 failed_add_dir_block:
5257                         fix_problem(ctx, PR_1_ADD_DBLOCK, pctx);
5258                         /* Should never get here */
5259                         ctx->flags |= E2F_FLAG_ABORT;
5260                         return BLOCK_ABORT;
5261                 }
5262         }
5263         return ret_code;
5264 }
5265
5266 static int process_bad_block(ext2_filsys fs,
5267                       blk64_t *block_nr,
5268                       e2_blkcnt_t blockcnt,
5269                       blk64_t ref_block EXT2FS_ATTR((unused)),
5270                       int ref_offset EXT2FS_ATTR((unused)),
5271                       void *priv_data)
5272 {
5273         struct process_block_struct *p;
5274         blk64_t         blk = *block_nr;
5275         blk64_t         first_block;
5276         dgrp_t          i;
5277         struct problem_context *pctx;
5278         e2fsck_t        ctx;
5279
5280         if (!blk)
5281                 return 0;
5282
5283         p = (struct process_block_struct *) priv_data;
5284         ctx = p->ctx;
5285         pctx = p->pctx;
5286
5287         pctx->ino = EXT2_BAD_INO;
5288         pctx->blk = blk;
5289         pctx->blkcount = blockcnt;
5290
5291         if ((blk < fs->super->s_first_data_block) ||
5292             (blk >= ext2fs_blocks_count(fs->super))) {
5293                 if (fix_problem(ctx, PR_1_BB_ILLEGAL_BLOCK_NUM, pctx)) {
5294                         *block_nr = 0;
5295                         return BLOCK_CHANGED;
5296                 } else
5297                         return 0;
5298         }
5299
5300         if (blockcnt < 0) {
5301                 if (ext2fs_test_block_bitmap2(p->fs_meta_blocks, blk)) {
5302                         p->bbcheck = 1;
5303                         if (fix_problem(ctx, PR_1_BB_FS_BLOCK, pctx)) {
5304                                 *block_nr = 0;
5305                                 return BLOCK_CHANGED;
5306                         }
5307                 } else if (is_blocks_used(ctx, blk, 1)) {
5308                         p->bbcheck = 1;
5309                         if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK,
5310                                         pctx)) {
5311                                 *block_nr = 0;
5312                                 return BLOCK_CHANGED;
5313                         }
5314                         if (e2fsck_should_abort(ctx))
5315                                 return BLOCK_ABORT;
5316                 } else {
5317                         mark_block_used(ctx, blk);
5318                 }
5319                 return 0;
5320         }
5321 #if 0
5322         printf ("DEBUG: Marking %u as bad.\n", blk);
5323 #endif
5324         ctx->fs_badblocks_count++;
5325         /*
5326          * If the block is not used, then mark it as used and return.
5327          * If it is already marked as found, this must mean that
5328          * there's an overlap between the filesystem table blocks
5329          * (bitmaps and inode table) and the bad block list.
5330          */
5331         if (!is_blocks_used(ctx, blk, 1)) {
5332                 ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5333                 return 0;
5334         }
5335         /*
5336          * Try to find the where the filesystem block was used...
5337          */
5338         first_block = fs->super->s_first_data_block;
5339
5340         for (i = 0; i < fs->group_desc_count; i++ ) {
5341                 pctx->group = i;
5342                 pctx->blk = blk;
5343                 if (!ext2fs_bg_has_super(fs, i))
5344                         goto skip_super;
5345                 if (blk == first_block) {
5346                         if (i == 0) {
5347                                 if (fix_problem(ctx,
5348                                                 PR_1_BAD_PRIMARY_SUPERBLOCK,
5349                                                 pctx)) {
5350                                         *block_nr = 0;
5351                                         return BLOCK_CHANGED;
5352                                 }
5353                                 return 0;
5354                         }
5355                         fix_problem(ctx, PR_1_BAD_SUPERBLOCK, pctx);
5356                         return 0;
5357                 }
5358                 if ((blk > first_block) &&
5359                     (blk <= first_block + fs->desc_blocks)) {
5360                         if (i == 0) {
5361                                 pctx->blk = *block_nr;
5362                                 if (fix_problem(ctx,
5363                         PR_1_BAD_PRIMARY_GROUP_DESCRIPTOR, pctx)) {
5364                                         *block_nr = 0;
5365                                         return BLOCK_CHANGED;
5366                                 }
5367                                 return 0;
5368                         }
5369                         fix_problem(ctx, PR_1_BAD_GROUP_DESCRIPTORS, pctx);
5370                         return 0;
5371                 }
5372         skip_super:
5373                 if (blk == ext2fs_block_bitmap_loc(fs, i)) {
5374                         if (fix_problem(ctx, PR_1_BB_BAD_BLOCK, pctx)) {
5375                                 ctx->invalid_block_bitmap_flag[i]++;
5376                                 ctx->invalid_bitmaps++;
5377                         }
5378                         return 0;
5379                 }
5380                 if (blk == ext2fs_inode_bitmap_loc(fs, i)) {
5381                         if (fix_problem(ctx, PR_1_IB_BAD_BLOCK, pctx)) {
5382                                 ctx->invalid_inode_bitmap_flag[i]++;
5383                                 ctx->invalid_bitmaps++;
5384                         }
5385                         return 0;
5386                 }
5387                 if ((blk >= ext2fs_inode_table_loc(fs, i)) &&
5388                     (blk < (ext2fs_inode_table_loc(fs, i) +
5389                             fs->inode_blocks_per_group))) {
5390                         /*
5391                          * If there are bad blocks in the inode table,
5392                          * the inode scan code will try to do
5393                          * something reasonable automatically.
5394                          */
5395                         return 0;
5396                 }
5397                 first_block += fs->super->s_blocks_per_group;
5398         }
5399         /*
5400          * If we've gotten to this point, then the only
5401          * possibility is that the bad block inode meta data
5402          * is using a bad block.
5403          */
5404         if ((blk == p->inode->i_block[EXT2_IND_BLOCK]) ||
5405             (blk == p->inode->i_block[EXT2_DIND_BLOCK]) ||
5406             (blk == p->inode->i_block[EXT2_TIND_BLOCK])) {
5407                 p->bbcheck = 1;
5408                 if (fix_problem(ctx, PR_1_BBINODE_BAD_METABLOCK, pctx)) {
5409                         *block_nr = 0;
5410                         return BLOCK_CHANGED;
5411                 }
5412                 if (e2fsck_should_abort(ctx))
5413                         return BLOCK_ABORT;
5414                 return 0;
5415         }
5416
5417         pctx->group = -1;
5418
5419         /* Warn user that the block wasn't claimed */
5420         fix_problem(ctx, PR_1_PROGERR_CLAIMED_BLOCK, pctx);
5421
5422         return 0;
5423 }
5424
5425 static void new_table_block(e2fsck_t ctx, blk64_t first_block, dgrp_t group,
5426                             const char *name, int num, blk64_t *new_block)
5427 {
5428         ext2_filsys fs = ctx->fs;
5429         dgrp_t          last_grp;
5430         blk64_t         old_block = *new_block;
5431         blk64_t         last_block;
5432         dgrp_t          flexbg;
5433         unsigned        flexbg_size;
5434         int             i, is_flexbg;
5435         char            *buf;
5436         struct problem_context  pctx;
5437
5438         clear_problem_context(&pctx);
5439
5440         pctx.group = group;
5441         pctx.blk = old_block;
5442         pctx.str = name;
5443
5444         /*
5445          * For flex_bg filesystems, first try to allocate the metadata
5446          * within the flex_bg, and if that fails then try finding the
5447          * space anywhere in the filesystem.
5448          */
5449         is_flexbg = ext2fs_has_feature_flex_bg(fs->super);
5450         if (is_flexbg) {
5451                 flexbg_size = 1U << fs->super->s_log_groups_per_flex;
5452                 flexbg = group / flexbg_size;
5453                 first_block = ext2fs_group_first_block2(fs,
5454                                                         flexbg_size * flexbg);
5455                 last_grp = group | (flexbg_size - 1);
5456                 if (last_grp >= fs->group_desc_count)
5457                         last_grp = fs->group_desc_count - 1;
5458                 last_block = ext2fs_group_last_block2(fs, last_grp);
5459         } else
5460                 last_block = ext2fs_group_last_block2(fs, group);
5461         pctx.errcode = ext2fs_get_free_blocks2(fs, first_block, last_block,
5462                                                num, ctx->block_found_map,
5463                                                new_block);
5464         if (is_flexbg && (pctx.errcode == EXT2_ET_BLOCK_ALLOC_FAIL))
5465                 pctx.errcode = ext2fs_get_free_blocks2(fs,
5466                                 fs->super->s_first_data_block,
5467                                 ext2fs_blocks_count(fs->super),
5468                                 num, ctx->block_found_map, new_block);
5469         if (pctx.errcode) {
5470                 pctx.num = num;
5471                 fix_problem(ctx, PR_1_RELOC_BLOCK_ALLOCATE, &pctx);
5472                 ext2fs_unmark_valid(fs);
5473                 ctx->flags |= E2F_FLAG_ABORT;
5474                 return;
5475         }
5476         pctx.errcode = ext2fs_get_mem(fs->blocksize, &buf);
5477         if (pctx.errcode) {
5478                 fix_problem(ctx, PR_1_RELOC_MEMORY_ALLOCATE, &pctx);
5479                 ext2fs_unmark_valid(fs);
5480                 ctx->flags |= E2F_FLAG_ABORT;
5481                 return;
5482         }
5483         ext2fs_mark_super_dirty(fs);
5484         fs->flags &= ~EXT2_FLAG_MASTER_SB_ONLY;
5485         pctx.blk2 = *new_block;
5486         fix_problem(ctx, (old_block ? PR_1_RELOC_FROM_TO :
5487                           PR_1_RELOC_TO), &pctx);
5488         pctx.blk2 = 0;
5489         for (i = 0; i < num; i++) {
5490                 pctx.blk = i;
5491                 ext2fs_mark_block_bitmap2(ctx->block_found_map, (*new_block)+i);
5492                 if (old_block) {
5493                         pctx.errcode = io_channel_read_blk64(fs->io,
5494                                    old_block + i, 1, buf);
5495                         if (pctx.errcode)
5496                                 fix_problem(ctx, PR_1_RELOC_READ_ERR, &pctx);
5497                         pctx.blk = (*new_block) + i;
5498                         pctx.errcode = io_channel_write_blk64(fs->io, pctx.blk,
5499                                                               1, buf);
5500                 } else {
5501                         pctx.blk = (*new_block) + i;
5502                         pctx.errcode = ext2fs_zero_blocks2(fs, pctx.blk, 1,
5503                                                            NULL, NULL);
5504                 }
5505
5506                 if (pctx.errcode)
5507                         fix_problem(ctx, PR_1_RELOC_WRITE_ERR, &pctx);
5508         }
5509         ext2fs_free_mem(&buf);
5510 }
5511
5512 /*
5513  * This routine gets called at the end of pass 1 if bad blocks are
5514  * detected in the superblock, group descriptors, inode_bitmaps, or
5515  * block bitmaps.  At this point, all of the blocks have been mapped
5516  * out, so we can try to allocate new block(s) to replace the bad
5517  * blocks.
5518  */
5519 static void handle_fs_bad_blocks(e2fsck_t ctx)
5520 {
5521         ext2_filsys fs = ctx->fs;
5522         dgrp_t          i;
5523         blk64_t         first_block;
5524         blk64_t         new_blk;
5525
5526         for (i = 0; i < fs->group_desc_count; i++) {
5527                 first_block = ext2fs_group_first_block2(fs, i);
5528
5529                 if (ctx->invalid_block_bitmap_flag[i]) {
5530                         new_blk = ext2fs_block_bitmap_loc(fs, i);
5531                         new_table_block(ctx, first_block, i, _("block bitmap"),
5532                                         1, &new_blk);
5533                         ext2fs_block_bitmap_loc_set(fs, i, new_blk);
5534                 }
5535                 if (ctx->invalid_inode_bitmap_flag[i]) {
5536                         new_blk = ext2fs_inode_bitmap_loc(fs, i);
5537                         new_table_block(ctx, first_block, i, _("inode bitmap"),
5538                                         1, &new_blk);
5539                         ext2fs_inode_bitmap_loc_set(fs, i, new_blk);
5540                 }
5541                 if (ctx->invalid_inode_table_flag[i]) {
5542                         new_blk = ext2fs_inode_table_loc(fs, i);
5543                         new_table_block(ctx, first_block, i, _("inode table"),
5544                                         fs->inode_blocks_per_group,
5545                                         &new_blk);
5546                         ext2fs_inode_table_loc_set(fs, i, new_blk);
5547                         ctx->flags |= E2F_FLAG_RESTART;
5548                 }
5549         }
5550         ctx->invalid_bitmaps = 0;
5551 }
5552
5553 /*
5554  * This routine marks all blocks which are used by the superblock,
5555  * group descriptors, inode bitmaps, and block bitmaps.
5556  */
5557 static void mark_table_blocks(e2fsck_t ctx)
5558 {
5559         ext2_filsys fs = ctx->fs;
5560         blk64_t b;
5561         dgrp_t  i;
5562         unsigned int    j;
5563         struct problem_context pctx;
5564
5565         clear_problem_context(&pctx);
5566
5567         for (i = 0; i < fs->group_desc_count; i++) {
5568                 pctx.group = i;
5569
5570                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_found_map);
5571                 ext2fs_reserve_super_and_bgd(fs, i, ctx->block_metadata_map);
5572
5573                 /*
5574                  * Mark the blocks used for the inode table
5575                  */
5576                 if (ext2fs_inode_table_loc(fs, i)) {
5577                         for (j = 0, b = ext2fs_inode_table_loc(fs, i);
5578                              j < fs->inode_blocks_per_group;
5579                              j++, b++) {
5580                                 if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5581                                                              b)) {
5582                                         pctx.blk = b;
5583                                         if (!ctx->invalid_inode_table_flag[i] &&
5584                                             fix_problem(ctx,
5585                                                 PR_1_ITABLE_CONFLICT, &pctx)) {
5586                                                 ctx->invalid_inode_table_flag[i]++;
5587                                                 ctx->invalid_bitmaps++;
5588                                         }
5589                                 } else {
5590                                     ext2fs_mark_block_bitmap2(
5591                                                 ctx->block_found_map, b);
5592                                     ext2fs_mark_block_bitmap2(
5593                                                 ctx->block_metadata_map, b);
5594                                 }
5595                         }
5596                 }
5597
5598                 /*
5599                  * Mark block used for the block bitmap
5600                  */
5601                 if (ext2fs_block_bitmap_loc(fs, i)) {
5602                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5603                                      ext2fs_block_bitmap_loc(fs, i))) {
5604                                 pctx.blk = ext2fs_block_bitmap_loc(fs, i);
5605                                 if (fix_problem(ctx, PR_1_BB_CONFLICT, &pctx)) {
5606                                         ctx->invalid_block_bitmap_flag[i]++;
5607                                         ctx->invalid_bitmaps++;
5608                                 }
5609                         } else {
5610                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5611                                      ext2fs_block_bitmap_loc(fs, i));
5612                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5613                                      ext2fs_block_bitmap_loc(fs, i));
5614                         }
5615                 }
5616                 /*
5617                  * Mark block used for the inode bitmap
5618                  */
5619                 if (ext2fs_inode_bitmap_loc(fs, i)) {
5620                         if (ext2fs_test_block_bitmap2(ctx->block_found_map,
5621                                      ext2fs_inode_bitmap_loc(fs, i))) {
5622                                 pctx.blk = ext2fs_inode_bitmap_loc(fs, i);
5623                                 if (fix_problem(ctx, PR_1_IB_CONFLICT, &pctx)) {
5624                                         ctx->invalid_inode_bitmap_flag[i]++;
5625                                         ctx->invalid_bitmaps++;
5626                                 }
5627                         } else {
5628                             ext2fs_mark_block_bitmap2(ctx->block_metadata_map,
5629                                      ext2fs_inode_bitmap_loc(fs, i));
5630                             ext2fs_mark_block_bitmap2(ctx->block_found_map,
5631                                      ext2fs_inode_bitmap_loc(fs, i));
5632                         }
5633                 }
5634         }
5635 }
5636
5637 /*
5638  * These subroutines short circuits ext2fs_get_blocks and
5639  * ext2fs_check_directory; we use them since we already have the inode
5640  * structure, so there's no point in letting the ext2fs library read
5641  * the inode again.
5642  */
5643 static errcode_t pass1_get_blocks(ext2_filsys fs, ext2_ino_t ino,
5644                                   blk_t *blocks)
5645 {
5646         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5647         int     i;
5648
5649         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5650                 return EXT2_ET_CALLBACK_NOTHANDLED;
5651
5652         for (i=0; i < EXT2_N_BLOCKS; i++)
5653                 blocks[i] = ctx->stashed_inode->i_block[i];
5654         return 0;
5655 }
5656
5657 static errcode_t pass1_read_inode(ext2_filsys fs, ext2_ino_t ino,
5658                                   struct ext2_inode *inode)
5659 {
5660         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5661
5662         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5663                 return EXT2_ET_CALLBACK_NOTHANDLED;
5664         *inode = *ctx->stashed_inode;
5665         return 0;
5666 }
5667
5668 static errcode_t pass1_write_inode(ext2_filsys fs, ext2_ino_t ino,
5669                             struct ext2_inode *inode)
5670 {
5671         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5672
5673         if ((ino == ctx->stashed_ino) && ctx->stashed_inode &&
5674                 (inode != ctx->stashed_inode))
5675                 *ctx->stashed_inode = *inode;
5676         return EXT2_ET_CALLBACK_NOTHANDLED;
5677 }
5678
5679 static errcode_t pass1_check_directory(ext2_filsys fs, ext2_ino_t ino)
5680 {
5681         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5682
5683         if ((ino != ctx->stashed_ino) || !ctx->stashed_inode)
5684                 return EXT2_ET_CALLBACK_NOTHANDLED;
5685
5686         if (!LINUX_S_ISDIR(ctx->stashed_inode->i_mode))
5687                 return EXT2_ET_NO_DIRECTORY;
5688         return 0;
5689 }
5690
5691 static errcode_t e2fsck_get_alloc_block(ext2_filsys fs, blk64_t goal,
5692                                         blk64_t *ret)
5693 {
5694         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5695         errcode_t       retval;
5696         blk64_t         new_block;
5697
5698         if (ctx->block_found_map) {
5699                 retval = ext2fs_new_block2(fs, goal, ctx->block_found_map,
5700                                            &new_block);
5701                 if (retval)
5702                         return retval;
5703                 if (fs->block_map) {
5704                         ext2fs_mark_block_bitmap2(fs->block_map, new_block);
5705                         ext2fs_mark_bb_dirty(fs);
5706                 }
5707         } else {
5708                 if (!fs->block_map) {
5709                         retval = ext2fs_read_block_bitmap(fs);
5710                         if (retval)
5711                                 return retval;
5712                 }
5713
5714                 retval = ext2fs_new_block2(fs, goal, fs->block_map, &new_block);
5715                 if (retval)
5716                         return retval;
5717         }
5718
5719         *ret = new_block;
5720         return (0);
5721 }
5722
5723 static errcode_t e2fsck_new_range(ext2_filsys fs, int flags, blk64_t goal,
5724                                   blk64_t len, blk64_t *pblk, blk64_t *plen)
5725 {
5726         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5727         errcode_t       retval;
5728
5729         if (ctx->block_found_map)
5730                 return ext2fs_new_range(fs, flags, goal, len,
5731                                         ctx->block_found_map, pblk, plen);
5732
5733         if (!fs->block_map) {
5734                 retval = ext2fs_read_block_bitmap(fs);
5735                 if (retval)
5736                         return retval;
5737         }
5738
5739         return ext2fs_new_range(fs, flags, goal, len, fs->block_map,
5740                                 pblk, plen);
5741 }
5742
5743 static void e2fsck_block_alloc_stats(ext2_filsys fs, blk64_t blk, int inuse)
5744 {
5745         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5746
5747         /* Never free a critical metadata block */
5748         if (ctx->block_found_map &&
5749             ctx->block_metadata_map &&
5750             inuse < 0 &&
5751             ext2fs_test_block_bitmap2(ctx->block_metadata_map, blk))
5752                 return;
5753
5754         if (ctx->block_found_map) {
5755                 if (inuse > 0)
5756                         ext2fs_mark_block_bitmap2(ctx->block_found_map, blk);
5757                 else
5758                         ext2fs_unmark_block_bitmap2(ctx->block_found_map, blk);
5759         }
5760 }
5761
5762 static void e2fsck_block_alloc_stats_range(ext2_filsys fs, blk64_t blk,
5763                                            blk_t num, int inuse)
5764 {
5765         e2fsck_t ctx = (e2fsck_t) fs->priv_data;
5766
5767         /* Never free a critical metadata block */
5768         if (ctx->block_found_map &&
5769             ctx->block_metadata_map &&
5770             inuse < 0 &&
5771             ext2fs_test_block_bitmap_range2(ctx->block_metadata_map, blk, num))
5772                 return;
5773
5774         if (ctx->block_found_map) {
5775                 if (inuse > 0)
5776                         ext2fs_mark_block_bitmap_range2(ctx->block_found_map,
5777                                                         blk, num);
5778                 else
5779                         ext2fs_unmark_block_bitmap_range2(ctx->block_found_map,
5780                                                         blk, num);
5781         }
5782 }
5783
5784 void e2fsck_use_inode_shortcuts(e2fsck_t ctx, int use_shortcuts)
5785 {
5786         ext2_filsys fs = ctx->fs;
5787
5788         if (use_shortcuts) {
5789                 fs->get_blocks = pass1_get_blocks;
5790                 fs->check_directory = pass1_check_directory;
5791                 fs->read_inode = pass1_read_inode;
5792                 fs->write_inode = pass1_write_inode;
5793                 ctx->stashed_ino = 0;
5794         } else {
5795                 fs->get_blocks = 0;
5796                 fs->check_directory = 0;
5797                 fs->read_inode = 0;
5798                 fs->write_inode = 0;
5799         }
5800 }
5801
5802 void e2fsck_intercept_block_allocations(e2fsck_t ctx)
5803 {
5804         ext2fs_set_alloc_block_callback(ctx->fs, e2fsck_get_alloc_block, 0);
5805         ext2fs_set_block_alloc_stats_callback(ctx->fs,
5806                                                 e2fsck_block_alloc_stats, 0);
5807         ext2fs_set_new_range_callback(ctx->fs, e2fsck_new_range, NULL);
5808         ext2fs_set_block_alloc_stats_range_callback(ctx->fs,
5809                                         e2fsck_block_alloc_stats_range, NULL);
5810 }