+Add support for the uninit_groups feature to the kernel.
+
Keep a high water mark of used inodes for each group to improve e2fsck time.
Block and inode bitmaps can be uninitialized on disk via a flag in the
group descriptor to avoid reading or scanning them at e2fsck time.
A checksum of each group descriptor is used to ensure that corruption in
the group descriptor's bit flags does not cause incorrect operation.
-Index: linux-stage/fs/ext3/balloc.c
+Index: linux-2.6.9-full/include/linux/ext3_fs.h
===================================================================
---- linux-stage.orig/fs/ext3/balloc.c 2007-03-14 04:44:12.000000000 -0400
-+++ linux-stage/fs/ext3/balloc.c 2007-03-14 16:23:48.000000000 -0400
-@@ -73,6 +73,95 @@ struct ext3_group_desc * ext3_get_group_
- return gdp + desc;
- }
+--- linux-2.6.9-full.orig/include/linux/ext3_fs.h 2007-03-28 18:35:41.000000000 +0400
++++ linux-2.6.9-full/include/linux/ext3_fs.h 2007-03-28 18:36:16.000000000 +0400
+@@ -153,16 +153,22 @@ struct ext3_allocation_request {
+ */
+ struct ext3_group_desc
+ {
+- __le32 bg_block_bitmap; /* Blocks bitmap block */
+- __le32 bg_inode_bitmap; /* Inodes bitmap block */
++ __le32 bg_block_bitmap; /* Blocks bitmap block */
++ __le32 bg_inode_bitmap; /* Inodes bitmap block */
+ __le32 bg_inode_table; /* Inodes table block */
+ __le16 bg_free_blocks_count; /* Free blocks count */
+ __le16 bg_free_inodes_count; /* Free inodes count */
+ __le16 bg_used_dirs_count; /* Directories count */
+- __u16 bg_pad;
+- __le32 bg_reserved[3];
++ __le16 bg_flags; /* EXT3_BG_flags (UNINIT, etc) */
++ __le32 bg_reserved[2]; /* Likely block/inode bitmap checksum */
++ __le16 bg_itable_unused; /* Unused inodes count */
++ __le16 bg_checksum; /* crc16(sb_uuid+group+desc) */
+ };
-+unsigned long ext3_free_blocks_after_init(struct super_block *sb,
-+ int block_group,
-+ struct ext3_group_desc *gdp)
-+{
-+ struct ext3_sb_info *sbi = EXT3_SB(sb);
-+ unsigned long blks;
-+ int has_sb;
++#define EXT3_BG_INODE_UNINIT 0x0001 /* Inode table/bitmap not in use */
++#define EXT3_BG_BLOCK_UNINIT 0x0002 /* Block bitmap not in use */
++#define EXT3_BG_INODE_ZEROED 0x0004 /* On-disk itable initialized to zero */
+
-+ /* Last and first groups are always initialized */
-+ blks = le32_to_cpu(EXT3_BLOCKS_PER_GROUP(sb));
-+ /* Account for for sb, gdt */
-+ has_sb = ext3_bg_has_super(sb, block_group);
-+ if (has_sb)
-+ blks--;
+ /*
+ * Macro-instructions used to manage group descriptors
+ */
+@@ -572,6 +578,7 @@ static inline struct ext3_inode_info *EX
+ #define EXT3_FEATURE_RO_COMPAT_SPARSE_SUPER 0x0001
+ #define EXT3_FEATURE_RO_COMPAT_LARGE_FILE 0x0002
+ #define EXT3_FEATURE_RO_COMPAT_BTREE_DIR 0x0004
++#define EXT4_FEATURE_RO_COMPAT_GDT_CSUM 0x0010
+ #define EXT4_FEATURE_RO_COMPAT_DIR_NLINK 0x0020
+
+ #define EXT3_FEATURE_INCOMPAT_COMPRESSION 0x0001
+@@ -588,6 +595,7 @@ static inline struct ext3_inode_info *EX
+ EXT3_FEATURE_INCOMPAT_EXTENTS)
+ #define EXT3_FEATURE_RO_COMPAT_SUPP (EXT3_FEATURE_RO_COMPAT_SPARSE_SUPER| \
+ EXT3_FEATURE_RO_COMPAT_LARGE_FILE| \
++ EXT4_FEATURE_RO_COMPAT_GDT_CSUM| \
+ EXT4_FEATURE_RO_COMPAT_DIR_NLINK| \
+ EXT3_FEATURE_RO_COMPAT_BTREE_DIR)
+
+Index: linux-2.6.9-full/fs/ext3/resize.c
+===================================================================
+--- linux-2.6.9-full.orig/fs/ext3/resize.c 2006-03-10 18:20:03.000000000 +0300
++++ linux-2.6.9-full/fs/ext3/resize.c 2007-03-28 18:36:16.000000000 +0400
+@@ -19,6 +19,7 @@
+ #include <linux/errno.h>
+ #include <linux/slab.h>
+
++#include "group.h"
+
+ #define outside(b, first, last) ((b) < (first) || (b) >= (last))
+ #define inside(b, first, last) ((b) >= (first) && (b) < (last))
+@@ -807,6 +808,7 @@ int ext3_group_add(struct super_block *s
+ gdp->bg_inode_table = cpu_to_le32(input->inode_table);
+ gdp->bg_free_blocks_count = cpu_to_le16(input->free_blocks_count);
+ gdp->bg_free_inodes_count = cpu_to_le16(EXT3_INODES_PER_GROUP(sb));
++ gdp->bg_checksum = ext3_group_desc_csum(sbi, input->group, gdp);
+
+ /*
+ * Make the new blocks and inodes valid next. We do this before
+Index: linux-2.6.9-full/fs/ext3/super.c
+===================================================================
+--- linux-2.6.9-full.orig/fs/ext3/super.c 2007-03-28 18:35:42.000000000 +0400
++++ linux-2.6.9-full/fs/ext3/super.c 2007-03-28 18:36:16.000000000 +0400
+@@ -38,6 +38,7 @@
+ #include <asm/uaccess.h>
+ #include "xattr.h"
+ #include "acl.h"
++#include "group.h"
+
+ static int ext3_load_journal(struct super_block *, struct ext3_super_block *,
+ unsigned long journal_devnum);
+@@ -1090,6 +1091,90 @@ static int ext3_setup_super(struct super
+ return res;
+ }
+
++#if !defined(CONFIG_CRC16) && !defined(CONFIG_CRC16_MODULE)
++/** CRC table for the CRC-16. The poly is 0x8005 (x^16 + x^15 + x^2 + 1) */
++__u16 const crc16_table[256] = {
++ 0x0000, 0xC0C1, 0xC181, 0x0140, 0xC301, 0x03C0, 0x0280, 0xC241,
++ 0xC601, 0x06C0, 0x0780, 0xC741, 0x0500, 0xC5C1, 0xC481, 0x0440,
++ 0xCC01, 0x0CC0, 0x0D80, 0xCD41, 0x0F00, 0xCFC1, 0xCE81, 0x0E40,
++ 0x0A00, 0xCAC1, 0xCB81, 0x0B40, 0xC901, 0x09C0, 0x0880, 0xC841,
++ 0xD801, 0x18C0, 0x1980, 0xD941, 0x1B00, 0xDBC1, 0xDA81, 0x1A40,
++ 0x1E00, 0xDEC1, 0xDF81, 0x1F40, 0xDD01, 0x1DC0, 0x1C80, 0xDC41,
++ 0x1400, 0xD4C1, 0xD581, 0x1540, 0xD701, 0x17C0, 0x1680, 0xD641,
++ 0xD201, 0x12C0, 0x1380, 0xD341, 0x1100, 0xD1C1, 0xD081, 0x1040,
++ 0xF001, 0x30C0, 0x3180, 0xF141, 0x3300, 0xF3C1, 0xF281, 0x3240,
++ 0x3600, 0xF6C1, 0xF781, 0x3740, 0xF501, 0x35C0, 0x3480, 0xF441,
++ 0x3C00, 0xFCC1, 0xFD81, 0x3D40, 0xFF01, 0x3FC0, 0x3E80, 0xFE41,
++ 0xFA01, 0x3AC0, 0x3B80, 0xFB41, 0x3900, 0xF9C1, 0xF881, 0x3840,
++ 0x2800, 0xE8C1, 0xE981, 0x2940, 0xEB01, 0x2BC0, 0x2A80, 0xEA41,
++ 0xEE01, 0x2EC0, 0x2F80, 0xEF41, 0x2D00, 0xEDC1, 0xEC81, 0x2C40,
++ 0xE401, 0x24C0, 0x2580, 0xE541, 0x2700, 0xE7C1, 0xE681, 0x2640,
++ 0x2200, 0xE2C1, 0xE381, 0x2340, 0xE101, 0x21C0, 0x2080, 0xE041,
++ 0xA001, 0x60C0, 0x6180, 0xA141, 0x6300, 0xA3C1, 0xA281, 0x6240,
++ 0x6600, 0xA6C1, 0xA781, 0x6740, 0xA501, 0x65C0, 0x6480, 0xA441,
++ 0x6C00, 0xACC1, 0xAD81, 0x6D40, 0xAF01, 0x6FC0, 0x6E80, 0xAE41,
++ 0xAA01, 0x6AC0, 0x6B80, 0xAB41, 0x6900, 0xA9C1, 0xA881, 0x6840,
++ 0x7800, 0xB8C1, 0xB981, 0x7940, 0xBB01, 0x7BC0, 0x7A80, 0xBA41,
++ 0xBE01, 0x7EC0, 0x7F80, 0xBF41, 0x7D00, 0xBDC1, 0xBC81, 0x7C40,
++ 0xB401, 0x74C0, 0x7580, 0xB541, 0x7700, 0xB7C1, 0xB681, 0x7640,
++ 0x7200, 0xB2C1, 0xB381, 0x7340, 0xB101, 0x71C0, 0x7080, 0xB041,
++ 0x5000, 0x90C1, 0x9181, 0x5140, 0x9301, 0x53C0, 0x5280, 0x9241,
++ 0x9601, 0x56C0, 0x5780, 0x9741, 0x5500, 0x95C1, 0x9481, 0x5440,
++ 0x9C01, 0x5CC0, 0x5D80, 0x9D41, 0x5F00, 0x9FC1, 0x9E81, 0x5E40,
++ 0x5A00, 0x9AC1, 0x9B81, 0x5B40, 0x9901, 0x59C0, 0x5880, 0x9841,
++ 0x8801, 0x48C0, 0x4980, 0x8941, 0x4B00, 0x8BC1, 0x8A81, 0x4A40,
++ 0x4E00, 0x8EC1, 0x8F81, 0x4F40, 0x8D01, 0x4DC0, 0x4C80, 0x8C41,
++ 0x4400, 0x84C1, 0x8581, 0x4540, 0x8701, 0x47C0, 0x4680, 0x8641,
++ 0x8201, 0x42C0, 0x4380, 0x8341, 0x4100, 0x81C1, 0x8081, 0x4040
++};
+
-+ if (!EXT3_HAS_INCOMPAT_FEATURE(sb, EXT3_FEATURE_INCOMPAT_META_BG) ||
-+ block_group < le32_to_cpu(sbi->s_es->s_first_meta_bg)) {
-+ if (has_sb) {
-+ blks -= le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks);
-+ blks -= ext3_bg_num_gdb(sb, block_group);
-+ }
-+ } else { /* For META_BG BLOCK GROUPS */
-+ int group_rel = (block_group -
-+ le32_to_cpu(sbi->s_es->s_first_meta_bg)) %
-+ EXT3_DESC_PER_BLOCK(sb);
-+ if (group_rel == 0 || group_rel == 1 ||
-+ (group_rel == EXT3_DESC_PER_BLOCK(sb) - 1))
-+ blks--;
-+ }
++static inline __u16 crc16_byte(__u16 crc, const __u8 data)
++{
++ return (crc >> 8) ^ crc16_table[(crc ^ data) & 0xff];
++}
+
-+ /* Account for bitmaps and inode table */
-+ blks -= sbi->s_itb_per_group + 2;
-+ return blks;
++__u16 crc16(__u16 crc, __u8 const *buffer, size_t len)
++{
++ while (len--)
++ crc = crc16_byte(crc, *buffer++);
++ return crc;
+}
++#endif
+
-+/* Initializes an uninitialized block bitmap */
-+void ext3_init_block_bitmap(struct super_block *sb, struct buffer_head *bh,
-+ int block_group, struct ext3_group_desc *gdp)
++__le16 ext3_group_desc_csum(struct ext3_sb_info *sbi, __u32 block_group,
++ struct ext3_group_desc *gdp)
+{
-+ unsigned long startblk;
-+ int bit, bit_max;
-+ struct ext3_sb_info *sbi = EXT3_SB(sb);
++ __u16 crc = 0;
+
-+ J_ASSERT_BH(bh, buffer_locked(bh));
++ if (sbi->s_es->s_feature_ro_compat &
++ cpu_to_le32(EXT4_FEATURE_RO_COMPAT_GDT_CSUM)) {
++ int offset = offsetof(struct ext3_group_desc, bg_checksum);
++ __le32 le_group = cpu_to_le32(block_group);
+
-+ /* If the checksum is bad, then just mark all bits in use for safety */
-+ if (!ext3_group_desc_csum_verify(sbi, block_group, gdp)) {
-+ ext3_error(sb, __FUNCTION__, "Checksum bad for group %u\n",
-+ block_group);
-+ gdp->bg_free_blocks_count = 0;
-+ gdp->bg_free_inodes_count = 0;
-+ memset(bh->b_data, 0xff, sb->s_blocksize);
-+ return;
++ crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
++ crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group));
++ crc = crc16(crc, (__u8 *)gdp, offset);
++ offset += sizeof(gdp->bg_checksum); /* skip checksum */
++ BUG_ON(offset != sizeof(*gdp)); /* XXX handle s_desc_size */
++ /* for checksum of struct ext4_group_desc do the rest...
++ if (offset < sbi->s_es->s_desc_size) {
++ crc = crc16(crc, (__u8 *)gdp + offset,
++ sbi->s_es->s_desc_size - offset);
++ */
+ }
-+ memset(bh->b_data, 0, bh->b_size);
+
-+ /* Set bits for sb, gdt */
-+ startblk = block_group * EXT3_BLOCKS_PER_GROUP(sb) +
-+ le32_to_cpu(sbi->s_es->s_first_data_block);
++ return cpu_to_le16(crc);
++}
+
-+ bit = 0;
-+ bit_max = ext3_bg_has_super(sb, block_group);
++int ext3_group_desc_csum_verify(struct ext3_sb_info *sbi, __u32 block_group,
++ struct ext3_group_desc *gdp)
++{
++ if (gdp->bg_checksum != ext3_group_desc_csum(sbi, block_group, gdp))
++ return 0;
+
-+ if (!EXT3_HAS_INCOMPAT_FEATURE(sb, EXT3_FEATURE_INCOMPAT_META_BG) ||
-+ block_group < le32_to_cpu(sbi->s_es->s_first_meta_bg)) {
-+ if (bit_max) {
-+ bit_max += ext3_bg_num_gdb(sb, block_group);
-+ bit_max +=le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks);
-+ }
-+ } else { /* For META_BG_BLOCK_GROUPS */
-+ int group_rel = (block_group -
-+ le32_to_cpu(sbi->s_es->s_first_meta_bg)) %
-+ EXT3_DESC_PER_BLOCK(sb);
-+ if (group_rel == 0 || group_rel == 1 ||
-+ (group_rel == EXT3_DESC_PER_BLOCK(sb) - 1))
-+ bit_max += 1;
-+ }
-+ for (; bit < bit_max; bit++)
-+ ext3_set_bit(bit, bh->b_data);
-+
-+ /* Set bits for bitmaps and inode table */
-+ ext3_set_bit(le32_to_cpu(gdp->bg_block_bitmap) - startblk, bh->b_data);
-+ ext3_set_bit(le32_to_cpu(gdp->bg_inode_bitmap) - startblk, bh->b_data);
-+ bit_max = bit + sbi->s_itb_per_group;
-+ for (bit = le32_to_cpu(gdp->bg_inode_table) - startblk;
-+ bit < bit_max; bit++)
-+ ext3_set_bit(bit, bh->b_data);
++ return 1;
+}
+
- /*
- * Read the bitmap for a given block_group, reading into the specified
- * slot in the superblock's bitmap cache.
-@@ -88,7 +170,19 @@ read_block_bitmap(struct super_block *sb
- desc = ext3_get_group_desc (sb, block_group, NULL);
- if (!desc)
- goto error_out;
-- bh = sb_bread(sb, le32_to_cpu(desc->bg_block_bitmap));
-+ if (desc->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
-+ bh = sb_getblk(sb, le32_to_cpu(desc->bg_block_bitmap));
-+ if (!buffer_uptodate(bh)) {
-+ lock_buffer(bh);
-+ if (!buffer_uptodate(bh)) {
-+ ext3_init_block_bitmap(sb, bh,block_group,desc);
-+ set_buffer_uptodate(bh);
-+ }
-+ unlock_buffer(bh);
-+ }
-+ } else {
-+ bh = sb_bread(sb, le32_to_cpu(desc->bg_block_bitmap));
-+ }
- if (!bh)
- ext3_error (sb, "read_block_bitmap",
- "Cannot read block bitmap - "
-@@ -427,6 +520,7 @@ do_more:
- gdp->bg_free_blocks_count =
- cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count) +
- *pdquot_freed_blocks);
-+ gdp->bg_checksum = ext3_group_desc_csum(sbi, block_group, gdp);
- spin_unlock(sb_bgl_lock(sbi, block_group));
- percpu_counter_mod(&sbi->s_freeblocks_counter, count);
-
-@@ -1175,7 +1270,7 @@ int ext3_new_block_old(handle_t *handle,
-
- goal_group = group_no;
- retry:
-- free_blocks = le16_to_cpu(gdp->bg_free_blocks_count);
-+ free_blocks = EXT3_BG_BLOCKS_FREE(sb, group_no, gdp);
- if (free_blocks > 0) {
- ret_block = ((goal - le32_to_cpu(es->s_first_data_block)) %
- EXT3_BLOCKS_PER_GROUP(sb));
-@@ -1206,7 +1304,7 @@ retry:
- *errp = -EIO;
- goto out;
+ /* Called at mount-time, super-block is locked */
+ static int ext3_check_descriptors (struct super_block * sb)
+ {
+@@ -1139,6 +1224,13 @@ static int ext3_check_descriptors (struc
+ le32_to_cpu(gdp->bg_inode_table));
+ return 0;
}
-- free_blocks = le16_to_cpu(gdp->bg_free_blocks_count);
-+ free_blocks = EXT3_BG_BLOCKS_FREE(sb, group_no, gdp);
- if (free_blocks <= 0)
- continue;
-
-@@ -1306,10 +1407,17 @@ allocated:
- ret_block, goal_hits, goal_attempts);
-
- spin_lock(sb_bgl_lock(sbi, group_no));
-+ free_blocks = 0;
-+ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
-+ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_BLOCK_UNINIT);
-+ free_blocks = ext3_free_blocks_after_init(sb, group_no, gdp);
-+ gdp->bg_free_blocks_count = cpu_to_le16(free_blocks);
-+ }
- gdp->bg_free_blocks_count =
- cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count) - 1);
-+ gdp->bg_checksum = ext3_group_desc_csum(sbi, group_no, gdp);
- spin_unlock(sb_bgl_lock(sbi, group_no));
-- percpu_counter_mod(&sbi->s_freeblocks_counter, -1);
-+ percpu_counter_mod(&sbi->s_freeblocks_counter, free_blocks);
-
- BUFFER_TRACE(gdp_bh, "journal_dirty_metadata for group descriptor");
- err = ext3_journal_dirty_metadata(handle, gdp_bh);
-@@ -1379,7 +1479,7 @@ unsigned long ext3_count_free_blocks(str
- gdp = ext3_get_group_desc(sb, i, NULL);
- if (!gdp)
- continue;
-- desc_count += le16_to_cpu(gdp->bg_free_blocks_count);
-+ desc_count += EXT3_BG_BLOCKS_FREE(sb, i, gdp);
- brelse(bitmap_bh);
- bitmap_bh = read_block_bitmap(sb, i);
- if (bitmap_bh == NULL)
-@@ -1387,7 +1487,7 @@ unsigned long ext3_count_free_blocks(str
-
- x = ext3_count_free(bitmap_bh, sb->s_blocksize);
- printk("group %d: stored = %d, counted = %lu\n",
-- i, le16_to_cpu(gdp->bg_free_blocks_count), x);
-+ i, EXT3_BG_BLOCKS_FREE(sb, i, gdp), x);
- bitmap_count += x;
- }
- brelse(bitmap_bh);
-@@ -1403,7 +1503,7 @@ unsigned long ext3_count_free_blocks(str
- gdp = ext3_get_group_desc(sb, i, NULL);
- if (!gdp)
- continue;
-- desc_count += le16_to_cpu(gdp->bg_free_blocks_count);
-+ desc_count += EXT3_BG_BLOCKS_FREE(sb, i, gdp);
++ if (!ext3_group_desc_csum_verify(sbi, i, gdp)) {
++ ext3_error(sb, __FUNCTION__,
++ "Checksum for group %d failed (%u!=%u)\n", i,
++ le16_to_cpu(ext3_group_desc_csum(sbi,i,gdp)),
++ le16_to_cpu(gdp->bg_checksum));
++ return 0;
++ }
+ block += EXT3_BLOCKS_PER_GROUP(sb);
+ gdp++;
}
+Index: linux-2.6.9-full/fs/ext3/group.h
+===================================================================
+--- linux-2.6.9-full.orig/fs/ext3/group.h 2007-02-13 18:39:59.640066087 +0300
++++ linux-2.6.9-full/fs/ext3/group.h 2007-03-28 18:36:16.000000000 +0400
+@@ -0,0 +1,29 @@
++/*
++ * linux/fs/ext3/group.h
++ *
++ * Copyright (C) 2007 Cluster File Systems, Inc
++ *
++ * Author: Andreas Dilger <adilger@clusterfs.com>
++ */
++
++#ifndef _LINUX_EXT3_GROUP_H
++#define _LINUX_EXT3_GROUP_H
++#if defined(CONFIG_CRC16) || defined(CONFIG_CRC16_MODULE)
++#include <linux/crc16.h>
++#endif
++
++extern __le16 ext3_group_desc_csum(struct ext3_sb_info *sbi, __u32 group,
++ struct ext3_group_desc *gdp);
++extern int ext3_group_desc_csum_verify(struct ext3_sb_info *sbi, __u32 group,
++ struct ext3_group_desc *gdp);
++struct buffer_head *read_block_bitmap(struct super_block *sb,
++ unsigned int block_group);
++extern unsigned ext3_init_block_bitmap(struct super_block *sb,
++ struct buffer_head *bh, int group,
++ struct ext3_group_desc *desc);
++#define ext3_free_blocks_after_init(sb, group, desc) \
++ ext3_init_block_bitmap(sb, NULL, group, desc)
++extern unsigned ext3_init_inode_bitmap(struct super_block *sb,
++ struct buffer_head *bh, int group,
++ struct ext3_group_desc *desc);
++#endif /* _LINUX_EXT3_GROUP_H */
+Index: linux-2.6.9-full/fs/ext3/ialloc.c
+===================================================================
+--- linux-2.6.9-full.orig/fs/ext3/ialloc.c 2007-03-28 18:35:38.000000000 +0400
++++ linux-2.6.9-full/fs/ext3/ialloc.c 2007-03-28 18:36:16.000000000 +0400
+@@ -28,6 +28,7 @@
- return desc_count;
-@@ -1590,7 +1587,7 @@ void ext3_check_blocks_bitmap (struct su
- gdp = ext3_get_group_desc (sb, i, NULL);
- if (!gdp)
- continue;
-- desc_count += le16_to_cpu(gdp->bg_free_blocks_count);
-+ desc_count += EXT3_BG_BLOCKS_FREE(sb, i, gdp);
- brelse(bitmap_bh);
- bitmap_bh = read_block_bitmap(sb, i);
- if (bitmap_bh == NULL)
-@@ -1628,11 +1625,11 @@ void ext3_check_blocks_bitmap (struct su
- "group %d is marked free", j, i);
+ #include "xattr.h"
+ #include "acl.h"
++#include "group.h"
- x = ext3_count_free(bitmap_bh, sb->s_blocksize);
-- if (le16_to_cpu(gdp->bg_free_blocks_count) != x)
-+ if (EXT3_BG_BLOCKS_FREE(sb, i, gdp) != x)
- ext3_error (sb, "ext3_check_blocks_bitmap",
- "Wrong free blocks count for group %d, "
- "stored = %d, counted = %lu", i,
-- le16_to_cpu(gdp->bg_free_blocks_count), x);
-+ EXT3_BG_BLOCKS_FREE(sb, i, gdp), x);
- bitmap_count += x;
- }
- brelse(bitmap_bh);
-Index: linux-stage/fs/ext3/ialloc.c
---- linux-stage.orig/fs/ext3/ialloc.c 2007-03-14 04:44:13.000000000 -0400
-+++ linux-stage/fs/ext3/ialloc.c 2007-03-14 16:13:29.000000000 -0400
-@@ -43,6 +43,47 @@
+ /*
+ * ialloc.c contains the inodes allocation and deallocation routines
+@@ -43,6 +44,52 @@
* the free blocks count in the block.
*/
+}
+
+/* Initializes an uninitialized inode bitmap */
-+void ext3_init_inode_bitmap(struct super_block *sb, struct buffer_head *bh,
-+ int block_group, struct ext3_group_desc *gdp)
++unsigned ext3_init_inode_bitmap(struct super_block *sb,
++ struct buffer_head *bh, int block_group,
++ struct ext3_group_desc *gdp)
+{
+ struct ext3_sb_info *sbi = EXT3_SB(sb);
+
+ J_ASSERT_BH(bh, buffer_locked(bh));
+
-+ /* If the checksum is bad, then just mark all bits in use for safety */
++ /* If checksum is bad mark all blocks and inodes use to prevent
++ * allocation, essentially implementing a per-group read-only flag. */
+ if (!ext3_group_desc_csum_verify(sbi, block_group, gdp)) {
+ ext3_error(sb, __FUNCTION__, "Checksum bad for group %u\n",
+ block_group);
-+ memset(bh->b_data, 0xff, sb->s_blocksize);
+ gdp->bg_free_blocks_count = 0;
+ gdp->bg_free_inodes_count = 0;
-+ return;
++ gdp->bg_itable_unused = 0;
++ memset(bh->b_data, 0xff, sb->s_blocksize);
++ return 0;
+ }
+
-+ memset(bh->b_data, 0, EXT3_INODES_PER_GROUP(sb) + 7 / 8);
++ memset(bh->b_data, 0, (EXT3_INODES_PER_GROUP(sb) + 7) / 8);
+ mark_bitmap_end(EXT3_INODES_PER_GROUP(sb), EXT3_BLOCKS_PER_GROUP(sb),
+ bh->b_data);
++
++ return EXT3_INODES_PER_GROUP(sb);
+}
/*
* Read the inode allocation bitmap for a given block_group, reading
-@@ -59,8 +103,15 @@ read_inode_bitmap(struct super_block * s
+@@ -59,8 +106,19 @@ read_inode_bitmap(struct super_block * s
desc = ext3_get_group_desc(sb, block_group, NULL);
if (!desc)
goto error_out;
+ if (desc->bg_flags & cpu_to_le16(EXT3_BG_INODE_UNINIT)) {
+ bh = sb_getblk(sb, le32_to_cpu(desc->bg_inode_bitmap));
+ if (!buffer_uptodate(bh)) {
-+ ext3_init_inode_bitmap(sb, bh, block_group, desc);
-+ set_buffer_uptodate(bh);
++ lock_buffer(bh);
++ if (!buffer_uptodate(bh)) {
++ ext3_init_inode_bitmap(sb, bh,block_group,desc);
++ set_buffer_uptodate(bh);
++ }
++ unlock_buffer(bh);
+ }
+ } else {
+ bh = sb_bread(sb, le32_to_cpu(desc->bg_inode_bitmap));
if (!bh)
ext3_error(sb, "read_inode_bitmap",
"Cannot read inode bitmap - "
-@@ -169,6 +175,8 @@ void ext3_free_inode (handle_t *handle,
+@@ -169,6 +227,8 @@ void ext3_free_inode (handle_t *handle,
if (is_directory)
gdp->bg_used_dirs_count = cpu_to_le16(
le16_to_cpu(gdp->bg_used_dirs_count) - 1);
spin_unlock(sb_bgl_lock(sbi, block_group));
percpu_counter_inc(&sbi->s_freeinodes_counter);
if (is_directory)
-@@ -202,8 +210,8 @@ error_return:
- static int find_group_dir(struct super_block *sb, struct inode *parent)
- {
- int ngroups = EXT3_SB(sb)->s_groups_count;
-- int freei, avefreei;
-- struct ext3_group_desc *desc, *best_desc = NULL;
-+ int freei, avefreei, freeb, best_freeb = 0;
-+ struct ext3_group_desc *desc;
- struct buffer_head *bh;
- int group, best_group = -1;
-
-@@ -212,15 +220,14 @@ static int find_group_dir(struct super_b
-
- for (group = 0; group < ngroups; group++) {
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ if (!desc || (freei = EXT3_BG_INODES_FREE(sb, group, desc)) ==0)
- continue;
-- if (le16_to_cpu(desc->bg_free_inodes_count) < avefreei)
-+ if (freei < avefreei)
- continue;
-- if (!best_desc ||
-- (le16_to_cpu(desc->bg_free_blocks_count) >
-- le16_to_cpu(best_desc->bg_free_blocks_count))) {
-+ freeb = EXT3_BG_BLOCKS_PNLT(sb, group, desc);
-+ if (freeb > best_freeb) {
- best_group = group;
-- best_desc = desc;
-+ best_freeb = freeb;
- }
- }
- return best_group;
-@@ -284,14 +294,15 @@ static int find_group_orlov(struct super
- parent_group = (unsigned)group % ngroups;
- for (i = 0; i < ngroups; i++) {
- group = (parent_group + i) % ngroups;
-- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ desc = ext3_get_group_desc(sb, group, &bh);
-+ if (!desc ||
-+ (freei = EXT3_BG_INODES_FREE(sb, groups, desc)) ==0)
- continue;
- if (le16_to_cpu(desc->bg_used_dirs_count) >= best_ndir)
- continue;
-- if (le16_to_cpu(desc->bg_free_inodes_count) < avefreei)
-+ if (freei < avefreei)
- continue;
-- if (le16_to_cpu(desc->bg_free_blocks_count) < avefreeb)
-+ if (EXT3_BG_BLOCKS_PNLT(sb, group, desc) < avefreeb)
- continue;
- best_group = group;
- best_ndir = le16_to_cpu(desc->bg_used_dirs_count);
-@@ -318,13 +330,13 @@ static int find_group_orlov(struct super
- for (i = 0; i < ngroups; i++) {
- group = (parent_group + i) % ngroups;
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ if (!desc || (freei = EXT3_BG_INODES_FREE(sb, group, desc)) ==0)
- continue;
- if (le16_to_cpu(desc->bg_used_dirs_count) >= max_dirs)
- continue;
-- if (le16_to_cpu(desc->bg_free_inodes_count) < min_inodes)
-+ if (freei < min_inodes)
- continue;
-- if (le16_to_cpu(desc->bg_free_blocks_count) < min_blocks)
-+ if (EXT3_BG_BLOCKS_PNLT(sb, group, desc) < min_blocks)
- continue;
- return group;
- }
-@@ -333,9 +347,9 @@ fallback:
- for (i = 0; i < ngroups; i++) {
- group = (parent_group + i) % ngroups;
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ if (!desc || (freei = EXT3_BG_INODES_FREE(sb, group, desc)) ==0)
- continue;
-- if (le16_to_cpu(desc->bg_free_inodes_count) >= avefreei)
-+ if (freei >= avefreei)
- return group;
- }
-
-@@ -362,6 +377,7 @@ static int find_group_other(struct super
- int group, i;
- int best_group = -1;
- int avefreeb, freeb, best_group_freeb = 0;
-+ int freei;
-
- /*
- * Try to place the inode in its parent directory
-@@ -380,8 +396,8 @@ static int find_group_other(struct super
- */
- group = parent_group;
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (desc && le16_to_cpu(desc->bg_free_inodes_count) &&
-- (!S_ISREG(mode) || le16_to_cpu(desc->bg_free_blocks_count)))
-+ if (desc && EXT3_BG_INODES_FREE(sb, group, desc) &&
-+ (!S_ISREG(mode) || EXT3_BG_BLOCKS_PNLT(sb, group, desc)))
- return group;
- avefreeb = le32_to_cpu(sbi->s_es->s_free_blocks_count) / ngroups;
- /*
-@@ -392,11 +408,11 @@ static int find_group_other(struct super
- if (group >= ngroups)
- group -= ngroups;
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ if (!desc || EXT3_BG_INODES_FREE(sb, group, desc) == 0)
- continue;
- if (!S_ISREG(mode))
- return group;
-- if (le16_to_cpu(desc->bg_free_blocks_count) >= avefreeb)
-+ if (EXT3_BG_BLOCKS_PNLT(sb, group, desc) >= avefreeb)
- return group;
- }
-
-@@ -413,9 +431,10 @@ static int find_group_other(struct super
- if (++group >= ngroups)
- group = 0;
- desc = ext3_get_group_desc (sb, group, &bh);
-- if (!desc || !desc->bg_free_inodes_count)
-+ freei = EXT3_BG_INODES_FREE(sb, group, desc);
-+ if (!desc || !freei)
- continue;
-- freeb = le16_to_cpu(desc->bg_free_blocks_count);
-+ freeb = EXT3_BG_BLOCKS_PNLT(sb, group, desc);
- if (freeb > best_group_freeb) {
- best_group_freeb = freeb;
- best_group = group;
-@@ -453,6 +472,7 @@ struct inode *ext3_new_inode(handle_t *h
+@@ -453,7 +513,7 @@ struct inode *ext3_new_inode(handle_t *h
+ struct ext3_sb_info *sbi;
int err = 0;
struct inode *ret;
- int i;
-+ int unused_flag = 0;
+- int i;
++ int i, free = 0;
/* Cannot create files in a deleted directory */
if (!dir || !dir->i_nlink)
-@@ -581,18 +601,34 @@ got:
+@@ -566,11 +626,13 @@ repeat_in_this_group:
+ goto out;
+
+ got:
+- ino += group * EXT3_INODES_PER_GROUP(sb) + 1;
+- if (ino < EXT3_FIRST_INO(sb) || ino > le32_to_cpu(es->s_inodes_count)) {
+- ext3_error (sb, "ext3_new_inode",
+- "reserved inode or inode > inodes count - "
+- "block_group = %d, inode=%lu", group, ino);
++ ino++;
++ if ((group == 0 && ino < EXT3_FIRST_INO(sb)) ||
++ ino > EXT3_INODES_PER_GROUP(sb)) {
++ ext3_error(sb, __FUNCTION__,
++ "reserved inode or inode > inodes count - "
++ "block_group = %d, inode=%lu", group,
++ ino + group * EXT3_INODES_PER_GROUP(sb));
+ err = -EIO;
+ goto fail;
+ }
+@@ -578,13 +640,65 @@ got:
+ BUFFER_TRACE(bh2, "get_write_access");
err = ext3_journal_get_write_access(handle, bh2);
if (err) goto fail;
++
++ /* We may have to initialize the block bitmap if it isn't already */
++ if (EXT3_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_GDT_CSUM) &&
++ gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
++ struct buffer_head *block_bh = read_block_bitmap(sb, group);
++
++ BUFFER_TRACE(block_bh, "get block bitmap access");
++ err = ext3_journal_get_write_access(handle, block_bh);
++ if (err) {
++ brelse(block_bh);
++ goto fail;
++ }
++
++ free = 0;
++ spin_lock(sb_bgl_lock(sbi, group));
++ /* recheck and clear flag under lock if we still need to */
++ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
++ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_BLOCK_UNINIT);
++ free = ext3_free_blocks_after_init(sb, group, gdp);
++ gdp->bg_free_blocks_count = cpu_to_le16(free);
++ }
++ spin_unlock(sb_bgl_lock(sbi, group));
++
++ /* Don't need to dirty bitmap block if we didn't change it */
++ if (free) {
++ BUFFER_TRACE(block_bh, "dirty block bitmap");
++ err = ext3_journal_dirty_metadata(handle, block_bh);
++ }
++
++ brelse(block_bh);
++ if (err)
++ goto fail;
++ }
++
spin_lock(sb_bgl_lock(sbi, group));
-- gdp->bg_free_inodes_count =
-- cpu_to_le16(le16_to_cpu(gdp->bg_free_inodes_count) - 1);
-+ if (gdp->bg_free_inodes_count == 0) {
++ /* If we didn't allocate from within the initialized part of the inode
++ * table then we need to initialize up to this inode. */
++ if (EXT3_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_GDT_CSUM)) {
+ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_INODE_UNINIT)) {
-+ gdp->bg_itable_unused =
-+ cpu_to_le16(le32_to_cpu(es->s_inodes_per_group));
+ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_INODE_UNINIT);
++ free = EXT3_INODES_PER_GROUP(sb);
++ } else {
++ free = EXT3_INODES_PER_GROUP(sb) -
++ le16_to_cpu(gdp->bg_itable_unused);
++ }
++
++ if (ino > free) {
++ gdp->bg_itable_unused =
++ cpu_to_le16(EXT3_INODES_PER_GROUP(sb) - ino);
+ }
-+ /* If we didn't allocate from free initialized inodes,
-+ * then we allocated from uninitialized inodes. In this
-+ * case initialize one inode. */
-+ gdp->bg_itable_unused =
-+ cpu_to_le16(le16_to_cpu(gdp->bg_itable_unused) - 1);
-+ unused_flag = 1;
-+ } else {
-+ gdp->bg_free_inodes_count =
-+ cpu_to_le16(le16_to_cpu(gdp->bg_free_inodes_count) -1);
+ }
++
+ gdp->bg_free_inodes_count =
+ cpu_to_le16(le16_to_cpu(gdp->bg_free_inodes_count) - 1);
if (S_ISDIR(mode)) {
gdp->bg_used_dirs_count =
cpu_to_le16(le16_to_cpu(gdp->bg_used_dirs_count) + 1);
spin_unlock(sb_bgl_lock(sbi, group));
BUFFER_TRACE(bh2, "call ext3_journal_dirty_metadata");
err = ext3_journal_dirty_metadata(handle, bh2);
- if (err) goto fail;
-
-- percpu_counter_dec(&sbi->s_freeinodes_counter);
-+ if (!unused_flag)
-+ percpu_counter_dec(&sbi->s_freeinodes_counter);
- if (S_ISDIR(mode))
- percpu_counter_inc(&sbi->s_dirs_counter);
- sb->s_dirt = 1;
-Index: linux-stage/fs/ext3/mballoc.c
+@@ -606,7 +720,7 @@ got:
+ inode->i_gid = current->fsgid;
+ inode->i_mode = mode;
+
+- inode->i_ino = ino;
++ inode->i_ino = ino + group * EXT3_INODES_PER_GROUP(sb);
+ /* This is the optimal IO size (for stat), not the fs block size */
+ inode->i_blksize = PAGE_SIZE;
+ inode->i_blocks = 0;
+Index: linux-2.6.9-full/fs/ext3/mballoc.c
===================================================================
---- linux-stage.orig/fs/ext3/mballoc.c 2007-03-14 04:44:12.000000000 -0400
-+++ linux-stage/fs/ext3/mballoc.c 2007-03-14 16:13:29.000000000 -0400
-@@ -107,6 +107,7 @@ struct ext3_group_info {
+--- linux-2.6.9-full.orig/fs/ext3/mballoc.c 2007-03-28 15:42:45.000000000 +0400
++++ linux-2.6.9-full/fs/ext3/mballoc.c 2007-03-28 18:36:16.000000000 +0400
+@@ -36,6 +36,8 @@
+ #include <linux/seq_file.h>
+ #include <linux/version.h>
+
++#include "group.h"
++
+ /*
+ * MUSTDO:
+ * - test ext3_ext_search_left() and ext3_ext_search_right()
+@@ -323,6 +325,7 @@ struct ext3_group_info {
unsigned long bb_state;
- unsigned long bb_tid;
+ unsigned long bb_tid;
struct ext3_free_metadata *bb_md_cur;
+ struct ext3_group_desc *bb_gdp;
unsigned short bb_first_free;
unsigned short bb_free;
unsigned short bb_fragments;
-@@ -511,10 +512,7 @@ static int ext3_mb_init_cache(struct pag
+@@ -928,10 +931,7 @@ static int ext3_mb_init_cache(struct pag
if (first_group + i >= EXT3_SB(sb)->s_groups_count)
break;
err = -ENOMEM;
bh[i] = sb_getblk(sb, le32_to_cpu(desc->bg_block_bitmap));
-@@ -529,7 +530,12 @@ static int ext3_mb_init_cache(struct pag
+@@ -946,7 +946,12 @@ static int ext3_mb_init_cache(struct pag
unlock_buffer(bh[i]);
continue;
}
get_bh(bh[i]);
bh[i]->b_end_io = end_buffer_read_sync;
submit_bh(READ, bh[i]);
-@@ -1246,6 +1244,10 @@ static int ext3_mb_good_group(struct ext
+@@ -1703,6 +1708,10 @@ static int ext3_mb_good_group(struct ext
switch (cr) {
case 0:
- J_ASSERT(ac->ac_2order != 0);
+ BUG_ON(ac->ac_2order == 0);
+ /* If this group is uninitialized, skip it initially */
+ if (grp->bb_gdp->bg_flags &
+ cpu_to_le16(EXT3_BG_BLOCK_UNINIT))
bits = ac->ac_sb->s_blocksize_bits + 1;
for (i = ac->ac_2order; i <= bits; i++)
if (grp->bb_counters[i] > 0)
-@@ -1421,7 +1421,8 @@ repeat:
+@@ -1796,7 +1805,9 @@ repeat:
}
- ac.ac_groups_scanned++;
+ ac->ac_groups_scanned++;
- if (cr == 0)
+ if (cr == 0 || (e3b.bd_info->bb_gdp->bg_flags &
-+ cpu_to_le16(EXT3_BG_BLOCK_UNINIT)))
- ext3_mb_simple_scan_group(&ac, &e3b);
- else if (cr == 1 && *len == sbi->s_stripe)
- ext3_mb_scan_aligned(&ac, &e3b);
-@@ -1500,7 +1499,8 @@ found:
- * bitmap to be journaled */
-
- ext3_debug("using block group %d(%d)\n",
-- ac.ac_b_group.group, gdp->bg_free_blocks_count);
-+ ac.ac_b_group.group,
-+ EXT3_BG_BLOCKS_FREE(sb, ac.ac_b_group.group, gdp));
-
- bitmap_bh = read_block_bitmap(sb, ac.ac_b_ex.fe_group);
- if (!bitmap_bh) {
-@@ -1537,9 +1543,17 @@ found:
- mb_set_bits(bitmap_bh->b_data, ac.ac_b_ex.fe_start, ac.ac_b_ex.fe_len);
-
- spin_lock(sb_bgl_lock(sbi, ac.ac_b_ex.fe_group));
-+ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
-+ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_BLOCK_UNINIT);
-+ gdp->bg_free_blocks_count =
-+ cpu_to_le16(ext3_free_blocks_after_init(sb,
-+ ac.ac_b_ex.fe_group,
-+ gdp));
-+ }
- gdp->bg_free_blocks_count =
- cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count)
- - ac.ac_b_ex.fe_len);
-+ gdp->bg_checksum = ext3_group_desc_csum(sbi, ac.ac_b_ex.fe_group, gdp);
- spin_unlock(sb_bgl_lock(sbi, ac.ac_b_ex.fe_group));
- percpu_counter_mod(&sbi->s_freeblocks_counter, - ac.ac_b_ex.fe_len);
-
-@@ -1992,16 +1991,16 @@ int ext3_mb_init_backend(struct super_bl
++ cpu_to_le16(EXT3_BG_BLOCK_UNINIT) &&
++ ac->ac_2order != 0))
+ ext3_mb_simple_scan_group(ac, &e3b);
+ else if (cr == 1 && ac->ac_g_ex.fe_len == sbi->s_stripe)
+ ext3_mb_scan_aligned(ac, &e3b);
+@@ -2267,12 +2278,13 @@ int ext3_mb_init_backend(struct super_bl
i--;
goto err_freebuddy;
}
- memset(meta_group_info[j], 0, len);
set_bit(EXT3_GROUP_INFO_NEED_INIT_BIT,
&meta_group_info[j]->bb_state);
-- meta_group_info[j]->bb_free =
-- le16_to_cpu(desc->bg_free_blocks_count);
-+ meta_group_info[j]->bb_free = EXT3_BG_BLOCKS_FREE(sb, j, desc);
- }
- return 0;
-@@ -2397,6 +2410,7 @@ do_more:
+@@ -2936,9 +2948,17 @@ int ext3_mb_mark_diskspace_used(struct e
+ mb_set_bits(bitmap_bh->b_data, ac->ac_b_ex.fe_start, ac->ac_b_ex.fe_len);
+
+ spin_lock(sb_bgl_lock(sbi, ac->ac_b_ex.fe_group));
++ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
++ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_BLOCK_UNINIT);
++ gdp->bg_free_blocks_count =
++ cpu_to_le16(ext3_free_blocks_after_init(sb,
++ ac->ac_b_ex.fe_group,
++ gdp));
++ }
+ gdp->bg_free_blocks_count =
+ cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count)
+ - ac->ac_b_ex.fe_len);
++ gdp->bg_checksum = ext3_group_desc_csum(sbi, ac->ac_b_ex.fe_group, gdp);
+ spin_unlock(sb_bgl_lock(sbi, ac->ac_b_ex.fe_group));
+ percpu_counter_mod(&sbi->s_freeblocks_counter, - ac->ac_b_ex.fe_len);
+
+@@ -4303,6 +4323,7 @@ do_more:
spin_lock(sb_bgl_lock(sbi, block_group));
gdp->bg_free_blocks_count =
cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count) + count);
spin_unlock(sb_bgl_lock(sbi, block_group));
percpu_counter_mod(&sbi->s_freeblocks_counter, count);
-Index: linux-stage/fs/ext3/resize.c
+Index: linux-2.6.9-full/fs/ext3/balloc.c
===================================================================
---- linux-stage.orig/fs/ext3/resize.c 2007-03-14 04:44:13.000000000 -0400
-+++ linux-stage/fs/ext3/resize.c 2007-03-14 16:13:29.000000000 -0400
-@@ -807,6 +807,9 @@ int ext3_group_add(struct super_block *s
- gdp->bg_inode_table = cpu_to_le32(input->inode_table);
- gdp->bg_free_blocks_count = cpu_to_le16(input->free_blocks_count);
- gdp->bg_free_inodes_count = cpu_to_le16(EXT3_INODES_PER_GROUP(sb));
-+ spin_lock(sb_bgl_lock(sbi, input->group)); /* not strictly needed */
-+ gdp->bg_checksum = ext3_group_desc_csum(sbi, input->group, gdp);
-+ spin_unlock(sb_bgl_lock(sbi, input->group));
+--- linux-2.6.9-full.orig/fs/ext3/balloc.c 2007-03-28 15:45:41.000000000 +0400
++++ linux-2.6.9-full/fs/ext3/balloc.c 2007-03-28 18:36:16.000000000 +0400
+@@ -20,6 +20,7 @@
+ #include <linux/quotaops.h>
+ #include <linux/buffer_head.h>
- /*
- * Make the new blocks and inodes valid next. We do this before
-Index: linux-stage/fs/ext3/super.c
-===================================================================
---- linux-stage.orig/fs/ext3/super.c 2007-03-14 04:44:13.000000000 -0400
-+++ linux-stage/fs/ext3/super.c 2007-03-14 16:13:29.000000000 -0400
-@@ -1084,6 +1084,56 @@ static int ext3_setup_super(struct super
- return res;
++#include "group.h"
+ /*
+ * balloc.c contains the blocks allocation and deallocation routines
+ */
+@@ -73,6 +74,75 @@ struct ext3_group_desc * ext3_get_group_
+ return gdp + desc;
}
-+static __u16 crc16(__u16 crc, const u8 *buf, size_t len)
++/* Initializes an uninitialized block bitmap if given, and returns the
++ * number of blocks free in the group. */
++unsigned ext3_init_block_bitmap(struct super_block *sb, struct buffer_head *bh,
++ int block_group, struct ext3_group_desc *gdp)
+{
-+ __u16 tmp;
++ unsigned long start;
++ int bit, bit_max;
++ unsigned free_blocks;
++ struct ext3_sb_info *sbi = EXT3_SB(sb);
+
-+ while (len--) {
-+ crc ^= *buf++;
-+ crc ^= (u8)crc >> 4;
-+ tmp = (u8)crc;
-+ crc ^= (tmp ^ (tmp << 1)) << 4;
-+ }
-+ return crc;
-+}
++ if (bh) {
++ J_ASSERT_BH(bh, buffer_locked(bh));
+
-+__u16 ext3_group_desc_csum(struct ext3_sb_info *sbi, __u32 block_group,
-+ struct ext3_group_desc *gdp)
-+{
-+ __u16 crc = 0;
++ /* If checksum is bad mark all blocks use to prevent allocation,
++ * essentially implementing a per-group read-only flag. */
++ if (!ext3_group_desc_csum_verify(sbi, block_group, gdp)) {
++ ext3_error(sb, __FUNCTION__,
++ "Checksum bad for group %u\n", block_group);
++ gdp->bg_free_blocks_count = 0;
++ gdp->bg_free_inodes_count = 0;
++ gdp->bg_itable_unused = 0;
++ memset(bh->b_data, 0xff, sb->s_blocksize);
++ return 0;
++ }
++ memset(bh->b_data, 0, sb->s_blocksize);
++ }
+
-+#ifdef CONFIG_SMP
-+ J_ASSERT(spin_is_locked(sb_bgl_lock(sbi, block_group)));
-+#endif
-+ if (sbi->s_es->s_feature_ro_compat &
-+ cpu_to_le32(EXT4_FEATURE_RO_COMPAT_GDT_CSUM)) {
-+ int offset = offsetof(struct ext3_group_desc, bg_checksum);
++ /* Check for superblock and gdt backups in this group */
++ bit_max = ext3_bg_has_super(sb, block_group);
+
-+ block_group = cpu_to_le32(block_group);
-+ crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
-+ crc = crc16(crc, (__u8 *)&block_group, sizeof(block_group));
-+ crc = crc16(crc, (__u8 *)gdp, offset);
-+ offset += sizeof(gdp->bg_checksum); /* skip checksum */
-+ BUG_ON(offset != sizeof(*gdp)); /* XXX handle s_desc_size */
-+ /* for checksum of struct ext4_group_desc do the rest...
-+ if (offset < sbi->s_es->s_desc_size) {
-+ crc = crc16(crc, (__u8 *)gdp + offset,
-+ sbi->s_es->s_desc_size - offset);
-+ */
++ if (!EXT3_HAS_INCOMPAT_FEATURE(sb, EXT3_FEATURE_INCOMPAT_META_BG) ||
++ block_group < le32_to_cpu(sbi->s_es->s_first_meta_bg) *
++ sbi->s_desc_per_block) {
++ if (bit_max) {
++ bit_max += ext3_bg_num_gdb(sb, block_group);
++ bit_max +=le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks);
++ }
++ } else { /* For META_BG_BLOCK_GROUPS */
++ int group_rel = (block_group -
++ le32_to_cpu(sbi->s_es->s_first_meta_bg)) %
++ EXT3_DESC_PER_BLOCK(sb);
++ if (group_rel == 0 || group_rel == 1 ||
++ (group_rel == EXT3_DESC_PER_BLOCK(sb) - 1))
++ bit_max += 1;
+ }
+
-+ return cpu_to_le16(crc);
-+}
++ /* Last and first groups are always initialized */
++ free_blocks = EXT3_BLOCKS_PER_GROUP(sb) - bit_max;
+
-+int ext3_group_desc_csum_verify(struct ext3_sb_info *sbi, __u32 block_group,
-+ struct ext3_group_desc *gdp)
-+{
-+ if (gdp->bg_checksum != ext3_group_desc_csum(sbi, block_group, gdp))
-+ return 0;
++ if (bh) {
++ for (bit = 0; bit < bit_max; bit++)
++ ext3_set_bit(bit, bh->b_data);
+
-+ return 1;
-+}
++ start = block_group * EXT3_BLOCKS_PER_GROUP(sb) +
++ le32_to_cpu(sbi->s_es->s_first_data_block);
+
- /* Called at mount-time, super-block is locked */
- static int ext3_check_descriptors (struct super_block * sb)
- {
-@@ -1133,6 +1179,13 @@ static int ext3_check_descriptors (struc
- le32_to_cpu(gdp->bg_inode_table));
- return 0;
- }
-+ if (!ext3_group_desc_csum_verify(sbi, i, gdp)) {
-+ ext3_error(sb, __FUNCTION__,
-+ "Checksum for group %d failed (%u != %u)\n",
-+ i, ext3_group_desc_csum(sbi, i, gdp),
-+ gdp->bg_checksum);
-+ return 0;
-+ }
- block += EXT3_BLOCKS_PER_GROUP(sb);
- gdp++;
- }
-Index: linux-stage/include/linux/ext3_fs.h
-===================================================================
---- linux-stage.orig/include/linux/ext3_fs.h 2007-03-14 16:29:47.000000000 -0400
-+++ linux-stage/include/linux/ext3_fs.h 2007-03-14 16:37:23.000000000 -0400
-@@ -118,6 +118,26 @@ struct statfs;
- (s)->s_first_ino)
- #endif
-
-+/* Macro-instructions used to calculate Free inodes and blocks count.
-+ * Value is approximate for the blocks count until it is initialized. */
-+#define EXT3_BG_INODES_FREE(sb,gr,gdp) ((gdp)->bg_flags & \
-+ cpu_to_le16(EXT3_BG_INODE_UNINIT) ? \
-+ EXT3_INODES_PER_GROUP(sb) : \
-+ le16_to_cpu((gdp)->bg_itable_unused) + \
-+ le16_to_cpu((gdp)->bg_free_inodes_count))
-+#define EXT3_BG_BLOCKS_FREE(sb,gr,gdp) ((gdp)->bg_flags & \
-+ cpu_to_le16(EXT3_BG_BLOCK_UNINIT) ? \
-+ ext3_free_blocks_after_init(sb,gr,gdp) :\
-+ le16_to_cpu((gdp)->bg_free_blocks_count))
-+
-+/* When looking for groups to allocate from, we reduce the free blocks count
-+ * to avoid always picking uninitialized groups. Essentially, we don't start
-+ * allocating from uninitialized groups until other groups are 1/2 full. */
-+#define EXT3_BG_BLOCKS_PNLT(sb,gr,gdp) ((gdp)->bg_flags & \
-+ cpu_to_le16(EXT3_BG_BLOCK_UNINIT) ? \
-+ EXT3_BLOCKS_PER_GROUP(sb) / 2 : \
-+ le16_to_cpu((gdp)->bg_free_blocks_count))
++ /* Set bits for block and inode bitmaps, and inode table */
++ ext3_set_bit(le32_to_cpu(gdp->bg_block_bitmap) - start,
++ bh->b_data);
++ ext3_set_bit(le32_to_cpu(gdp->bg_inode_bitmap) - start,
++ bh->b_data);
++ for (bit = le32_to_cpu(gdp->bg_inode_table) - start,
++ bit_max = bit + sbi->s_itb_per_group; bit < bit_max; bit++)
++ ext3_set_bit(bit, bh->b_data);
++ }
+
- /*
- * Macro-instructions used to manage fragments
- */
-@@ -138,16 +148,22 @@ struct statfs;
- */
- struct ext3_group_desc
- {
-- __le32 bg_block_bitmap; /* Blocks bitmap block */
-- __le32 bg_inode_bitmap; /* Inodes bitmap block */
-+ __le32 bg_block_bitmap; /* Blocks bitmap block */
-+ __le32 bg_inode_bitmap; /* Inodes bitmap block */
- __le32 bg_inode_table; /* Inodes table block */
- __le16 bg_free_blocks_count; /* Free blocks count */
- __le16 bg_free_inodes_count; /* Free inodes count */
- __le16 bg_used_dirs_count; /* Directories count */
-- __u16 bg_pad;
-- __le32 bg_reserved[3];
-+ __le16 bg_flags; /* EXT3_BG_flags (UNINIT, etc) */
-+ __le32 bg_reserved[2]; /* Likely block/inode bitmap checksum */
-+ __le16 bg_itable_unused; /* Unused inodes count */
-+ __le16 bg_checksum; /* crc16(sb_uuid+group+desc) */
- };
-
-+#define EXT3_BG_INODE_UNINIT 0x0001 /* Inode table/bitmap not in use */
-+#define EXT3_BG_BLOCK_UNINIT 0x0002 /* Block bitmap not in use */
-+#define EXT3_BG_BLOCK_WRITTEN 0x0004 /* On-disk structures were overwritten */
++ return free_blocks - sbi->s_itb_per_group - 2;
++}
+
/*
- * Macro-instructions used to manage group descriptors
- */
-@@ -564,6 +581,7 @@ static inline struct ext3_inode_info *EX
- #define EXT3_FEATURE_RO_COMPAT_SPARSE_SUPER 0x0001
- #define EXT3_FEATURE_RO_COMPAT_LARGE_FILE 0x0002
- #define EXT3_FEATURE_RO_COMPAT_BTREE_DIR 0x0004
-+#define EXT4_FEATURE_RO_COMPAT_GDT_CSUM 0x0010
- #define EXT4_FEATURE_RO_COMPAT_DIR_NLINK 0x0020
+ * Read the bitmap for a given block_group, reading into the specified
+ * slot in the superblock's bitmap cache.
+@@ -88,7 +158,19 @@ read_block_bitmap(struct super_block *sb
+ desc = ext3_get_group_desc (sb, block_group, NULL);
+ if (!desc)
+ goto error_out;
+- bh = sb_bread(sb, le32_to_cpu(desc->bg_block_bitmap));
++ if (desc->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT)) {
++ bh = sb_getblk(sb, le32_to_cpu(desc->bg_block_bitmap));
++ if (!buffer_uptodate(bh)) {
++ lock_buffer(bh);
++ if (!buffer_uptodate(bh)) {
++ ext3_init_block_bitmap(sb, bh,block_group,desc);
++ set_buffer_uptodate(bh);
++ }
++ unlock_buffer(bh);
++ }
++ } else {
++ bh = sb_bread(sb, le32_to_cpu(desc->bg_block_bitmap));
++ }
+ if (!bh)
+ ext3_error (sb, "read_block_bitmap",
+ "Cannot read block bitmap - "
+@@ -429,6 +511,7 @@ do_more:
+ gdp->bg_free_blocks_count =
+ cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count) +
+ *pdquot_freed_blocks);
++ gdp->bg_checksum = ext3_group_desc_csum(sbi, block_group, gdp);
+ spin_unlock(sb_bgl_lock(sbi, block_group));
+ percpu_counter_mod(&sbi->s_freeblocks_counter, count);
- #define EXT3_FEATURE_INCOMPAT_COMPRESSION 0x0001
-@@ -580,6 +598,7 @@ static inline struct ext3_inode_info *EX
- EXT3_FEATURE_INCOMPAT_EXTENTS)
- #define EXT3_FEATURE_RO_COMPAT_SUPP (EXT3_FEATURE_RO_COMPAT_SPARSE_SUPER| \
- EXT3_FEATURE_RO_COMPAT_LARGE_FILE| \
-+ EXT4_FEATURE_RO_COMPAT_GDT_CSUM| \
- EXT4_FEATURE_RO_COMPAT_DIR_NLINK| \
- EXT3_FEATURE_RO_COMPAT_BTREE_DIR)
+@@ -1330,8 +1413,11 @@ allocated:
+ ret_block, goal_hits, goal_attempts);
-@@ -841,6 +860,16 @@ extern void ext3_unlockfs (struct super_
- extern void ext3_commit_super (struct super_block *, struct ext3_super_block *, int);
- extern int ext3_remount (struct super_block *, int *, char *);
- extern int ext3_statfs (struct super_block *, struct kstatfs *);
-+extern __u16 ext3_group_desc_csum(struct ext3_sb_info *sbi, __u32 group,
-+ struct ext3_group_desc *gdp);
-+extern int ext3_group_desc_csum_verify(struct ext3_sb_info *sbi, __u32 group,
-+ struct ext3_group_desc *gdp);
-+extern unsigned long ext3_free_blocks_after_init(struct super_block *sb,
-+ int block_group,
-+ struct ext3_group_desc *gdp);
-+extern void ext3_init_block_bitmap(struct super_block *sb,
-+ struct buffer_head *bh, int group,
-+ struct ext3_group_desc *desc);
+ spin_lock(sb_bgl_lock(sbi, group_no));
++ if (gdp->bg_flags & cpu_to_le16(EXT3_BG_BLOCK_UNINIT))
++ gdp->bg_flags &= cpu_to_le16(~EXT3_BG_BLOCK_UNINIT);
+ gdp->bg_free_blocks_count =
+ cpu_to_le16(le16_to_cpu(gdp->bg_free_blocks_count) - 1);
++ gdp->bg_checksum = ext3_group_desc_csum(sbi, group_no, gdp);
+ spin_unlock(sb_bgl_lock(sbi, group_no));
+ percpu_counter_mod(&sbi->s_freeblocks_counter, -1);
- #define ext3_std_error(sb, errno) \
- do { \
-
-%diffstat
- fs/ext3/balloc.c | 116 +++++++++++++++++++++++++++++++++++++++++--
- fs/ext3/ialloc.c | 85 ++++++++++++++++++++++---------
- fs/ext3/mballoc.c | 18 +++++-
- fs/ext3/resize.c | 1
- fs/ext3/super.c | 53 +++++++++++++++++++
- include/linux/ext3_fs.h | 36 +++++++++++--
- include/linux/ext3_fs.h.orig | 23 +++++++-
- 7 files changed, 294 insertions(+), 38 deletions(-)
-