ext4: New inode allocation for FLEX_BG meta-data groups. This patch mostly controls the way inode are allocated in order to make ialloc aware of flex_bg block group grouping. It achieves this by bypassing the Orlov allocator when block group meta-data are packed toghether through mke2fs. Since the impact on the block allocator is minimal, this patch should have little or no effect on other block allocation algorithms. By controlling the inode allocation, it can basically control where the initial search for new block begins and thus indirectly manipulate the block allocator. This allocator favors data and meta-data locality so the disk will gradually be filled from block group zero upward. This helps improve performance by reducing seek time. Since the group of inode tables within one flex_bg are treated as one giant inode table, uninitialized block groups would not need to partially initialize as many inode table as with Orlov which would help fsck time as the filesystem usage goes up. Signed-off-by: Jose R. Santos <jrs@us.ibm.com> Signed-off-by: Valerie Clement <valerie.clement@bull.net> Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>

commit: 772cb7c83ba256a11c7bf99a11bef3858d23767c [log] [tgz]
author: Jose R. Santos <jrs@us.ibm.com> Fri Jul 11 19:27:31 2008 -0400
committer: Theodore Ts'o <tytso@mit.edu> Fri Jul 11 19:27:31 2008 -0400
tree: a42b97e5cbd870a76b2646c2dcb658a92c53f637
parent: 736603ab297506f4396cb5af592004499950fcfd [diff] [blame]
diff --git a/fs/ext4/mballoc.c b/fs/ext4/mballoc.c
index b882868..5dcb826 100644
--- a/fs/ext4/mballoc.c
+++ b/fs/ext4/mballoc.c

@@ -2842,6 +2842,14 @@
 	spin_unlock(sb_bgl_lock(sbi, ac->ac_b_ex.fe_group));
 	percpu_counter_sub(&sbi->s_freeblocks_counter, ac->ac_b_ex.fe_len);
 
+	if (sbi->s_log_groups_per_flex) {
+		ext4_group_t flex_group = ext4_flex_group(sbi,
+							  ac->ac_b_ex.fe_group);
+		spin_lock(sb_bgl_lock(sbi, flex_group));
+		sbi->s_flex_groups[flex_group].free_blocks -= ac->ac_b_ex.fe_len;
+		spin_unlock(sb_bgl_lock(sbi, flex_group));
+	}
+
 	err = ext4_journal_dirty_metadata(handle, bitmap_bh);
 	if (err)
 		goto out_err;
@@ -4342,6 +4350,13 @@
 	spin_unlock(sb_bgl_lock(sbi, block_group));
 	percpu_counter_add(&sbi->s_freeblocks_counter, count);
 
+	if (sbi->s_log_groups_per_flex) {
+		ext4_group_t flex_group = ext4_flex_group(sbi, block_group);
+		spin_lock(sb_bgl_lock(sbi, flex_group));
+		sbi->s_flex_groups[flex_group].free_blocks += count;
+		spin_unlock(sb_bgl_lock(sbi, flex_group));
+	}
+
 	ext4_mb_release_desc(&e4b);
 
 	*freed += count;
commit	772cb7c83ba256a11c7bf99a11bef3858d23767c	[log] [tgz]
author	Jose R. Santos <jrs@us.ibm.com>	Fri Jul 11 19:27:31 2008 -0400
committer	Theodore Ts'o <tytso@mit.edu>	Fri Jul 11 19:27:31 2008 -0400
tree	a42b97e5cbd870a76b2646c2dcb658a92c53f637
parent	736603ab297506f4396cb5af592004499950fcfd [diff] [blame]