Commit 6501a85b authored by Andrew Morton's avatar Andrew Morton Committed by Linus Torvalds

[PATCH] ext2: inode allocation race fix

ext2's inode allocator will call find_group_orlov(), which will return a
suitable blockgroup in which the inode should be allocated.  But by the time
we actually try to allocate an inode in the blockgroup, other CPUs could have
used them all up.

ext2 will bogusly fail with "ext2_new_inode: Free inodes count corrupted in
group NN".


To fix this we just advance onto the next blockgroup if the rare race
happens.  If we've scanned all blockgroups then return -ENOSPC.


(This is a bit inaccurate: after we've scanned all blockgroups, there may
still be available inodes due to inode freeing activity in other blockgroups.
 This cannot be fixed without fs-wide locking.  The effect is a slightly
early ENOSPC in a nearly-full filesystem).
parent bc75ac4f
...@@ -489,17 +489,18 @@ static int find_group_other(struct super_block *sb, struct inode *parent) ...@@ -489,17 +489,18 @@ static int find_group_other(struct super_block *sb, struct inode *parent)
return group; return group;
} }
struct inode * ext2_new_inode(struct inode * dir, int mode) struct inode *ext2_new_inode(struct inode *dir, int mode)
{ {
struct super_block *sb; struct super_block *sb;
struct buffer_head *bitmap_bh = NULL; struct buffer_head *bitmap_bh = NULL;
struct buffer_head *bh2; struct buffer_head *bh2;
int group, i; int group, i;
ino_t ino; ino_t ino = 0;
struct inode * inode; struct inode * inode;
struct ext2_group_desc * desc; struct ext2_group_desc *gdp;
struct ext2_super_block * es; struct ext2_super_block *es;
struct ext2_inode_info *ei; struct ext2_inode_info *ei;
struct ext2_sb_info *sbi;
int err; int err;
sb = dir->i_sb; sb = dir->i_sb;
...@@ -508,36 +509,62 @@ struct inode * ext2_new_inode(struct inode * dir, int mode) ...@@ -508,36 +509,62 @@ struct inode * ext2_new_inode(struct inode * dir, int mode)
return ERR_PTR(-ENOMEM); return ERR_PTR(-ENOMEM);
ei = EXT2_I(inode); ei = EXT2_I(inode);
es = EXT2_SB(sb)->s_es; sbi = EXT2_SB(sb);
es = sbi->s_es;
repeat: repeat:
if (S_ISDIR(mode)) { if (S_ISDIR(mode)) {
if (test_opt (sb, OLDALLOC)) if (test_opt(sb, OLDALLOC))
group = find_group_dir(sb, dir); group = find_group_dir(sb, dir);
else else
group = find_group_orlov(sb, dir); group = find_group_orlov(sb, dir);
} else } else
group = find_group_other(sb, dir); group = find_group_other(sb, dir);
if (group == -1) {
err = -ENOSPC; err = -ENOSPC;
if (group == -1)
goto fail; goto fail;
}
err = -EIO; for (i = 0; i < sbi->s_groups_count; i++) {
gdp = ext2_get_group_desc(sb, group, &bh2);
brelse(bitmap_bh);
bitmap_bh = read_inode_bitmap(sb, group); bitmap_bh = read_inode_bitmap(sb, group);
if (!bitmap_bh) if (!bitmap_bh) {
err = -EIO;
goto fail2; goto fail2;
}
i = ext2_find_first_zero_bit((unsigned long *)bitmap_bh->b_data, i = ext2_find_first_zero_bit((unsigned long *)bitmap_bh->b_data,
EXT2_INODES_PER_GROUP(sb)); EXT2_INODES_PER_GROUP(sb));
if (i >= EXT2_INODES_PER_GROUP(sb)) if (i >= EXT2_INODES_PER_GROUP(sb)) {
goto bad_count; /*
* Rare race: find_group_xx() decided that there were
* free inodes in this group, but by the time we tried
* to allocate one, they're all gone. This can also
* occur because the counters which find_group_orlov()
* uses are approximate. So just go and search the
* next block group.
*/
if (++group == sbi->s_groups_count)
group = 0;
continue;
}
if (ext2_set_bit_atomic(sb_bgl_lock(EXT2_SB(sb), group), if (ext2_set_bit_atomic(sb_bgl_lock(EXT2_SB(sb), group),
i, (void *) bitmap_bh->b_data)) { i, bitmap_bh->b_data)) {
brelse(bitmap_bh); brelse(bitmap_bh);
bitmap_bh = NULL;
ext2_release_inode(sb, group, S_ISDIR(mode)); ext2_release_inode(sb, group, S_ISDIR(mode));
goto repeat; goto repeat;
} }
goto got;
}
/*
* Scanned all blockgroups.
*/
err = -ENOSPC;
goto fail2;
got:
mark_buffer_dirty(bitmap_bh); mark_buffer_dirty(bitmap_bh);
if (sb->s_flags & MS_SYNCHRONOUS) if (sb->s_flags & MS_SYNCHRONOUS)
sync_dirty_buffer(bitmap_bh); sync_dirty_buffer(bitmap_bh);
...@@ -605,8 +632,9 @@ struct inode * ext2_new_inode(struct inode * dir, int mode) ...@@ -605,8 +632,9 @@ struct inode * ext2_new_inode(struct inode * dir, int mode)
inode->i_generation = EXT2_SB(sb)->s_next_generation++; inode->i_generation = EXT2_SB(sb)->s_next_generation++;
insert_inode_hash(inode); insert_inode_hash(inode);
if(DQUOT_ALLOC_INODE(inode)) { if (DQUOT_ALLOC_INODE(inode)) {
DQUOT_DROP(inode); DQUOT_DROP(inode);
err = -ENOSPC;
goto fail3; goto fail3;
} }
err = ext2_init_acl(inode, dir); err = ext2_init_acl(inode, dir);
...@@ -631,21 +659,6 @@ struct inode * ext2_new_inode(struct inode * dir, int mode) ...@@ -631,21 +659,6 @@ struct inode * ext2_new_inode(struct inode * dir, int mode)
make_bad_inode(inode); make_bad_inode(inode);
iput(inode); iput(inode);
return ERR_PTR(err); return ERR_PTR(err);
bad_count:
brelse(bitmap_bh);
ext2_error (sb, "ext2_new_inode",
"Free inodes count corrupted in group %d",
group);
/* Is it really ENOSPC? */
err = -ENOSPC;
if (sb->s_flags & MS_RDONLY)
goto fail;
desc = ext2_get_group_desc (sb, group, &bh2);
desc->bg_free_inodes_count = 0;
mark_buffer_dirty(bh2);
goto repeat;
} }
unsigned long ext2_count_free_inodes (struct super_block * sb) unsigned long ext2_count_free_inodes (struct super_block * sb)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment