diff options
author | Andreas Gruenbacher <agruen@suse.de> | 2005-01-14 23:35:57 -0800 |
---|---|---|
committer | Linus Torvalds <torvalds@ppc970.osdl.org> | 2005-01-14 23:35:57 -0800 |
commit | fd1ea9abe35beaa2402b90b83a4c47135b086613 (patch) | |
tree | fae65165516b9faed78100cd3e9bb532a01c43d4 /fs/ext3/xattr.c | |
parent | 401494b1615efb1922a380226b0bea3eccb22ff3 (diff) | |
download | history-fd1ea9abe35beaa2402b90b83a4c47135b086613.tar.gz |
[PATCH] ext3/EA: Race in ext[23] xattr sharing code
Andrew Tridgell and Stephen C. Tweedie have reported two different Oopses
caused by a race condition in the mbcache, which is responsible for
extended attribute sharing in ext2 and ext3. Stephen tracked down the bug;
I did the fix.
Explanation:
The mbcache caches the locations and content hashes of xattr blocks. There
are two access strategies: [1] xattr block disposal via
mb_cache_entry_get(), [2] xattr block reuse (sharing) via
mb_cache_entry_find_{first,next}(). There is no locking between the two
methods, so between one mb_cache_entry_find_x and the next, a
mb_cache_entry_get might come in, unhash the cache entry, and change the
journaling state of the xattr buffer. Subsequently, two things can happen:
[a] the next mb_cache_entry_find_x may try to follow the mbcache hash chain
starting from the entry that has become unhashed, which now is a stale
pointer, [b] the block may have become deallocated, and then we try to
reuse it.
Fix this by converting the mbcache into a readers-writer style lock, and
protect all block accesses in ext2/ext3 by the mbcache entry lock. This
ensures that destroying blocks is an exclusive operation that may not
overlap xattr block reuse, while allowing multiple "re-users". Write
access to the xattr block's buffer is protected by the buffer lock.
Signed-off-by: Andreas Gruenbacher <agruen@suse.de>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Diffstat (limited to 'fs/ext3/xattr.c')
-rw-r--r-- | fs/ext3/xattr.c | 54 |
1 files changed, 29 insertions, 25 deletions
diff --git a/fs/ext3/xattr.c b/fs/ext3/xattr.c index 2fbb2336e7c992..bce5e0e0f01274 100644 --- a/fs/ext3/xattr.c +++ b/fs/ext3/xattr.c @@ -97,7 +97,6 @@ static int ext3_xattr_cache_insert(struct buffer_head *); static struct buffer_head *ext3_xattr_cache_find(handle_t *, struct inode *, struct ext3_xattr_header *, int *); -static void ext3_xattr_cache_remove(struct buffer_head *); static void ext3_xattr_rehash(struct ext3_xattr_header *, struct ext3_xattr_entry *); @@ -500,6 +499,7 @@ bad_block: ext3_error(sb, "ext3_xattr_set", /* Here we know that we can set the new attribute. */ if (header) { + struct mb_cache_entry *ce; int credits = 0; /* assert(header == HDR(bh)); */ @@ -511,14 +511,19 @@ bad_block: ext3_error(sb, "ext3_xattr_set", &credits); if (error) goto cleanup; + ce = mb_cache_entry_get(ext3_xattr_cache, bh->b_bdev, + bh->b_blocknr); lock_buffer(bh); if (header->h_refcount == cpu_to_le32(1)) { + if (ce) + mb_cache_entry_free(ce); ea_bdebug(bh, "modifying in-place"); - ext3_xattr_cache_remove(bh); /* keep the buffer locked while modifying it. */ } else { int offset; + if (ce) + mb_cache_entry_release(ce); unlock_buffer(bh); journal_release_buffer(handle, bh, credits); skip_get_write_access: @@ -725,6 +730,8 @@ getblk_failed: error = 0; if (old_bh && old_bh != new_bh) { + struct mb_cache_entry *ce; + /* * If there was an old block, and we are no longer using it, * release the old block. @@ -732,9 +739,13 @@ getblk_failed: error = ext3_journal_get_write_access(handle, old_bh); if (error) goto cleanup; + ce = mb_cache_entry_get(ext3_xattr_cache, old_bh->b_bdev, + old_bh->b_blocknr); lock_buffer(old_bh); if (HDR(old_bh)->h_refcount == cpu_to_le32(1)) { /* Free the old block. */ + if (ce) + mb_cache_entry_free(ce); ea_bdebug(old_bh, "freeing"); ext3_free_blocks(handle, inode, old_bh->b_blocknr, 1); @@ -747,6 +758,8 @@ getblk_failed: /* Decrement the refcount only. */ HDR(old_bh)->h_refcount = cpu_to_le32( le32_to_cpu(HDR(old_bh)->h_refcount) - 1); + if (ce) + mb_cache_entry_release(ce); DQUOT_FREE_BLOCK(inode, 1); ext3_journal_dirty_metadata(handle, old_bh); ea_bdebug(old_bh, "refcount now=%d", @@ -806,6 +819,7 @@ void ext3_xattr_delete_inode(handle_t *handle, struct inode *inode) { struct buffer_head *bh = NULL; + struct mb_cache_entry *ce; down_write(&EXT3_I(inode)->xattr_sem); if (!EXT3_I(inode)->i_file_acl) @@ -826,15 +840,19 @@ ext3_xattr_delete_inode(handle_t *handle, struct inode *inode) } if (ext3_journal_get_write_access(handle, bh) != 0) goto cleanup; + ce = mb_cache_entry_get(ext3_xattr_cache, bh->b_bdev, bh->b_blocknr); lock_buffer(bh); if (HDR(bh)->h_refcount == cpu_to_le32(1)) { - ext3_xattr_cache_remove(bh); + if (ce) + mb_cache_entry_free(ce); ext3_free_blocks(handle, inode, EXT3_I(inode)->i_file_acl, 1); get_bh(bh); ext3_forget(handle, 1, inode, bh, EXT3_I(inode)->i_file_acl); } else { HDR(bh)->h_refcount = cpu_to_le32( le32_to_cpu(HDR(bh)->h_refcount) - 1); + if (ce) + mb_cache_entry_release(ce); ext3_journal_dirty_metadata(handle, bh); if (IS_SYNC(inode)) handle->h_sync = 1; @@ -951,11 +969,18 @@ ext3_xattr_cache_find(handle_t *handle, struct inode *inode, if (!header->h_hash) return NULL; /* never share */ ea_idebug(inode, "looking for cached blocks [%x]", (int)hash); +again: ce = mb_cache_entry_find_first(ext3_xattr_cache, 0, inode->i_sb->s_bdev, hash); while (ce) { - struct buffer_head *bh = sb_bread(inode->i_sb, ce->e_block); + struct buffer_head *bh; + if (IS_ERR(ce)) { + if (PTR_ERR(ce) == -EAGAIN) + goto again; + break; + } + bh = sb_bread(inode->i_sb, ce->e_block); if (!bh) { ext3_error(inode->i_sb, "ext3_xattr_cache_find", "inode %ld: block %ld read error", @@ -986,27 +1011,6 @@ ext3_xattr_cache_find(handle_t *handle, struct inode *inode, return NULL; } -/* - * ext3_xattr_cache_remove() - * - * Remove the cache entry of a block from the cache. Called when a - * block becomes invalid. - */ -static void -ext3_xattr_cache_remove(struct buffer_head *bh) -{ - struct mb_cache_entry *ce; - - ce = mb_cache_entry_get(ext3_xattr_cache, bh->b_bdev, - bh->b_blocknr); - if (ce) { - ea_bdebug(bh, "removing (%d cache entries remaining)", - atomic_read(&ext3_xattr_cache->c_entry_count)-1); - mb_cache_entry_free(ce); - } else - ea_bdebug(bh, "no cache entry"); -} - #define NAME_HASH_SHIFT 5 #define VALUE_HASH_SHIFT 16 |