提交 82e54229 编写于 作者: D Dmitry Monakhov 提交者: Theodore Ts'o

ext4: fix unwritten counter leakage

ext4_set_io_unwritten_flag() will increment i_unwritten counter, so
once we mark end_io with EXT4_END_IO_UNWRITTEN we have to revert it back
on error path.

 - add missed error checks to prevent counter leakage
 - ext4_end_io_nolock() will clear EXT4_END_IO_UNWRITTEN flag to signal
   that conversion finished.
 - add BUG_ON to ext4_free_end_io() to prevent similar leakage in future.

Visible effect of this bug is that unaligned aio_stress may deadlock
Reviewed-by: NJan Kara <jack@suse.cz>
Signed-off-by: NDmitry Monakhov <dmonakhov@openvz.org>
Signed-off-by: N"Theodore Ts'o" <tytso@mit.edu>
上级 e27f41e1
...@@ -3633,6 +3633,8 @@ ext4_ext_handle_uninitialized_extents(handle_t *handle, struct inode *inode, ...@@ -3633,6 +3633,8 @@ ext4_ext_handle_uninitialized_extents(handle_t *handle, struct inode *inode,
if ((flags & EXT4_GET_BLOCKS_PRE_IO)) { if ((flags & EXT4_GET_BLOCKS_PRE_IO)) {
ret = ext4_split_unwritten_extents(handle, inode, map, ret = ext4_split_unwritten_extents(handle, inode, map,
path, flags); path, flags);
if (ret <= 0)
goto out;
/* /*
* Flag the inode(non aio case) or end_io struct (aio case) * Flag the inode(non aio case) or end_io struct (aio case)
* that this IO needs to conversion to written when IO is * that this IO needs to conversion to written when IO is
...@@ -3878,6 +3880,7 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode, ...@@ -3878,6 +3880,7 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode,
struct ext4_allocation_request ar; struct ext4_allocation_request ar;
ext4_io_end_t *io = ext4_inode_aio(inode); ext4_io_end_t *io = ext4_inode_aio(inode);
ext4_lblk_t cluster_offset; ext4_lblk_t cluster_offset;
int set_unwritten = 0;
ext_debug("blocks %u/%u requested for inode %lu\n", ext_debug("blocks %u/%u requested for inode %lu\n",
map->m_lblk, map->m_len, inode->i_ino); map->m_lblk, map->m_len, inode->i_ino);
...@@ -4100,13 +4103,8 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode, ...@@ -4100,13 +4103,8 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode,
* For non asycn direct IO case, flag the inode state * For non asycn direct IO case, flag the inode state
* that we need to perform conversion when IO is done. * that we need to perform conversion when IO is done.
*/ */
if ((flags & EXT4_GET_BLOCKS_PRE_IO)) { if ((flags & EXT4_GET_BLOCKS_PRE_IO))
if (io) set_unwritten = 1;
ext4_set_io_unwritten_flag(inode, io);
else
ext4_set_inode_state(inode,
EXT4_STATE_DIO_UNWRITTEN);
}
if (ext4_should_dioread_nolock(inode)) if (ext4_should_dioread_nolock(inode))
map->m_flags |= EXT4_MAP_UNINIT; map->m_flags |= EXT4_MAP_UNINIT;
} }
...@@ -4118,6 +4116,15 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode, ...@@ -4118,6 +4116,15 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode,
if (!err) if (!err)
err = ext4_ext_insert_extent(handle, inode, path, err = ext4_ext_insert_extent(handle, inode, path,
&newex, flags); &newex, flags);
if (!err && set_unwritten) {
if (io)
ext4_set_io_unwritten_flag(inode, io);
else
ext4_set_inode_state(inode,
EXT4_STATE_DIO_UNWRITTEN);
}
if (err && free_on_err) { if (err && free_on_err) {
int fb_flags = flags & EXT4_GET_BLOCKS_DELALLOC_RESERVE ? int fb_flags = flags & EXT4_GET_BLOCKS_DELALLOC_RESERVE ?
EXT4_FREE_BLOCKS_NO_QUOT_UPDATE : 0; EXT4_FREE_BLOCKS_NO_QUOT_UPDATE : 0;
......
...@@ -71,6 +71,8 @@ void ext4_free_io_end(ext4_io_end_t *io) ...@@ -71,6 +71,8 @@ void ext4_free_io_end(ext4_io_end_t *io)
int i; int i;
BUG_ON(!io); BUG_ON(!io);
BUG_ON(io->flag & EXT4_IO_END_UNWRITTEN);
if (io->page) if (io->page)
put_page(io->page); put_page(io->page);
for (i = 0; i < io->num_io_pages; i++) for (i = 0; i < io->num_io_pages; i++)
...@@ -94,6 +96,8 @@ int ext4_end_io_nolock(ext4_io_end_t *io) ...@@ -94,6 +96,8 @@ int ext4_end_io_nolock(ext4_io_end_t *io)
ssize_t size = io->size; ssize_t size = io->size;
int ret = 0; int ret = 0;
BUG_ON(!(io->flag & EXT4_IO_END_UNWRITTEN));
ext4_debug("ext4_end_io_nolock: io 0x%p from inode %lu,list->next 0x%p," ext4_debug("ext4_end_io_nolock: io 0x%p from inode %lu,list->next 0x%p,"
"list->prev 0x%p\n", "list->prev 0x%p\n",
io, inode->i_ino, io->list.next, io->list.prev); io, inode->i_ino, io->list.next, io->list.prev);
...@@ -106,7 +110,7 @@ int ext4_end_io_nolock(ext4_io_end_t *io) ...@@ -106,7 +110,7 @@ int ext4_end_io_nolock(ext4_io_end_t *io)
"(inode %lu, offset %llu, size %zd, error %d)", "(inode %lu, offset %llu, size %zd, error %d)",
inode->i_ino, offset, size, ret); inode->i_ino, offset, size, ret);
} }
io->flag &= ~EXT4_IO_END_UNWRITTEN;
if (io->iocb) if (io->iocb)
aio_complete(io->iocb, io->result, 0); aio_complete(io->iocb, io->result, 0);
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册