diff options
author | Dmitry Monakhov <dmonakhov@openvz.org> | 2012-09-29 00:58:26 -0400 |
---|---|---|
committer | Theodore Ts'o <tytso@mit.edu> | 2012-09-29 00:58:26 -0400 |
commit | 1f555cfa29e8f787d675e8390f88ce517a37271a (patch) | |
tree | df32d4fd9114f4cbe78fb490a12b21c6b538cf81 | |
parent | 1b65007e9870e0021397b548e8cd6bbc584f9152 (diff) |
ext4: serialize truncate with owerwrite DIO workers
Jan Kara have spotted interesting issue:
There are potential data corruption issue with direct IO overwrites
racing with truncate:
Like:
dio write truncate_task
->ext4_ext_direct_IO
->overwrite == 1
->down_read(&EXT4_I(inode)->i_data_sem);
->mutex_unlock(&inode->i_mutex);
->ext4_setattr()
->inode_dio_wait()
->truncate_setsize()
->ext4_truncate()
->down_write(&EXT4_I(inode)->i_data_sem);
->__blockdev_direct_IO
->ext4_get_block
->submit_io()
->up_read(&EXT4_I(inode)->i_data_sem);
# truncate data blocks, allocate them to
# other inode - bad stuff happens because
# dio is still in flight.
In order to serialize with truncate dio worker should grab extra i_dio_count
reference before drop i_mutex.
Reviewed-by: Jan Kara <jack@suse.cz>
Signed-off-by: Dmitry Monakhov <dmonakhov@openvz.org>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
-rw-r--r-- | fs/ext4/inode.c | 2 |
1 files changed, 2 insertions, 0 deletions
diff --git a/fs/ext4/inode.c b/fs/ext4/inode.c index 05ab70dd5c64..09308ad0f314 100644 --- a/fs/ext4/inode.c +++ b/fs/ext4/inode.c | |||
@@ -3010,6 +3010,7 @@ static ssize_t ext4_ext_direct_IO(int rw, struct kiocb *iocb, | |||
3010 | overwrite = *((int *)iocb->private); | 3010 | overwrite = *((int *)iocb->private); |
3011 | 3011 | ||
3012 | if (overwrite) { | 3012 | if (overwrite) { |
3013 | atomic_inc(&inode->i_dio_count); | ||
3013 | down_read(&EXT4_I(inode)->i_data_sem); | 3014 | down_read(&EXT4_I(inode)->i_data_sem); |
3014 | mutex_unlock(&inode->i_mutex); | 3015 | mutex_unlock(&inode->i_mutex); |
3015 | } | 3016 | } |
@@ -3107,6 +3108,7 @@ static ssize_t ext4_ext_direct_IO(int rw, struct kiocb *iocb, | |||
3107 | retake_lock: | 3108 | retake_lock: |
3108 | /* take i_mutex locking again if we do a ovewrite dio */ | 3109 | /* take i_mutex locking again if we do a ovewrite dio */ |
3109 | if (overwrite) { | 3110 | if (overwrite) { |
3111 | inode_dio_done(inode); | ||
3110 | up_read(&EXT4_I(inode)->i_data_sem); | 3112 | up_read(&EXT4_I(inode)->i_data_sem); |
3111 | mutex_lock(&inode->i_mutex); | 3113 | mutex_lock(&inode->i_mutex); |
3112 | } | 3114 | } |