direct-io: Handle O_(D)SYNC AIO
Call generic_write_sync() from the deferred I/O completion handler if O_DSYNC is set for a write request. Also make sure various callers don't call generic_write_sync if the direct I/O code returns -EIOCBQUEUED. Based on an earlier patch from Jan Kara <jack@suse.cz> with updates from Jeff Moyer <jmoyer@redhat.com> and Darrick J. Wong <darrick.wong@oracle.com>. Signed-off-by: Christoph Hellwig <hch@lst.de> Signed-off-by: Jan Kara <jack@suse.cz> Signed-off-by: Al Viro <viro@zeniv.linux.org.uk>
This commit is contained in:
parent
7b7a8665ed
commit
02afc27fae
@ -1519,7 +1519,7 @@ ssize_t blkdev_aio_write(struct kiocb *iocb, const struct iovec *iov,
|
|||||||
|
|
||||||
blk_start_plug(&plug);
|
blk_start_plug(&plug);
|
||||||
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
||||||
if (ret > 0 || ret == -EIOCBQUEUED) {
|
if (ret > 0) {
|
||||||
ssize_t err;
|
ssize_t err;
|
||||||
|
|
||||||
err = generic_write_sync(file, pos, ret);
|
err = generic_write_sync(file, pos, ret);
|
||||||
|
@ -1727,7 +1727,7 @@ static ssize_t btrfs_file_aio_write(struct kiocb *iocb,
|
|||||||
*/
|
*/
|
||||||
BTRFS_I(inode)->last_trans = root->fs_info->generation + 1;
|
BTRFS_I(inode)->last_trans = root->fs_info->generation + 1;
|
||||||
BTRFS_I(inode)->last_sub_trans = root->log_transid;
|
BTRFS_I(inode)->last_sub_trans = root->log_transid;
|
||||||
if (num_written > 0 || num_written == -EIOCBQUEUED) {
|
if (num_written > 0) {
|
||||||
err = generic_write_sync(file, pos, num_written);
|
err = generic_write_sync(file, pos, num_written);
|
||||||
if (err < 0 && num_written > 0)
|
if (err < 0 && num_written > 0)
|
||||||
num_written = err;
|
num_written = err;
|
||||||
|
@ -2553,7 +2553,7 @@ cifs_writev(struct kiocb *iocb, const struct iovec *iov,
|
|||||||
mutex_unlock(&inode->i_mutex);
|
mutex_unlock(&inode->i_mutex);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (rc > 0 || rc == -EIOCBQUEUED) {
|
if (rc > 0) {
|
||||||
ssize_t err;
|
ssize_t err;
|
||||||
|
|
||||||
err = generic_write_sync(file, pos, rc);
|
err = generic_write_sync(file, pos, rc);
|
||||||
|
@ -266,8 +266,18 @@ static ssize_t dio_complete(struct dio *dio, loff_t offset, ssize_t ret,
|
|||||||
dio->end_io(dio->iocb, offset, transferred, dio->private);
|
dio->end_io(dio->iocb, offset, transferred, dio->private);
|
||||||
|
|
||||||
inode_dio_done(dio->inode);
|
inode_dio_done(dio->inode);
|
||||||
if (is_async)
|
if (is_async) {
|
||||||
|
if (dio->rw & WRITE) {
|
||||||
|
int err;
|
||||||
|
|
||||||
|
err = generic_write_sync(dio->iocb->ki_filp, offset,
|
||||||
|
transferred);
|
||||||
|
if (err < 0 && ret > 0)
|
||||||
|
ret = err;
|
||||||
|
}
|
||||||
|
|
||||||
aio_complete(dio->iocb, ret, 0);
|
aio_complete(dio->iocb, ret, 0);
|
||||||
|
}
|
||||||
|
|
||||||
kmem_cache_free(dio_cache, dio);
|
kmem_cache_free(dio_cache, dio);
|
||||||
return ret;
|
return ret;
|
||||||
@ -1182,11 +1192,6 @@ do_blockdev_direct_IO(int rw, struct kiocb *iocb, struct inode *inode,
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
|
||||||
* Will be decremented at I/O completion time.
|
|
||||||
*/
|
|
||||||
atomic_inc(&inode->i_dio_count);
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* For file extending writes updating i_size before data
|
* For file extending writes updating i_size before data
|
||||||
* writeouts complete can expose uninitialized blocks. So
|
* writeouts complete can expose uninitialized blocks. So
|
||||||
@ -1195,11 +1200,33 @@ do_blockdev_direct_IO(int rw, struct kiocb *iocb, struct inode *inode,
|
|||||||
*/
|
*/
|
||||||
dio->is_async = !is_sync_kiocb(iocb) && !((rw & WRITE) &&
|
dio->is_async = !is_sync_kiocb(iocb) && !((rw & WRITE) &&
|
||||||
(end > i_size_read(inode)));
|
(end > i_size_read(inode)));
|
||||||
|
|
||||||
retval = 0;
|
|
||||||
|
|
||||||
dio->inode = inode;
|
dio->inode = inode;
|
||||||
dio->rw = rw;
|
dio->rw = rw;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* For AIO O_(D)SYNC writes we need to defer completions to a workqueue
|
||||||
|
* so that we can call ->fsync.
|
||||||
|
*/
|
||||||
|
if (dio->is_async && (rw & WRITE) &&
|
||||||
|
((iocb->ki_filp->f_flags & O_DSYNC) ||
|
||||||
|
IS_SYNC(iocb->ki_filp->f_mapping->host))) {
|
||||||
|
retval = dio_set_defer_completion(dio);
|
||||||
|
if (retval) {
|
||||||
|
/*
|
||||||
|
* We grab i_mutex only for reads so we don't have
|
||||||
|
* to release it here
|
||||||
|
*/
|
||||||
|
kmem_cache_free(dio_cache, dio);
|
||||||
|
goto out;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Will be decremented at I/O completion time.
|
||||||
|
*/
|
||||||
|
atomic_inc(&inode->i_dio_count);
|
||||||
|
|
||||||
|
retval = 0;
|
||||||
sdio.blkbits = blkbits;
|
sdio.blkbits = blkbits;
|
||||||
sdio.blkfactor = i_blkbits - blkbits;
|
sdio.blkfactor = i_blkbits - blkbits;
|
||||||
sdio.block_in_file = offset >> blkbits;
|
sdio.block_in_file = offset >> blkbits;
|
||||||
|
@ -149,7 +149,7 @@ ext4_file_dio_write(struct kiocb *iocb, const struct iovec *iov,
|
|||||||
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
||||||
mutex_unlock(&inode->i_mutex);
|
mutex_unlock(&inode->i_mutex);
|
||||||
|
|
||||||
if (ret > 0 || ret == -EIOCBQUEUED) {
|
if (ret > 0) {
|
||||||
ssize_t err;
|
ssize_t err;
|
||||||
|
|
||||||
err = generic_write_sync(file, pos, ret);
|
err = generic_write_sync(file, pos, ret);
|
||||||
|
@ -2550,7 +2550,7 @@ ssize_t generic_file_aio_write(struct kiocb *iocb, const struct iovec *iov,
|
|||||||
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
|
||||||
mutex_unlock(&inode->i_mutex);
|
mutex_unlock(&inode->i_mutex);
|
||||||
|
|
||||||
if (ret > 0 || ret == -EIOCBQUEUED) {
|
if (ret > 0) {
|
||||||
ssize_t err;
|
ssize_t err;
|
||||||
|
|
||||||
err = generic_write_sync(file, pos, ret);
|
err = generic_write_sync(file, pos, ret);
|
||||||
|
Loading…
Reference in New Issue
Block a user