GFS2: Split data write & wait in fsync

Now that the data writing is part of fsync proper, we can split
the waiting part out and do it later on. This reduces the
number of waits that we do during fsync on average.

There is also no need to take the i_mutex unless we are flushing
metadata to disk, so we can move that to within the metadata
flushing code.

Signed-off-by: Steven Whitehouse <swhiteho@redhat.com>
This commit is contained in:
Steven Whitehouse 2011-07-27 10:58:48 +01:00
parent 4c28d33803
commit 2f0264d592

View File

@ -551,8 +551,16 @@ static int gfs2_close(struct inode *inode, struct file *file)
* @end: the end position in the file to sync * @end: the end position in the file to sync
* @datasync: set if we can ignore timestamp changes * @datasync: set if we can ignore timestamp changes
* *
* The VFS will flush data for us. We only need to worry * We split the data flushing here so that we don't wait for the data
* about metadata here. * until after we've also sent the metadata to disk. Note that for
* data=ordered, we will write & wait for the data at the log flush
* stage anyway, so this is unlikely to make much of a difference
* except in the data=writeback case.
*
* If the fdatawrite fails due to any reason except -EIO, we will
* continue the remainder of the fsync, although we'll still report
* the error at the end. This is to match filemap_write_and_wait_range()
* behaviour.
* *
* Returns: errno * Returns: errno
*/ */
@ -560,30 +568,36 @@ static int gfs2_close(struct inode *inode, struct file *file)
static int gfs2_fsync(struct file *file, loff_t start, loff_t end, static int gfs2_fsync(struct file *file, loff_t start, loff_t end,
int datasync) int datasync)
{ {
struct inode *inode = file->f_mapping->host; struct address_space *mapping = file->f_mapping;
struct inode *inode = mapping->host;
int sync_state = inode->i_state & (I_DIRTY_SYNC|I_DIRTY_DATASYNC); int sync_state = inode->i_state & (I_DIRTY_SYNC|I_DIRTY_DATASYNC);
struct gfs2_inode *ip = GFS2_I(inode); struct gfs2_inode *ip = GFS2_I(inode);
int ret; int ret, ret1 = 0;
ret = filemap_write_and_wait_range(inode->i_mapping, start, end); if (mapping->nrpages) {
if (ret) ret1 = filemap_fdatawrite_range(mapping, start, end);
return ret; if (ret1 == -EIO)
mutex_lock(&inode->i_mutex); return ret1;
}
if (datasync) if (datasync)
sync_state &= ~I_DIRTY_SYNC; sync_state &= ~I_DIRTY_SYNC;
if (sync_state) { if (sync_state) {
mutex_lock(&inode->i_mutex);
ret = sync_inode_metadata(inode, 1); ret = sync_inode_metadata(inode, 1);
if (ret) { if (ret) {
mutex_unlock(&inode->i_mutex); mutex_unlock(&inode->i_mutex);
return ret; return ret;
} }
gfs2_ail_flush(ip->i_gl); gfs2_ail_flush(ip->i_gl);
mutex_unlock(&inode->i_mutex);
} }
mutex_unlock(&inode->i_mutex); if (mapping->nrpages)
return 0; ret = filemap_fdatawait_range(mapping, start, end);
return ret ? ret : ret1;
} }
/** /**