diff options
Diffstat (limited to 'fs/xfs/linux-2.6/xfs_file.c')
-rw-r--r-- | fs/xfs/linux-2.6/xfs_file.c | 140 |
1 files changed, 117 insertions, 23 deletions
diff --git a/fs/xfs/linux-2.6/xfs_file.c b/fs/xfs/linux-2.6/xfs_file.c index 1eb561a10e26..6c283b7be8ab 100644 --- a/fs/xfs/linux-2.6/xfs_file.c +++ b/fs/xfs/linux-2.6/xfs_file.c | |||
@@ -35,6 +35,7 @@ | |||
35 | #include "xfs_dir2_sf.h" | 35 | #include "xfs_dir2_sf.h" |
36 | #include "xfs_dinode.h" | 36 | #include "xfs_dinode.h" |
37 | #include "xfs_inode.h" | 37 | #include "xfs_inode.h" |
38 | #include "xfs_inode_item.h" | ||
38 | #include "xfs_bmap.h" | 39 | #include "xfs_bmap.h" |
39 | #include "xfs_error.h" | 40 | #include "xfs_error.h" |
40 | #include "xfs_rw.h" | 41 | #include "xfs_rw.h" |
@@ -96,6 +97,120 @@ xfs_iozero( | |||
96 | return (-status); | 97 | return (-status); |
97 | } | 98 | } |
98 | 99 | ||
100 | /* | ||
101 | * We ignore the datasync flag here because a datasync is effectively | ||
102 | * identical to an fsync. That is, datasync implies that we need to write | ||
103 | * only the metadata needed to be able to access the data that is written | ||
104 | * if we crash after the call completes. Hence if we are writing beyond | ||
105 | * EOF we have to log the inode size change as well, which makes it a | ||
106 | * full fsync. If we don't write beyond EOF, the inode core will be | ||
107 | * clean in memory and so we don't need to log the inode, just like | ||
108 | * fsync. | ||
109 | */ | ||
110 | STATIC int | ||
111 | xfs_file_fsync( | ||
112 | struct file *file, | ||
113 | struct dentry *dentry, | ||
114 | int datasync) | ||
115 | { | ||
116 | struct xfs_inode *ip = XFS_I(dentry->d_inode); | ||
117 | struct xfs_trans *tp; | ||
118 | int error = 0; | ||
119 | int log_flushed = 0; | ||
120 | |||
121 | xfs_itrace_entry(ip); | ||
122 | |||
123 | if (XFS_FORCED_SHUTDOWN(ip->i_mount)) | ||
124 | return -XFS_ERROR(EIO); | ||
125 | |||
126 | xfs_iflags_clear(ip, XFS_ITRUNCATED); | ||
127 | |||
128 | /* | ||
129 | * We always need to make sure that the required inode state is safe on | ||
130 | * disk. The inode might be clean but we still might need to force the | ||
131 | * log because of committed transactions that haven't hit the disk yet. | ||
132 | * Likewise, there could be unflushed non-transactional changes to the | ||
133 | * inode core that have to go to disk and this requires us to issue | ||
134 | * a synchronous transaction to capture these changes correctly. | ||
135 | * | ||
136 | * This code relies on the assumption that if the i_update_core field | ||
137 | * of the inode is clear and the inode is unpinned then it is clean | ||
138 | * and no action is required. | ||
139 | */ | ||
140 | xfs_ilock(ip, XFS_ILOCK_SHARED); | ||
141 | |||
142 | if (ip->i_update_core) { | ||
143 | /* | ||
144 | * Kick off a transaction to log the inode core to get the | ||
145 | * updates. The sync transaction will also force the log. | ||
146 | */ | ||
147 | xfs_iunlock(ip, XFS_ILOCK_SHARED); | ||
148 | tp = xfs_trans_alloc(ip->i_mount, XFS_TRANS_FSYNC_TS); | ||
149 | error = xfs_trans_reserve(tp, 0, | ||
150 | XFS_FSYNC_TS_LOG_RES(ip->i_mount), 0, 0, 0); | ||
151 | if (error) { | ||
152 | xfs_trans_cancel(tp, 0); | ||
153 | return -error; | ||
154 | } | ||
155 | xfs_ilock(ip, XFS_ILOCK_EXCL); | ||
156 | |||
157 | /* | ||
158 | * Note - it's possible that we might have pushed ourselves out | ||
159 | * of the way during trans_reserve which would flush the inode. | ||
160 | * But there's no guarantee that the inode buffer has actually | ||
161 | * gone out yet (it's delwri). Plus the buffer could be pinned | ||
162 | * anyway if it's part of an inode in another recent | ||
163 | * transaction. So we play it safe and fire off the | ||
164 | * transaction anyway. | ||
165 | */ | ||
166 | xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL); | ||
167 | xfs_trans_ihold(tp, ip); | ||
168 | xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE); | ||
169 | xfs_trans_set_sync(tp); | ||
170 | error = _xfs_trans_commit(tp, 0, &log_flushed); | ||
171 | |||
172 | xfs_iunlock(ip, XFS_ILOCK_EXCL); | ||
173 | } else { | ||
174 | /* | ||
175 | * Timestamps/size haven't changed since last inode flush or | ||
176 | * inode transaction commit. That means either nothing got | ||
177 | * written or a transaction committed which caught the updates. | ||
178 | * If the latter happened and the transaction hasn't hit the | ||
179 | * disk yet, the inode will be still be pinned. If it is, | ||
180 | * force the log. | ||
181 | */ | ||
182 | xfs_iunlock(ip, XFS_ILOCK_SHARED); | ||
183 | if (xfs_ipincount(ip)) { | ||
184 | if (ip->i_itemp->ili_last_lsn) { | ||
185 | error = _xfs_log_force_lsn(ip->i_mount, | ||
186 | ip->i_itemp->ili_last_lsn, | ||
187 | XFS_LOG_SYNC, &log_flushed); | ||
188 | } else { | ||
189 | error = _xfs_log_force(ip->i_mount, | ||
190 | XFS_LOG_SYNC, &log_flushed); | ||
191 | } | ||
192 | } | ||
193 | } | ||
194 | |||
195 | if (ip->i_mount->m_flags & XFS_MOUNT_BARRIER) { | ||
196 | /* | ||
197 | * If the log write didn't issue an ordered tag we need | ||
198 | * to flush the disk cache for the data device now. | ||
199 | */ | ||
200 | if (!log_flushed) | ||
201 | xfs_blkdev_issue_flush(ip->i_mount->m_ddev_targp); | ||
202 | |||
203 | /* | ||
204 | * If this inode is on the RT dev we need to flush that | ||
205 | * cache as well. | ||
206 | */ | ||
207 | if (XFS_IS_REALTIME_INODE(ip)) | ||
208 | xfs_blkdev_issue_flush(ip->i_mount->m_rtdev_targp); | ||
209 | } | ||
210 | |||
211 | return -error; | ||
212 | } | ||
213 | |||
99 | STATIC ssize_t | 214 | STATIC ssize_t |
100 | xfs_file_aio_read( | 215 | xfs_file_aio_read( |
101 | struct kiocb *iocb, | 216 | struct kiocb *iocb, |
@@ -755,7 +870,8 @@ write_retry: | |||
755 | mutex_lock(&inode->i_mutex); | 870 | mutex_lock(&inode->i_mutex); |
756 | xfs_ilock(ip, iolock); | 871 | xfs_ilock(ip, iolock); |
757 | 872 | ||
758 | error2 = xfs_fsync(ip); | 873 | error2 = -xfs_file_fsync(file, file->f_path.dentry, |
874 | (file->f_flags & __O_SYNC) ? 0 : 1); | ||
759 | if (!error) | 875 | if (!error) |
760 | error = error2; | 876 | error = error2; |
761 | } | 877 | } |
@@ -826,28 +942,6 @@ xfs_file_release( | |||
826 | return -xfs_release(XFS_I(inode)); | 942 | return -xfs_release(XFS_I(inode)); |
827 | } | 943 | } |
828 | 944 | ||
829 | /* | ||
830 | * We ignore the datasync flag here because a datasync is effectively | ||
831 | * identical to an fsync. That is, datasync implies that we need to write | ||
832 | * only the metadata needed to be able to access the data that is written | ||
833 | * if we crash after the call completes. Hence if we are writing beyond | ||
834 | * EOF we have to log the inode size change as well, which makes it a | ||
835 | * full fsync. If we don't write beyond EOF, the inode core will be | ||
836 | * clean in memory and so we don't need to log the inode, just like | ||
837 | * fsync. | ||
838 | */ | ||
839 | STATIC int | ||
840 | xfs_file_fsync( | ||
841 | struct file *file, | ||
842 | struct dentry *dentry, | ||
843 | int datasync) | ||
844 | { | ||
845 | struct xfs_inode *ip = XFS_I(dentry->d_inode); | ||
846 | |||
847 | xfs_iflags_clear(ip, XFS_ITRUNCATED); | ||
848 | return -xfs_fsync(ip); | ||
849 | } | ||
850 | |||
851 | STATIC int | 945 | STATIC int |
852 | xfs_file_readdir( | 946 | xfs_file_readdir( |
853 | struct file *filp, | 947 | struct file *filp, |