aboutsummaryrefslogtreecommitdiffstats
path: root/fs/ocfs2
diff options
context:
space:
mode:
Diffstat (limited to 'fs/ocfs2')
-rw-r--r--fs/ocfs2/move_extents.c46
1 files changed, 26 insertions, 20 deletions
diff --git a/fs/ocfs2/move_extents.c b/fs/ocfs2/move_extents.c
index 800552168d8a..efc509b3af1f 100644
--- a/fs/ocfs2/move_extents.c
+++ b/fs/ocfs2/move_extents.c
@@ -44,6 +44,7 @@ struct ocfs2_move_extents_context {
44 struct inode *inode; 44 struct inode *inode;
45 struct file *file; 45 struct file *file;
46 int auto_defrag; 46 int auto_defrag;
47 int partial;
47 int credits; 48 int credits;
48 u32 new_phys_cpos; 49 u32 new_phys_cpos;
49 u32 clusters_moved; 50 u32 clusters_moved;
@@ -221,9 +222,9 @@ out:
221 * crash happens anywhere. 222 * crash happens anywhere.
222 */ 223 */
223static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context, 224static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
224 u32 cpos, u32 phys_cpos, u32 len, int ext_flags) 225 u32 cpos, u32 phys_cpos, u32 *len, int ext_flags)
225{ 226{
226 int ret, credits = 0, extra_blocks = 0; 227 int ret, credits = 0, extra_blocks = 0, partial = context->partial;
227 handle_t *handle; 228 handle_t *handle;
228 struct inode *inode = context->inode; 229 struct inode *inode = context->inode;
229 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb); 230 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
@@ -232,7 +233,7 @@ static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
232 u32 new_phys_cpos, new_len; 233 u32 new_phys_cpos, new_len;
233 u64 phys_blkno = ocfs2_clusters_to_blocks(inode->i_sb, phys_cpos); 234 u64 phys_blkno = ocfs2_clusters_to_blocks(inode->i_sb, phys_cpos);
234 235
235 if ((ext_flags & OCFS2_EXT_REFCOUNTED) && len) { 236 if ((ext_flags & OCFS2_EXT_REFCOUNTED) && *len) {
236 237
237 BUG_ON(!(OCFS2_I(inode)->ip_dyn_features & 238 BUG_ON(!(OCFS2_I(inode)->ip_dyn_features &
238 OCFS2_HAS_REFCOUNT_FL)); 239 OCFS2_HAS_REFCOUNT_FL));
@@ -249,7 +250,7 @@ static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
249 ret = ocfs2_prepare_refcount_change_for_del(inode, 250 ret = ocfs2_prepare_refcount_change_for_del(inode,
250 context->refcount_loc, 251 context->refcount_loc,
251 phys_blkno, 252 phys_blkno,
252 len, 253 *len,
253 &credits, 254 &credits,
254 &extra_blocks); 255 &extra_blocks);
255 if (ret) { 256 if (ret) {
@@ -258,7 +259,7 @@ static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
258 } 259 }
259 } 260 }
260 261
261 ret = ocfs2_lock_allocators_move_extents(inode, &context->et, len, 1, 262 ret = ocfs2_lock_allocators_move_extents(inode, &context->et, *len, 1,
262 &context->meta_ac, 263 &context->meta_ac,
263 &context->data_ac, 264 &context->data_ac,
264 extra_blocks, &credits); 265 extra_blocks, &credits);
@@ -291,7 +292,7 @@ static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
291 goto out_unlock_mutex; 292 goto out_unlock_mutex;
292 } 293 }
293 294
294 ret = __ocfs2_claim_clusters(handle, context->data_ac, 1, len, 295 ret = __ocfs2_claim_clusters(handle, context->data_ac, 1, *len,
295 &new_phys_cpos, &new_len); 296 &new_phys_cpos, &new_len);
296 if (ret) { 297 if (ret) {
297 mlog_errno(ret); 298 mlog_errno(ret);
@@ -299,33 +300,36 @@ static int ocfs2_defrag_extent(struct ocfs2_move_extents_context *context,
299 } 300 }
300 301
301 /* 302 /*
302 * we're not quite patient here to make multiple attempts for claiming 303 * allowing partial extent moving is kind of 'pros and cons', it makes
303 * enough clusters, failure to claim clusters per-requested is not a 304 * whole defragmentation less likely to fail, on the contrary, the bad
304 * disaster though, it can only mean partial range of defragmentation 305 * thing is it may make the fs even more fragmented after moving, let
305 * or extent movements gets gone, users anyway is able to have another 306 * userspace make a good decision here.
306 * try as they wish anytime, since they're going to be returned a
307 * '-ENOSPC' and completed length of this movement.
308 */ 307 */
309 if (new_len != len) { 308 if (new_len != *len) {
310 mlog(0, "len_claimed: %u, len: %u\n", new_len, len); 309 mlog(0, "len_claimed: %u, len: %u\n", new_len, *len);
311 context->range->me_flags &= ~OCFS2_MOVE_EXT_FL_COMPLETE; 310 if (!partial) {
312 ret = -ENOSPC; 311 context->range->me_flags &= ~OCFS2_MOVE_EXT_FL_COMPLETE;
313 goto out_commit; 312 ret = -ENOSPC;
313 goto out_commit;
314 }
314 } 315 }
315 316
316 mlog(0, "cpos: %u, phys_cpos: %u, new_phys_cpos: %u\n", cpos, 317 mlog(0, "cpos: %u, phys_cpos: %u, new_phys_cpos: %u\n", cpos,
317 phys_cpos, new_phys_cpos); 318 phys_cpos, new_phys_cpos);
318 319
319 ret = __ocfs2_move_extent(handle, context, cpos, len, phys_cpos, 320 ret = __ocfs2_move_extent(handle, context, cpos, new_len, phys_cpos,
320 new_phys_cpos, ext_flags); 321 new_phys_cpos, ext_flags);
321 if (ret) 322 if (ret)
322 mlog_errno(ret); 323 mlog_errno(ret);
323 324
325 if (partial && (new_len != *len))
326 *len = new_len;
327
324 /* 328 /*
325 * Here we should write the new page out first if we are 329 * Here we should write the new page out first if we are
326 * in write-back mode. 330 * in write-back mode.
327 */ 331 */
328 ret = ocfs2_cow_sync_writeback(inode->i_sb, context->inode, cpos, len); 332 ret = ocfs2_cow_sync_writeback(inode->i_sb, context->inode, cpos, *len);
329 if (ret) 333 if (ret)
330 mlog_errno(ret); 334 mlog_errno(ret);
331 335
@@ -926,7 +930,7 @@ static int __ocfs2_move_extents_range(struct buffer_head *di_bh,
926 cpos, phys_cpos, alloc_size, len_defraged); 930 cpos, phys_cpos, alloc_size, len_defraged);
927 931
928 ret = ocfs2_defrag_extent(context, cpos, phys_cpos, 932 ret = ocfs2_defrag_extent(context, cpos, phys_cpos,
929 alloc_size, flags); 933 &alloc_size, flags);
930 } else { 934 } else {
931 ret = ocfs2_move_extent(context, cpos, phys_cpos, 935 ret = ocfs2_move_extent(context, cpos, phys_cpos,
932 &new_phys_cpos, alloc_size, 936 &new_phys_cpos, alloc_size,
@@ -1101,6 +1105,8 @@ int ocfs2_ioctl_move_extents(struct file *filp, void __user *argp)
1101 * any thought? 1105 * any thought?
1102 */ 1106 */
1103 range.me_threshold = 1024 * 1024; 1107 range.me_threshold = 1024 * 1024;
1108 if (range.me_flags & OCFS2_MOVE_EXT_FL_PART_DEFRAG)
1109 context->partial = 1;
1104 } else { 1110 } else {
1105 /* 1111 /*
1106 * first best-effort attempt to validate and adjust the goal 1112 * first best-effort attempt to validate and adjust the goal