diff options
Diffstat (limited to 'fs/btrfs/ctree.c')
-rw-r--r-- | fs/btrfs/ctree.c | 238 |
1 files changed, 178 insertions, 60 deletions
diff --git a/fs/btrfs/ctree.c b/fs/btrfs/ctree.c index 6795a713b205..c3df14ce2cc2 100644 --- a/fs/btrfs/ctree.c +++ b/fs/btrfs/ctree.c | |||
@@ -280,7 +280,8 @@ int btrfs_block_can_be_shared(struct btrfs_root *root, | |||
280 | static noinline int update_ref_for_cow(struct btrfs_trans_handle *trans, | 280 | static noinline int update_ref_for_cow(struct btrfs_trans_handle *trans, |
281 | struct btrfs_root *root, | 281 | struct btrfs_root *root, |
282 | struct extent_buffer *buf, | 282 | struct extent_buffer *buf, |
283 | struct extent_buffer *cow) | 283 | struct extent_buffer *cow, |
284 | int *last_ref) | ||
284 | { | 285 | { |
285 | u64 refs; | 286 | u64 refs; |
286 | u64 owner; | 287 | u64 owner; |
@@ -366,6 +367,7 @@ static noinline int update_ref_for_cow(struct btrfs_trans_handle *trans, | |||
366 | BUG_ON(ret); | 367 | BUG_ON(ret); |
367 | } | 368 | } |
368 | clean_tree_block(trans, root, buf); | 369 | clean_tree_block(trans, root, buf); |
370 | *last_ref = 1; | ||
369 | } | 371 | } |
370 | return 0; | 372 | return 0; |
371 | } | 373 | } |
@@ -392,6 +394,7 @@ static noinline int __btrfs_cow_block(struct btrfs_trans_handle *trans, | |||
392 | struct btrfs_disk_key disk_key; | 394 | struct btrfs_disk_key disk_key; |
393 | struct extent_buffer *cow; | 395 | struct extent_buffer *cow; |
394 | int level; | 396 | int level; |
397 | int last_ref = 0; | ||
395 | int unlock_orig = 0; | 398 | int unlock_orig = 0; |
396 | u64 parent_start; | 399 | u64 parent_start; |
397 | 400 | ||
@@ -442,7 +445,10 @@ static noinline int __btrfs_cow_block(struct btrfs_trans_handle *trans, | |||
442 | (unsigned long)btrfs_header_fsid(cow), | 445 | (unsigned long)btrfs_header_fsid(cow), |
443 | BTRFS_FSID_SIZE); | 446 | BTRFS_FSID_SIZE); |
444 | 447 | ||
445 | update_ref_for_cow(trans, root, buf, cow); | 448 | update_ref_for_cow(trans, root, buf, cow, &last_ref); |
449 | |||
450 | if (root->ref_cows) | ||
451 | btrfs_reloc_cow_block(trans, root, buf, cow); | ||
446 | 452 | ||
447 | if (buf == root->node) { | 453 | if (buf == root->node) { |
448 | WARN_ON(parent && parent != buf); | 454 | WARN_ON(parent && parent != buf); |
@@ -457,8 +463,8 @@ static noinline int __btrfs_cow_block(struct btrfs_trans_handle *trans, | |||
457 | extent_buffer_get(cow); | 463 | extent_buffer_get(cow); |
458 | spin_unlock(&root->node_lock); | 464 | spin_unlock(&root->node_lock); |
459 | 465 | ||
460 | btrfs_free_tree_block(trans, root, buf->start, buf->len, | 466 | btrfs_free_tree_block(trans, root, buf, parent_start, |
461 | parent_start, root->root_key.objectid, level); | 467 | last_ref); |
462 | free_extent_buffer(buf); | 468 | free_extent_buffer(buf); |
463 | add_root_to_dirty_list(root); | 469 | add_root_to_dirty_list(root); |
464 | } else { | 470 | } else { |
@@ -473,8 +479,8 @@ static noinline int __btrfs_cow_block(struct btrfs_trans_handle *trans, | |||
473 | btrfs_set_node_ptr_generation(parent, parent_slot, | 479 | btrfs_set_node_ptr_generation(parent, parent_slot, |
474 | trans->transid); | 480 | trans->transid); |
475 | btrfs_mark_buffer_dirty(parent); | 481 | btrfs_mark_buffer_dirty(parent); |
476 | btrfs_free_tree_block(trans, root, buf->start, buf->len, | 482 | btrfs_free_tree_block(trans, root, buf, parent_start, |
477 | parent_start, root->root_key.objectid, level); | 483 | last_ref); |
478 | } | 484 | } |
479 | if (unlock_orig) | 485 | if (unlock_orig) |
480 | btrfs_tree_unlock(buf); | 486 | btrfs_tree_unlock(buf); |
@@ -949,6 +955,22 @@ int btrfs_bin_search(struct extent_buffer *eb, struct btrfs_key *key, | |||
949 | return bin_search(eb, key, level, slot); | 955 | return bin_search(eb, key, level, slot); |
950 | } | 956 | } |
951 | 957 | ||
958 | static void root_add_used(struct btrfs_root *root, u32 size) | ||
959 | { | ||
960 | spin_lock(&root->accounting_lock); | ||
961 | btrfs_set_root_used(&root->root_item, | ||
962 | btrfs_root_used(&root->root_item) + size); | ||
963 | spin_unlock(&root->accounting_lock); | ||
964 | } | ||
965 | |||
966 | static void root_sub_used(struct btrfs_root *root, u32 size) | ||
967 | { | ||
968 | spin_lock(&root->accounting_lock); | ||
969 | btrfs_set_root_used(&root->root_item, | ||
970 | btrfs_root_used(&root->root_item) - size); | ||
971 | spin_unlock(&root->accounting_lock); | ||
972 | } | ||
973 | |||
952 | /* given a node and slot number, this reads the blocks it points to. The | 974 | /* given a node and slot number, this reads the blocks it points to. The |
953 | * extent buffer is returned with a reference taken (but unlocked). | 975 | * extent buffer is returned with a reference taken (but unlocked). |
954 | * NULL is returned on error. | 976 | * NULL is returned on error. |
@@ -1019,7 +1041,11 @@ static noinline int balance_level(struct btrfs_trans_handle *trans, | |||
1019 | btrfs_tree_lock(child); | 1041 | btrfs_tree_lock(child); |
1020 | btrfs_set_lock_blocking(child); | 1042 | btrfs_set_lock_blocking(child); |
1021 | ret = btrfs_cow_block(trans, root, child, mid, 0, &child); | 1043 | ret = btrfs_cow_block(trans, root, child, mid, 0, &child); |
1022 | BUG_ON(ret); | 1044 | if (ret) { |
1045 | btrfs_tree_unlock(child); | ||
1046 | free_extent_buffer(child); | ||
1047 | goto enospc; | ||
1048 | } | ||
1023 | 1049 | ||
1024 | spin_lock(&root->node_lock); | 1050 | spin_lock(&root->node_lock); |
1025 | root->node = child; | 1051 | root->node = child; |
@@ -1034,11 +1060,12 @@ static noinline int balance_level(struct btrfs_trans_handle *trans, | |||
1034 | btrfs_tree_unlock(mid); | 1060 | btrfs_tree_unlock(mid); |
1035 | /* once for the path */ | 1061 | /* once for the path */ |
1036 | free_extent_buffer(mid); | 1062 | free_extent_buffer(mid); |
1037 | ret = btrfs_free_tree_block(trans, root, mid->start, mid->len, | 1063 | |
1038 | 0, root->root_key.objectid, level); | 1064 | root_sub_used(root, mid->len); |
1065 | btrfs_free_tree_block(trans, root, mid, 0, 1); | ||
1039 | /* once for the root ptr */ | 1066 | /* once for the root ptr */ |
1040 | free_extent_buffer(mid); | 1067 | free_extent_buffer(mid); |
1041 | return ret; | 1068 | return 0; |
1042 | } | 1069 | } |
1043 | if (btrfs_header_nritems(mid) > | 1070 | if (btrfs_header_nritems(mid) > |
1044 | BTRFS_NODEPTRS_PER_BLOCK(root) / 4) | 1071 | BTRFS_NODEPTRS_PER_BLOCK(root) / 4) |
@@ -1088,23 +1115,16 @@ static noinline int balance_level(struct btrfs_trans_handle *trans, | |||
1088 | if (wret < 0 && wret != -ENOSPC) | 1115 | if (wret < 0 && wret != -ENOSPC) |
1089 | ret = wret; | 1116 | ret = wret; |
1090 | if (btrfs_header_nritems(right) == 0) { | 1117 | if (btrfs_header_nritems(right) == 0) { |
1091 | u64 bytenr = right->start; | ||
1092 | u32 blocksize = right->len; | ||
1093 | |||
1094 | clean_tree_block(trans, root, right); | 1118 | clean_tree_block(trans, root, right); |
1095 | btrfs_tree_unlock(right); | 1119 | btrfs_tree_unlock(right); |
1096 | free_extent_buffer(right); | ||
1097 | right = NULL; | ||
1098 | wret = del_ptr(trans, root, path, level + 1, pslot + | 1120 | wret = del_ptr(trans, root, path, level + 1, pslot + |
1099 | 1); | 1121 | 1); |
1100 | if (wret) | 1122 | if (wret) |
1101 | ret = wret; | 1123 | ret = wret; |
1102 | wret = btrfs_free_tree_block(trans, root, | 1124 | root_sub_used(root, right->len); |
1103 | bytenr, blocksize, 0, | 1125 | btrfs_free_tree_block(trans, root, right, 0, 1); |
1104 | root->root_key.objectid, | 1126 | free_extent_buffer(right); |
1105 | level); | 1127 | right = NULL; |
1106 | if (wret) | ||
1107 | ret = wret; | ||
1108 | } else { | 1128 | } else { |
1109 | struct btrfs_disk_key right_key; | 1129 | struct btrfs_disk_key right_key; |
1110 | btrfs_node_key(right, &right_key, 0); | 1130 | btrfs_node_key(right, &right_key, 0); |
@@ -1136,21 +1156,15 @@ static noinline int balance_level(struct btrfs_trans_handle *trans, | |||
1136 | BUG_ON(wret == 1); | 1156 | BUG_ON(wret == 1); |
1137 | } | 1157 | } |
1138 | if (btrfs_header_nritems(mid) == 0) { | 1158 | if (btrfs_header_nritems(mid) == 0) { |
1139 | /* we've managed to empty the middle node, drop it */ | ||
1140 | u64 bytenr = mid->start; | ||
1141 | u32 blocksize = mid->len; | ||
1142 | |||
1143 | clean_tree_block(trans, root, mid); | 1159 | clean_tree_block(trans, root, mid); |
1144 | btrfs_tree_unlock(mid); | 1160 | btrfs_tree_unlock(mid); |
1145 | free_extent_buffer(mid); | ||
1146 | mid = NULL; | ||
1147 | wret = del_ptr(trans, root, path, level + 1, pslot); | 1161 | wret = del_ptr(trans, root, path, level + 1, pslot); |
1148 | if (wret) | 1162 | if (wret) |
1149 | ret = wret; | 1163 | ret = wret; |
1150 | wret = btrfs_free_tree_block(trans, root, bytenr, blocksize, | 1164 | root_sub_used(root, mid->len); |
1151 | 0, root->root_key.objectid, level); | 1165 | btrfs_free_tree_block(trans, root, mid, 0, 1); |
1152 | if (wret) | 1166 | free_extent_buffer(mid); |
1153 | ret = wret; | 1167 | mid = NULL; |
1154 | } else { | 1168 | } else { |
1155 | /* update the parent key to reflect our changes */ | 1169 | /* update the parent key to reflect our changes */ |
1156 | struct btrfs_disk_key mid_key; | 1170 | struct btrfs_disk_key mid_key; |
@@ -1590,7 +1604,7 @@ read_block_for_search(struct btrfs_trans_handle *trans, | |||
1590 | btrfs_release_path(NULL, p); | 1604 | btrfs_release_path(NULL, p); |
1591 | 1605 | ||
1592 | ret = -EAGAIN; | 1606 | ret = -EAGAIN; |
1593 | tmp = read_tree_block(root, blocknr, blocksize, gen); | 1607 | tmp = read_tree_block(root, blocknr, blocksize, 0); |
1594 | if (tmp) { | 1608 | if (tmp) { |
1595 | /* | 1609 | /* |
1596 | * If the read above didn't mark this buffer up to date, | 1610 | * If the read above didn't mark this buffer up to date, |
@@ -1740,7 +1754,6 @@ again: | |||
1740 | p->nodes[level + 1], | 1754 | p->nodes[level + 1], |
1741 | p->slots[level + 1], &b); | 1755 | p->slots[level + 1], &b); |
1742 | if (err) { | 1756 | if (err) { |
1743 | free_extent_buffer(b); | ||
1744 | ret = err; | 1757 | ret = err; |
1745 | goto done; | 1758 | goto done; |
1746 | } | 1759 | } |
@@ -2076,6 +2089,8 @@ static noinline int insert_new_root(struct btrfs_trans_handle *trans, | |||
2076 | if (IS_ERR(c)) | 2089 | if (IS_ERR(c)) |
2077 | return PTR_ERR(c); | 2090 | return PTR_ERR(c); |
2078 | 2091 | ||
2092 | root_add_used(root, root->nodesize); | ||
2093 | |||
2079 | memset_extent_buffer(c, 0, 0, sizeof(struct btrfs_header)); | 2094 | memset_extent_buffer(c, 0, 0, sizeof(struct btrfs_header)); |
2080 | btrfs_set_header_nritems(c, 1); | 2095 | btrfs_set_header_nritems(c, 1); |
2081 | btrfs_set_header_level(c, level); | 2096 | btrfs_set_header_level(c, level); |
@@ -2134,6 +2149,7 @@ static int insert_ptr(struct btrfs_trans_handle *trans, struct btrfs_root | |||
2134 | int nritems; | 2149 | int nritems; |
2135 | 2150 | ||
2136 | BUG_ON(!path->nodes[level]); | 2151 | BUG_ON(!path->nodes[level]); |
2152 | btrfs_assert_tree_locked(path->nodes[level]); | ||
2137 | lower = path->nodes[level]; | 2153 | lower = path->nodes[level]; |
2138 | nritems = btrfs_header_nritems(lower); | 2154 | nritems = btrfs_header_nritems(lower); |
2139 | BUG_ON(slot > nritems); | 2155 | BUG_ON(slot > nritems); |
@@ -2202,6 +2218,8 @@ static noinline int split_node(struct btrfs_trans_handle *trans, | |||
2202 | if (IS_ERR(split)) | 2218 | if (IS_ERR(split)) |
2203 | return PTR_ERR(split); | 2219 | return PTR_ERR(split); |
2204 | 2220 | ||
2221 | root_add_used(root, root->nodesize); | ||
2222 | |||
2205 | memset_extent_buffer(split, 0, 0, sizeof(struct btrfs_header)); | 2223 | memset_extent_buffer(split, 0, 0, sizeof(struct btrfs_header)); |
2206 | btrfs_set_header_level(split, btrfs_header_level(c)); | 2224 | btrfs_set_header_level(split, btrfs_header_level(c)); |
2207 | btrfs_set_header_bytenr(split, split->start); | 2225 | btrfs_set_header_bytenr(split, split->start); |
@@ -2286,12 +2304,17 @@ noinline int btrfs_leaf_free_space(struct btrfs_root *root, | |||
2286 | return ret; | 2304 | return ret; |
2287 | } | 2305 | } |
2288 | 2306 | ||
2307 | /* | ||
2308 | * min slot controls the lowest index we're willing to push to the | ||
2309 | * right. We'll push up to and including min_slot, but no lower | ||
2310 | */ | ||
2289 | static noinline int __push_leaf_right(struct btrfs_trans_handle *trans, | 2311 | static noinline int __push_leaf_right(struct btrfs_trans_handle *trans, |
2290 | struct btrfs_root *root, | 2312 | struct btrfs_root *root, |
2291 | struct btrfs_path *path, | 2313 | struct btrfs_path *path, |
2292 | int data_size, int empty, | 2314 | int data_size, int empty, |
2293 | struct extent_buffer *right, | 2315 | struct extent_buffer *right, |
2294 | int free_space, u32 left_nritems) | 2316 | int free_space, u32 left_nritems, |
2317 | u32 min_slot) | ||
2295 | { | 2318 | { |
2296 | struct extent_buffer *left = path->nodes[0]; | 2319 | struct extent_buffer *left = path->nodes[0]; |
2297 | struct extent_buffer *upper = path->nodes[1]; | 2320 | struct extent_buffer *upper = path->nodes[1]; |
@@ -2309,7 +2332,7 @@ static noinline int __push_leaf_right(struct btrfs_trans_handle *trans, | |||
2309 | if (empty) | 2332 | if (empty) |
2310 | nr = 0; | 2333 | nr = 0; |
2311 | else | 2334 | else |
2312 | nr = 1; | 2335 | nr = max_t(u32, 1, min_slot); |
2313 | 2336 | ||
2314 | if (path->slots[0] >= left_nritems) | 2337 | if (path->slots[0] >= left_nritems) |
2315 | push_space += data_size; | 2338 | push_space += data_size; |
@@ -2415,6 +2438,9 @@ static noinline int __push_leaf_right(struct btrfs_trans_handle *trans, | |||
2415 | 2438 | ||
2416 | if (left_nritems) | 2439 | if (left_nritems) |
2417 | btrfs_mark_buffer_dirty(left); | 2440 | btrfs_mark_buffer_dirty(left); |
2441 | else | ||
2442 | clean_tree_block(trans, root, left); | ||
2443 | |||
2418 | btrfs_mark_buffer_dirty(right); | 2444 | btrfs_mark_buffer_dirty(right); |
2419 | 2445 | ||
2420 | btrfs_item_key(right, &disk_key, 0); | 2446 | btrfs_item_key(right, &disk_key, 0); |
@@ -2448,10 +2474,14 @@ out_unlock: | |||
2448 | * | 2474 | * |
2449 | * returns 1 if the push failed because the other node didn't have enough | 2475 | * returns 1 if the push failed because the other node didn't have enough |
2450 | * room, 0 if everything worked out and < 0 if there were major errors. | 2476 | * room, 0 if everything worked out and < 0 if there were major errors. |
2477 | * | ||
2478 | * this will push starting from min_slot to the end of the leaf. It won't | ||
2479 | * push any slot lower than min_slot | ||
2451 | */ | 2480 | */ |
2452 | static int push_leaf_right(struct btrfs_trans_handle *trans, struct btrfs_root | 2481 | static int push_leaf_right(struct btrfs_trans_handle *trans, struct btrfs_root |
2453 | *root, struct btrfs_path *path, int data_size, | 2482 | *root, struct btrfs_path *path, |
2454 | int empty) | 2483 | int min_data_size, int data_size, |
2484 | int empty, u32 min_slot) | ||
2455 | { | 2485 | { |
2456 | struct extent_buffer *left = path->nodes[0]; | 2486 | struct extent_buffer *left = path->nodes[0]; |
2457 | struct extent_buffer *right; | 2487 | struct extent_buffer *right; |
@@ -2493,8 +2523,8 @@ static int push_leaf_right(struct btrfs_trans_handle *trans, struct btrfs_root | |||
2493 | if (left_nritems == 0) | 2523 | if (left_nritems == 0) |
2494 | goto out_unlock; | 2524 | goto out_unlock; |
2495 | 2525 | ||
2496 | return __push_leaf_right(trans, root, path, data_size, empty, | 2526 | return __push_leaf_right(trans, root, path, min_data_size, empty, |
2497 | right, free_space, left_nritems); | 2527 | right, free_space, left_nritems, min_slot); |
2498 | out_unlock: | 2528 | out_unlock: |
2499 | btrfs_tree_unlock(right); | 2529 | btrfs_tree_unlock(right); |
2500 | free_extent_buffer(right); | 2530 | free_extent_buffer(right); |
@@ -2504,12 +2534,17 @@ out_unlock: | |||
2504 | /* | 2534 | /* |
2505 | * push some data in the path leaf to the left, trying to free up at | 2535 | * push some data in the path leaf to the left, trying to free up at |
2506 | * least data_size bytes. returns zero if the push worked, nonzero otherwise | 2536 | * least data_size bytes. returns zero if the push worked, nonzero otherwise |
2537 | * | ||
2538 | * max_slot can put a limit on how far into the leaf we'll push items. The | ||
2539 | * item at 'max_slot' won't be touched. Use (u32)-1 to make us do all the | ||
2540 | * items | ||
2507 | */ | 2541 | */ |
2508 | static noinline int __push_leaf_left(struct btrfs_trans_handle *trans, | 2542 | static noinline int __push_leaf_left(struct btrfs_trans_handle *trans, |
2509 | struct btrfs_root *root, | 2543 | struct btrfs_root *root, |
2510 | struct btrfs_path *path, int data_size, | 2544 | struct btrfs_path *path, int data_size, |
2511 | int empty, struct extent_buffer *left, | 2545 | int empty, struct extent_buffer *left, |
2512 | int free_space, int right_nritems) | 2546 | int free_space, u32 right_nritems, |
2547 | u32 max_slot) | ||
2513 | { | 2548 | { |
2514 | struct btrfs_disk_key disk_key; | 2549 | struct btrfs_disk_key disk_key; |
2515 | struct extent_buffer *right = path->nodes[0]; | 2550 | struct extent_buffer *right = path->nodes[0]; |
@@ -2528,9 +2563,9 @@ static noinline int __push_leaf_left(struct btrfs_trans_handle *trans, | |||
2528 | slot = path->slots[1]; | 2563 | slot = path->slots[1]; |
2529 | 2564 | ||
2530 | if (empty) | 2565 | if (empty) |
2531 | nr = right_nritems; | 2566 | nr = min(right_nritems, max_slot); |
2532 | else | 2567 | else |
2533 | nr = right_nritems - 1; | 2568 | nr = min(right_nritems - 1, max_slot); |
2534 | 2569 | ||
2535 | for (i = 0; i < nr; i++) { | 2570 | for (i = 0; i < nr; i++) { |
2536 | item = btrfs_item_nr(right, i); | 2571 | item = btrfs_item_nr(right, i); |
@@ -2660,6 +2695,8 @@ static noinline int __push_leaf_left(struct btrfs_trans_handle *trans, | |||
2660 | btrfs_mark_buffer_dirty(left); | 2695 | btrfs_mark_buffer_dirty(left); |
2661 | if (right_nritems) | 2696 | if (right_nritems) |
2662 | btrfs_mark_buffer_dirty(right); | 2697 | btrfs_mark_buffer_dirty(right); |
2698 | else | ||
2699 | clean_tree_block(trans, root, right); | ||
2663 | 2700 | ||
2664 | btrfs_item_key(right, &disk_key, 0); | 2701 | btrfs_item_key(right, &disk_key, 0); |
2665 | wret = fixup_low_keys(trans, root, path, &disk_key, 1); | 2702 | wret = fixup_low_keys(trans, root, path, &disk_key, 1); |
@@ -2669,8 +2706,6 @@ static noinline int __push_leaf_left(struct btrfs_trans_handle *trans, | |||
2669 | /* then fixup the leaf pointer in the path */ | 2706 | /* then fixup the leaf pointer in the path */ |
2670 | if (path->slots[0] < push_items) { | 2707 | if (path->slots[0] < push_items) { |
2671 | path->slots[0] += old_left_nritems; | 2708 | path->slots[0] += old_left_nritems; |
2672 | if (btrfs_header_nritems(path->nodes[0]) == 0) | ||
2673 | clean_tree_block(trans, root, path->nodes[0]); | ||
2674 | btrfs_tree_unlock(path->nodes[0]); | 2709 | btrfs_tree_unlock(path->nodes[0]); |
2675 | free_extent_buffer(path->nodes[0]); | 2710 | free_extent_buffer(path->nodes[0]); |
2676 | path->nodes[0] = left; | 2711 | path->nodes[0] = left; |
@@ -2691,10 +2726,14 @@ out: | |||
2691 | /* | 2726 | /* |
2692 | * push some data in the path leaf to the left, trying to free up at | 2727 | * push some data in the path leaf to the left, trying to free up at |
2693 | * least data_size bytes. returns zero if the push worked, nonzero otherwise | 2728 | * least data_size bytes. returns zero if the push worked, nonzero otherwise |
2729 | * | ||
2730 | * max_slot can put a limit on how far into the leaf we'll push items. The | ||
2731 | * item at 'max_slot' won't be touched. Use (u32)-1 to make us push all the | ||
2732 | * items | ||
2694 | */ | 2733 | */ |
2695 | static int push_leaf_left(struct btrfs_trans_handle *trans, struct btrfs_root | 2734 | static int push_leaf_left(struct btrfs_trans_handle *trans, struct btrfs_root |
2696 | *root, struct btrfs_path *path, int data_size, | 2735 | *root, struct btrfs_path *path, int min_data_size, |
2697 | int empty) | 2736 | int data_size, int empty, u32 max_slot) |
2698 | { | 2737 | { |
2699 | struct extent_buffer *right = path->nodes[0]; | 2738 | struct extent_buffer *right = path->nodes[0]; |
2700 | struct extent_buffer *left; | 2739 | struct extent_buffer *left; |
@@ -2740,8 +2779,9 @@ static int push_leaf_left(struct btrfs_trans_handle *trans, struct btrfs_root | |||
2740 | goto out; | 2779 | goto out; |
2741 | } | 2780 | } |
2742 | 2781 | ||
2743 | return __push_leaf_left(trans, root, path, data_size, | 2782 | return __push_leaf_left(trans, root, path, min_data_size, |
2744 | empty, left, free_space, right_nritems); | 2783 | empty, left, free_space, right_nritems, |
2784 | max_slot); | ||
2745 | out: | 2785 | out: |
2746 | btrfs_tree_unlock(left); | 2786 | btrfs_tree_unlock(left); |
2747 | free_extent_buffer(left); | 2787 | free_extent_buffer(left); |
@@ -2834,6 +2874,64 @@ static noinline int copy_for_split(struct btrfs_trans_handle *trans, | |||
2834 | } | 2874 | } |
2835 | 2875 | ||
2836 | /* | 2876 | /* |
2877 | * double splits happen when we need to insert a big item in the middle | ||
2878 | * of a leaf. A double split can leave us with 3 mostly empty leaves: | ||
2879 | * leaf: [ slots 0 - N] [ our target ] [ N + 1 - total in leaf ] | ||
2880 | * A B C | ||
2881 | * | ||
2882 | * We avoid this by trying to push the items on either side of our target | ||
2883 | * into the adjacent leaves. If all goes well we can avoid the double split | ||
2884 | * completely. | ||
2885 | */ | ||
2886 | static noinline int push_for_double_split(struct btrfs_trans_handle *trans, | ||
2887 | struct btrfs_root *root, | ||
2888 | struct btrfs_path *path, | ||
2889 | int data_size) | ||
2890 | { | ||
2891 | int ret; | ||
2892 | int progress = 0; | ||
2893 | int slot; | ||
2894 | u32 nritems; | ||
2895 | |||
2896 | slot = path->slots[0]; | ||
2897 | |||
2898 | /* | ||
2899 | * try to push all the items after our slot into the | ||
2900 | * right leaf | ||
2901 | */ | ||
2902 | ret = push_leaf_right(trans, root, path, 1, data_size, 0, slot); | ||
2903 | if (ret < 0) | ||
2904 | return ret; | ||
2905 | |||
2906 | if (ret == 0) | ||
2907 | progress++; | ||
2908 | |||
2909 | nritems = btrfs_header_nritems(path->nodes[0]); | ||
2910 | /* | ||
2911 | * our goal is to get our slot at the start or end of a leaf. If | ||
2912 | * we've done so we're done | ||
2913 | */ | ||
2914 | if (path->slots[0] == 0 || path->slots[0] == nritems) | ||
2915 | return 0; | ||
2916 | |||
2917 | if (btrfs_leaf_free_space(root, path->nodes[0]) >= data_size) | ||
2918 | return 0; | ||
2919 | |||
2920 | /* try to push all the items before our slot into the next leaf */ | ||
2921 | slot = path->slots[0]; | ||
2922 | ret = push_leaf_left(trans, root, path, 1, data_size, 0, slot); | ||
2923 | if (ret < 0) | ||
2924 | return ret; | ||
2925 | |||
2926 | if (ret == 0) | ||
2927 | progress++; | ||
2928 | |||
2929 | if (progress) | ||
2930 | return 0; | ||
2931 | return 1; | ||
2932 | } | ||
2933 | |||
2934 | /* | ||
2837 | * split the path's leaf in two, making sure there is at least data_size | 2935 | * split the path's leaf in two, making sure there is at least data_size |
2838 | * available for the resulting leaf level of the path. | 2936 | * available for the resulting leaf level of the path. |
2839 | * | 2937 | * |
@@ -2855,6 +2953,7 @@ static noinline int split_leaf(struct btrfs_trans_handle *trans, | |||
2855 | int wret; | 2953 | int wret; |
2856 | int split; | 2954 | int split; |
2857 | int num_doubles = 0; | 2955 | int num_doubles = 0; |
2956 | int tried_avoid_double = 0; | ||
2858 | 2957 | ||
2859 | l = path->nodes[0]; | 2958 | l = path->nodes[0]; |
2860 | slot = path->slots[0]; | 2959 | slot = path->slots[0]; |
@@ -2863,12 +2962,14 @@ static noinline int split_leaf(struct btrfs_trans_handle *trans, | |||
2863 | return -EOVERFLOW; | 2962 | return -EOVERFLOW; |
2864 | 2963 | ||
2865 | /* first try to make some room by pushing left and right */ | 2964 | /* first try to make some room by pushing left and right */ |
2866 | if (data_size && ins_key->type != BTRFS_DIR_ITEM_KEY) { | 2965 | if (data_size) { |
2867 | wret = push_leaf_right(trans, root, path, data_size, 0); | 2966 | wret = push_leaf_right(trans, root, path, data_size, |
2967 | data_size, 0, 0); | ||
2868 | if (wret < 0) | 2968 | if (wret < 0) |
2869 | return wret; | 2969 | return wret; |
2870 | if (wret) { | 2970 | if (wret) { |
2871 | wret = push_leaf_left(trans, root, path, data_size, 0); | 2971 | wret = push_leaf_left(trans, root, path, data_size, |
2972 | data_size, 0, (u32)-1); | ||
2872 | if (wret < 0) | 2973 | if (wret < 0) |
2873 | return wret; | 2974 | return wret; |
2874 | } | 2975 | } |
@@ -2902,6 +3003,8 @@ again: | |||
2902 | if (mid != nritems && | 3003 | if (mid != nritems && |
2903 | leaf_space_used(l, mid, nritems - mid) + | 3004 | leaf_space_used(l, mid, nritems - mid) + |
2904 | data_size > BTRFS_LEAF_DATA_SIZE(root)) { | 3005 | data_size > BTRFS_LEAF_DATA_SIZE(root)) { |
3006 | if (data_size && !tried_avoid_double) | ||
3007 | goto push_for_double; | ||
2905 | split = 2; | 3008 | split = 2; |
2906 | } | 3009 | } |
2907 | } | 3010 | } |
@@ -2918,6 +3021,8 @@ again: | |||
2918 | if (mid != nritems && | 3021 | if (mid != nritems && |
2919 | leaf_space_used(l, mid, nritems - mid) + | 3022 | leaf_space_used(l, mid, nritems - mid) + |
2920 | data_size > BTRFS_LEAF_DATA_SIZE(root)) { | 3023 | data_size > BTRFS_LEAF_DATA_SIZE(root)) { |
3024 | if (data_size && !tried_avoid_double) | ||
3025 | goto push_for_double; | ||
2921 | split = 2 ; | 3026 | split = 2 ; |
2922 | } | 3027 | } |
2923 | } | 3028 | } |
@@ -2932,10 +3037,10 @@ again: | |||
2932 | right = btrfs_alloc_free_block(trans, root, root->leafsize, 0, | 3037 | right = btrfs_alloc_free_block(trans, root, root->leafsize, 0, |
2933 | root->root_key.objectid, | 3038 | root->root_key.objectid, |
2934 | &disk_key, 0, l->start, 0); | 3039 | &disk_key, 0, l->start, 0); |
2935 | if (IS_ERR(right)) { | 3040 | if (IS_ERR(right)) |
2936 | BUG_ON(1); | ||
2937 | return PTR_ERR(right); | 3041 | return PTR_ERR(right); |
2938 | } | 3042 | |
3043 | root_add_used(root, root->leafsize); | ||
2939 | 3044 | ||
2940 | memset_extent_buffer(right, 0, 0, sizeof(struct btrfs_header)); | 3045 | memset_extent_buffer(right, 0, 0, sizeof(struct btrfs_header)); |
2941 | btrfs_set_header_bytenr(right, right->start); | 3046 | btrfs_set_header_bytenr(right, right->start); |
@@ -2998,6 +3103,13 @@ again: | |||
2998 | } | 3103 | } |
2999 | 3104 | ||
3000 | return ret; | 3105 | return ret; |
3106 | |||
3107 | push_for_double: | ||
3108 | push_for_double_split(trans, root, path, data_size); | ||
3109 | tried_avoid_double = 1; | ||
3110 | if (btrfs_leaf_free_space(root, path->nodes[0]) >= data_size) | ||
3111 | return 0; | ||
3112 | goto again; | ||
3001 | } | 3113 | } |
3002 | 3114 | ||
3003 | static noinline int setup_leaf_for_split(struct btrfs_trans_handle *trans, | 3115 | static noinline int setup_leaf_for_split(struct btrfs_trans_handle *trans, |
@@ -3054,7 +3166,8 @@ static noinline int setup_leaf_for_split(struct btrfs_trans_handle *trans, | |||
3054 | 3166 | ||
3055 | btrfs_set_path_blocking(path); | 3167 | btrfs_set_path_blocking(path); |
3056 | ret = split_leaf(trans, root, &key, path, ins_len, 1); | 3168 | ret = split_leaf(trans, root, &key, path, ins_len, 1); |
3057 | BUG_ON(ret); | 3169 | if (ret) |
3170 | goto err; | ||
3058 | 3171 | ||
3059 | path->keep_locks = 0; | 3172 | path->keep_locks = 0; |
3060 | btrfs_unlock_up_safe(path, 1); | 3173 | btrfs_unlock_up_safe(path, 1); |
@@ -3796,9 +3909,10 @@ static noinline int btrfs_del_leaf(struct btrfs_trans_handle *trans, | |||
3796 | */ | 3909 | */ |
3797 | btrfs_unlock_up_safe(path, 0); | 3910 | btrfs_unlock_up_safe(path, 0); |
3798 | 3911 | ||
3799 | ret = btrfs_free_tree_block(trans, root, leaf->start, leaf->len, | 3912 | root_sub_used(root, leaf->len); |
3800 | 0, root->root_key.objectid, 0); | 3913 | |
3801 | return ret; | 3914 | btrfs_free_tree_block(trans, root, leaf, 0, 1); |
3915 | return 0; | ||
3802 | } | 3916 | } |
3803 | /* | 3917 | /* |
3804 | * delete the item at the leaf level in path. If that empties | 3918 | * delete the item at the leaf level in path. If that empties |
@@ -3865,6 +3979,8 @@ int btrfs_del_items(struct btrfs_trans_handle *trans, struct btrfs_root *root, | |||
3865 | if (leaf == root->node) { | 3979 | if (leaf == root->node) { |
3866 | btrfs_set_header_level(leaf, 0); | 3980 | btrfs_set_header_level(leaf, 0); |
3867 | } else { | 3981 | } else { |
3982 | btrfs_set_path_blocking(path); | ||
3983 | clean_tree_block(trans, root, leaf); | ||
3868 | ret = btrfs_del_leaf(trans, root, path, leaf); | 3984 | ret = btrfs_del_leaf(trans, root, path, leaf); |
3869 | BUG_ON(ret); | 3985 | BUG_ON(ret); |
3870 | } | 3986 | } |
@@ -3890,13 +4006,15 @@ int btrfs_del_items(struct btrfs_trans_handle *trans, struct btrfs_root *root, | |||
3890 | extent_buffer_get(leaf); | 4006 | extent_buffer_get(leaf); |
3891 | 4007 | ||
3892 | btrfs_set_path_blocking(path); | 4008 | btrfs_set_path_blocking(path); |
3893 | wret = push_leaf_left(trans, root, path, 1, 1); | 4009 | wret = push_leaf_left(trans, root, path, 1, 1, |
4010 | 1, (u32)-1); | ||
3894 | if (wret < 0 && wret != -ENOSPC) | 4011 | if (wret < 0 && wret != -ENOSPC) |
3895 | ret = wret; | 4012 | ret = wret; |
3896 | 4013 | ||
3897 | if (path->nodes[0] == leaf && | 4014 | if (path->nodes[0] == leaf && |
3898 | btrfs_header_nritems(leaf)) { | 4015 | btrfs_header_nritems(leaf)) { |
3899 | wret = push_leaf_right(trans, root, path, 1, 1); | 4016 | wret = push_leaf_right(trans, root, path, 1, |
4017 | 1, 1, 0); | ||
3900 | if (wret < 0 && wret != -ENOSPC) | 4018 | if (wret < 0 && wret != -ENOSPC) |
3901 | ret = wret; | 4019 | ret = wret; |
3902 | } | 4020 | } |