aboutsummaryrefslogtreecommitdiffstats
path: root/fs/ext4
diff options
context:
space:
mode:
authorZheng Liu <wenqing.lz@taobao.com>2013-02-18 00:29:59 -0500
committerTheodore Ts'o <tytso@mit.edu>2013-02-18 00:29:59 -0500
commitd100eef2440fea13e4f09e88b1c8bcbca64beb9f (patch)
tree2451dc4582b43a30b414c89108b75148d48c9b57 /fs/ext4
parentf7fec032aa782d3fd7e51fbdf08aa3a296c01500 (diff)
ext4: lookup block mapping in extent status tree
After tracking all extent status, we already have a extent cache in memory. Every time we want to lookup a block mapping, we can first try to lookup it in extent status tree to avoid a potential disk I/O. A new function called ext4_es_lookup_extent is defined to finish this work. When we try to lookup a block mapping, we always call ext4_map_blocks and/or ext4_da_map_blocks. So in these functions we first try to lookup a block mapping in extent status tree. A new flag EXT4_GET_BLOCKS_NO_PUT_HOLE is used in ext4_da_map_blocks in order not to put a hole into extent status tree because this hole will be converted to delayed extent in the tree immediately. Signed-off-by: Zheng Liu <wenqing.lz@taobao.com> Signed-off-by: "Theodore Ts'o" <tytso@mit.edu> Cc: Jan kara <jack@suse.cz>
Diffstat (limited to 'fs/ext4')
-rw-r--r--fs/ext4/ext4.h2
-rw-r--r--fs/ext4/extents.c9
-rw-r--r--fs/ext4/extents_status.c60
-rw-r--r--fs/ext4/extents_status.h2
-rw-r--r--fs/ext4/inode.c66
5 files changed, 136 insertions, 3 deletions
diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h
index 5c31d6ac9500..329e7fba47d6 100644
--- a/fs/ext4/ext4.h
+++ b/fs/ext4/ext4.h
@@ -579,6 +579,8 @@ enum {
579#define EXT4_GET_BLOCKS_KEEP_SIZE 0x0080 579#define EXT4_GET_BLOCKS_KEEP_SIZE 0x0080
580 /* Do not take i_data_sem locking in ext4_map_blocks */ 580 /* Do not take i_data_sem locking in ext4_map_blocks */
581#define EXT4_GET_BLOCKS_NO_LOCK 0x0100 581#define EXT4_GET_BLOCKS_NO_LOCK 0x0100
582 /* Do not put hole in extent cache */
583#define EXT4_GET_BLOCKS_NO_PUT_HOLE 0x0200
582 584
583/* 585/*
584 * Flags used by ext4_free_blocks 586 * Flags used by ext4_free_blocks
diff --git a/fs/ext4/extents.c b/fs/ext4/extents.c
index be0b1b3eed97..b9d7a2363736 100644
--- a/fs/ext4/extents.c
+++ b/fs/ext4/extents.c
@@ -2167,6 +2167,9 @@ ext4_ext_put_gap_in_cache(struct inode *inode, struct ext4_ext_path *path,
2167 block, 2167 block,
2168 le32_to_cpu(ex->ee_block), 2168 le32_to_cpu(ex->ee_block),
2169 ext4_ext_get_actual_len(ex)); 2169 ext4_ext_get_actual_len(ex));
2170 if (!ext4_find_delalloc_range(inode, lblock, lblock + len - 1))
2171 ext4_es_insert_extent(inode, lblock, len, ~0,
2172 EXTENT_STATUS_HOLE);
2170 } else if (block >= le32_to_cpu(ex->ee_block) 2173 } else if (block >= le32_to_cpu(ex->ee_block)
2171 + ext4_ext_get_actual_len(ex)) { 2174 + ext4_ext_get_actual_len(ex)) {
2172 ext4_lblk_t next; 2175 ext4_lblk_t next;
@@ -2180,6 +2183,9 @@ ext4_ext_put_gap_in_cache(struct inode *inode, struct ext4_ext_path *path,
2180 block); 2183 block);
2181 BUG_ON(next == lblock); 2184 BUG_ON(next == lblock);
2182 len = next - lblock; 2185 len = next - lblock;
2186 if (!ext4_find_delalloc_range(inode, lblock, lblock + len - 1))
2187 ext4_es_insert_extent(inode, lblock, len, ~0,
2188 EXTENT_STATUS_HOLE);
2183 } else { 2189 } else {
2184 lblock = len = 0; 2190 lblock = len = 0;
2185 BUG(); 2191 BUG();
@@ -4018,7 +4024,8 @@ int ext4_ext_map_blocks(handle_t *handle, struct inode *inode,
4018 * put just found gap into cache to speed up 4024 * put just found gap into cache to speed up
4019 * subsequent requests 4025 * subsequent requests
4020 */ 4026 */
4021 ext4_ext_put_gap_in_cache(inode, path, map->m_lblk); 4027 if ((flags & EXT4_GET_BLOCKS_NO_PUT_HOLE) == 0)
4028 ext4_ext_put_gap_in_cache(inode, path, map->m_lblk);
4022 goto out2; 4029 goto out2;
4023 } 4030 }
4024 4031
diff --git a/fs/ext4/extents_status.c b/fs/ext4/extents_status.c
index 76f4351ea821..eeb893122d8d 100644
--- a/fs/ext4/extents_status.c
+++ b/fs/ext4/extents_status.c
@@ -461,6 +461,66 @@ error:
461 return err; 461 return err;
462} 462}
463 463
464/*
465 * ext4_es_lookup_extent() looks up an extent in extent status tree.
466 *
467 * ext4_es_lookup_extent is called by ext4_map_blocks/ext4_da_map_blocks.
468 *
469 * Return: 1 on found, 0 on not
470 */
471int ext4_es_lookup_extent(struct inode *inode, ext4_lblk_t lblk,
472 struct extent_status *es)
473{
474 struct ext4_es_tree *tree;
475 struct extent_status *es1 = NULL;
476 struct rb_node *node;
477 int found = 0;
478
479 trace_ext4_es_lookup_extent_enter(inode, lblk);
480 es_debug("lookup extent in block %u\n", lblk);
481
482 tree = &EXT4_I(inode)->i_es_tree;
483 read_lock(&EXT4_I(inode)->i_es_lock);
484
485 /* find extent in cache firstly */
486 es->es_lblk = es->es_len = es->es_pblk = 0;
487 if (tree->cache_es) {
488 es1 = tree->cache_es;
489 if (in_range(lblk, es1->es_lblk, es1->es_len)) {
490 es_debug("%u cached by [%u/%u)\n",
491 lblk, es1->es_lblk, es1->es_len);
492 found = 1;
493 goto out;
494 }
495 }
496
497 node = tree->root.rb_node;
498 while (node) {
499 es1 = rb_entry(node, struct extent_status, rb_node);
500 if (lblk < es1->es_lblk)
501 node = node->rb_left;
502 else if (lblk > ext4_es_end(es1))
503 node = node->rb_right;
504 else {
505 found = 1;
506 break;
507 }
508 }
509
510out:
511 if (found) {
512 BUG_ON(!es1);
513 es->es_lblk = es1->es_lblk;
514 es->es_len = es1->es_len;
515 es->es_pblk = es1->es_pblk;
516 }
517
518 read_unlock(&EXT4_I(inode)->i_es_lock);
519
520 trace_ext4_es_lookup_extent_exit(inode, es, found);
521 return found;
522}
523
464static int __es_remove_extent(struct ext4_es_tree *tree, ext4_lblk_t lblk, 524static int __es_remove_extent(struct ext4_es_tree *tree, ext4_lblk_t lblk,
465 ext4_lblk_t end) 525 ext4_lblk_t end)
466{ 526{
diff --git a/fs/ext4/extents_status.h b/fs/ext4/extents_status.h
index 3f69d097c6e7..8ffc90c784fa 100644
--- a/fs/ext4/extents_status.h
+++ b/fs/ext4/extents_status.h
@@ -53,6 +53,8 @@ extern int ext4_es_remove_extent(struct inode *inode, ext4_lblk_t lblk,
53 ext4_lblk_t len); 53 ext4_lblk_t len);
54extern void ext4_es_find_delayed_extent(struct inode *inode, ext4_lblk_t lblk, 54extern void ext4_es_find_delayed_extent(struct inode *inode, ext4_lblk_t lblk,
55 struct extent_status *es); 55 struct extent_status *es);
56extern int ext4_es_lookup_extent(struct inode *inode, ext4_lblk_t lblk,
57 struct extent_status *es);
56 58
57static inline int ext4_es_is_written(struct extent_status *es) 59static inline int ext4_es_is_written(struct extent_status *es)
58{ 60{
diff --git a/fs/ext4/inode.c b/fs/ext4/inode.c
index 576b586b61aa..95a0c62c5683 100644
--- a/fs/ext4/inode.c
+++ b/fs/ext4/inode.c
@@ -507,12 +507,33 @@ static pgoff_t ext4_num_dirty_pages(struct inode *inode, pgoff_t idx,
507int ext4_map_blocks(handle_t *handle, struct inode *inode, 507int ext4_map_blocks(handle_t *handle, struct inode *inode,
508 struct ext4_map_blocks *map, int flags) 508 struct ext4_map_blocks *map, int flags)
509{ 509{
510 struct extent_status es;
510 int retval; 511 int retval;
511 512
512 map->m_flags = 0; 513 map->m_flags = 0;
513 ext_debug("ext4_map_blocks(): inode %lu, flag %d, max_blocks %u," 514 ext_debug("ext4_map_blocks(): inode %lu, flag %d, max_blocks %u,"
514 "logical block %lu\n", inode->i_ino, flags, map->m_len, 515 "logical block %lu\n", inode->i_ino, flags, map->m_len,
515 (unsigned long) map->m_lblk); 516 (unsigned long) map->m_lblk);
517
518 /* Lookup extent status tree firstly */
519 if (ext4_es_lookup_extent(inode, map->m_lblk, &es)) {
520 if (ext4_es_is_written(&es) || ext4_es_is_unwritten(&es)) {
521 map->m_pblk = ext4_es_pblock(&es) +
522 map->m_lblk - es.es_lblk;
523 map->m_flags |= ext4_es_is_written(&es) ?
524 EXT4_MAP_MAPPED : EXT4_MAP_UNWRITTEN;
525 retval = es.es_len - (map->m_lblk - es.es_lblk);
526 if (retval > map->m_len)
527 retval = map->m_len;
528 map->m_len = retval;
529 } else if (ext4_es_is_delayed(&es) || ext4_es_is_hole(&es)) {
530 retval = 0;
531 } else {
532 BUG_ON(1);
533 }
534 goto found;
535 }
536
516 /* 537 /*
517 * Try to see if we can get the block without requesting a new 538 * Try to see if we can get the block without requesting a new
518 * file system block. 539 * file system block.
@@ -544,6 +565,7 @@ int ext4_map_blocks(handle_t *handle, struct inode *inode,
544 if (!(flags & EXT4_GET_BLOCKS_NO_LOCK)) 565 if (!(flags & EXT4_GET_BLOCKS_NO_LOCK))
545 up_read((&EXT4_I(inode)->i_data_sem)); 566 up_read((&EXT4_I(inode)->i_data_sem));
546 567
568found:
547 if (retval > 0 && map->m_flags & EXT4_MAP_MAPPED) { 569 if (retval > 0 && map->m_flags & EXT4_MAP_MAPPED) {
548 int ret = check_block_validity(inode, map); 570 int ret = check_block_validity(inode, map);
549 if (ret != 0) 571 if (ret != 0)
@@ -1743,6 +1765,7 @@ static int ext4_da_map_blocks(struct inode *inode, sector_t iblock,
1743 struct ext4_map_blocks *map, 1765 struct ext4_map_blocks *map,
1744 struct buffer_head *bh) 1766 struct buffer_head *bh)
1745{ 1767{
1768 struct extent_status es;
1746 int retval; 1769 int retval;
1747 sector_t invalid_block = ~((sector_t) 0xffff); 1770 sector_t invalid_block = ~((sector_t) 0xffff);
1748 1771
@@ -1753,6 +1776,42 @@ static int ext4_da_map_blocks(struct inode *inode, sector_t iblock,
1753 ext_debug("ext4_da_map_blocks(): inode %lu, max_blocks %u," 1776 ext_debug("ext4_da_map_blocks(): inode %lu, max_blocks %u,"
1754 "logical block %lu\n", inode->i_ino, map->m_len, 1777 "logical block %lu\n", inode->i_ino, map->m_len,
1755 (unsigned long) map->m_lblk); 1778 (unsigned long) map->m_lblk);
1779
1780 /* Lookup extent status tree firstly */
1781 if (ext4_es_lookup_extent(inode, iblock, &es)) {
1782
1783 if (ext4_es_is_hole(&es)) {
1784 retval = 0;
1785 down_read((&EXT4_I(inode)->i_data_sem));
1786 goto add_delayed;
1787 }
1788
1789 /*
1790 * Delayed extent could be allocated by fallocate.
1791 * So we need to check it.
1792 */
1793 if (ext4_es_is_delayed(&es) && !ext4_es_is_unwritten(&es)) {
1794 map_bh(bh, inode->i_sb, invalid_block);
1795 set_buffer_new(bh);
1796 set_buffer_delay(bh);
1797 return 0;
1798 }
1799
1800 map->m_pblk = ext4_es_pblock(&es) + iblock - es.es_lblk;
1801 retval = es.es_len - (iblock - es.es_lblk);
1802 if (retval > map->m_len)
1803 retval = map->m_len;
1804 map->m_len = retval;
1805 if (ext4_es_is_written(&es))
1806 map->m_flags |= EXT4_MAP_MAPPED;
1807 else if (ext4_es_is_unwritten(&es))
1808 map->m_flags |= EXT4_MAP_UNWRITTEN;
1809 else
1810 BUG_ON(1);
1811
1812 return retval;
1813 }
1814
1756 /* 1815 /*
1757 * Try to see if we can get the block without requesting a new 1816 * Try to see if we can get the block without requesting a new
1758 * file system block. 1817 * file system block.
@@ -1771,10 +1830,13 @@ static int ext4_da_map_blocks(struct inode *inode, sector_t iblock,
1771 map->m_flags |= EXT4_MAP_FROM_CLUSTER; 1830 map->m_flags |= EXT4_MAP_FROM_CLUSTER;
1772 retval = 0; 1831 retval = 0;
1773 } else if (ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS)) 1832 } else if (ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS))
1774 retval = ext4_ext_map_blocks(NULL, inode, map, 0); 1833 retval = ext4_ext_map_blocks(NULL, inode, map,
1834 EXT4_GET_BLOCKS_NO_PUT_HOLE);
1775 else 1835 else
1776 retval = ext4_ind_map_blocks(NULL, inode, map, 0); 1836 retval = ext4_ind_map_blocks(NULL, inode, map,
1837 EXT4_GET_BLOCKS_NO_PUT_HOLE);
1777 1838
1839add_delayed:
1778 if (retval == 0) { 1840 if (retval == 0) {
1779 int ret; 1841 int ret;
1780 /* 1842 /*