aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMingming Cao <cmm@us.ibm.com>2009-09-28 15:49:08 -0400
committerTheodore Ts'o <tytso@mit.edu>2009-09-28 15:49:08 -0400
commit0031462b5b392f90d17f1d75abb795883c44e969 (patch)
treee8323861b8dede0f3ddbfc8324d650bf1f4fd74b
parent9f0ccfd8e07d61b413e6536ffa02fbf60d2e20d8 (diff)
ext4: Split uninitialized extents for direct I/O
When writing into an unitialized extent via direct I/O, and the direct I/O doesn't exactly cover the unitialized extent, split the extent into uninitialized and initialized extents before submitting the I/O. This avoids needing to deal with an ENOSPC error in the end_io callback that gets used for direct I/O. When the IO is complete, the written extent will be marked as initialized. Singed-Off-By: Mingming Cao <cmm@us.ibm.com> Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
-rw-r--r--fs/ext4/ext4.h22
-rw-r--r--fs/ext4/ext4_extents.h7
-rw-r--r--fs/ext4/extents.c423
-rw-r--r--fs/ext4/inode.c3
-rw-r--r--fs/ext4/migrate.c2
-rw-r--r--fs/ext4/move_extent.c4
6 files changed, 419 insertions, 42 deletions
diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h
index a58438e18d0b..2b4293aac162 100644
--- a/fs/ext4/ext4.h
+++ b/fs/ext4/ext4.h
@@ -128,6 +128,15 @@ struct mpage_da_data {
128 int retval; 128 int retval;
129}; 129};
130 130
131typedef struct ext4_io_end {
132 struct inode *inode; /* file being written to */
133 unsigned int flag; /* sync IO or AIO */
134 int error; /* I/O error code */
135 ext4_lblk_t offset; /* offset in the file */
136 size_t size; /* size of the extent */
137 struct work_struct work; /* data work queue */
138} ext4_io_end_t;
139
131/* 140/*
132 * Special inodes numbers 141 * Special inodes numbers
133 */ 142 */
@@ -347,7 +356,16 @@ struct ext4_new_group_data {
347 /* Call ext4_da_update_reserve_space() after successfully 356 /* Call ext4_da_update_reserve_space() after successfully
348 allocating the blocks */ 357 allocating the blocks */
349#define EXT4_GET_BLOCKS_UPDATE_RESERVE_SPACE 0x0008 358#define EXT4_GET_BLOCKS_UPDATE_RESERVE_SPACE 0x0008
350 359 /* caller is from the direct IO path, request to creation of an
360 unitialized extents if not allocated, split the uninitialized
361 extent if blocks has been preallocated already*/
362#define EXT4_GET_BLOCKS_DIO 0x0010
363#define EXT4_GET_BLOCKS_CONVERT 0x0020
364#define EXT4_GET_BLOCKS_DIO_CREATE_EXT (EXT4_GET_BLOCKS_DIO|\
365 EXT4_GET_BLOCKS_CREATE_UNINIT_EXT)
366 /* Convert extent to initialized after direct IO complete */
367#define EXT4_GET_BLOCKS_DIO_CONVERT_EXT (EXT4_GET_BLOCKS_CONVERT|\
368 EXT4_GET_BLOCKS_DIO_CREATE_EXT)
351 369
352/* 370/*
353 * ioctl commands 371 * ioctl commands
@@ -1700,6 +1718,8 @@ extern void ext4_ext_init(struct super_block *);
1700extern void ext4_ext_release(struct super_block *); 1718extern void ext4_ext_release(struct super_block *);
1701extern long ext4_fallocate(struct inode *inode, int mode, loff_t offset, 1719extern long ext4_fallocate(struct inode *inode, int mode, loff_t offset,
1702 loff_t len); 1720 loff_t len);
1721extern int ext4_convert_unwritten_extents(struct inode *inode, loff_t offset,
1722 loff_t len);
1703extern int ext4_get_blocks(handle_t *handle, struct inode *inode, 1723extern int ext4_get_blocks(handle_t *handle, struct inode *inode,
1704 sector_t block, unsigned int max_blocks, 1724 sector_t block, unsigned int max_blocks,
1705 struct buffer_head *bh, int flags); 1725 struct buffer_head *bh, int flags);
diff --git a/fs/ext4/ext4_extents.h b/fs/ext4/ext4_extents.h
index 61652f1d15e6..2ca686454e87 100644
--- a/fs/ext4/ext4_extents.h
+++ b/fs/ext4/ext4_extents.h
@@ -220,6 +220,11 @@ static inline int ext4_ext_get_actual_len(struct ext4_extent *ext)
220 (le16_to_cpu(ext->ee_len) - EXT_INIT_MAX_LEN)); 220 (le16_to_cpu(ext->ee_len) - EXT_INIT_MAX_LEN));
221} 221}
222 222
223static inline void ext4_ext_mark_initialized(struct ext4_extent *ext)
224{
225 ext->ee_len = cpu_to_le16(ext4_ext_get_actual_len(ext));
226}
227
223extern int ext4_ext_calc_metadata_amount(struct inode *inode, int blocks); 228extern int ext4_ext_calc_metadata_amount(struct inode *inode, int blocks);
224extern ext4_fsblk_t ext_pblock(struct ext4_extent *ex); 229extern ext4_fsblk_t ext_pblock(struct ext4_extent *ex);
225extern ext4_fsblk_t idx_pblock(struct ext4_extent_idx *); 230extern ext4_fsblk_t idx_pblock(struct ext4_extent_idx *);
@@ -235,7 +240,7 @@ extern int ext4_ext_try_to_merge(struct inode *inode,
235 struct ext4_ext_path *path, 240 struct ext4_ext_path *path,
236 struct ext4_extent *); 241 struct ext4_extent *);
237extern unsigned int ext4_ext_check_overlap(struct inode *, struct ext4_extent *, struct ext4_ext_path *); 242extern unsigned int ext4_ext_check_overlap(struct inode *, struct ext4_extent *, struct ext4_ext_path *);
238extern int ext4_ext_insert_extent(handle_t *, struct inode *, struct ext4_ext_path *, struct ext4_extent *); 243extern int ext4_ext_insert_extent(handle_t *, struct inode *, struct ext4_ext_path *, struct ext4_extent *, int);
239extern int ext4_ext_walk_space(struct inode *, ext4_lblk_t, ext4_lblk_t, 244extern int ext4_ext_walk_space(struct inode *, ext4_lblk_t, ext4_lblk_t,
240 ext_prepare_callback, void *); 245 ext_prepare_callback, void *);
241extern struct ext4_ext_path *ext4_ext_find_extent(struct inode *, ext4_lblk_t, 246extern struct ext4_ext_path *ext4_ext_find_extent(struct inode *, ext4_lblk_t,
diff --git a/fs/ext4/extents.c b/fs/ext4/extents.c
index 7a3832577923..a38e651c004e 100644
--- a/fs/ext4/extents.c
+++ b/fs/ext4/extents.c
@@ -723,7 +723,7 @@ err:
723 * insert new index [@logical;@ptr] into the block at @curp; 723 * insert new index [@logical;@ptr] into the block at @curp;
724 * check where to insert: before @curp or after @curp 724 * check where to insert: before @curp or after @curp
725 */ 725 */
726static int ext4_ext_insert_index(handle_t *handle, struct inode *inode, 726int ext4_ext_insert_index(handle_t *handle, struct inode *inode,
727 struct ext4_ext_path *curp, 727 struct ext4_ext_path *curp,
728 int logical, ext4_fsblk_t ptr) 728 int logical, ext4_fsblk_t ptr)
729{ 729{
@@ -1586,7 +1586,7 @@ out:
1586 */ 1586 */
1587int ext4_ext_insert_extent(handle_t *handle, struct inode *inode, 1587int ext4_ext_insert_extent(handle_t *handle, struct inode *inode,
1588 struct ext4_ext_path *path, 1588 struct ext4_ext_path *path,
1589 struct ext4_extent *newext) 1589 struct ext4_extent *newext, int flag)
1590{ 1590{
1591 struct ext4_extent_header *eh; 1591 struct ext4_extent_header *eh;
1592 struct ext4_extent *ex, *fex; 1592 struct ext4_extent *ex, *fex;
@@ -1602,7 +1602,8 @@ int ext4_ext_insert_extent(handle_t *handle, struct inode *inode,
1602 BUG_ON(path[depth].p_hdr == NULL); 1602 BUG_ON(path[depth].p_hdr == NULL);
1603 1603
1604 /* try to insert block into found extent and return */ 1604 /* try to insert block into found extent and return */
1605 if (ex && ext4_can_extents_be_merged(inode, ex, newext)) { 1605 if (ex && (flag != EXT4_GET_BLOCKS_DIO_CREATE_EXT)
1606 && ext4_can_extents_be_merged(inode, ex, newext)) {
1606 ext_debug("append [%d]%d block to %d:[%d]%d (from %llu)\n", 1607 ext_debug("append [%d]%d block to %d:[%d]%d (from %llu)\n",
1607 ext4_ext_is_uninitialized(newext), 1608 ext4_ext_is_uninitialized(newext),
1608 ext4_ext_get_actual_len(newext), 1609 ext4_ext_get_actual_len(newext),
@@ -1722,7 +1723,8 @@ has_space:
1722 1723
1723merge: 1724merge:
1724 /* try to merge extents to the right */ 1725 /* try to merge extents to the right */
1725 ext4_ext_try_to_merge(inode, path, nearex); 1726 if (flag != EXT4_GET_BLOCKS_DIO_CREATE_EXT)
1727 ext4_ext_try_to_merge(inode, path, nearex);
1726 1728
1727 /* try to merge extents to the left */ 1729 /* try to merge extents to the left */
1728 1730
@@ -2490,7 +2492,6 @@ static int ext4_ext_zeroout(struct inode *inode, struct ext4_extent *ex)
2490} 2492}
2491 2493
2492#define EXT4_EXT_ZERO_LEN 7 2494#define EXT4_EXT_ZERO_LEN 7
2493
2494/* 2495/*
2495 * This function is called by ext4_ext_get_blocks() if someone tries to write 2496 * This function is called by ext4_ext_get_blocks() if someone tries to write
2496 * to an uninitialized extent. It may result in splitting the uninitialized 2497 * to an uninitialized extent. It may result in splitting the uninitialized
@@ -2583,7 +2584,8 @@ static int ext4_ext_convert_to_initialized(handle_t *handle,
2583 ex3->ee_block = cpu_to_le32(iblock); 2584 ex3->ee_block = cpu_to_le32(iblock);
2584 ext4_ext_store_pblock(ex3, newblock); 2585 ext4_ext_store_pblock(ex3, newblock);
2585 ex3->ee_len = cpu_to_le16(allocated); 2586 ex3->ee_len = cpu_to_le16(allocated);
2586 err = ext4_ext_insert_extent(handle, inode, path, ex3); 2587 err = ext4_ext_insert_extent(handle, inode, path,
2588 ex3, 0);
2587 if (err == -ENOSPC) { 2589 if (err == -ENOSPC) {
2588 err = ext4_ext_zeroout(inode, &orig_ex); 2590 err = ext4_ext_zeroout(inode, &orig_ex);
2589 if (err) 2591 if (err)
@@ -2639,7 +2641,7 @@ static int ext4_ext_convert_to_initialized(handle_t *handle,
2639 ext4_ext_store_pblock(ex3, newblock + max_blocks); 2641 ext4_ext_store_pblock(ex3, newblock + max_blocks);
2640 ex3->ee_len = cpu_to_le16(allocated - max_blocks); 2642 ex3->ee_len = cpu_to_le16(allocated - max_blocks);
2641 ext4_ext_mark_uninitialized(ex3); 2643 ext4_ext_mark_uninitialized(ex3);
2642 err = ext4_ext_insert_extent(handle, inode, path, ex3); 2644 err = ext4_ext_insert_extent(handle, inode, path, ex3, 0);
2643 if (err == -ENOSPC) { 2645 if (err == -ENOSPC) {
2644 err = ext4_ext_zeroout(inode, &orig_ex); 2646 err = ext4_ext_zeroout(inode, &orig_ex);
2645 if (err) 2647 if (err)
@@ -2757,7 +2759,7 @@ static int ext4_ext_convert_to_initialized(handle_t *handle,
2757 err = ext4_ext_dirty(handle, inode, path + depth); 2759 err = ext4_ext_dirty(handle, inode, path + depth);
2758 goto out; 2760 goto out;
2759insert: 2761insert:
2760 err = ext4_ext_insert_extent(handle, inode, path, &newex); 2762 err = ext4_ext_insert_extent(handle, inode, path, &newex, 0);
2761 if (err == -ENOSPC) { 2763 if (err == -ENOSPC) {
2762 err = ext4_ext_zeroout(inode, &orig_ex); 2764 err = ext4_ext_zeroout(inode, &orig_ex);
2763 if (err) 2765 if (err)
@@ -2785,6 +2787,320 @@ fix_extent_len:
2785} 2787}
2786 2788
2787/* 2789/*
2790 * This function is called by ext4_ext_get_blocks() from
2791 * ext4_get_blocks_dio_write() when DIO to write
2792 * to an uninitialized extent.
2793 *
2794 * Writing to an uninitized extent may result in splitting the uninitialized
2795 * extent into multiple /intialized unintialized extents (up to three)
2796 * There are three possibilities:
2797 * a> There is no split required: Entire extent should be uninitialized
2798 * b> Splits in two extents: Write is happening at either end of the extent
2799 * c> Splits in three extents: Somone is writing in middle of the extent
2800 *
2801 * One of more index blocks maybe needed if the extent tree grow after
2802 * the unintialized extent split. To prevent ENOSPC occur at the IO
2803 * complete, we need to split the uninitialized extent before DIO submit
2804 * the IO. The uninitilized extent called at this time will be split
2805 * into three uninitialized extent(at most). After IO complete, the part
2806 * being filled will be convert to initialized by the end_io callback function
2807 * via ext4_convert_unwritten_extents().
2808 */
2809static int ext4_split_unwritten_extents(handle_t *handle,
2810 struct inode *inode,
2811 struct ext4_ext_path *path,
2812 ext4_lblk_t iblock,
2813 unsigned int max_blocks,
2814 int flags)
2815{
2816 struct ext4_extent *ex, newex, orig_ex;
2817 struct ext4_extent *ex1 = NULL;
2818 struct ext4_extent *ex2 = NULL;
2819 struct ext4_extent *ex3 = NULL;
2820 struct ext4_extent_header *eh;
2821 ext4_lblk_t ee_block;
2822 unsigned int allocated, ee_len, depth;
2823 ext4_fsblk_t newblock;
2824 int err = 0;
2825 int ret = 0;
2826
2827 ext_debug("ext4_split_unwritten_extents: inode %lu,"
2828 "iblock %llu, max_blocks %u\n", inode->i_ino,
2829 (unsigned long long)iblock, max_blocks);
2830 depth = ext_depth(inode);
2831 eh = path[depth].p_hdr;
2832 ex = path[depth].p_ext;
2833 ee_block = le32_to_cpu(ex->ee_block);
2834 ee_len = ext4_ext_get_actual_len(ex);
2835 allocated = ee_len - (iblock - ee_block);
2836 newblock = iblock - ee_block + ext_pblock(ex);
2837 ex2 = ex;
2838 orig_ex.ee_block = ex->ee_block;
2839 orig_ex.ee_len = cpu_to_le16(ee_len);
2840 ext4_ext_store_pblock(&orig_ex, ext_pblock(ex));
2841
2842 /*
2843 * if the entire unintialized extent length less than
2844 * the size of extent to write, there is no need to split
2845 * uninitialized extent
2846 */
2847 if (allocated <= max_blocks)
2848 return ret;
2849
2850 err = ext4_ext_get_access(handle, inode, path + depth);
2851 if (err)
2852 goto out;
2853 /* ex1: ee_block to iblock - 1 : uninitialized */
2854 if (iblock > ee_block) {
2855 ex1 = ex;
2856 ex1->ee_len = cpu_to_le16(iblock - ee_block);
2857 ext4_ext_mark_uninitialized(ex1);
2858 ex2 = &newex;
2859 }
2860 /*
2861 * for sanity, update the length of the ex2 extent before
2862 * we insert ex3, if ex1 is NULL. This is to avoid temporary
2863 * overlap of blocks.
2864 */
2865 if (!ex1 && allocated > max_blocks)
2866 ex2->ee_len = cpu_to_le16(max_blocks);
2867 /* ex3: to ee_block + ee_len : uninitialised */
2868 if (allocated > max_blocks) {
2869 unsigned int newdepth;
2870 ex3 = &newex;
2871 ex3->ee_block = cpu_to_le32(iblock + max_blocks);
2872 ext4_ext_store_pblock(ex3, newblock + max_blocks);
2873 ex3->ee_len = cpu_to_le16(allocated - max_blocks);
2874 ext4_ext_mark_uninitialized(ex3);
2875 err = ext4_ext_insert_extent(handle, inode, path, ex3, flags);
2876 if (err == -ENOSPC) {
2877 err = ext4_ext_zeroout(inode, &orig_ex);
2878 if (err)
2879 goto fix_extent_len;
2880 /* update the extent length and mark as initialized */
2881 ex->ee_block = orig_ex.ee_block;
2882 ex->ee_len = orig_ex.ee_len;
2883 ext4_ext_store_pblock(ex, ext_pblock(&orig_ex));
2884 ext4_ext_dirty(handle, inode, path + depth);
2885 /* zeroed the full extent */
2886 /* blocks available from iblock */
2887 return allocated;
2888
2889 } else if (err)
2890 goto fix_extent_len;
2891 /*
2892 * The depth, and hence eh & ex might change
2893 * as part of the insert above.
2894 */
2895 newdepth = ext_depth(inode);
2896 /*
2897 * update the extent length after successful insert of the
2898 * split extent
2899 */
2900 orig_ex.ee_len = cpu_to_le16(ee_len -
2901 ext4_ext_get_actual_len(ex3));
2902 depth = newdepth;
2903 ext4_ext_drop_refs(path);
2904 path = ext4_ext_find_extent(inode, iblock, path);
2905 if (IS_ERR(path)) {
2906 err = PTR_ERR(path);
2907 goto out;
2908 }
2909 eh = path[depth].p_hdr;
2910 ex = path[depth].p_ext;
2911 if (ex2 != &newex)
2912 ex2 = ex;
2913
2914 err = ext4_ext_get_access(handle, inode, path + depth);
2915 if (err)
2916 goto out;
2917
2918 allocated = max_blocks;
2919 }
2920 /*
2921 * If there was a change of depth as part of the
2922 * insertion of ex3 above, we need to update the length
2923 * of the ex1 extent again here
2924 */
2925 if (ex1 && ex1 != ex) {
2926 ex1 = ex;
2927 ex1->ee_len = cpu_to_le16(iblock - ee_block);
2928 ext4_ext_mark_uninitialized(ex1);
2929 ex2 = &newex;
2930 }
2931 /*
2932 * ex2: iblock to iblock + maxblocks-1 : to be direct IO written,
2933 * uninitialised still.
2934 */
2935 ex2->ee_block = cpu_to_le32(iblock);
2936 ext4_ext_store_pblock(ex2, newblock);
2937 ex2->ee_len = cpu_to_le16(allocated);
2938 ext4_ext_mark_uninitialized(ex2);
2939 if (ex2 != ex)
2940 goto insert;
2941 /* Mark modified extent as dirty */
2942 err = ext4_ext_dirty(handle, inode, path + depth);
2943 ext_debug("out here\n");
2944 goto out;
2945insert:
2946 err = ext4_ext_insert_extent(handle, inode, path, &newex, flags);
2947 if (err == -ENOSPC) {
2948 err = ext4_ext_zeroout(inode, &orig_ex);
2949 if (err)
2950 goto fix_extent_len;
2951 /* update the extent length and mark as initialized */
2952 ex->ee_block = orig_ex.ee_block;
2953 ex->ee_len = orig_ex.ee_len;
2954 ext4_ext_store_pblock(ex, ext_pblock(&orig_ex));
2955 ext4_ext_dirty(handle, inode, path + depth);
2956 /* zero out the first half */
2957 return allocated;
2958 } else if (err)
2959 goto fix_extent_len;
2960out:
2961 ext4_ext_show_leaf(inode, path);
2962 return err ? err : allocated;
2963
2964fix_extent_len:
2965 ex->ee_block = orig_ex.ee_block;
2966 ex->ee_len = orig_ex.ee_len;
2967 ext4_ext_store_pblock(ex, ext_pblock(&orig_ex));
2968 ext4_ext_mark_uninitialized(ex);
2969 ext4_ext_dirty(handle, inode, path + depth);
2970 return err;
2971}
2972static int ext4_convert_unwritten_extents_dio(handle_t *handle,
2973 struct inode *inode,
2974 struct ext4_ext_path *path)
2975{
2976 struct ext4_extent *ex;
2977 struct ext4_extent_header *eh;
2978 int depth;
2979 int err = 0;
2980 int ret = 0;
2981
2982 depth = ext_depth(inode);
2983 eh = path[depth].p_hdr;
2984 ex = path[depth].p_ext;
2985
2986 err = ext4_ext_get_access(handle, inode, path + depth);
2987 if (err)
2988 goto out;
2989 /* first mark the extent as initialized */
2990 ext4_ext_mark_initialized(ex);
2991
2992 /*
2993 * We have to see if it can be merged with the extent
2994 * on the left.
2995 */
2996 if (ex > EXT_FIRST_EXTENT(eh)) {
2997 /*
2998 * To merge left, pass "ex - 1" to try_to_merge(),
2999 * since it merges towards right _only_.
3000 */
3001 ret = ext4_ext_try_to_merge(inode, path, ex - 1);
3002 if (ret) {
3003 err = ext4_ext_correct_indexes(handle, inode, path);
3004 if (err)
3005 goto out;
3006 depth = ext_depth(inode);
3007 ex--;
3008 }
3009 }
3010 /*
3011 * Try to Merge towards right.
3012 */
3013 ret = ext4_ext_try_to_merge(inode, path, ex);
3014 if (ret) {
3015 err = ext4_ext_correct_indexes(handle, inode, path);
3016 if (err)
3017 goto out;
3018 depth = ext_depth(inode);
3019 }
3020 /* Mark modified extent as dirty */
3021 err = ext4_ext_dirty(handle, inode, path + depth);
3022out:
3023 ext4_ext_show_leaf(inode, path);
3024 return err;
3025}
3026
3027static int
3028ext4_ext_handle_uninitialized_extents(handle_t *handle, struct inode *inode,
3029 ext4_lblk_t iblock, unsigned int max_blocks,
3030 struct ext4_ext_path *path, int flags,
3031 unsigned int allocated, struct buffer_head *bh_result,
3032 ext4_fsblk_t newblock)
3033{
3034 int ret = 0;
3035 int err = 0;
3036
3037 ext_debug("ext4_ext_handle_uninitialized_extents: inode %lu, logical"
3038 "block %llu, max_blocks %u, flags %d, allocated %u",
3039 inode->i_ino, (unsigned long long)iblock, max_blocks,
3040 flags, allocated);
3041 ext4_ext_show_leaf(inode, path);
3042
3043 /* DIO get_block() before submit the IO, split the extent */
3044 if (flags == EXT4_GET_BLOCKS_DIO_CREATE_EXT) {
3045 ret = ext4_split_unwritten_extents(handle,
3046 inode, path, iblock,
3047 max_blocks, flags);
3048 goto out;
3049 }
3050 /* DIO end_io complete, convert the filled extent to written */
3051 if (flags == EXT4_GET_BLOCKS_DIO_CONVERT_EXT) {
3052 ret = ext4_convert_unwritten_extents_dio(handle, inode,
3053 path);
3054 goto out2;
3055 }
3056 /* buffered IO case */
3057 /*
3058 * repeat fallocate creation request
3059 * we already have an unwritten extent
3060 */
3061 if (flags & EXT4_GET_BLOCKS_UNINIT_EXT)
3062 goto map_out;
3063
3064 /* buffered READ or buffered write_begin() lookup */
3065 if ((flags & EXT4_GET_BLOCKS_CREATE) == 0) {
3066 /*
3067 * We have blocks reserved already. We
3068 * return allocated blocks so that delalloc
3069 * won't do block reservation for us. But
3070 * the buffer head will be unmapped so that
3071 * a read from the block returns 0s.
3072 */
3073 set_buffer_unwritten(bh_result);
3074 goto out1;
3075 }
3076
3077 /* buffered write, writepage time, convert*/
3078 ret = ext4_ext_convert_to_initialized(handle, inode,
3079 path, iblock,
3080 max_blocks);
3081out:
3082 if (ret <= 0) {
3083 err = ret;
3084 goto out2;
3085 } else
3086 allocated = ret;
3087 set_buffer_new(bh_result);
3088map_out:
3089 set_buffer_mapped(bh_result);
3090out1:
3091 if (allocated > max_blocks)
3092 allocated = max_blocks;
3093 ext4_ext_show_leaf(inode, path);
3094 bh_result->b_bdev = inode->i_sb->s_bdev;
3095 bh_result->b_blocknr = newblock;
3096out2:
3097 if (path) {
3098 ext4_ext_drop_refs(path);
3099 kfree(path);
3100 }
3101 return err ? err : allocated;
3102}
3103/*
2788 * Block allocation/map/preallocation routine for extents based files 3104 * Block allocation/map/preallocation routine for extents based files
2789 * 3105 *
2790 * 3106 *
@@ -2889,33 +3205,10 @@ int ext4_ext_get_blocks(handle_t *handle, struct inode *inode,
2889 EXT4_EXT_CACHE_EXTENT); 3205 EXT4_EXT_CACHE_EXTENT);
2890 goto out; 3206 goto out;
2891 } 3207 }
2892 if (flags & EXT4_GET_BLOCKS_UNINIT_EXT) 3208 ret = ext4_ext_handle_uninitialized_extents(handle,
2893 goto out; 3209 inode, iblock, max_blocks, path,
2894 if ((flags & EXT4_GET_BLOCKS_CREATE) == 0) { 3210 flags, allocated, bh_result, newblock);
2895 if (allocated > max_blocks) 3211 return ret;
2896 allocated = max_blocks;
2897 /*
2898 * We have blocks reserved already. We
2899 * return allocated blocks so that delalloc
2900 * won't do block reservation for us. But
2901 * the buffer head will be unmapped so that
2902 * a read from the block returns 0s.
2903 */
2904 set_buffer_unwritten(bh_result);
2905 bh_result->b_bdev = inode->i_sb->s_bdev;
2906 bh_result->b_blocknr = newblock;
2907 goto out2;
2908 }
2909
2910 ret = ext4_ext_convert_to_initialized(handle, inode,
2911 path, iblock,
2912 max_blocks);
2913 if (ret <= 0) {
2914 err = ret;
2915 goto out2;
2916 } else
2917 allocated = ret;
2918 goto outnew;
2919 } 3212 }
2920 } 3213 }
2921 3214
@@ -2988,7 +3281,7 @@ int ext4_ext_get_blocks(handle_t *handle, struct inode *inode,
2988 newex.ee_len = cpu_to_le16(ar.len); 3281 newex.ee_len = cpu_to_le16(ar.len);
2989 if (flags & EXT4_GET_BLOCKS_UNINIT_EXT) /* Mark uninitialized */ 3282 if (flags & EXT4_GET_BLOCKS_UNINIT_EXT) /* Mark uninitialized */
2990 ext4_ext_mark_uninitialized(&newex); 3283 ext4_ext_mark_uninitialized(&newex);
2991 err = ext4_ext_insert_extent(handle, inode, path, &newex); 3284 err = ext4_ext_insert_extent(handle, inode, path, &newex, flags);
2992 if (err) { 3285 if (err) {
2993 /* free data blocks we just allocated */ 3286 /* free data blocks we just allocated */
2994 /* not a good idea to call discard here directly, 3287 /* not a good idea to call discard here directly,
@@ -3002,7 +3295,6 @@ int ext4_ext_get_blocks(handle_t *handle, struct inode *inode,
3002 /* previous routine could use block we allocated */ 3295 /* previous routine could use block we allocated */
3003 newblock = ext_pblock(&newex); 3296 newblock = ext_pblock(&newex);
3004 allocated = ext4_ext_get_actual_len(&newex); 3297 allocated = ext4_ext_get_actual_len(&newex);
3005outnew:
3006 set_buffer_new(bh_result); 3298 set_buffer_new(bh_result);
3007 3299
3008 /* Cache only when it is _not_ an uninitialized extent */ 3300 /* Cache only when it is _not_ an uninitialized extent */
@@ -3201,6 +3493,63 @@ retry:
3201} 3493}
3202 3494
3203/* 3495/*
3496 * This function convert a range of blocks to written extents
3497 * The caller of this function will pass the start offset and the size.
3498 * all unwritten extents within this range will be converted to
3499 * written extents.
3500 *
3501 * This function is called from the direct IO end io call back
3502 * function, to convert the fallocated extents after IO is completed.
3503 */
3504int ext4_convert_unwritten_extents(struct inode *inode, loff_t offset,
3505 loff_t len)
3506{
3507 handle_t *handle;
3508 ext4_lblk_t block;
3509 unsigned int max_blocks;
3510 int ret = 0;
3511 int ret2 = 0;
3512 struct buffer_head map_bh;
3513 unsigned int credits, blkbits = inode->i_blkbits;
3514
3515 block = offset >> blkbits;
3516 /*
3517 * We can't just convert len to max_blocks because
3518 * If blocksize = 4096 offset = 3072 and len = 2048
3519 */
3520 max_blocks = (EXT4_BLOCK_ALIGN(len + offset, blkbits) >> blkbits)
3521 - block;
3522 /*
3523 * credits to insert 1 extent into extent tree
3524 */
3525 credits = ext4_chunk_trans_blocks(inode, max_blocks);
3526 while (ret >= 0 && ret < max_blocks) {
3527 block = block + ret;
3528 max_blocks = max_blocks - ret;
3529 handle = ext4_journal_start(inode, credits);
3530 if (IS_ERR(handle)) {
3531 ret = PTR_ERR(handle);
3532 break;
3533 }
3534 map_bh.b_state = 0;
3535 ret = ext4_get_blocks(handle, inode, block,
3536 max_blocks, &map_bh,
3537 EXT4_GET_BLOCKS_DIO_CONVERT_EXT);
3538 if (ret <= 0) {
3539 WARN_ON(ret <= 0);
3540 printk(KERN_ERR "%s: ext4_ext_get_blocks "
3541 "returned error inode#%lu, block=%u, "
3542 "max_blocks=%u", __func__,
3543 inode->i_ino, block, max_blocks);
3544 }
3545 ext4_mark_inode_dirty(handle, inode);
3546 ret2 = ext4_journal_stop(handle);
3547 if (ret <= 0 || ret2 )
3548 break;
3549 }
3550 return ret > 0 ? ret2 : ret;
3551}
3552/*
3204 * Callback function called for each extent to gather FIEMAP information. 3553 * Callback function called for each extent to gather FIEMAP information.
3205 */ 3554 */
3206static int ext4_ext_fiemap_cb(struct inode *inode, struct ext4_ext_path *path, 3555static int ext4_ext_fiemap_cb(struct inode *inode, struct ext4_ext_path *path,
diff --git a/fs/ext4/inode.c b/fs/ext4/inode.c
index 219067ce09d9..da4f2ecb5447 100644
--- a/fs/ext4/inode.c
+++ b/fs/ext4/inode.c
@@ -1233,6 +1233,9 @@ int ext4_get_blocks(handle_t *handle, struct inode *inode, sector_t block,
1233 clear_buffer_mapped(bh); 1233 clear_buffer_mapped(bh);
1234 clear_buffer_unwritten(bh); 1234 clear_buffer_unwritten(bh);
1235 1235
1236 ext_debug("ext4_get_blocks(): inode %lu, flag %d, max_blocks %u,"
1237 "logical block %lu\n", inode->i_ino, flags, max_blocks,
1238 (unsigned long)block);
1236 /* 1239 /*
1237 * Try to see if we can get the block without requesting a new 1240 * Try to see if we can get the block without requesting a new
1238 * file system block. 1241 * file system block.
diff --git a/fs/ext4/migrate.c b/fs/ext4/migrate.c
index bf519f239ae6..a93d5b80f3e2 100644
--- a/fs/ext4/migrate.c
+++ b/fs/ext4/migrate.c
@@ -75,7 +75,7 @@ static int finish_range(handle_t *handle, struct inode *inode,
75 goto err_out; 75 goto err_out;
76 } 76 }
77 } 77 }
78 retval = ext4_ext_insert_extent(handle, inode, path, &newext); 78 retval = ext4_ext_insert_extent(handle, inode, path, &newext, 0);
79err_out: 79err_out:
80 if (path) { 80 if (path) {
81 ext4_ext_drop_refs(path); 81 ext4_ext_drop_refs(path);
diff --git a/fs/ext4/move_extent.c b/fs/ext4/move_extent.c
index c07a2915e40b..5332fd4c4028 100644
--- a/fs/ext4/move_extent.c
+++ b/fs/ext4/move_extent.c
@@ -322,7 +322,7 @@ mext_insert_across_blocks(handle_t *handle, struct inode *orig_inode,
322 goto out; 322 goto out;
323 323
324 if (ext4_ext_insert_extent(handle, orig_inode, 324 if (ext4_ext_insert_extent(handle, orig_inode,
325 orig_path, new_ext)) 325 orig_path, new_ext, 0))
326 goto out; 326 goto out;
327 } 327 }
328 328
@@ -333,7 +333,7 @@ mext_insert_across_blocks(handle_t *handle, struct inode *orig_inode,
333 goto out; 333 goto out;
334 334
335 if (ext4_ext_insert_extent(handle, orig_inode, 335 if (ext4_ext_insert_extent(handle, orig_inode,
336 orig_path, end_ext)) 336 orig_path, end_ext, 0))
337 goto out; 337 goto out;
338 } 338 }
339out: 339out: