8 files changed, 1525 insertions, 159 deletions
diff --git a/fs/ntfs/ChangeLog b/fs/ntfs/ChangeLog
index de58579a1d0e..9f4674a026f2 100644
--- a/fs/ntfs/ChangeLog
+++ b/fs/ntfs/ChangeLog
@@ -3,16 +3,14 @@ ToDo/Notes:
        - In between ntfs_prepare/commit_write, need exclusion between
          simultaneous file extensions.  This is given to us by holding i_sem
          on the inode.  The only places in the kernel when a file is resized
-          are prepare/commit write and truncate for both of which i_sem is
+          are prepare/commit write and ntfs_truncate() for both of which i_sem
-          held.  Just have to be careful in readpage/writepage and all other
+          is held.  Just have to be careful in read-/writepage and other helpers
-          helpers not running under i_sem that we play nice...
+          not running under i_sem that we play nice...  Also need to be careful
-          Also need to be careful with initialized_size extention in
+          with initialized_size extention in ntfs_prepare_write and writepage.
-          ntfs_prepare_write. Basically, just be _very_ careful in this code...
+          UPDATE: The only things that need to be checked are
-          UPDATE: The only things that need to be checked are read/writepage
+          prepare/commit_write as well as the compressed write and the other
-          which do not hold i_sem.  Note writepage cannot change i_size but it
+          attribute resize/write cases like index attributes, etc.  For now
-          needs to cope with a concurrent i_size change, just like readpage.
+          none of these are implemented so are safe.
-          Also both need to cope with concurrent changes to the other sizes,
-          i.e. initialized/allocated/compressed size, as well.
        - Implement mft.c::sync_mft_mirror_umount().  We currently will just
          leave the volume dirty on umount if the final iput(vol->mft_ino)
          causes a write of any mirrored mft records due to the mft mirror
@@ -22,6 +20,44 @@ ToDo/Notes:
        - Enable the code for setting the NT4 compatibility flag when we start
          making NTFS 1.2 specific modifications.
+2.1.25-WIP
+        - Change ntfs_map_runlist_nolock(), ntfs_attr_find_vcn_nolock() and
+          {__,}ntfs_cluster_free() to also take an optional attribute search
+          context as argument.  This allows calling these functions with the
+          mft record mapped.  Update all callers.
+        - Fix potential deadlock in ntfs_mft_data_extend_allocation_nolock()
+          error handling by passing in the active search context when calling
+          ntfs_cluster_free().
+        - Change ntfs_cluster_alloc() to take an extra boolean parameter
+          specifying whether the cluster are being allocated to extend an
+          attribute or to fill a hole.
+        - Change ntfs_attr_make_non_resident() to call ntfs_cluster_alloc()
+          with @is_extension set to TRUE and remove the runlist terminator
+          fixup code as this is now done by ntfs_cluster_alloc().
+        - Change ntfs_attr_make_non_resident to take the attribute value size
+          as an extra parameter.  This is needed since we need to know the size
+          before we can map the mft record and our callers always know it.  The
+          reason we cannot simply read the size from the vfs inode i_size is
+          that this is not necessarily uptodate.  This happens when
+          ntfs_attr_make_non_resident() is called in the ->truncate call path.
+        - Fix ntfs_attr_make_non_resident() to update the vfs inode i_blocks
+          which is zero for a resident attribute but should no longer be zero
+          once the attribute is non-resident as it then has real clusters
+          allocated.
+        - Add fs/ntfs/attrib.[hc]::ntfs_attr_extend_allocation(), a function to
+          extend the allocation of an attributes.  Optionally, the data size,
+          but not the initialized size can be extended, too.
+        - Implement fs/ntfs/inode.[hc]::ntfs_truncate().  It only supports
+          uncompressed and unencrypted files.
+        - Enable ATTR_SIZE attribute changes in ntfs_setattr().  This completes
+          the initial implementation of file truncation.  Now both open(2)ing
+          a file with the O_TRUNC flag and the {,f}truncate(2) system calls
+          will resize a file appropriately.  The limitations are that only
+          uncompressed and unencrypted files are supported.  Also, there is
+          only very limited support for highly fragmented files (the ones whose
+          $DATA attribute is split into multiple attribute extents).
 2.1.24 - Lots of bug fixes and support more clean journal states.
        - Support journals ($LogFile) which have been modified by chkdsk.  This
diff --git a/fs/ntfs/Makefile b/fs/ntfs/Makefile
index 894b2b876d35..a3ce2c0e7dd9 100644
--- a/fs/ntfs/Makefile
+++ b/fs/ntfs/Makefile
@@ -6,7 +6,7 @@ ntfs-objs := aops.o attrib.o collate.o compress.o debug.o dir.o file.o \
             index.o inode.o mft.o mst.o namei.o runlist.o super.o sysctl.o \
             unistr.o upcase.o
-EXTRA_CFLAGS = -DNTFS_VERSION=\"2.1.24\"
+EXTRA_CFLAGS = -DNTFS_VERSION=\"2.1.25-WIP\"
 ifeq ($(CONFIG_NTFS_DEBUG),y)
 EXTRA_CFLAGS += -DDEBUG
diff --git a/fs/ntfs/attrib.c b/fs/ntfs/attrib.c
index 3f9a4ff42ee5..bc25e88ad468 100644
--- a/fs/ntfs/attrib.c
+++ b/fs/ntfs/attrib.c
@@ -36,9 +36,27 @@
 * ntfs_map_runlist_nolock - map (a part of) a runlist of an ntfs inode
 * @ni:         ntfs inode for which to map (part of) a runlist
 * @vcn:        map runlist part containing this vcn
+ * @ctx:        active attribute search context if present or NULL if not
 *
 * Map the part of a runlist containing the @vcn of the ntfs inode @ni.
 *
+ * If @ctx is specified, it is an active search context of @ni and its base mft
+ * record.  This is needed when ntfs_map_runlist_nolock() encounters unmapped
+ * runlist fragments and allows their mapping.  If you do not have the mft
+ * record mapped, you can specify @ctx as NULL and ntfs_map_runlist_nolock()
+ * will perform the necessary mapping and unmapping.
+ *
+ * Note, ntfs_map_runlist_nolock() saves the state of @ctx on entry and
+ * restores it before returning.  Thus, @ctx will be left pointing to the same
+ * attribute on return as on entry.  However, the actual pointers in @ctx may
+ * point to different memory locations on return, so you must remember to reset
+ * any cached pointers from the @ctx, i.e. after the call to
+ * ntfs_map_runlist_nolock(), you will probably want to do:
+ *      m = ctx->mrec;
+ *      a = ctx->attr;
+ * Assuming you cache ctx->attr in a variable @a of type ATTR_RECORD * and that
+ * you cache ctx->mrec in a variable @m of type MFT_RECORD *.
+ *
 * Return 0 on success and -errno on error.  There is one special error code
 * which is not an error as such.  This is -ENOENT.  It means that @vcn is out
 * of bounds of the runlist.
@@ -46,19 +64,32 @@
 * Note the runlist can be NULL after this function returns if @vcn is zero and
 * the attribute has zero allocated size, i.e. there simply is no runlist.
 *
- * Locking: - The runlist must be locked for writing.
+ * WARNING: If @ctx is supplied, regardless of whether success or failure is
- *          - This function modifies the runlist.
+ *          returned, you need to check IS_ERR(@ctx->mrec) and if TRUE the @ctx
+ *          is no longer valid, i.e. you need to either call
+ *          ntfs_attr_reinit_search_ctx() or ntfs_attr_put_search_ctx() on it.
+ *          In that case PTR_ERR(@ctx->mrec) will give you the error code for
+ *          why the mapping of the old inode failed.
+ *
+ * Locking: - The runlist described by @ni must be locked for writing on entry
+ *            and is locked on return.  Note the runlist will be modified.
+ *          - If @ctx is NULL, the base mft record of @ni must not be mapped on
+ *            entry and it will be left unmapped on return.
+ *          - If @ctx is not NULL, the base mft record must be mapped on entry
+ *            and it will be left mapped on return.
 */
-int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn)
+int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn, ntfs_attr_search_ctx *ctx)
 {
        VCN end_vcn;
+        unsigned long flags;
        ntfs_inode *base_ni;
        MFT_RECORD *m;
        ATTR_RECORD *a;
-        ntfs_attr_search_ctx *ctx;
        runlist_element *rl;
-        unsigned long flags;
+        struct page *put_this_page = NULL;
        int err = 0;
+        BOOL ctx_is_temporary, ctx_needs_reset;
+        ntfs_attr_search_ctx old_ctx;
        ntfs_debug("Mapping runlist part containing vcn 0x%llx.",
                        (unsigned long long)vcn);
@@ -66,20 +97,77 @@ int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn)
                base_ni = ni;
        else
                base_ni = ni->ext.base_ntfs_ino;
-        m = map_mft_record(base_ni);
+        if (!ctx) {
-        if (IS_ERR(m))
+                ctx_is_temporary = ctx_needs_reset = TRUE;
-                return PTR_ERR(m);
+                m = map_mft_record(base_ni);
-        ctx = ntfs_attr_get_search_ctx(base_ni, m);
+                if (IS_ERR(m))
-        if (unlikely(!ctx)) {
+                        return PTR_ERR(m);
-                err = -ENOMEM;
+                ctx = ntfs_attr_get_search_ctx(base_ni, m);
-                goto err_out;
+                if (unlikely(!ctx)) {
+                        err = -ENOMEM;
+                        goto err_out;
+                }
+        } else {
+                VCN allocated_size_vcn;
+                BUG_ON(IS_ERR(ctx->mrec));
+                a = ctx->attr;
+                BUG_ON(!a->non_resident);
+                ctx_is_temporary = FALSE;
+                end_vcn = sle64_to_cpu(a->data.non_resident.highest_vcn);
+                read_lock_irqsave(&ni->size_lock, flags);
+                allocated_size_vcn = ni->allocated_size >>
+                                ni->vol->cluster_size_bits;
+                read_unlock_irqrestore(&ni->size_lock, flags);
+                if (!a->data.non_resident.lowest_vcn && end_vcn <= 0)
+                        end_vcn = allocated_size_vcn - 1;
+                /*
+                 * If we already have the attribute extent containing @vcn in
+                 * @ctx, no need to look it up again.  We slightly cheat in
+                 * that if vcn exceeds the allocated size, we will refuse to
+                 * map the runlist below, so there is definitely no need to get
+                 * the right attribute extent.
+                 */
+                if (vcn >= allocated_size_vcn || (a->type == ni->type &&
+                                a->name_length == ni->name_len &&
+                                !memcmp((u8*)a + le16_to_cpu(a->name_offset),
+                                ni->name, ni->name_len) &&
+                                sle64_to_cpu(a->data.non_resident.lowest_vcn)
+                                <= vcn && end_vcn >= vcn))
+                        ctx_needs_reset = FALSE;
+                else {
+                        /* Save the old search context. */
+                        old_ctx = *ctx;
+                        /*
+                         * If the currently mapped (extent) inode is not the
+                         * base inode we will unmap it when we reinitialize the
+                         * search context which means we need to get a
+                         * reference to the page containing the mapped mft
+                         * record so we do not accidentally drop changes to the
+                         * mft record when it has not been marked dirty yet.
+                         */
+                        if (old_ctx.base_ntfs_ino && old_ctx.ntfs_ino !=
+                                        old_ctx.base_ntfs_ino) {
+                                put_this_page = old_ctx.ntfs_ino->page;
+                                page_cache_get(put_this_page);
+                        }
+                        /*
+                         * Reinitialize the search context so we can lookup the
+                         * needed attribute extent.
+                         */
+                        ntfs_attr_reinit_search_ctx(ctx);
+                        ctx_needs_reset = TRUE;
+                }
        }
-        err = ntfs_attr_lookup(ni->type, ni->name, ni->name_len,
+        if (ctx_needs_reset) {
-                        CASE_SENSITIVE, vcn, NULL, 0, ctx);
+                err = ntfs_attr_lookup(ni->type, ni->name, ni->name_len,
-        if (unlikely(err)) {
+                                CASE_SENSITIVE, vcn, NULL, 0, ctx);
-                if (err == -ENOENT)
+                if (unlikely(err)) {
-                        err = -EIO;
+                        if (err == -ENOENT)
-                goto err_out;
+                                err = -EIO;
+                        goto err_out;
+                }
+                BUG_ON(!ctx->attr->non_resident);
        }
        a = ctx->attr;
        /*
@@ -89,11 +177,9 @@ int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn)
         * ntfs_mapping_pairs_decompress() fails.
         */
        end_vcn = sle64_to_cpu(a->data.non_resident.highest_vcn) + 1;
-        if (unlikely(!a->data.non_resident.lowest_vcn && end_vcn <= 1)) {
+        if (!a->data.non_resident.lowest_vcn && end_vcn == 1)
-                read_lock_irqsave(&ni->size_lock, flags);
+                end_vcn = sle64_to_cpu(a->data.non_resident.allocated_size) >>
-                end_vcn = ni->allocated_size >> ni->vol->cluster_size_bits;
+                                ni->vol->cluster_size_bits;
-                read_unlock_irqrestore(&ni->size_lock, flags);
-        }
        if (unlikely(vcn >= end_vcn)) {
                err = -ENOENT;
                goto err_out;
@@ -104,9 +190,93 @@ int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn)
        else
                ni->runlist.rl = rl;
 err_out:
-        if (likely(ctx))
+        if (ctx_is_temporary) {
-                ntfs_attr_put_search_ctx(ctx);
+                if (likely(ctx))
-        unmap_mft_record(base_ni);
+                        ntfs_attr_put_search_ctx(ctx);
+                unmap_mft_record(base_ni);
+        } else if (ctx_needs_reset) {
+                /*
+                 * If there is no attribute list, restoring the search context
+                 * is acomplished simply by copying the saved context back over
+                 * the caller supplied context.  If there is an attribute list,
+                 * things are more complicated as we need to deal with mapping
+                 * of mft records and resulting potential changes in pointers.
+                 */
+                if (NInoAttrList(base_ni)) {
+                        /*
+                         * If the currently mapped (extent) inode is not the
+                         * one we had before, we need to unmap it and map the
+                         * old one.
+                         */
+                        if (ctx->ntfs_ino != old_ctx.ntfs_ino) {
+                                /*
+                                 * If the currently mapped inode is not the
+                                 * base inode, unmap it.
+                                 */
+                                if (ctx->base_ntfs_ino && ctx->ntfs_ino !=
+                                                ctx->base_ntfs_ino) {
+                                        unmap_extent_mft_record(ctx->ntfs_ino);
+                                        ctx->mrec = ctx->base_mrec;
+                                        BUG_ON(!ctx->mrec);
+                                }
+                                /*
+                                 * If the old mapped inode is not the base
+                                 * inode, map it.
+                                 */
+                                if (old_ctx.base_ntfs_ino &&
+                                                old_ctx.ntfs_ino !=
+                                                old_ctx.base_ntfs_ino) {
+retry_map:
+                                        ctx->mrec = map_mft_record(
+                                                        old_ctx.ntfs_ino);
+                                        /*
+                                         * Something bad has happened.  If out
+                                         * of memory retry till it succeeds.
+                                         * Any other errors are fatal and we
+                                         * return the error code in ctx->mrec.
+                                         * Let the caller deal with it...  We
+                                         * just need to fudge things so the
+                                         * caller can reinit and/or put the
+                                         * search context safely.
+                                         */
+                                        if (IS_ERR(ctx->mrec)) {
+                                                if (PTR_ERR(ctx->mrec) ==
+                                                                -ENOMEM) {
+                                                        schedule();
+                                                        goto retry_map;
+                                                } else
+                                                        old_ctx.ntfs_ino =
+                                                                old_ctx.
+                                                                base_ntfs_ino;
+                                        }
+                                }
+                        }
+                        /* Update the changed pointers in the saved context. */
+                        if (ctx->mrec != old_ctx.mrec) {
+                                if (!IS_ERR(ctx->mrec))
+                                        old_ctx.attr = (ATTR_RECORD*)(
+                                                        (u8*)ctx->mrec +
+                                                        ((u8*)old_ctx.attr -
+                                                        (u8*)old_ctx.mrec));
+                                old_ctx.mrec = ctx->mrec;
+                        }
+                }
+                /* Restore the search context to the saved one. */
+                *ctx = old_ctx;
+                /*
+                 * We drop the reference on the page we took earlier.  In the
+                 * case that IS_ERR(ctx->mrec) is true this means we might lose
+                 * some changes to the mft record that had been made between
+                 * the last time it was marked dirty/written out and now.  This
+                 * at this stage is not a problem as the mapping error is fatal
+                 * enough that the mft record cannot be written out anyway and
+                 * the caller is very likely to shutdown the whole inode
+                 * immediately and mark the volume dirty for chkdsk to pick up
+                 * the pieces anyway.
+                 */
+                if (put_this_page)
+                        page_cache_release(put_this_page);
+        }
        return err;
 }
@@ -122,8 +292,8 @@ err_out:
 * of bounds of the runlist.
 *
 * Locking: - The runlist must be unlocked on entry and is unlocked on return.
- *          - This function takes the runlist lock for writing and modifies the
+ *          - This function takes the runlist lock for writing and may modify
- *            runlist.
+ *            the runlist.
 */
 int ntfs_map_runlist(ntfs_inode *ni, VCN vcn)
 {
@@ -133,7 +303,7 @@ int ntfs_map_runlist(ntfs_inode *ni, VCN vcn)
        /* Make sure someone else didn't do the work while we were sleeping. */
        if (likely(ntfs_rl_vcn_to_lcn(ni->runlist.rl, vcn) <=
                        LCN_RL_NOT_MAPPED))
-                err = ntfs_map_runlist_nolock(ni, vcn);
+                err = ntfs_map_runlist_nolock(ni, vcn, NULL);
        up_write(&ni->runlist.lock);
        return err;
 }
@@ -212,7 +382,7 @@ retry_remap:
                                goto retry_remap;
                        }
                }
-                err = ntfs_map_runlist_nolock(ni, vcn);
+                err = ntfs_map_runlist_nolock(ni, vcn, NULL);
                if (!write_locked) {
                        up_write(&ni->runlist.lock);
                        down_read(&ni->runlist.lock);
@@ -236,9 +406,9 @@ retry_remap:
 /**
 * ntfs_attr_find_vcn_nolock - find a vcn in the runlist of an ntfs inode
- * @ni:                 ntfs inode describing the runlist to search
+ * @ni:         ntfs inode describing the runlist to search
- * @vcn:                vcn to find
+ * @vcn:        vcn to find
- * @write_locked:       true if the runlist is locked for writing
+ * @ctx:        active attribute search context if present or NULL if not
 *
 * Find the virtual cluster number @vcn in the runlist described by the ntfs
 * inode @ni and return the address of the runlist element containing the @vcn.
@@ -246,9 +416,22 @@ retry_remap:
 * If the @vcn is not mapped yet, the attempt is made to map the attribute
 * extent containing the @vcn and the vcn to lcn conversion is retried.
 *
- * If @write_locked is true the caller has locked the runlist for writing and
+ * If @ctx is specified, it is an active search context of @ni and its base mft
- * if false for reading.
+ * record.  This is needed when ntfs_attr_find_vcn_nolock() encounters unmapped
- *
+ * runlist fragments and allows their mapping.  If you do not have the mft
+ * record mapped, you can specify @ctx as NULL and ntfs_attr_find_vcn_nolock()
+ * will perform the necessary mapping and unmapping.
+ *
+ * Note, ntfs_attr_find_vcn_nolock() saves the state of @ctx on entry and
+ * restores it before returning.  Thus, @ctx will be left pointing to the same
+ * attribute on return as on entry.  However, the actual pointers in @ctx may
+ * point to different memory locations on return, so you must remember to reset
+ * any cached pointers from the @ctx, i.e. after the call to
+ * ntfs_attr_find_vcn_nolock(), you will probably want to do:
+ *      m = ctx->mrec;
+ *      a = ctx->attr;
+ * Assuming you cache ctx->attr in a variable @a of type ATTR_RECORD * and that
+ * you cache ctx->mrec in a variable @m of type MFT_RECORD *.
 * Note you need to distinguish between the lcn of the returned runlist element
 * being >= 0 and LCN_HOLE.  In the later case you have to return zeroes on
 * read and allocate clusters on write.
@@ -263,22 +446,31 @@ retry_remap:
 *      -ENOMEM - Not enough memory to map runlist.
 *      -EIO    - Critical error (runlist/file is corrupt, i/o error, etc).
 *
- * Locking: - The runlist must be locked on entry and is left locked on return.
+ * WARNING: If @ctx is supplied, regardless of whether success or failure is
- *          - If @write_locked is FALSE, i.e. the runlist is locked for reading,
+ *          returned, you need to check IS_ERR(@ctx->mrec) and if TRUE the @ctx
- *            the lock may be dropped inside the function so you cannot rely on
+ *          is no longer valid, i.e. you need to either call
- *            the runlist still being the same when this function returns.
+ *          ntfs_attr_reinit_search_ctx() or ntfs_attr_put_search_ctx() on it.
+ *          In that case PTR_ERR(@ctx->mrec) will give you the error code for
+ *          why the mapping of the old inode failed.
+ *
+ * Locking: - The runlist described by @ni must be locked for writing on entry
+ *            and is locked on return.  Note the runlist may be modified when
+ *            needed runlist fragments need to be mapped.
+ *          - If @ctx is NULL, the base mft record of @ni must not be mapped on
+ *            entry and it will be left unmapped on return.
+ *          - If @ctx is not NULL, the base mft record must be mapped on entry
+ *            and it will be left mapped on return.
 */
 runlist_element *ntfs_attr_find_vcn_nolock(ntfs_inode *ni, const VCN vcn,
-                const BOOL write_locked)
+                ntfs_attr_search_ctx *ctx)
 {
        unsigned long flags;
        runlist_element *rl;
        int err = 0;
        BOOL is_retry = FALSE;
-        ntfs_debug("Entering for i_ino 0x%lx, vcn 0x%llx, %s_locked.",
+        ntfs_debug("Entering for i_ino 0x%lx, vcn 0x%llx, with%s ctx.",
-                        ni->mft_no, (unsigned long long)vcn,
+                        ni->mft_no, (unsigned long long)vcn, ctx ? "" : "out");
-                        write_locked ? "write" : "read");
        BUG_ON(!ni);
        BUG_ON(!NInoNonResident(ni));
        BUG_ON(vcn < 0);
@@ -312,33 +504,22 @@ retry_remap:
        }
        if (!err && !is_retry) {
                /*
-                 * The @vcn is in an unmapped region, map the runlist and
+                 * If the search context is invalid we cannot map the unmapped
-                 * retry.
+                 * region.
                 */
-                if (!write_locked) {
+                if (IS_ERR(ctx->mrec))
-                        up_read(&ni->runlist.lock);
+                        err = PTR_ERR(ctx->mrec);
-                        down_write(&ni->runlist.lock);
+                else {
-                        if (unlikely(ntfs_rl_vcn_to_lcn(ni->runlist.rl, vcn) !=
+                        /*
-                                        LCN_RL_NOT_MAPPED)) {
+                         * The @vcn is in an unmapped region, map the runlist
-                                up_write(&ni->runlist.lock);
+                         * and retry.
-                                down_read(&ni->runlist.lock);
+                         */
+                        err = ntfs_map_runlist_nolock(ni, vcn, ctx);
+                        if (likely(!err)) {
+                                is_retry = TRUE;
                                goto retry_remap;
                        }
                }
-                err = ntfs_map_runlist_nolock(ni, vcn);
-                if (!write_locked) {
-                        up_write(&ni->runlist.lock);
-                        down_read(&ni->runlist.lock);
-                }
-                if (likely(!err)) {
-                        is_retry = TRUE;
-                        goto retry_remap;
-                }
-                /*
-                 * -EINVAL coming from a failed mapping attempt is equivalent
-                 * to i/o error for us as it should not happen in our code
-                 * paths.
-                 */
                if (err == -EINVAL)
                        err = -EIO;
        } else if (!err)
@@ -1011,6 +1192,7 @@ int ntfs_attr_lookup(const ATTR_TYPE type, const ntfschar *name,
        ntfs_inode *base_ni;
        ntfs_debug("Entering.");
+        BUG_ON(IS_ERR(ctx->mrec));
        if (ctx->base_ntfs_ino)
                base_ni = ctx->base_ntfs_ino;
        else
@@ -1319,10 +1501,17 @@ int ntfs_resident_attr_value_resize(MFT_RECORD *m, ATTR_RECORD *a,
 /**
 * ntfs_attr_make_non_resident - convert a resident to a non-resident attribute
 * @ni:         ntfs inode describing the attribute to convert
+ * @data_size:  size of the resident data to copy to the non-resident attribute
 *
 * Convert the resident ntfs attribute described by the ntfs inode @ni to a
 * non-resident one.
 *
+ * @data_size must be equal to the attribute value size.  This is needed since
+ * we need to know the size before we can map the mft record and our callers
+ * always know it.  The reason we cannot simply read the size from the vfs
+ * inode i_size is that this is not necessarily uptodate.  This happens when
+ * ntfs_attr_make_non_resident() is called in the ->truncate call path(s).
+ *
 * Return 0 on success and -errno on error.  The following error return codes
 * are defined:
 *      -EPERM  - The attribute is not allowed to be non-resident.
@@ -1343,7 +1532,7 @@ int ntfs_resident_attr_value_resize(MFT_RECORD *m, ATTR_RECORD *a,
 *
 * Locking: - The caller must hold i_sem on the inode.
 */
-int ntfs_attr_make_non_resident(ntfs_inode *ni)
+int ntfs_attr_make_non_resident(ntfs_inode *ni, const u32 data_size)
 {
        s64 new_size;
        struct inode *vi = VFS_I(ni);
@@ -1381,11 +1570,9 @@ int ntfs_attr_make_non_resident(ntfs_inode *ni)
         * The size needs to be aligned to a cluster boundary for allocation
         * purposes.
         */
-        new_size = (i_size_read(vi) + vol->cluster_size - 1) &
+        new_size = (data_size + vol->cluster_size - 1) &
                        ~(vol->cluster_size - 1);
        if (new_size > 0) {
-                runlist_element *rl2;
                /*
                 * Will need the page later and since the page lock nests
                 * outside all ntfs locks, we need to get the page now.
@@ -1396,7 +1583,7 @@ int ntfs_attr_make_non_resident(ntfs_inode *ni)
                        return -ENOMEM;
                /* Start by allocating clusters to hold the attribute value. */
                rl = ntfs_cluster_alloc(vol, 0, new_size >>
-                                vol->cluster_size_bits, -1, DATA_ZONE);
+                                vol->cluster_size_bits, -1, DATA_ZONE, TRUE);
                if (IS_ERR(rl)) {
                        err = PTR_ERR(rl);
                        ntfs_debug("Failed to allocate cluster%s, error code "
@@ -1405,12 +1592,6 @@ int ntfs_attr_make_non_resident(ntfs_inode *ni)
                                        err);
                        goto page_err_out;
                }
-                /* Change the runlist terminator to LCN_ENOENT. */
-                rl2 = rl;
-                while (rl2->length)
-                        rl2++;
-                BUG_ON(rl2->lcn != LCN_RL_NOT_MAPPED);
-                rl2->lcn = LCN_ENOENT;
        } else {
                rl = NULL;
                page = NULL;
@@ -1473,7 +1654,7 @@ int ntfs_attr_make_non_resident(ntfs_inode *ni)
         * attribute value.
         */
        attr_size = le32_to_cpu(a->data.resident.value_length);
-        BUG_ON(attr_size != i_size_read(vi));
+        BUG_ON(attr_size != data_size);
        if (page && !PageUptodate(page)) {
                kaddr = kmap_atomic(page, KM_USER0);
                memcpy(kaddr, (u8*)a +
@@ -1538,7 +1719,9 @@ int ntfs_attr_make_non_resident(ntfs_inode *ni)
                                ffs(ni->itype.compressed.block_size) - 1;
                ni->itype.compressed.block_clusters = 1U <<
                                a->data.non_resident.compression_unit;
-        }
+                vi->i_blocks = ni->itype.compressed.size >> 9;
+        } else
+                vi->i_blocks = ni->allocated_size >> 9;
        write_unlock_irqrestore(&ni->size_lock, flags);
        /*
         * This needs to be last since the address space operations ->readpage
@@ -1652,6 +1835,640 @@ page_err_out:
 }
 /**
+ * ntfs_attr_extend_allocation - extend the allocated space of an attribute
+ * @ni:                 ntfs inode of the attribute whose allocation to extend
+ * @new_alloc_size:     new size in bytes to which to extend the allocation to
+ * @new_data_size:      new size in bytes to which to extend the data to
+ * @data_start:         beginning of region which is required to be non-sparse
+ *
+ * Extend the allocated space of an attribute described by the ntfs inode @ni
+ * to @new_alloc_size bytes.  If @data_start is -1, the whole extension may be
+ * implemented as a hole in the file (as long as both the volume and the ntfs
+ * inode @ni have sparse support enabled).  If @data_start is >= 0, then the
+ * region between the old allocated size and @data_start - 1 may be made sparse
+ * but the regions between @data_start and @new_alloc_size must be backed by
+ * actual clusters.
+ *
+ * If @new_data_size is -1, it is ignored.  If it is >= 0, then the data size
+ * of the attribute is extended to @new_data_size.  Note that the i_size of the
+ * vfs inode is not updated.  Only the data size in the base attribute record
+ * is updated.  The caller has to update i_size separately if this is required.
+ * WARNING: It is a BUG() for @new_data_size to be smaller than the old data
+ * size as well as for @new_data_size to be greater than @new_alloc_size.
+ *
+ * For resident attributes this involves resizing the attribute record and if
+ * necessary moving it and/or other attributes into extent mft records and/or
+ * converting the attribute to a non-resident attribute which in turn involves
+ * extending the allocation of a non-resident attribute as described below.
+ *
+ * For non-resident attributes this involves allocating clusters in the data
+ * zone on the volume (except for regions that are being made sparse) and
+ * extending the run list to describe the allocated clusters as well as
+ * updating the mapping pairs array of the attribute.  This in turn involves
+ * resizing the attribute record and if necessary moving it and/or other
+ * attributes into extent mft records and/or splitting the attribute record
+ * into multiple extent attribute records.
+ *
+ * Also, the attribute list attribute is updated if present and in some of the
+ * above cases (the ones where extent mft records/attributes come into play),
+ * an attribute list attribute is created if not already present.
+ *
+ * Return the new allocated size on success and -errno on error.  In the case
+ * that an error is encountered but a partial extension at least up to
+ * @data_start (if present) is possible, the allocation is partially extended
+ * and this is returned.  This means the caller must check the returned size to
+ * determine if the extension was partial.  If @data_start is -1 then partial
+ * allocations are not performed.
+ *
+ * WARNING: Do not call ntfs_attr_extend_allocation() for $MFT/$DATA.
+ *
+ * Locking: This function takes the runlist lock of @ni for writing as well as
+ * locking the mft record of the base ntfs inode.  These locks are maintained
+ * throughout execution of the function.  These locks are required so that the
+ * attribute can be resized safely and so that it can for example be converted
+ * from resident to non-resident safely.
+ *
+ * TODO: At present attribute list attribute handling is not implemented.
+ *
+ * TODO: At present it is not safe to call this function for anything other
+ * than the $DATA attribute(s) of an uncompressed and unencrypted file.
+ */
+s64 ntfs_attr_extend_allocation(ntfs_inode *ni, s64 new_alloc_size,
+                const s64 new_data_size, const s64 data_start)
+{
+        VCN vcn;
+        s64 ll, allocated_size, start = data_start;
+        struct inode *vi = VFS_I(ni);
+        ntfs_volume *vol = ni->vol;
+        ntfs_inode *base_ni;
+        MFT_RECORD *m;
+        ATTR_RECORD *a;
+        ntfs_attr_search_ctx *ctx;
+        runlist_element *rl, *rl2;
+        unsigned long flags;
+        int err, mp_size;
+        u32 attr_len = 0; /* Silence stupid gcc warning. */
+        BOOL mp_rebuilt;
+#ifdef NTFS_DEBUG
+        read_lock_irqsave(&ni->size_lock, flags);
+        allocated_size = ni->allocated_size;
+        read_unlock_irqrestore(&ni->size_lock, flags);
+        ntfs_debug("Entering for i_ino 0x%lx, attribute type 0x%x, "
+                        "old_allocated_size 0x%llx, "
+                        "new_allocated_size 0x%llx, new_data_size 0x%llx, "
+                        "data_start 0x%llx.", vi->i_ino,
+                        (unsigned)le32_to_cpu(ni->type),
+                        (unsigned long long)allocated_size,
+                        (unsigned long long)new_alloc_size,
+                        (unsigned long long)new_data_size,
+                        (unsigned long long)start);
+#endif
+retry_extend:
+        /*
+         * For non-resident attributes, @start and @new_size need to be aligned
+         * to cluster boundaries for allocation purposes.
+         */
+        if (NInoNonResident(ni)) {
+                if (start > 0)
+                        start &= ~(s64)vol->cluster_size_mask;
+                new_alloc_size = (new_alloc_size + vol->cluster_size - 1) &
+                                ~(s64)vol->cluster_size_mask;
+        }
+        BUG_ON(new_data_size >= 0 && new_data_size > new_alloc_size);
+        /* Check if new size is allowed in $AttrDef. */
+        err = ntfs_attr_size_bounds_check(vol, ni->type, new_alloc_size);
+        if (unlikely(err)) {
+                /* Only emit errors when the write will fail completely. */
+                read_lock_irqsave(&ni->size_lock, flags);
+                allocated_size = ni->allocated_size;
+                read_unlock_irqrestore(&ni->size_lock, flags);
+                if (start < 0 || start >= allocated_size) {
+                        if (err == -ERANGE) {
+                                ntfs_error(vol->sb, "Cannot extend allocation "
+                                                "of inode 0x%lx, attribute "
+                                                "type 0x%x, because the new "
+                                                "allocation would exceed the "
+                                                "maximum allowed size for "
+                                                "this attribute type.",
+                                                vi->i_ino, (unsigned)
+                                                le32_to_cpu(ni->type));
+                        } else {
+                                ntfs_error(vol->sb, "Cannot extend allocation "
+                                                "of inode 0x%lx, attribute "
+                                                "type 0x%x, because this "
+                                                "attribute type is not "
+                                                "defined on the NTFS volume.  "
+                                                "Possible corruption!  You "
+                                                "should run chkdsk!",
+                                                vi->i_ino, (unsigned)
+                                                le32_to_cpu(ni->type));
+                        }
+                }
+                /* Translate error code to be POSIX conformant for write(2). */
+                if (err == -ERANGE)
+                        err = -EFBIG;
+                else
+                        err = -EIO;
+                return err;
+        }
+        if (!NInoAttr(ni))
+                base_ni = ni;
+        else
+                base_ni = ni->ext.base_ntfs_ino;
+        /*
+         * We will be modifying both the runlist (if non-resident) and the mft
+         * record so lock them both down.
+         */
+        down_write(&ni->runlist.lock);
+        m = map_mft_record(base_ni);
+        if (IS_ERR(m)) {
+                err = PTR_ERR(m);
+                m = NULL;
+                ctx = NULL;
+                goto err_out;
+        }
+        ctx = ntfs_attr_get_search_ctx(base_ni, m);
+        if (unlikely(!ctx)) {
+                err = -ENOMEM;
+                goto err_out;
+        }
+        read_lock_irqsave(&ni->size_lock, flags);
+        allocated_size = ni->allocated_size;
+        read_unlock_irqrestore(&ni->size_lock, flags);
+        /*
+         * If non-resident, seek to the last extent.  If resident, there is
+         * only one extent, so seek to that.
+         */
+        vcn = NInoNonResident(ni) ? allocated_size >> vol->cluster_size_bits :
+                        0;
+        /*
+         * Abort if someone did the work whilst we waited for the locks.  If we
+         * just converted the attribute from resident to non-resident it is
+         * likely that exactly this has happened already.  We cannot quite
+         * abort if we need to update the data size.
+         */
+        if (unlikely(new_alloc_size <= allocated_size)) {
+                ntfs_debug("Allocated size already exceeds requested size.");
+                new_alloc_size = allocated_size;
+                if (new_data_size < 0)
+                        goto done;
+                /*
+                 * We want the first attribute extent so that we can update the
+                 * data size.
+                 */
+                vcn = 0;
+        }
+        err = ntfs_attr_lookup(ni->type, ni->name, ni->name_len,
+                        CASE_SENSITIVE, vcn, NULL, 0, ctx);
+        if (unlikely(err)) {
+                if (err == -ENOENT)
+                        err = -EIO;
+                goto err_out;
+        }
+        m = ctx->mrec;
+        a = ctx->attr;
+        /* Use goto to reduce indentation. */
+        if (a->non_resident)
+                goto do_non_resident_extend;
+        BUG_ON(NInoNonResident(ni));
+        /* The total length of the attribute value. */
+        attr_len = le32_to_cpu(a->data.resident.value_length);
+        /*
+         * Extend the attribute record to be able to store the new attribute
+         * size.  ntfs_attr_record_resize() will not do anything if the size is
+         * not changing.
+         */
+        if (new_alloc_size < vol->mft_record_size &&
+                        !ntfs_attr_record_resize(m, a,
+                        le16_to_cpu(a->data.resident.value_offset) +
+                        new_alloc_size)) {
+                /* The resize succeeded! */
+                write_lock_irqsave(&ni->size_lock, flags);
+                ni->allocated_size = le32_to_cpu(a->length) -
+                                le16_to_cpu(a->data.resident.value_offset);
+                write_unlock_irqrestore(&ni->size_lock, flags);
+                if (new_data_size >= 0) {
+                        BUG_ON(new_data_size < attr_len);
+                        a->data.resident.value_length =
+                                        cpu_to_le32((u32)new_data_size);
+                }
+                goto flush_done;
+        }
+        /*
+         * We have to drop all the locks so we can call
+         * ntfs_attr_make_non_resident().  This could be optimised by try-
+         * locking the first page cache page and only if that fails dropping
+         * the locks, locking the page, and redoing all the locking and
+         * lookups.  While this would be a huge optimisation, it is not worth
+         * it as this is definitely a slow code path.
+         */
+        ntfs_attr_put_search_ctx(ctx);
+        unmap_mft_record(base_ni);
+        up_write(&ni->runlist.lock);
+        /*
+         * Not enough space in the mft record, try to make the attribute
+         * non-resident and if successful restart the extension process.
+         */
+        err = ntfs_attr_make_non_resident(ni, attr_len);
+        if (likely(!err))
+                goto retry_extend;
+        /*
+         * Could not make non-resident.  If this is due to this not being
+         * permitted for this attribute type or there not being enough space,
+         * try to make other attributes non-resident.  Otherwise fail.
+         */
+        if (unlikely(err != -EPERM && err != -ENOSPC)) {
+                /* Only emit errors when the write will fail completely. */
+                read_lock_irqsave(&ni->size_lock, flags);
+                allocated_size = ni->allocated_size;
+                read_unlock_irqrestore(&ni->size_lock, flags);
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Cannot extend allocation of "
+                                        "inode 0x%lx, attribute type 0x%x, "
+                                        "because the conversion from resident "
+                                        "to non-resident attribute failed "
+                                        "with error code %i.", vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type), err);
+                if (err != -ENOMEM)
+                        err = -EIO;
+                goto conv_err_out;
+        }
+        /* TODO: Not implemented from here, abort. */
+        read_lock_irqsave(&ni->size_lock, flags);
+        allocated_size = ni->allocated_size;
+        read_unlock_irqrestore(&ni->size_lock, flags);
+        if (start < 0 || start >= allocated_size) {
+                if (err == -ENOSPC)
+                        ntfs_error(vol->sb, "Not enough space in the mft "
+                                        "record/on disk for the non-resident "
+                                        "attribute value.  This case is not "
+                                        "implemented yet.");
+                else /* if (err == -EPERM) */
+                        ntfs_error(vol->sb, "This attribute type may not be "
+                                        "non-resident.  This case is not "
+                                        "implemented yet.");
+        }
+        err = -EOPNOTSUPP;
+        goto conv_err_out;
+#if 0
+        // TODO: Attempt to make other attributes non-resident.
+        if (!err)
+                goto do_resident_extend;
+        /*
+         * Both the attribute list attribute and the standard information
+         * attribute must remain in the base inode.  Thus, if this is one of
+         * these attributes, we have to try to move other attributes out into
+         * extent mft records instead.
+         */
+        if (ni->type == AT_ATTRIBUTE_LIST ||
+                        ni->type == AT_STANDARD_INFORMATION) {
+                // TODO: Attempt to move other attributes into extent mft
+                // records.
+                err = -EOPNOTSUPP;
+                if (!err)
+                        goto do_resident_extend;
+                goto err_out;
+        }
+        // TODO: Attempt to move this attribute to an extent mft record, but
+        // only if it is not already the only attribute in an mft record in
+        // which case there would be nothing to gain.
+        err = -EOPNOTSUPP;
+        if (!err)
+                goto do_resident_extend;
+        /* There is nothing we can do to make enough space. )-: */
+        goto err_out;
+#endif
+do_non_resident_extend:
+        BUG_ON(!NInoNonResident(ni));
+        if (new_alloc_size == allocated_size) {
+                BUG_ON(vcn);
+                goto alloc_done;
+        }
+        /*
+         * If the data starts after the end of the old allocation, this is a
+         * $DATA attribute and sparse attributes are enabled on the volume and
+         * for this inode, then create a sparse region between the old
+         * allocated size and the start of the data.  Otherwise simply proceed
+         * with filling the whole space between the old allocated size and the
+         * new allocated size with clusters.
+         */
+        if ((start >= 0 && start <= allocated_size) || ni->type != AT_DATA ||
+                        !NVolSparseEnabled(vol) || NInoSparseDisabled(ni))
+                goto skip_sparse;
+        // TODO: This is not implemented yet.  We just fill in with real
+        // clusters for now...
+        ntfs_debug("Inserting holes is not-implemented yet.  Falling back to "
+                        "allocating real clusters instead.");
+skip_sparse:
+        rl = ni->runlist.rl;
+        if (likely(rl)) {
+                /* Seek to the end of the runlist. */
+                while (rl->length)
+                        rl++;
+        }
+        /* If this attribute extent is not mapped, map it now. */
+        if (unlikely(!rl || rl->lcn == LCN_RL_NOT_MAPPED ||
+                        (rl->lcn == LCN_ENOENT && rl > ni->runlist.rl &&
+                        (rl-1)->lcn == LCN_RL_NOT_MAPPED))) {
+                if (!rl && !allocated_size)
+                        goto first_alloc;
+                rl = ntfs_mapping_pairs_decompress(vol, a, ni->runlist.rl);
+                if (IS_ERR(rl)) {
+                        err = PTR_ERR(rl);
+                        if (start < 0 || start >= allocated_size)
+                                ntfs_error(vol->sb, "Cannot extend allocation "
+                                                "of inode 0x%lx, attribute "
+                                                "type 0x%x, because the "
+                                                "mapping of a runlist "
+                                                "fragment failed with error "
+                                                "code %i.", vi->i_ino,
+                                                (unsigned)le32_to_cpu(ni->type),
+                                                err);
+                        if (err != -ENOMEM)
+                                err = -EIO;
+                        goto err_out;
+                }
+                ni->runlist.rl = rl;
+                /* Seek to the end of the runlist. */
+                while (rl->length)
+                        rl++;
+        }
+        /*
+         * We now know the runlist of the last extent is mapped and @rl is at
+         * the end of the runlist.  We want to begin allocating clusters
+         * starting at the last allocated cluster to reduce fragmentation.  If
+         * there are no valid LCNs in the attribute we let the cluster
+         * allocator choose the starting cluster.
+         */
+        /* If the last LCN is a hole or simillar seek back to last real LCN. */
+        while (rl->lcn < 0 && rl > ni->runlist.rl)
+                rl--;
+first_alloc:
+        // FIXME: Need to implement partial allocations so at least part of the
+        // write can be performed when start >= 0.  (Needed for POSIX write(2)
+        // conformance.)
+        rl2 = ntfs_cluster_alloc(vol, allocated_size >> vol->cluster_size_bits,
+                        (new_alloc_size - allocated_size) >>
+                        vol->cluster_size_bits, (rl && (rl->lcn >= 0)) ?
+                        rl->lcn + rl->length : -1, DATA_ZONE, TRUE);
+        if (IS_ERR(rl2)) {
+                err = PTR_ERR(rl2);
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Cannot extend allocation of "
+                                        "inode 0x%lx, attribute type 0x%x, "
+                                        "because the allocation of clusters "
+                                        "failed with error code %i.", vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type), err);
+                if (err != -ENOMEM && err != -ENOSPC)
+                        err = -EIO;
+                goto err_out;
+        }
+        rl = ntfs_runlists_merge(ni->runlist.rl, rl2);
+        if (IS_ERR(rl)) {
+                err = PTR_ERR(rl);
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Cannot extend allocation of "
+                                        "inode 0x%lx, attribute type 0x%x, "
+                                        "because the runlist merge failed "
+                                        "with error code %i.", vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type), err);
+                if (err != -ENOMEM)
+                        err = -EIO;
+                if (ntfs_cluster_free_from_rl(vol, rl2)) {
+                        ntfs_error(vol->sb, "Failed to release allocated "
+                                        "cluster(s) in error code path.  Run "
+                                        "chkdsk to recover the lost "
+                                        "cluster(s).");
+                        NVolSetErrors(vol);
+                }
+                ntfs_free(rl2);
+                goto err_out;
+        }
+        ni->runlist.rl = rl;
+        ntfs_debug("Allocated 0x%llx clusters.", (long long)(new_alloc_size -
+                        allocated_size) >> vol->cluster_size_bits);
+        /* Find the runlist element with which the attribute extent starts. */
+        ll = sle64_to_cpu(a->data.non_resident.lowest_vcn);
+        rl2 = ntfs_rl_find_vcn_nolock(rl, ll);
+        BUG_ON(!rl2);
+        BUG_ON(!rl2->length);
+        BUG_ON(rl2->lcn < LCN_HOLE);
+        mp_rebuilt = FALSE;
+        /* Get the size for the new mapping pairs array for this extent. */
+        mp_size = ntfs_get_size_for_mapping_pairs(vol, rl2, ll, -1);
+        if (unlikely(mp_size <= 0)) {
+                err = mp_size;
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Cannot extend allocation of "
+                                        "inode 0x%lx, attribute type 0x%x, "
+                                        "because determining the size for the "
+                                        "mapping pairs failed with error code "
+                                        "%i.", vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type), err);
+                err = -EIO;
+                goto undo_alloc;
+        }
+        /* Extend the attribute record to fit the bigger mapping pairs array. */
+        attr_len = le32_to_cpu(a->length);
+        err = ntfs_attr_record_resize(m, a, mp_size +
+                        le16_to_cpu(a->data.non_resident.mapping_pairs_offset));
+        if (unlikely(err)) {
+                BUG_ON(err != -ENOSPC);
+                // TODO: Deal with this by moving this extent to a new mft
+                // record or by starting a new extent in a new mft record,
+                // possibly by extending this extent partially and filling it
+                // and creating a new extent for the remainder, or by making
+                // other attributes non-resident and/or by moving other
+                // attributes out of this mft record.
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Not enough space in the mft "
+                                        "record for the extended attribute "
+                                        "record.  This case is not "
+                                        "implemented yet.");
+                err = -EOPNOTSUPP;
+                goto undo_alloc;
+        }
+        mp_rebuilt = TRUE;
+        /* Generate the mapping pairs array directly into the attr record. */
+        err = ntfs_mapping_pairs_build(vol, (u8*)a +
+                        le16_to_cpu(a->data.non_resident.mapping_pairs_offset),
+                        mp_size, rl2, ll, -1, NULL);
+        if (unlikely(err)) {
+                if (start < 0 || start >= allocated_size)
+                        ntfs_error(vol->sb, "Cannot extend allocation of "
+                                        "inode 0x%lx, attribute type 0x%x, "
+                                        "because building the mapping pairs "
+                                        "failed with error code %i.", vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type), err);
+                err = -EIO;
+                goto undo_alloc;
+        }
+        /* Update the highest_vcn. */
+        a->data.non_resident.highest_vcn = cpu_to_sle64((new_alloc_size >>
+                        vol->cluster_size_bits) - 1);
+        /*
+         * We now have extended the allocated size of the attribute.  Reflect
+         * this in the ntfs_inode structure and the attribute record.
+         */
+        if (a->data.non_resident.lowest_vcn) {
+                /*
+                 * We are not in the first attribute extent, switch to it, but
+                 * first ensure the changes will make it to disk later.
+                 */
+                flush_dcache_mft_record_page(ctx->ntfs_ino);
+                mark_mft_record_dirty(ctx->ntfs_ino);
+                ntfs_attr_reinit_search_ctx(ctx);
+                err = ntfs_attr_lookup(ni->type, ni->name, ni->name_len,
+                                CASE_SENSITIVE, 0, NULL, 0, ctx);
+                if (unlikely(err))
+                        goto restore_undo_alloc;
+                /* @m is not used any more so no need to set it. */
+                a = ctx->attr;
+        }
+        write_lock_irqsave(&ni->size_lock, flags);
+        ni->allocated_size = new_alloc_size;
+        a->data.non_resident.allocated_size = cpu_to_sle64(new_alloc_size);
+        /*
+         * FIXME: This would fail if @ni is a directory, $MFT, or an index,
+         * since those can have sparse/compressed set.  For example can be
+         * set compressed even though it is not compressed itself and in that
+         * case the bit means that files are to be created compressed in the
+         * directory...  At present this is ok as this code is only called for
+         * regular files, and only for their $DATA attribute(s).
+         * FIXME: The calculation is wrong if we created a hole above.  For now
+         * it does not matter as we never create holes.
+         */
+        if (NInoSparse(ni) || NInoCompressed(ni)) {
+                ni->itype.compressed.size += new_alloc_size - allocated_size;
+                a->data.non_resident.compressed_size =
+                                cpu_to_sle64(ni->itype.compressed.size);
+                vi->i_blocks = ni->itype.compressed.size >> 9;
+        } else
+                vi->i_blocks = new_alloc_size >> 9;
+        write_unlock_irqrestore(&ni->size_lock, flags);
+alloc_done:
+        if (new_data_size >= 0) {
+                BUG_ON(new_data_size <
+                                sle64_to_cpu(a->data.non_resident.data_size));
+                a->data.non_resident.data_size = cpu_to_sle64(new_data_size);
+        }
+flush_done:
+        /* Ensure the changes make it to disk. */
+        flush_dcache_mft_record_page(ctx->ntfs_ino);
+        mark_mft_record_dirty(ctx->ntfs_ino);
+done:
+        ntfs_attr_put_search_ctx(ctx);
+        unmap_mft_record(base_ni);
+        up_write(&ni->runlist.lock);
+        ntfs_debug("Done, new_allocated_size 0x%llx.",
+                        (unsigned long long)new_alloc_size);
+        return new_alloc_size;
+restore_undo_alloc:
+        if (start < 0 || start >= allocated_size)
+                ntfs_error(vol->sb, "Cannot complete extension of allocation "
+                                "of inode 0x%lx, attribute type 0x%x, because "
+                                "lookup of first attribute extent failed with "
+                                "error code %i.", vi->i_ino,
+                                (unsigned)le32_to_cpu(ni->type), err);
+        if (err == -ENOENT)
+                err = -EIO;
+        ntfs_attr_reinit_search_ctx(ctx);
+        if (ntfs_attr_lookup(ni->type, ni->name, ni->name_len, CASE_SENSITIVE,
+                        allocated_size >> vol->cluster_size_bits, NULL, 0,
+                        ctx)) {
+                ntfs_error(vol->sb, "Failed to find last attribute extent of "
+                                "attribute in error code path.  Run chkdsk to "
+                                "recover.");
+                write_lock_irqsave(&ni->size_lock, flags);
+                ni->allocated_size = new_alloc_size;
+                /*
+                 * FIXME: This would fail if @ni is a directory...  See above.
+                 * FIXME: The calculation is wrong if we created a hole above.
+                 * For now it does not matter as we never create holes.
+                 */
+                if (NInoSparse(ni) || NInoCompressed(ni)) {
+                        ni->itype.compressed.size += new_alloc_size -
+                                        allocated_size;
+                        vi->i_blocks = ni->itype.compressed.size >> 9;
+                } else
+                        vi->i_blocks = new_alloc_size >> 9;
+                write_unlock_irqrestore(&ni->size_lock, flags);
+                ntfs_attr_put_search_ctx(ctx);
+                unmap_mft_record(base_ni);
+                up_write(&ni->runlist.lock);
+                /*
+                 * The only thing that is now wrong is the allocated size of the
+                 * base attribute extent which chkdsk should be able to fix.
+                 */
+                NVolSetErrors(vol);
+                return err;
+        }
+        ctx->attr->data.non_resident.highest_vcn = cpu_to_sle64(
+                        (allocated_size >> vol->cluster_size_bits) - 1);
+undo_alloc:
+        ll = allocated_size >> vol->cluster_size_bits;
+        if (ntfs_cluster_free(ni, ll, -1, ctx) < 0) {
+                ntfs_error(vol->sb, "Failed to release allocated cluster(s) "
+                                "in error code path.  Run chkdsk to recover "
+                                "the lost cluster(s).");
+                NVolSetErrors(vol);
+        }
+        m = ctx->mrec;
+        a = ctx->attr;
+        /*
+         * If the runlist truncation fails and/or the search context is no
+         * longer valid, we cannot resize the attribute record or build the
+         * mapping pairs array thus we mark the inode bad so that no access to
+         * the freed clusters can happen.
+         */
+        if (ntfs_rl_truncate_nolock(vol, &ni->runlist, ll) || IS_ERR(m)) {
+                ntfs_error(vol->sb, "Failed to %s in error code path.  Run "
+                                "chkdsk to recover.", IS_ERR(m) ?
+                                "restore attribute search context" :
+                                "truncate attribute runlist");
+                make_bad_inode(vi);
+                make_bad_inode(VFS_I(base_ni));
+                NVolSetErrors(vol);
+        } else if (mp_rebuilt) {
+                if (ntfs_attr_record_resize(m, a, attr_len)) {
+                        ntfs_error(vol->sb, "Failed to restore attribute "
+                                        "record in error code path.  Run "
+                                        "chkdsk to recover.");
+                        make_bad_inode(vi);
+                        make_bad_inode(VFS_I(base_ni));
+                        NVolSetErrors(vol);
+                } else /* if (success) */ {
+                        if (ntfs_mapping_pairs_build(vol, (u8*)a + le16_to_cpu(
+                                        a->data.non_resident.
+                                        mapping_pairs_offset), attr_len -
+                                        le16_to_cpu(a->data.non_resident.
+                                        mapping_pairs_offset), rl2, ll, -1,
+                                        NULL)) {
+                                ntfs_error(vol->sb, "Failed to restore "
+                                                "mapping pairs array in error "
+                                                "code path.  Run chkdsk to "
+                                                "recover.");
+                                make_bad_inode(vi);
+                                make_bad_inode(VFS_I(base_ni));
+                                NVolSetErrors(vol);
+                        }
+                        flush_dcache_mft_record_page(ctx->ntfs_ino);
+                        mark_mft_record_dirty(ctx->ntfs_ino);
+                }
+        }
+err_out:
+        if (ctx)
+                ntfs_attr_put_search_ctx(ctx);
+        if (m)
+                unmap_mft_record(base_ni);
+        up_write(&ni->runlist.lock);
+conv_err_out:
+        ntfs_debug("Failed.  Returning error code %i.", err);
+        return err;
+}
+/**
 * ntfs_attr_set - fill (a part of) an attribute with a byte
 * @ni:         ntfs inode describing the attribute to fill
 * @ofs:        offset inside the attribute at which to start to fill
diff --git a/fs/ntfs/attrib.h b/fs/ntfs/attrib.h
index 0618ed6fd7b3..9074886b44ba 100644
--- a/fs/ntfs/attrib.h
+++ b/fs/ntfs/attrib.h
@@ -60,14 +60,15 @@ typedef struct {
        ATTR_RECORD *base_attr;
 } ntfs_attr_search_ctx;
-extern int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn);
+extern int ntfs_map_runlist_nolock(ntfs_inode *ni, VCN vcn,
+                ntfs_attr_search_ctx *ctx);
 extern int ntfs_map_runlist(ntfs_inode *ni, VCN vcn);
 extern LCN ntfs_attr_vcn_to_lcn_nolock(ntfs_inode *ni, const VCN vcn,
                const BOOL write_locked);
 extern runlist_element *ntfs_attr_find_vcn_nolock(ntfs_inode *ni,
-                const VCN vcn, const BOOL write_locked);
+                const VCN vcn, ntfs_attr_search_ctx *ctx);
 int ntfs_attr_lookup(const ATTR_TYPE type, const ntfschar *name,
                const u32 name_len, const IGNORE_CASE_BOOL ic,
@@ -102,7 +103,10 @@ extern int ntfs_attr_record_resize(MFT_RECORD *m, ATTR_RECORD *a, u32 new_size);
 extern int ntfs_resident_attr_value_resize(MFT_RECORD *m, ATTR_RECORD *a,
                const u32 new_size);
-extern int ntfs_attr_make_non_resident(ntfs_inode *ni);
+extern int ntfs_attr_make_non_resident(ntfs_inode *ni, const u32 data_size);
+extern s64 ntfs_attr_extend_allocation(ntfs_inode *ni, s64 new_alloc_size,
+                const s64 new_data_size, const s64 data_start);
 extern int ntfs_attr_set(ntfs_inode *ni, const s64 ofs, const s64 cnt,
                const u8 val);
diff --git a/fs/ntfs/inode.c b/fs/ntfs/inode.c
index 7ec045131808..b24f4c4b2c5c 100644
--- a/fs/ntfs/inode.c
+++ b/fs/ntfs/inode.c
@@ -30,6 +30,7 @@
 #include "debug.h"
 #include "inode.h"
 #include "attrib.h"
+#include "lcnalloc.h"
 #include "malloc.h"
 #include "mft.h"
 #include "time.h"
@@ -2291,11 +2292,16 @@ int ntfs_show_options(struct seq_file *sf, struct vfsmount *mnt)
 #ifdef NTFS_RW
+static const char *es = "  Leaving inconsistent metadata.  Unmount and run "
+                "chkdsk.";
 /**
 * ntfs_truncate - called when the i_size of an ntfs inode is changed
 * @vi:         inode for which the i_size was changed
 *
- * We do not support i_size changes yet.
+ * We only support i_size changes for normal files at present, i.e. not
+ * compressed and not encrypted.  This is enforced in ntfs_setattr(), see
+ * below.
 *
 * The kernel guarantees that @vi is a regular file (S_ISREG() is true) and
 * that the change is allowed.
@@ -2306,80 +2312,499 @@ int ntfs_show_options(struct seq_file *sf, struct vfsmount *mnt)
 * Returns 0 on success or -errno on error.
 *
 * Called with ->i_sem held.  In all but one case ->i_alloc_sem is held for
- * writing.  The only case where ->i_alloc_sem is not held is
+ * writing.  The only case in the kernel where ->i_alloc_sem is not held is
 * mm/filemap.c::generic_file_buffered_write() where vmtruncate() is called
- * with the current i_size as the offset which means that it is a noop as far
+ * with the current i_size as the offset.  The analogous place in NTFS is in
- * as ntfs_truncate() is concerned.
+ * fs/ntfs/file.c::ntfs_file_buffered_write() where we call vmtruncate() again
+ * without holding ->i_alloc_sem.
 */
 int ntfs_truncate(struct inode *vi)
 {
-        ntfs_inode *ni = NTFS_I(vi);
+        s64 new_size, old_size, nr_freed, new_alloc_size, old_alloc_size;
+        VCN highest_vcn;
+        unsigned long flags;
+        ntfs_inode *base_ni, *ni = NTFS_I(vi);
        ntfs_volume *vol = ni->vol;
        ntfs_attr_search_ctx *ctx;
        MFT_RECORD *m;
        ATTR_RECORD *a;
        const char *te = "  Leaving file length out of sync with i_size.";
-        int err;
+        int err, mp_size, size_change, alloc_change;
+        u32 attr_len;
        ntfs_debug("Entering for inode 0x%lx.", vi->i_ino);
        BUG_ON(NInoAttr(ni));
+        BUG_ON(S_ISDIR(vi->i_mode));
+        BUG_ON(NInoMstProtected(ni));
        BUG_ON(ni->nr_extents < 0);
-        m = map_mft_record(ni);
+retry_truncate:
+        /*
+         * Lock the runlist for writing and map the mft record to ensure it is
+         * safe to mess with the attribute runlist and sizes.
+         */
+        down_write(&ni->runlist.lock);
+        if (!NInoAttr(ni))
+                base_ni = ni;
+        else
+                base_ni = ni->ext.base_ntfs_ino;
+        m = map_mft_record(base_ni);
        if (IS_ERR(m)) {
                err = PTR_ERR(m);
                ntfs_error(vi->i_sb, "Failed to map mft record for inode 0x%lx "
                                "(error code %d).%s", vi->i_ino, err, te);
                ctx = NULL;
                m = NULL;
-                goto err_out;
+                goto old_bad_out;
        }
-        ctx = ntfs_attr_get_search_ctx(ni, m);
+        ctx = ntfs_attr_get_search_ctx(base_ni, m);
        if (unlikely(!ctx)) {
                ntfs_error(vi->i_sb, "Failed to allocate a search context for "
                                "inode 0x%lx (not enough memory).%s",
                                vi->i_ino, te);
                err = -ENOMEM;
-                goto err_out;
+                goto old_bad_out;
        }
        err = ntfs_attr_lookup(ni->type, ni->name, ni->name_len,
                        CASE_SENSITIVE, 0, NULL, 0, ctx);
        if (unlikely(err)) {
-                if (err == -ENOENT)
+                if (err == -ENOENT) {
                        ntfs_error(vi->i_sb, "Open attribute is missing from "
                                        "mft record.  Inode 0x%lx is corrupt.  "
-                                        "Run chkdsk.", vi->i_ino);
+                                        "Run chkdsk.%s", vi->i_ino, te);
-                else
+                        err = -EIO;
+                } else
                        ntfs_error(vi->i_sb, "Failed to lookup attribute in "
-                                        "inode 0x%lx (error code %d).",
+                                        "inode 0x%lx (error code %d).%s",
-                                        vi->i_ino, err);
+                                        vi->i_ino, err, te);
-                goto err_out;
+                goto old_bad_out;
        }
+        m = ctx->mrec;
        a = ctx->attr;
-        /* If the size has not changed there is nothing to do. */
+        /*
-        if (ntfs_attr_size(a) == i_size_read(vi))
+         * The i_size of the vfs inode is the new size for the attribute value.
-                goto done;
+         */
-        // TODO: Implement the truncate...
+        new_size = i_size_read(vi);
-        ntfs_error(vi->i_sb, "Inode size has changed but this is not "
+        /* The current size of the attribute value is the old size. */
-                        "implemented yet.  Resetting inode size to old value. "
+        old_size = ntfs_attr_size(a);
-                        " This is most likely a bug in the ntfs driver!");
+        /* Calculate the new allocated size. */
-        i_size_write(vi, ntfs_attr_size(a)); 
+        if (NInoNonResident(ni))
-done:
+                new_alloc_size = (new_size + vol->cluster_size - 1) &
+                                ~(s64)vol->cluster_size_mask;
+        else
+                new_alloc_size = (new_size + 7) & ~7;
+        /* The current allocated size is the old allocated size. */
+        read_lock_irqsave(&ni->size_lock, flags);
+        old_alloc_size = ni->allocated_size;
+        read_unlock_irqrestore(&ni->size_lock, flags);
+        /*
+         * The change in the file size.  This will be 0 if no change, >0 if the
+         * size is growing, and <0 if the size is shrinking.
+         */
+        size_change = -1;
+        if (new_size - old_size >= 0) {
+                size_change = 1;
+                if (new_size == old_size)
+                        size_change = 0;
+        }
+        /* As above for the allocated size. */
+        alloc_change = -1;
+        if (new_alloc_size - old_alloc_size >= 0) {
+                alloc_change = 1;
+                if (new_alloc_size == old_alloc_size)
+                        alloc_change = 0;
+        }
+        /*
+         * If neither the size nor the allocation are being changed there is
+         * nothing to do.
+         */
+        if (!size_change && !alloc_change)
+                goto unm_done;
+        /* If the size is changing, check if new size is allowed in $AttrDef. */
+        if (size_change) {
+                err = ntfs_attr_size_bounds_check(vol, ni->type, new_size);
+                if (unlikely(err)) {
+                        if (err == -ERANGE) {
+                                ntfs_error(vol->sb, "Truncate would cause the "
+                                                "inode 0x%lx to %simum size "
+                                                "for its attribute type "
+                                                "(0x%x).  Aborting truncate.",
+                                                vi->i_ino,
+                                                new_size > old_size ? "exceed "
+                                                "the max" : "go under the min",
+                                                le32_to_cpu(ni->type));
+                                err = -EFBIG;
+                        } else {
+                                ntfs_error(vol->sb, "Inode 0x%lx has unknown "
+                                                "attribute type 0x%x.  "
+                                                "Aborting truncate.",
+                                                vi->i_ino,
+                                                le32_to_cpu(ni->type));
+                                err = -EIO;
+                        }
+                        /* Reset the vfs inode size to the old size. */
+                        i_size_write(vi, old_size);
+                        goto err_out;
+                }
+        }
+        if (NInoCompressed(ni) || NInoEncrypted(ni)) {
+                ntfs_warning(vi->i_sb, "Changes in inode size are not "
+                                "supported yet for %s files, ignoring.",
+                                NInoCompressed(ni) ? "compressed" :
+                                "encrypted");
+                err = -EOPNOTSUPP;
+                goto bad_out;
+        }
+        if (a->non_resident)
+                goto do_non_resident_truncate;
+        BUG_ON(NInoNonResident(ni));
+        /* Resize the attribute record to best fit the new attribute size. */
+        if (new_size < vol->mft_record_size &&
+                        !ntfs_resident_attr_value_resize(m, a, new_size)) {
+                unsigned long flags;
+                /* The resize succeeded! */
+                flush_dcache_mft_record_page(ctx->ntfs_ino);
+                mark_mft_record_dirty(ctx->ntfs_ino);
+                write_lock_irqsave(&ni->size_lock, flags);
+                /* Update the sizes in the ntfs inode and all is done. */
+                ni->allocated_size = le32_to_cpu(a->length) -
+                                le16_to_cpu(a->data.resident.value_offset);
+                /*
+                 * Note ntfs_resident_attr_value_resize() has already done any
+                 * necessary data clearing in the attribute record.  When the
+                 * file is being shrunk vmtruncate() will already have cleared
+                 * the top part of the last partial page, i.e. since this is
+                 * the resident case this is the page with index 0.  However,
+                 * when the file is being expanded, the page cache page data
+                 * between the old data_size, i.e. old_size, and the new_size
+                 * has not been zeroed.  Fortunately, we do not need to zero it
+                 * either since on one hand it will either already be zero due
+                 * to both readpage and writepage clearing partial page data
+                 * beyond i_size in which case there is nothing to do or in the
+                 * case of the file being mmap()ped at the same time, POSIX
+                 * specifies that the behaviour is unspecified thus we do not
+                 * have to do anything.  This means that in our implementation
+                 * in the rare case that the file is mmap()ped and a write
+                 * occured into the mmap()ped region just beyond the file size
+                 * and writepage has not yet been called to write out the page
+                 * (which would clear the area beyond the file size) and we now
+                 * extend the file size to incorporate this dirty region
+                 * outside the file size, a write of the page would result in
+                 * this data being written to disk instead of being cleared.
+                 * Given both POSIX and the Linux mmap(2) man page specify that
+                 * this corner case is undefined, we choose to leave it like
+                 * that as this is much simpler for us as we cannot lock the
+                 * relevant page now since we are holding too many ntfs locks
+                 * which would result in a lock reversal deadlock.
+                 */
+                ni->initialized_size = new_size;
+                write_unlock_irqrestore(&ni->size_lock, flags);
+                goto unm_done;
+        }
+        /* If the above resize failed, this must be an attribute extension. */
+        BUG_ON(size_change < 0);
+        /*
+         * We have to drop all the locks so we can call
+         * ntfs_attr_make_non_resident().  This could be optimised by try-
+         * locking the first page cache page and only if that fails dropping
+         * the locks, locking the page, and redoing all the locking and
+         * lookups.  While this would be a huge optimisation, it is not worth
+         * it as this is definitely a slow code path as it only ever can happen
+         * once for any given file.
+         */
        ntfs_attr_put_search_ctx(ctx);
-        unmap_mft_record(ni);
+        unmap_mft_record(base_ni);
-        NInoClearTruncateFailed(ni);
+        up_write(&ni->runlist.lock);
-        ntfs_debug("Done.");
+        /*
-        return 0;
+         * Not enough space in the mft record, try to make the attribute
-err_out:
+         * non-resident and if successful restart the truncation process.
-        if (err != -ENOMEM) {
+         */
+        err = ntfs_attr_make_non_resident(ni, old_size);
+        if (likely(!err))
+                goto retry_truncate;
+        /*
+         * Could not make non-resident.  If this is due to this not being
+         * permitted for this attribute type or there not being enough space,
+         * try to make other attributes non-resident.  Otherwise fail.
+         */
+        if (unlikely(err != -EPERM && err != -ENOSPC)) {
+                ntfs_error(vol->sb, "Cannot truncate inode 0x%lx, attribute "
+                                "type 0x%x, because the conversion from "
+                                "resident to non-resident attribute failed "
+                                "with error code %i.", vi->i_ino,
+                                (unsigned)le32_to_cpu(ni->type), err);
+                if (err != -ENOMEM)
+                        err = -EIO;
+                goto conv_err_out;
+        }
+        /* TODO: Not implemented from here, abort. */
+        if (err == -ENOSPC)
+                ntfs_error(vol->sb, "Not enough space in the mft record/on "
+                                "disk for the non-resident attribute value.  "
+                                "This case is not implemented yet.");
+        else /* if (err == -EPERM) */
+                ntfs_error(vol->sb, "This attribute type may not be "
+                                "non-resident.  This case is not implemented "
+                                "yet.");
+        err = -EOPNOTSUPP;
+        goto conv_err_out;
+#if 0
+        // TODO: Attempt to make other attributes non-resident.
+        if (!err)
+                goto do_resident_extend;
+        /*
+         * Both the attribute list attribute and the standard information
+         * attribute must remain in the base inode.  Thus, if this is one of
+         * these attributes, we have to try to move other attributes out into
+         * extent mft records instead.
+         */
+        if (ni->type == AT_ATTRIBUTE_LIST ||
+                        ni->type == AT_STANDARD_INFORMATION) {
+                // TODO: Attempt to move other attributes into extent mft
+                // records.
+                err = -EOPNOTSUPP;
+                if (!err)
+                        goto do_resident_extend;
+                goto err_out;
+        }
+        // TODO: Attempt to move this attribute to an extent mft record, but
+        // only if it is not already the only attribute in an mft record in
+        // which case there would be nothing to gain.
+        err = -EOPNOTSUPP;
+        if (!err)
+                goto do_resident_extend;
+        /* There is nothing we can do to make enough space. )-: */
+        goto err_out;
+#endif
+do_non_resident_truncate:
+        BUG_ON(!NInoNonResident(ni));
+        if (alloc_change < 0) {
+                highest_vcn = sle64_to_cpu(a->data.non_resident.highest_vcn);
+                if (highest_vcn > 0 &&
+                                old_alloc_size >> vol->cluster_size_bits >
+                                highest_vcn + 1) {
+                        /*
+                         * This attribute has multiple extents.  Not yet
+                         * supported.
+                         */
+                        ntfs_error(vol->sb, "Cannot truncate inode 0x%lx, "
+                                        "attribute type 0x%x, because the "
+                                        "attribute is highly fragmented (it "
+                                        "consists of multiple extents) and "
+                                        "this case is not implemented yet.",
+                                        vi->i_ino,
+                                        (unsigned)le32_to_cpu(ni->type));
+                        err = -EOPNOTSUPP;
+                        goto bad_out;
+                }
+        }
+        /*
+         * If the size is shrinking, need to reduce the initialized_size and
+         * the data_size before reducing the allocation.
+         */
+        if (size_change < 0) {
+                /*
+                 * Make the valid size smaller (i_size is already up-to-date).
+                 */
+                write_lock_irqsave(&ni->size_lock, flags);
+                if (new_size < ni->initialized_size) {
+                        ni->initialized_size = new_size;
+                        a->data.non_resident.initialized_size =
+                                        cpu_to_sle64(new_size);
+                }
+                a->data.non_resident.data_size = cpu_to_sle64(new_size);
+                write_unlock_irqrestore(&ni->size_lock, flags);
+                flush_dcache_mft_record_page(ctx->ntfs_ino);
+                mark_mft_record_dirty(ctx->ntfs_ino);
+                /* If the allocated size is not changing, we are done. */
+                if (!alloc_change)
+                        goto unm_done;
+                /*
+                 * If the size is shrinking it makes no sense for the
+                 * allocation to be growing.
+                 */
+                BUG_ON(alloc_change > 0);
+        } else /* if (size_change >= 0) */ {
+                /*
+                 * The file size is growing or staying the same but the
+                 * allocation can be shrinking, growing or staying the same.
+                 */
+                if (alloc_change > 0) {
+                        /*
+                         * We need to extend the allocation and possibly update
+                         * the data size.  If we are updating the data size,
+                         * since we are not touching the initialized_size we do
+                         * not need to worry about the actual data on disk.
+                         * And as far as the page cache is concerned, there
+                         * will be no pages beyond the old data size and any
+                         * partial region in the last page between the old and
+                         * new data size (or the end of the page if the new
+                         * data size is outside the page) does not need to be
+                         * modified as explained above for the resident
+                         * attribute truncate case.  To do this, we simply drop
+                         * the locks we hold and leave all the work to our
+                         * friendly helper ntfs_attr_extend_allocation().
+                         */
+                        ntfs_attr_put_search_ctx(ctx);
+                        unmap_mft_record(base_ni);
+                        up_write(&ni->runlist.lock);
+                        err = ntfs_attr_extend_allocation(ni, new_size,
+                                        size_change > 0 ? new_size : -1, -1);
+                        /*
+                         * ntfs_attr_extend_allocation() will have done error
+                         * output already.
+                         */
+                        goto done;
+                }
+                if (!alloc_change)
+                        goto alloc_done;
+        }
+        /* alloc_change < 0 */
+        /* Free the clusters. */
+        nr_freed = ntfs_cluster_free(ni, new_alloc_size >>
+                        vol->cluster_size_bits, -1, ctx);
+        m = ctx->mrec;
+        a = ctx->attr;
+        if (unlikely(nr_freed < 0)) {
+                ntfs_error(vol->sb, "Failed to release cluster(s) (error code "
+                                "%lli).  Unmount and run chkdsk to recover "
+                                "the lost cluster(s).", (long long)nr_freed);
                NVolSetErrors(vol);
+                nr_freed = 0;
+        }
+        /* Truncate the runlist. */
+        err = ntfs_rl_truncate_nolock(vol, &ni->runlist,
+                        new_alloc_size >> vol->cluster_size_bits);
+        /*
+         * If the runlist truncation failed and/or the search context is no
+         * longer valid, we cannot resize the attribute record or build the
+         * mapping pairs array thus we mark the inode bad so that no access to
+         * the freed clusters can happen.
+         */
+        if (unlikely(err || IS_ERR(m))) {
+                ntfs_error(vol->sb, "Failed to %s (error code %li).%s",
+                                IS_ERR(m) ?
+                                "restore attribute search context" :
+                                "truncate attribute runlist",
+                                IS_ERR(m) ? PTR_ERR(m) : err, es);
+                err = -EIO;
+                goto bad_out;
+        }
+        /* Get the size for the shrunk mapping pairs array for the runlist. */
+        mp_size = ntfs_get_size_for_mapping_pairs(vol, ni->runlist.rl, 0, -1);
+        if (unlikely(mp_size <= 0)) {
+                ntfs_error(vol->sb, "Cannot shrink allocation of inode 0x%lx, "
+                                "attribute type 0x%x, because determining the "
+                                "size for the mapping pairs failed with error "
+                                "code %i.%s", vi->i_ino,
+                                (unsigned)le32_to_cpu(ni->type), mp_size, es);
+                err = -EIO;
+                goto bad_out;
+        }
+        /*
+         * Shrink the attribute record for the new mapping pairs array.  Note,
+         * this cannot fail since we are making the attribute smaller thus by
+         * definition there is enough space to do so.
+         */
+        attr_len = le32_to_cpu(a->length);
+        err = ntfs_attr_record_resize(m, a, mp_size +
+                        le16_to_cpu(a->data.non_resident.mapping_pairs_offset));
+        BUG_ON(err);
+        /*
+         * Generate the mapping pairs array directly into the attribute record.
+         */
+        err = ntfs_mapping_pairs_build(vol, (u8*)a +
+                        le16_to_cpu(a->data.non_resident.mapping_pairs_offset),
+                        mp_size, ni->runlist.rl, 0, -1, NULL);
+        if (unlikely(err)) {
+                ntfs_error(vol->sb, "Cannot shrink allocation of inode 0x%lx, "
+                                "attribute type 0x%x, because building the "
+                                "mapping pairs failed with error code %i.%s",
+                                vi->i_ino, (unsigned)le32_to_cpu(ni->type),
+                                err, es);
+                err = -EIO;
+                goto bad_out;
+        }
+        /* Update the allocated/compressed size as well as the highest vcn. */
+        a->data.non_resident.highest_vcn = cpu_to_sle64((new_alloc_size >>
+                        vol->cluster_size_bits) - 1);
+        write_lock_irqsave(&ni->size_lock, flags);
+        ni->allocated_size = new_alloc_size;
+        a->data.non_resident.allocated_size = cpu_to_sle64(new_alloc_size);
+        if (NInoSparse(ni) || NInoCompressed(ni)) {
+                if (nr_freed) {
+                        ni->itype.compressed.size -= nr_freed <<
+                                        vol->cluster_size_bits;
+                        BUG_ON(ni->itype.compressed.size < 0);
+                        a->data.non_resident.compressed_size = cpu_to_sle64(
+                                        ni->itype.compressed.size);
+                        vi->i_blocks = ni->itype.compressed.size >> 9;
+                }
+        } else
+                vi->i_blocks = new_alloc_size >> 9;
+        write_unlock_irqrestore(&ni->size_lock, flags);
+        /*
+         * We have shrunk the allocation.  If this is a shrinking truncate we
+         * have already dealt with the initialized_size and the data_size above
+         * and we are done.  If the truncate is only changing the allocation
+         * and not the data_size, we are also done.  If this is an extending
+         * truncate, need to extend the data_size now which is ensured by the
+         * fact that @size_change is positive.
+         */
+alloc_done:
+        /*
+         * If the size is growing, need to update it now.  If it is shrinking,
+         * we have already updated it above (before the allocation change).
+         */
+        if (size_change > 0)
+                a->data.non_resident.data_size = cpu_to_sle64(new_size);
+        /* Ensure the modified mft record is written out. */
+        flush_dcache_mft_record_page(ctx->ntfs_ino);
+        mark_mft_record_dirty(ctx->ntfs_ino);
+unm_done:
+        ntfs_attr_put_search_ctx(ctx);
+        unmap_mft_record(base_ni);
+        up_write(&ni->runlist.lock);
+done:
+        /* Update the mtime and ctime on the base inode. */
+        inode_update_time(VFS_I(base_ni), 1);
+        if (likely(!err)) {
+                NInoClearTruncateFailed(ni);
+                ntfs_debug("Done.");
+        }
+        return err;
+old_bad_out:
+        old_size = -1;
+bad_out:
+        if (err != -ENOMEM && err != -EOPNOTSUPP) {
                make_bad_inode(vi);
+                make_bad_inode(VFS_I(base_ni));
+                NVolSetErrors(vol);
        }
+        if (err != -EOPNOTSUPP)
+                NInoSetTruncateFailed(ni);
+        else if (old_size >= 0)
+                i_size_write(vi, old_size);
+err_out:
        if (ctx)
                ntfs_attr_put_search_ctx(ctx);
        if (m)
-                unmap_mft_record(ni);
+                unmap_mft_record(base_ni);
-        NInoSetTruncateFailed(ni);
+        up_write(&ni->runlist.lock);
+out:
+        ntfs_debug("Failed.  Returning error code %i.", err);
        return err;
+conv_err_out:
+        if (err != -ENOMEM && err != -EOPNOTSUPP) {
+                make_bad_inode(vi);
+                make_bad_inode(VFS_I(base_ni));
+                NVolSetErrors(vol);
+        }
+        if (err != -EOPNOTSUPP)
+                NInoSetTruncateFailed(ni);
+        else
+                i_size_write(vi, old_size);
+        goto out;
 }
 /**
@@ -2420,8 +2845,7 @@ int ntfs_setattr(struct dentry *dentry, struct iattr *attr)
        err = inode_change_ok(vi, attr);
        if (err)
-                return err;
+                goto out;
        /* We do not support NTFS ACLs yet. */
        if (ia_valid & (ATTR_UID | ATTR_GID | ATTR_MODE)) {
                ntfs_warning(vi->i_sb, "Changes in user/group/mode are not "
@@ -2429,14 +2853,22 @@ int ntfs_setattr(struct dentry *dentry, struct iattr *attr)
                err = -EOPNOTSUPP;
                goto out;
        }
        if (ia_valid & ATTR_SIZE) {
                if (attr->ia_size != i_size_read(vi)) {
-                        ntfs_warning(vi->i_sb, "Changes in inode size are not "
+                        ntfs_inode *ni = NTFS_I(vi);
-                                        "supported yet, ignoring.");
+                        /*
-                        err = -EOPNOTSUPP;
+                         * FIXME: For now we do not support resizing of
-                        // TODO: Implement...
+                         * compressed or encrypted files yet.
-                        // err = vmtruncate(vi, attr->ia_size);
+                         */
+                        if (NInoCompressed(ni) || NInoEncrypted(ni)) {
+                                ntfs_warning(vi->i_sb, "Changes in inode size "
+                                                "are not supported yet for "
+                                                "%s files, ignoring.",
+                                                NInoCompressed(ni) ?
+                                                "compressed" : "encrypted");
+                                err = -EOPNOTSUPP;
+                        } else
+                                err = vmtruncate(vi, attr->ia_size);
                        if (err || ia_valid == ATTR_SIZE)
                                goto out;
                } else {
diff --git a/fs/ntfs/lcnalloc.c b/fs/ntfs/lcnalloc.c
index 5af3bf0b7eee..29cabf93d2d2 100644
--- a/fs/ntfs/lcnalloc.c
+++ b/fs/ntfs/lcnalloc.c
@@ -76,6 +76,7 @@ int ntfs_cluster_free_from_rl_nolock(ntfs_volume *vol,
 * @count:      number of clusters to allocate
 * @start_lcn:  starting lcn at which to allocate the clusters (or -1 if none)
 * @zone:       zone from which to allocate the clusters
+ * @is_extension:       if TRUE, this is an attribute extension
 *
 * Allocate @count clusters preferably starting at cluster @start_lcn or at the
 * current allocator position if @start_lcn is -1, on the mounted ntfs volume
@@ -86,6 +87,13 @@ int ntfs_cluster_free_from_rl_nolock(ntfs_volume *vol,
 * @start_vcn specifies the vcn of the first allocated cluster.  This makes
 * merging the resulting runlist with the old runlist easier.
 *
+ * If @is_extension is TRUE, the caller is allocating clusters to extend an
+ * attribute and if it is FALSE, the caller is allocating clusters to fill a
+ * hole in an attribute.  Practically the difference is that if @is_extension
+ * is TRUE the returned runlist will be terminated with LCN_ENOENT and if
+ * @is_extension is FALSE the runlist will be terminated with
+ * LCN_RL_NOT_MAPPED.
+ *
 * You need to check the return value with IS_ERR().  If this is false, the
 * function was successful and the return value is a runlist describing the
 * allocated cluster(s).  If IS_ERR() is true, the function failed and
@@ -137,7 +145,8 @@ int ntfs_cluster_free_from_rl_nolock(ntfs_volume *vol,
 */
 runlist_element *ntfs_cluster_alloc(ntfs_volume *vol, const VCN start_vcn,
                const s64 count, const LCN start_lcn,
-                const NTFS_CLUSTER_ALLOCATION_ZONES zone)
+                const NTFS_CLUSTER_ALLOCATION_ZONES zone,
+                const BOOL is_extension)
 {
        LCN zone_start, zone_end, bmp_pos, bmp_initial_pos, last_read_pos, lcn;
        LCN prev_lcn = 0, prev_run_len = 0, mft_zone_size;
@@ -310,7 +319,7 @@ runlist_element *ntfs_cluster_alloc(ntfs_volume *vol, const VCN start_vcn,
                                continue;
                        }
                        bit = 1 << (lcn & 7);
-                        ntfs_debug("bit %i.", bit);
+                        ntfs_debug("bit 0x%x.", bit);
                        /* If the bit is already set, go onto the next one. */
                        if (*byte & bit) {
                                lcn++;
@@ -729,7 +738,7 @@ out:
        /* Add runlist terminator element. */
        if (likely(rl)) {
                rl[rlpos].vcn = rl[rlpos - 1].vcn + rl[rlpos - 1].length;
-                rl[rlpos].lcn = LCN_RL_NOT_MAPPED;
+                rl[rlpos].lcn = is_extension ? LCN_ENOENT : LCN_RL_NOT_MAPPED;
                rl[rlpos].length = 0;
        }
        if (likely(page && !IS_ERR(page))) {
@@ -782,6 +791,7 @@ out:
 * @ni:         ntfs inode whose runlist describes the clusters to free
 * @start_vcn:  vcn in the runlist of @ni at which to start freeing clusters
 * @count:      number of clusters to free or -1 for all clusters
+ * @ctx:        active attribute search context if present or NULL if not
 * @is_rollback:        true if this is a rollback operation
 *
 * Free @count clusters starting at the cluster @start_vcn in the runlist
@@ -791,15 +801,39 @@ out:
 * deallocated.  Thus, to completely free all clusters in a runlist, use
 * @start_vcn = 0 and @count = -1.
 *
+ * If @ctx is specified, it is an active search context of @ni and its base mft
+ * record.  This is needed when __ntfs_cluster_free() encounters unmapped
+ * runlist fragments and allows their mapping.  If you do not have the mft
+ * record mapped, you can specify @ctx as NULL and __ntfs_cluster_free() will
+ * perform the necessary mapping and unmapping.
+ *
+ * Note, __ntfs_cluster_free() saves the state of @ctx on entry and restores it
+ * before returning.  Thus, @ctx will be left pointing to the same attribute on
+ * return as on entry.  However, the actual pointers in @ctx may point to
+ * different memory locations on return, so you must remember to reset any
+ * cached pointers from the @ctx, i.e. after the call to __ntfs_cluster_free(),
+ * you will probably want to do:
+ *      m = ctx->mrec;
+ *      a = ctx->attr;
+ * Assuming you cache ctx->attr in a variable @a of type ATTR_RECORD * and that
+ * you cache ctx->mrec in a variable @m of type MFT_RECORD *.
+ *
 * @is_rollback should always be FALSE, it is for internal use to rollback
 * errors.  You probably want to use ntfs_cluster_free() instead.
 *
- * Note, ntfs_cluster_free() does not modify the runlist at all, so the caller
+ * Note, __ntfs_cluster_free() does not modify the runlist, so you have to
- * has to deal with it later.
+ * remove from the runlist or mark sparse the freed runs later.
 *
 * Return the number of deallocated clusters (not counting sparse ones) on
 * success and -errno on error.
 *
+ * WARNING: If @ctx is supplied, regardless of whether success or failure is
+ *          returned, you need to check IS_ERR(@ctx->mrec) and if TRUE the @ctx
+ *          is no longer valid, i.e. you need to either call
+ *          ntfs_attr_reinit_search_ctx() or ntfs_attr_put_search_ctx() on it.
+ *          In that case PTR_ERR(@ctx->mrec) will give you the error code for
+ *          why the mapping of the old inode failed.
+ *
 * Locking: - The runlist described by @ni must be locked for writing on entry
 *            and is locked on return.  Note the runlist may be modified when
 *            needed runlist fragments need to be mapped.
@@ -807,9 +841,13 @@ out:
 *            on return.
 *          - This function takes the volume lcn bitmap lock for writing and
 *            modifies the bitmap contents.
+ *          - If @ctx is NULL, the base mft record of @ni must not be mapped on
+ *            entry and it will be left unmapped on return.
+ *          - If @ctx is not NULL, the base mft record must be mapped on entry
+ *            and it will be left mapped on return.
 */
 s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn, s64 count,
-                const BOOL is_rollback)
+                ntfs_attr_search_ctx *ctx, const BOOL is_rollback)
 {
        s64 delta, to_free, total_freed, real_freed;
        ntfs_volume *vol;
@@ -839,7 +877,7 @@ s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn, s64 count,
        total_freed = real_freed = 0;
-        rl = ntfs_attr_find_vcn_nolock(ni, start_vcn, TRUE);
+        rl = ntfs_attr_find_vcn_nolock(ni, start_vcn, ctx);
        if (IS_ERR(rl)) {
                if (!is_rollback)
                        ntfs_error(vol->sb, "Failed to find first runlist "
@@ -893,7 +931,7 @@ s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn, s64 count,
                        /* Attempt to map runlist. */
                        vcn = rl->vcn;
-                        rl = ntfs_attr_find_vcn_nolock(ni, vcn, TRUE);
+                        rl = ntfs_attr_find_vcn_nolock(ni, vcn, ctx);
                        if (IS_ERR(rl)) {
                                err = PTR_ERR(rl);
                                if (!is_rollback)
@@ -961,7 +999,7 @@ err_out:
         * If rollback fails, set the volume errors flag, emit an error
         * message, and return the error code.
         */
-        delta = __ntfs_cluster_free(ni, start_vcn, total_freed, TRUE);
+        delta = __ntfs_cluster_free(ni, start_vcn, total_freed, ctx, TRUE);
        if (delta < 0) {
                ntfs_error(vol->sb, "Failed to rollback (error %i).  Leaving "
                                "inconsistent metadata!  Unmount and run "
diff --git a/fs/ntfs/lcnalloc.h b/fs/ntfs/lcnalloc.h
index a6a8827882e7..72cbca7003b2 100644
--- a/fs/ntfs/lcnalloc.h
+++ b/fs/ntfs/lcnalloc.h
@@ -27,6 +27,7 @@
 #include <linux/fs.h>
+#include "attrib.h"
 #include "types.h"
 #include "inode.h"
 #include "runlist.h"
@@ -41,16 +42,18 @@ typedef enum {
 extern runlist_element *ntfs_cluster_alloc(ntfs_volume *vol,
                const VCN start_vcn, const s64 count, const LCN start_lcn,
-                const NTFS_CLUSTER_ALLOCATION_ZONES zone);
+                const NTFS_CLUSTER_ALLOCATION_ZONES zone,
+                const BOOL is_extension);
 extern s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn,
-                s64 count, const BOOL is_rollback);
+                s64 count, ntfs_attr_search_ctx *ctx, const BOOL is_rollback);
 /**
 * ntfs_cluster_free - free clusters on an ntfs volume
 * @ni:         ntfs inode whose runlist describes the clusters to free
 * @start_vcn:  vcn in the runlist of @ni at which to start freeing clusters
 * @count:      number of clusters to free or -1 for all clusters
+ * @ctx:        active attribute search context if present or NULL if not
 *
 * Free @count clusters starting at the cluster @start_vcn in the runlist
 * described by the ntfs inode @ni.
@@ -59,12 +62,36 @@ extern s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn,
 * deallocated.  Thus, to completely free all clusters in a runlist, use
 * @start_vcn = 0 and @count = -1.
 *
- * Note, ntfs_cluster_free() does not modify the runlist at all, so the caller
+ * If @ctx is specified, it is an active search context of @ni and its base mft
- * has to deal with it later.
+ * record.  This is needed when ntfs_cluster_free() encounters unmapped runlist
+ * fragments and allows their mapping.  If you do not have the mft record
+ * mapped, you can specify @ctx as NULL and ntfs_cluster_free() will perform
+ * the necessary mapping and unmapping.
+ *
+ * Note, ntfs_cluster_free() saves the state of @ctx on entry and restores it
+ * before returning.  Thus, @ctx will be left pointing to the same attribute on
+ * return as on entry.  However, the actual pointers in @ctx may point to
+ * different memory locations on return, so you must remember to reset any
+ * cached pointers from the @ctx, i.e. after the call to ntfs_cluster_free(),
+ * you will probably want to do:
+ *      m = ctx->mrec;
+ *      a = ctx->attr;
+ * Assuming you cache ctx->attr in a variable @a of type ATTR_RECORD * and that
+ * you cache ctx->mrec in a variable @m of type MFT_RECORD *.
+ *
+ * Note, ntfs_cluster_free() does not modify the runlist, so you have to remove
+ * from the runlist or mark sparse the freed runs later.
 *
 * Return the number of deallocated clusters (not counting sparse ones) on
 * success and -errno on error.
 *
+ * WARNING: If @ctx is supplied, regardless of whether success or failure is
+ *          returned, you need to check IS_ERR(@ctx->mrec) and if TRUE the @ctx
+ *          is no longer valid, i.e. you need to either call
+ *          ntfs_attr_reinit_search_ctx() or ntfs_attr_put_search_ctx() on it.
+ *          In that case PTR_ERR(@ctx->mrec) will give you the error code for
+ *          why the mapping of the old inode failed.
+ *
 * Locking: - The runlist described by @ni must be locked for writing on entry
 *            and is locked on return.  Note the runlist may be modified when
 *            needed runlist fragments need to be mapped.
@@ -72,11 +99,15 @@ extern s64 __ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn,
 *            on return.
 *          - This function takes the volume lcn bitmap lock for writing and
 *            modifies the bitmap contents.
+ *          - If @ctx is NULL, the base mft record of @ni must not be mapped on
+ *            entry and it will be left unmapped on return.
+ *          - If @ctx is not NULL, the base mft record must be mapped on entry
+ *            and it will be left mapped on return.
 */
 static inline s64 ntfs_cluster_free(ntfs_inode *ni, const VCN start_vcn,
-                s64 count)
+                s64 count, ntfs_attr_search_ctx *ctx)
 {
-        return __ntfs_cluster_free(ni, start_vcn, count, FALSE);
+        return __ntfs_cluster_free(ni, start_vcn, count, ctx, FALSE);
 }
 extern int ntfs_cluster_free_from_rl_nolock(ntfs_volume *vol,
diff --git a/fs/ntfs/mft.c b/fs/ntfs/mft.c
index b011369b5956..0c65cbb8c5cf 100644
--- a/fs/ntfs/mft.c
+++ b/fs/ntfs/mft.c
@@ -49,7 +49,8 @@ static inline MFT_RECORD *map_mft_record_page(ntfs_inode *ni)
        ntfs_volume *vol = ni->vol;
        struct inode *mft_vi = vol->mft_ino;
        struct page *page;
-        unsigned long index, ofs, end_index;
+        unsigned long index, end_index;
+        unsigned ofs;
        BUG_ON(ni->page);
        /*
@@ -1308,7 +1309,7 @@ static int ntfs_mft_bitmap_extend_allocation_nolock(ntfs_volume *vol)
        ll = mftbmp_ni->allocated_size;
        read_unlock_irqrestore(&mftbmp_ni->size_lock, flags);
        rl = ntfs_attr_find_vcn_nolock(mftbmp_ni,
-                        (ll - 1) >> vol->cluster_size_bits, TRUE);
+                        (ll - 1) >> vol->cluster_size_bits, NULL);
        if (unlikely(IS_ERR(rl) || !rl->length || rl->lcn < 0)) {
                up_write(&mftbmp_ni->runlist.lock);
                ntfs_error(vol->sb, "Failed to determine last allocated "
@@ -1354,7 +1355,8 @@ static int ntfs_mft_bitmap_extend_allocation_nolock(ntfs_volume *vol)
                up_write(&vol->lcnbmp_lock);
                ntfs_unmap_page(page);
                /* Allocate a cluster from the DATA_ZONE. */
-                rl2 = ntfs_cluster_alloc(vol, rl[1].vcn, 1, lcn, DATA_ZONE);
+                rl2 = ntfs_cluster_alloc(vol, rl[1].vcn, 1, lcn, DATA_ZONE,
+                                TRUE);
                if (IS_ERR(rl2)) {
                        up_write(&mftbmp_ni->runlist.lock);
                        ntfs_error(vol->sb, "Failed to allocate a cluster for "
@@ -1738,7 +1740,7 @@ static int ntfs_mft_data_extend_allocation_nolock(ntfs_volume *vol)
        ll = mft_ni->allocated_size;
        read_unlock_irqrestore(&mft_ni->size_lock, flags);
        rl = ntfs_attr_find_vcn_nolock(mft_ni,
-                        (ll - 1) >> vol->cluster_size_bits, TRUE);
+                        (ll - 1) >> vol->cluster_size_bits, NULL);
        if (unlikely(IS_ERR(rl) || !rl->length || rl->lcn < 0)) {
                up_write(&mft_ni->runlist.lock);
                ntfs_error(vol->sb, "Failed to determine last allocated "
@@ -1779,7 +1781,8 @@ static int ntfs_mft_data_extend_allocation_nolock(ntfs_volume *vol)
                        nr > min_nr ? "default" : "minimal", (long long)nr);
        old_last_vcn = rl[1].vcn;
        do {
-                rl2 = ntfs_cluster_alloc(vol, old_last_vcn, nr, lcn, MFT_ZONE);
+                rl2 = ntfs_cluster_alloc(vol, old_last_vcn, nr, lcn, MFT_ZONE,
+                                TRUE);
                if (likely(!IS_ERR(rl2)))
                        break;
                if (PTR_ERR(rl2) != -ENOSPC || nr == min_nr) {
@@ -1951,20 +1954,21 @@ restore_undo_alloc:
                NVolSetErrors(vol);
                return ret;
        }
-        a = ctx->attr;
+        ctx->attr->data.non_resident.highest_vcn =
-        a->data.non_resident.highest_vcn = cpu_to_sle64(old_last_vcn - 1);
+                        cpu_to_sle64(old_last_vcn - 1);
 undo_alloc:
-        if (ntfs_cluster_free(mft_ni, old_last_vcn, -1) < 0) {
+        if (ntfs_cluster_free(mft_ni, old_last_vcn, -1, ctx) < 0) {
                ntfs_error(vol->sb, "Failed to free clusters from mft data "
                                "attribute.%s", es);
                NVolSetErrors(vol);
        }
+        a = ctx->attr;
        if (ntfs_rl_truncate_nolock(vol, &mft_ni->runlist, old_last_vcn)) {
                ntfs_error(vol->sb, "Failed to truncate mft data attribute "
                                "runlist.%s", es);
                NVolSetErrors(vol);
        }
-        if (mp_rebuilt) {
+        if (mp_rebuilt && !IS_ERR(ctx->mrec)) {
                if (ntfs_mapping_pairs_build(vol, (u8*)a + le16_to_cpu(
                                a->data.non_resident.mapping_pairs_offset),
                                old_alen - le16_to_cpu(
@@ -1981,6 +1985,10 @@ undo_alloc:
                }
                flush_dcache_mft_record_page(ctx->ntfs_ino);
                mark_mft_record_dirty(ctx->ntfs_ino);
+        } else if (IS_ERR(ctx->mrec)) {
+                ntfs_error(vol->sb, "Failed to restore attribute search "
+                                "context.%s", es);
+                NVolSetErrors(vol);
        }
        if (ctx)
                ntfs_attr_put_search_ctx(ctx);