139 files changed, 2651 insertions, 1780 deletions
diff --git a/fs/Kconfig.binfmt b/fs/Kconfig.binfmt
index 0efd1524b977..370b24cee4d8 100644
--- a/fs/Kconfig.binfmt
+++ b/fs/Kconfig.binfmt
@@ -65,6 +65,20 @@ config CORE_DUMP_DEFAULT_ELF_HEADERS
          This config option changes the default setting of coredump_filter
          seen at boot time.  If unsure, say Y.
+config BINFMT_SCRIPT
+        tristate "Kernel support for scripts starting with #!"
+        default y
+        help
+          Say Y here if you want to execute interpreted scripts starting with
+          #! followed by the path to an interpreter.
+          You can build this support as a module; however, until that module
+          gets loaded, you cannot run scripts.  Thus, if you want to load this
+          module from an initramfs, the portion of the initramfs before loading
+          this module must consist of compiled binaries only.
+          Most systems will not boot if you say M or N here.  If unsure, say Y.
 config BINFMT_FLAT
        bool "Kernel support for flat binaries"
        depends on !MMU && (!FRV || BROKEN)
diff --git a/fs/Makefile b/fs/Makefile
index 9d53192236fc..5e67e57b59dc 100644
--- a/fs/Makefile
+++ b/fs/Makefile
@@ -10,7 +10,7 @@ obj-y :=	open.o read_write.o file_table.o super.o \
                ioctl.o readdir.o select.o fifo.o dcache.o inode.o \
                attr.o bad_inode.o file.o filesystems.o namespace.o \
                seq_file.o xattr.o libfs.o fs-writeback.o \
-                pnode.o drop_caches.o splice.o sync.o utimes.o \
+                pnode.o splice.o sync.o utimes.o \
                stack.o fs_struct.o statfs.o
 ifeq ($(CONFIG_BLOCK),y)
@@ -34,10 +34,7 @@ obj-$(CONFIG_COMPAT)		+= compat.o compat_ioctl.o
 obj-$(CONFIG_BINFMT_AOUT)       += binfmt_aout.o
 obj-$(CONFIG_BINFMT_EM86)       += binfmt_em86.o
 obj-$(CONFIG_BINFMT_MISC)       += binfmt_misc.o
+obj-$(CONFIG_BINFMT_SCRIPT)     += binfmt_script.o
-# binfmt_script is always there
-obj-y                           += binfmt_script.o
 obj-$(CONFIG_BINFMT_ELF)        += binfmt_elf.o
 obj-$(CONFIG_COMPAT_BINFMT_ELF) += compat_binfmt_elf.o
 obj-$(CONFIG_BINFMT_ELF_FDPIC)  += binfmt_elf_fdpic.o
@@ -49,6 +46,7 @@ obj-$(CONFIG_FS_POSIX_ACL)	+= posix_acl.o xattr_acl.o
 obj-$(CONFIG_NFS_COMMON)        += nfs_common/
 obj-$(CONFIG_GENERIC_ACL)       += generic_acl.o
 obj-$(CONFIG_COREDUMP)          += coredump.o
+obj-$(CONFIG_SYSCTL)            += drop_caches.o
 obj-$(CONFIG_FHANDLE)           += fhandle.o
diff --git a/fs/aio.c b/fs/aio.c
index 3f941f2a3059..6db8745c2edd 100644
--- a/fs/aio.c
+++ b/fs/aio.c
@@ -1029,9 +1029,9 @@ static int aio_read_evt(struct kioctx *ioctx, struct io_event *ent)
        spin_unlock(&info->ring_lock);
 out:
-        kunmap_atomic(ring);
        dprintk("leaving aio_read_evt: %d  h%lu t%lu\n", ret,
                 (unsigned long)ring->head, (unsigned long)ring->tail);
+        kunmap_atomic(ring);
        return ret;
 }
@@ -1790,7 +1790,5 @@ SYSCALL_DEFINE5(io_getevents, aio_context_t, ctx_id,
                        ret = read_events(ioctx, min_nr, nr, events, timeout);
                put_ioctx(ioctx);
        }
-        asmlinkage_protect(5, ret, ctx_id, min_nr, nr, events, timeout);
        return ret;
 }
diff --git a/fs/befs/btree.c b/fs/befs/btree.c
index a66c9b1136e0..74e397db0b8b 100644
--- a/fs/befs/btree.c
+++ b/fs/befs/btree.c
@@ -436,8 +436,7 @@ befs_btree_read(struct super_block *sb, befs_data_stream * ds,
                goto error;
        }
-        if ((this_node = (befs_btree_node *)
+        if ((this_node = kmalloc(sizeof (befs_btree_node), GFP_NOFS)) == NULL) {
-             kmalloc(sizeof (befs_btree_node), GFP_NOFS)) == NULL) {
                befs_error(sb, "befs_btree_read() failed to allocate %u "
                           "bytes of memory", sizeof (befs_btree_node));
                goto error;
diff --git a/fs/binfmt_aout.c b/fs/binfmt_aout.c
index bbc8f8827eac..02fe378fc506 100644
--- a/fs/binfmt_aout.c
+++ b/fs/binfmt_aout.c
@@ -62,7 +62,6 @@ static int aout_core_dump(struct coredump_params *cprm)
        fs = get_fs();
        set_fs(KERNEL_DS);
        has_dumped = 1;
-        current->flags |= PF_DUMPCORE;
        strncpy(dump.u_comm, current->comm, sizeof(dump.u_comm));
        dump.u_ar0 = offsetof(struct user, regs);
        dump.signal = cprm->siginfo->si_signo;
diff --git a/fs/binfmt_elf.c b/fs/binfmt_elf.c
index 3939829f6c5c..34a9771eaa6c 100644
--- a/fs/binfmt_elf.c
+++ b/fs/binfmt_elf.c
@@ -803,7 +803,8 @@ static int load_elf_binary(struct linux_binprm *bprm)
                         * follow the loader, and is not movable.  */
 #ifdef CONFIG_ARCH_BINFMT_ELF_RANDOMIZE_PIE
                        /* Memory randomization might have been switched off
-                         * in runtime via sysctl.
+                         * in runtime via sysctl or explicit setting of
+                         * personality flags.
                         * If that is the case, retain the original non-zero
                         * load_bias value in order to establish proper
                         * non-randomized mappings.
@@ -1137,6 +1138,7 @@ static unsigned long vma_dump_size(struct vm_area_struct *vma,
                        goto whole;
                if (!(vma->vm_flags & VM_SHARED) && FILTER(HUGETLB_PRIVATE))
                        goto whole;
+                return 0;
        }
        /* Do not dump I/O mapped devices or special mappings */
@@ -2090,8 +2092,7 @@ static int elf_core_dump(struct coredump_params *cprm)
                goto cleanup;
        has_dumped = 1;
-        current->flags |= PF_DUMPCORE;
-  
        fs = get_fs();
        set_fs(KERNEL_DS);
diff --git a/fs/binfmt_elf_fdpic.c b/fs/binfmt_elf_fdpic.c
index 9c13e023e2b7..c1cc06aed601 100644
--- a/fs/binfmt_elf_fdpic.c
+++ b/fs/binfmt_elf_fdpic.c
@@ -1687,8 +1687,6 @@ static int elf_fdpic_core_dump(struct coredump_params *cprm)
        fill_elf_fdpic_header(elf, e_phnum);
        has_dumped = 1;
-        current->flags |= PF_DUMPCORE;
        /*
         * Set up the notes in similar form to SVR4 core dumps made
         * with info from their /proc.
diff --git a/fs/binfmt_misc.c b/fs/binfmt_misc.c
index 751df5e4f61a..1c740e152f38 100644
--- a/fs/binfmt_misc.c
+++ b/fs/binfmt_misc.c
@@ -23,6 +23,7 @@
 #include <linux/binfmts.h>
 #include <linux/slab.h>
 #include <linux/ctype.h>
+#include <linux/string_helpers.h>
 #include <linux/file.h>
 #include <linux/pagemap.h>
 #include <linux/namei.h>
@@ -234,24 +235,6 @@ static char *scanarg(char *s, char del)
        return s;
 }
-static int unquote(char *from)
-{
-        char c = 0, *s = from, *p = from;
-        while ((c = *s++) != '\0') {
-                if (c == '\\' && *s == 'x') {
-                        s++;
-                        c = toupper(*s++);
-                        *p = (c - (isdigit(c) ? '0' : 'A' - 10)) << 4;
-                        c = toupper(*s++);
-                        *p++ |= c - (isdigit(c) ? '0' : 'A' - 10);
-                        continue;
-                }
-                *p++ = c;
-        }
-        return p - from;
-}
 static char * check_special_flags (char * sfs, Node * e)
 {
        char * p = sfs;
@@ -354,8 +337,9 @@ static Node *create_entry(const char __user *buffer, size_t count)
                p[-1] = '\0';
                if (!e->mask[0])
                        e->mask = NULL;
-                e->size = unquote(e->magic);
+                e->size = string_unescape_inplace(e->magic, UNESCAPE_HEX);
-                if (e->mask && unquote(e->mask) != e->size)
+                if (e->mask &&
+                    string_unescape_inplace(e->mask, UNESCAPE_HEX) != e->size)
                        goto Einval;
                if (e->size + e->offset > BINPRM_BUF_SIZE)
                        goto Einval;
diff --git a/fs/bio.c b/fs/bio.c
index bb5768f59b32..b96fc6ce4855 100644
--- a/fs/bio.c
+++ b/fs/bio.c
@@ -1428,8 +1428,6 @@ void bio_endio(struct bio *bio, int error)
        else if (!test_bit(BIO_UPTODATE, &bio->bi_flags))
                error = -EIO;
-        trace_block_bio_complete(bio, error);
        if (bio->bi_end_io)
                bio->bi_end_io(bio, error);
 }
diff --git a/fs/block_dev.c b/fs/block_dev.c
index aea605c98ba6..ce08de7467a3 100644
--- a/fs/block_dev.c
+++ b/fs/block_dev.c
@@ -551,6 +551,7 @@ struct block_device *bdgrab(struct block_device *bdev)
        ihold(bdev->bd_inode);
        return bdev;
 }
+EXPORT_SYMBOL(bdgrab);
 long nr_blockdev_pages(void)
 {
@@ -616,11 +617,9 @@ void bd_forget(struct inode *inode)
        struct block_device *bdev = NULL;
        spin_lock(&bdev_lock);
-        if (inode->i_bdev) {
+        if (!sb_is_blkdev_sb(inode->i_sb))
-                if (!sb_is_blkdev_sb(inode->i_sb))
+                bdev = inode->i_bdev;
-                        bdev = inode->i_bdev;
+        __bd_forget(inode);
-                __bd_forget(inode);
-        }
        spin_unlock(&bdev_lock);
        if (bdev)
diff --git a/fs/btrfs/tree-log.c b/fs/btrfs/tree-log.c
index 451fad96ecd1..ef96381569a4 100644
--- a/fs/btrfs/tree-log.c
+++ b/fs/btrfs/tree-log.c
@@ -317,6 +317,7 @@ static noinline int overwrite_item(struct btrfs_trans_handle *trans,
        unsigned long src_ptr;
        unsigned long dst_ptr;
        int overwrite_root = 0;
+        bool inode_item = key->type == BTRFS_INODE_ITEM_KEY;
        if (root->root_key.objectid != BTRFS_TREE_LOG_OBJECTID)
                overwrite_root = 1;
@@ -326,6 +327,9 @@ static noinline int overwrite_item(struct btrfs_trans_handle *trans,
        /* look for the key in the destination tree */
        ret = btrfs_search_slot(NULL, root, key, path, 0, 0);
+        if (ret < 0)
+                return ret;
        if (ret == 0) {
                char *src_copy;
                char *dst_copy;
@@ -367,6 +371,30 @@ static noinline int overwrite_item(struct btrfs_trans_handle *trans,
                        return 0;
                }
+                /*
+                 * We need to load the old nbytes into the inode so when we
+                 * replay the extents we've logged we get the right nbytes.
+                 */
+                if (inode_item) {
+                        struct btrfs_inode_item *item;
+                        u64 nbytes;
+                        item = btrfs_item_ptr(path->nodes[0], path->slots[0],
+                                              struct btrfs_inode_item);
+                        nbytes = btrfs_inode_nbytes(path->nodes[0], item);
+                        item = btrfs_item_ptr(eb, slot,
+                                              struct btrfs_inode_item);
+                        btrfs_set_inode_nbytes(eb, item, nbytes);
+                }
+        } else if (inode_item) {
+                struct btrfs_inode_item *item;
+                /*
+                 * New inode, set nbytes to 0 so that the nbytes comes out
+                 * properly when we replay the extents.
+                 */
+                item = btrfs_item_ptr(eb, slot, struct btrfs_inode_item);
+                btrfs_set_inode_nbytes(eb, item, 0);
        }
 insert:
        btrfs_release_path(path);
@@ -486,7 +514,7 @@ static noinline int replay_one_extent(struct btrfs_trans_handle *trans,
        int found_type;
        u64 extent_end;
        u64 start = key->offset;
-        u64 saved_nbytes;
+        u64 nbytes = 0;
        struct btrfs_file_extent_item *item;
        struct inode *inode = NULL;
        unsigned long size;
@@ -496,10 +524,19 @@ static noinline int replay_one_extent(struct btrfs_trans_handle *trans,
        found_type = btrfs_file_extent_type(eb, item);
        if (found_type == BTRFS_FILE_EXTENT_REG ||
-            found_type == BTRFS_FILE_EXTENT_PREALLOC)
+            found_type == BTRFS_FILE_EXTENT_PREALLOC) {
-                extent_end = start + btrfs_file_extent_num_bytes(eb, item);
+                nbytes = btrfs_file_extent_num_bytes(eb, item);
-        else if (found_type == BTRFS_FILE_EXTENT_INLINE) {
+                extent_end = start + nbytes;
+                /*
+                 * We don't add to the inodes nbytes if we are prealloc or a
+                 * hole.
+                 */
+                if (btrfs_file_extent_disk_bytenr(eb, item) == 0)
+                        nbytes = 0;
+        } else if (found_type == BTRFS_FILE_EXTENT_INLINE) {
                size = btrfs_file_extent_inline_len(eb, item);
+                nbytes = btrfs_file_extent_ram_bytes(eb, item);
                extent_end = ALIGN(start + size, root->sectorsize);
        } else {
                ret = 0;
@@ -548,7 +585,6 @@ static noinline int replay_one_extent(struct btrfs_trans_handle *trans,
        }
        btrfs_release_path(path);
-        saved_nbytes = inode_get_bytes(inode);
        /* drop any overlapping extents */
        ret = btrfs_drop_extents(trans, root, inode, start, extent_end, 1);
        BUG_ON(ret);
@@ -635,7 +671,7 @@ static noinline int replay_one_extent(struct btrfs_trans_handle *trans,
                BUG_ON(ret);
        }
-        inode_set_bytes(inode, saved_nbytes);
+        inode_add_bytes(inode, nbytes);
        ret = btrfs_update_inode(trans, root, inode);
 out:
        if (inode)
diff --git a/fs/buffer.c b/fs/buffer.c
index a15575c0b9ee..bc1fe14aaa3e 100644
--- a/fs/buffer.c
+++ b/fs/buffer.c
@@ -865,8 +865,6 @@ try_again:
                /* Link the buffer to its page */
                set_bh_page(bh, page, offset);
-                init_buffer(bh, NULL, NULL);
        }
        return head;
 /*
@@ -2949,7 +2947,7 @@ static void guard_bh_eod(int rw, struct bio *bio, struct buffer_head *bh)
        }
 }
-int submit_bh(int rw, struct buffer_head * bh)
+int _submit_bh(int rw, struct buffer_head *bh, unsigned long bio_flags)
 {
        struct bio *bio;
        int ret = 0;
@@ -2984,6 +2982,7 @@ int submit_bh(int rw, struct buffer_head * bh)
        bio->bi_end_io = end_bio_bh_io_sync;
        bio->bi_private = bh;
+        bio->bi_flags |= bio_flags;
        /* Take care of bh's that straddle the end of the device */
        guard_bh_eod(rw, bio, bh);
@@ -3002,6 +3001,12 @@ int submit_bh(int rw, struct buffer_head * bh)
        bio_put(bio);
        return ret;
 }
+EXPORT_SYMBOL_GPL(_submit_bh);
+int submit_bh(int rw, struct buffer_head *bh)
+{
+        return _submit_bh(rw, bh, 0);
+}
 EXPORT_SYMBOL(submit_bh);
 /**
diff --git a/fs/cifs/connect.c b/fs/cifs/connect.c
index 991c63c6bdd0..21b3a291c327 100644
--- a/fs/cifs/connect.c
+++ b/fs/cifs/connect.c
@@ -1575,14 +1575,24 @@ cifs_parse_mount_options(const char *mountdata, const char *devname,
                        }
                        break;
                case Opt_blank_pass:
-                        vol->password = NULL;
-                        break;
-                case Opt_pass:
                        /* passwords have to be handled differently
                         * to allow the character used for deliminator
                         * to be passed within them
                         */
+                        /*
+                         * Check if this is a case where the  password
+                         * starts with a delimiter
+                         */
+                        tmp_end = strchr(data, '=');
+                        tmp_end++;
+                        if (!(tmp_end < end && tmp_end[1] == delim)) {
+                                /* No it is not. Set the password to NULL */
+                                vol->password = NULL;
+                                break;
+                        }
+                        /* Yes it is. Drop down to Opt_pass below.*/
+                case Opt_pass:
                        /* Obtain the value string */
                        value = strchr(data, '=');
                        value++;
diff --git a/fs/compat.c b/fs/compat.c
index d487985dd0ea..5f83ffa42115 100644
--- a/fs/compat.c
+++ b/fs/compat.c
@@ -44,7 +44,6 @@
 #include <linux/signal.h>
 #include <linux/poll.h>
 #include <linux/mm.h>
-#include <linux/eventpoll.h>
 #include <linux/fs_struct.h>
 #include <linux/slab.h>
 #include <linux/pagemap.h>
@@ -1253,26 +1252,6 @@ compat_sys_pwritev(unsigned long fd, const struct compat_iovec __user *vec,
        return compat_sys_pwritev64(fd, vec, vlen, pos);
 }
-asmlinkage long
-compat_sys_vmsplice(int fd, const struct compat_iovec __user *iov32,
-                    unsigned int nr_segs, unsigned int flags)
-{
-        unsigned i;
-        struct iovec __user *iov;
-        if (nr_segs > UIO_MAXIOV)
-                return -EINVAL;
-        iov = compat_alloc_user_space(nr_segs * sizeof(struct iovec));
-        for (i = 0; i < nr_segs; i++) {
-                struct compat_iovec v;
-                if (get_user(v.iov_base, &iov32[i].iov_base) ||
-                    get_user(v.iov_len, &iov32[i].iov_len) ||
-                    put_user(compat_ptr(v.iov_base), &iov[i].iov_base) ||
-                    put_user(v.iov_len, &iov[i].iov_len))
-                        return -EFAULT;
-        }
-        return sys_vmsplice(fd, iov, nr_segs, flags);
-}
 /*
 * Exactly like fs/open.c:sys_open(), except that it doesn't set the
 * O_LARGEFILE flag.
@@ -1658,84 +1637,6 @@ asmlinkage long compat_sys_ppoll(struct pollfd __user *ufds,
        return ret;
 }
-#ifdef CONFIG_EPOLL
-asmlinkage long compat_sys_epoll_pwait(int epfd,
-                        struct compat_epoll_event __user *events,
-                        int maxevents, int timeout,
-                        const compat_sigset_t __user *sigmask,
-                        compat_size_t sigsetsize)
-{
-        long err;
-        compat_sigset_t csigmask;
-        sigset_t ksigmask, sigsaved;
-        /*
-         * If the caller wants a certain signal mask to be set during the wait,
-         * we apply it here.
-         */
-        if (sigmask) {
-                if (sigsetsize != sizeof(compat_sigset_t))
-                        return -EINVAL;
-                if (copy_from_user(&csigmask, sigmask, sizeof(csigmask)))
-                        return -EFAULT;
-                sigset_from_compat(&ksigmask, &csigmask);
-                sigdelsetmask(&ksigmask, sigmask(SIGKILL) | sigmask(SIGSTOP));
-                sigprocmask(SIG_SETMASK, &ksigmask, &sigsaved);
-        }
-        err = sys_epoll_wait(epfd, events, maxevents, timeout);
-        /*
-         * If we changed the signal mask, we need to restore the original one.
-         * In case we've got a signal while waiting, we do not restore the
-         * signal mask yet, and we allow do_signal() to deliver the signal on
-         * the way back to userspace, before the signal mask is restored.
-         */
-        if (sigmask) {
-                if (err == -EINTR) {
-                        memcpy(&current->saved_sigmask, &sigsaved,
-                               sizeof(sigsaved));
-                        set_restore_sigmask();
-                } else
-                        sigprocmask(SIG_SETMASK, &sigsaved, NULL);
-        }
-        return err;
-}
-#endif /* CONFIG_EPOLL */
-#ifdef CONFIG_SIGNALFD
-asmlinkage long compat_sys_signalfd4(int ufd,
-                                     const compat_sigset_t __user *sigmask,
-                                     compat_size_t sigsetsize, int flags)
-{
-        compat_sigset_t ss32;
-        sigset_t tmp;
-        sigset_t __user *ksigmask;
-        if (sigsetsize != sizeof(compat_sigset_t))
-                return -EINVAL;
-        if (copy_from_user(&ss32, sigmask, sizeof(ss32)))
-                return -EFAULT;
-        sigset_from_compat(&tmp, &ss32);
-        ksigmask = compat_alloc_user_space(sizeof(sigset_t));
-        if (copy_to_user(ksigmask, &tmp, sizeof(sigset_t)))
-                return -EFAULT;
-        return sys_signalfd4(ufd, ksigmask, sizeof(sigset_t), flags);
-}
-asmlinkage long compat_sys_signalfd(int ufd,
-                                    const compat_sigset_t __user *sigmask,
-                                    compat_size_t sigsetsize)
-{
-        return compat_sys_signalfd4(ufd, sigmask, sigsetsize, 0);
-}
-#endif /* CONFIG_SIGNALFD */
 #ifdef CONFIG_FHANDLE
 /*
 * Exactly like fs/open.c:sys_open_by_handle_at(), except that it
@@ -1747,25 +1648,3 @@ COMPAT_SYSCALL_DEFINE3(open_by_handle_at, int, mountdirfd,
        return do_handle_open(mountdirfd, handle, flags);
 }
 #endif
-#ifdef __ARCH_WANT_COMPAT_SYS_SENDFILE
-asmlinkage long compat_sys_sendfile(int out_fd, int in_fd,
-                                    compat_off_t __user *offset, compat_size_t count)
-{
-        loff_t pos;
-        off_t off;
-        ssize_t ret;
-        if (offset) {
-                if (unlikely(get_user(off, offset)))
-                        return -EFAULT;
-                pos = off;
-                ret = do_sendfile(out_fd, in_fd, &pos, count, MAX_NON_LFS);
-                if (unlikely(put_user(pos, offset)))
-                        return -EFAULT;
-                return ret;
-        }
-        return do_sendfile(out_fd, in_fd, NULL, count, 0);
-}
-#endif /* __ARCH_WANT_COMPAT_SYS_SENDFILE */
diff --git a/fs/coredump.c b/fs/coredump.c
index c6479658d487..ec306cc9a28a 100644
--- a/fs/coredump.c
+++ b/fs/coredump.c
@@ -263,7 +263,6 @@ static int zap_process(struct task_struct *start, int exit_code)
        struct task_struct *t;
        int nr = 0;
-        start->signal->flags = SIGNAL_GROUP_EXIT;
        start->signal->group_exit_code = exit_code;
        start->signal->group_stop_count = 0;
@@ -280,8 +279,8 @@ static int zap_process(struct task_struct *start, int exit_code)
        return nr;
 }
-static inline int zap_threads(struct task_struct *tsk, struct mm_struct *mm,
+static int zap_threads(struct task_struct *tsk, struct mm_struct *mm,
-                                struct core_state *core_state, int exit_code)
+                        struct core_state *core_state, int exit_code)
 {
        struct task_struct *g, *p;
        unsigned long flags;
@@ -291,11 +290,16 @@ static inline int zap_threads(struct task_struct *tsk, struct mm_struct *mm,
        if (!signal_group_exit(tsk->signal)) {
                mm->core_state = core_state;
                nr = zap_process(tsk, exit_code);
+                tsk->signal->group_exit_task = tsk;
+                /* ignore all signals except SIGKILL, see prepare_signal() */
+                tsk->signal->flags = SIGNAL_GROUP_COREDUMP;
+                clear_tsk_thread_flag(tsk, TIF_SIGPENDING);
        }
        spin_unlock_irq(&tsk->sighand->siglock);
        if (unlikely(nr < 0))
                return nr;
+        tsk->flags = PF_DUMPCORE;
        if (atomic_read(&mm->mm_users) == nr + 1)
                goto done;
        /*
@@ -340,6 +344,7 @@ static inline int zap_threads(struct task_struct *tsk, struct mm_struct *mm,
                                if (unlikely(p->mm == mm)) {
                                        lock_task_sighand(p, &flags);
                                        nr += zap_process(p, exit_code);
+                                        p->signal->flags = SIGNAL_GROUP_EXIT;
                                        unlock_task_sighand(p, &flags);
                                }
                                break;
@@ -386,11 +391,18 @@ static int coredump_wait(int exit_code, struct core_state *core_state)
        return core_waiters;
 }
-static void coredump_finish(struct mm_struct *mm)
+static void coredump_finish(struct mm_struct *mm, bool core_dumped)
 {
        struct core_thread *curr, *next;
        struct task_struct *task;
+        spin_lock_irq(&current->sighand->siglock);
+        if (core_dumped && !__fatal_signal_pending(current))
+                current->signal->group_exit_code |= 0x80;
+        current->signal->group_exit_task = NULL;
+        current->signal->flags = SIGNAL_GROUP_EXIT;
+        spin_unlock_irq(&current->sighand->siglock);
        next = mm->core_state->dumper.next;
        while ((curr = next) != NULL) {
                next = curr->next;
@@ -407,6 +419,17 @@ static void coredump_finish(struct mm_struct *mm)
        mm->core_state = NULL;
 }
+static bool dump_interrupted(void)
+{
+        /*
+         * SIGKILL or freezing() interrupt the coredumping. Perhaps we
+         * can do try_to_freeze() and check __fatal_signal_pending(),
+         * but then we need to teach dump_write() to restart and clear
+         * TIF_SIGPENDING.
+         */
+        return signal_pending(current);
+}
 static void wait_for_dump_helpers(struct file *file)
 {
        struct pipe_inode_info *pipe;
@@ -416,17 +439,20 @@ static void wait_for_dump_helpers(struct file *file)
        pipe_lock(pipe);
        pipe->readers++;
        pipe->writers--;
+        wake_up_interruptible_sync(&pipe->wait);
+        kill_fasync(&pipe->fasync_readers, SIGIO, POLL_IN);
+        pipe_unlock(pipe);
-        while ((pipe->readers > 1) && (!signal_pending(current))) {
+        /*
-                wake_up_interruptible_sync(&pipe->wait);
+         * We actually want wait_event_freezable() but then we need
-                kill_fasync(&pipe->fasync_readers, SIGIO, POLL_IN);
+         * to clear TIF_SIGPENDING and improve dump_interrupted().
-                pipe_wait(pipe);
+         */
-        }
+        wait_event_interruptible(pipe->wait, pipe->readers == 1);
+        pipe_lock(pipe);
        pipe->readers--;
        pipe->writers++;
        pipe_unlock(pipe);
 }
 /*
@@ -471,6 +497,7 @@ void do_coredump(siginfo_t *siginfo)
        int ispipe;
        struct files_struct *displaced;
        bool need_nonrelative = false;
+        bool core_dumped = false;
        static atomic_t core_dump_count = ATOMIC_INIT(0);
        struct coredump_params cprm = {
                .siginfo = siginfo,
@@ -514,17 +541,12 @@ void do_coredump(siginfo_t *siginfo)
        old_cred = override_creds(cred);
-        /*
-         * Clear any false indication of pending signals that might
-         * be seen by the filesystem code called to write the core file.
-         */
-        clear_thread_flag(TIF_SIGPENDING);
        ispipe = format_corename(&cn, &cprm);
-        if (ispipe) {
+        if (ispipe) {
                int dump_count;
                char **helper_argv;
+                struct subprocess_info *sub_info;
                if (ispipe < 0) {
                        printk(KERN_WARNING "format_corename failed\n");
@@ -571,15 +593,20 @@ void do_coredump(siginfo_t *siginfo)
                        goto fail_dropcount;
                }
-                retval = call_usermodehelper_fns(helper_argv[0], helper_argv,
+                retval = -ENOMEM;
-                                        NULL, UMH_WAIT_EXEC, umh_pipe_setup,
+                sub_info = call_usermodehelper_setup(helper_argv[0],
-                                        NULL, &cprm);
+                                                helper_argv, NULL, GFP_KERNEL,
+                                                umh_pipe_setup, NULL, &cprm);
+                if (sub_info)
+                        retval = call_usermodehelper_exec(sub_info,
+                                                          UMH_WAIT_EXEC);
                argv_free(helper_argv);
                if (retval) {
-                        printk(KERN_INFO "Core dump to %s pipe failed\n",
+                        printk(KERN_INFO "Core dump to %s pipe failed\n",
                               cn.corename);
                        goto close_fail;
-                }
+                }
        } else {
                struct inode *inode;
@@ -629,9 +656,7 @@ void do_coredump(siginfo_t *siginfo)
                goto close_fail;
        if (displaced)
                put_files_struct(displaced);
-        retval = binfmt->core_dump(&cprm);
+        core_dumped = !dump_interrupted() && binfmt->core_dump(&cprm);
-        if (retval)
-                current->signal->group_exit_code |= 0x80;
        if (ispipe && core_pipe_limit)
                wait_for_dump_helpers(cprm.file);
@@ -644,7 +669,7 @@ fail_dropcount:
 fail_unlock:
        kfree(cn.corename);
 fail_corename:
-        coredump_finish(mm);
+        coredump_finish(mm, core_dumped);
        revert_creds(old_cred);
 fail_creds:
        put_cred(cred);
@@ -659,7 +684,9 @@ fail:
 */
 int dump_write(struct file *file, const void *addr, int nr)
 {
-        return access_ok(VERIFY_READ, addr, nr) && file->f_op->write(file, addr, nr, &file->f_pos) == nr;
+        return !dump_interrupted() &&
+                access_ok(VERIFY_READ, addr, nr) &&
+                file->f_op->write(file, addr, nr, &file->f_pos) == nr;
 }
 EXPORT_SYMBOL(dump_write);
@@ -668,7 +695,8 @@ int dump_seek(struct file *file, loff_t off)
        int ret = 1;
        if (file->f_op->llseek && file->f_op->llseek != no_llseek) {
-                if (file->f_op->llseek(file, off, SEEK_CUR) < 0)
+                if (dump_interrupted() ||
+                    file->f_op->llseek(file, off, SEEK_CUR) < 0)
                        return 0;
        } else {
                char *buf = (char *)get_zeroed_page(GFP_KERNEL);
diff --git a/fs/dcache.c b/fs/dcache.c
index e8bc3420d63e..e689268046c3 100644
--- a/fs/dcache.c
+++ b/fs/dcache.c
@@ -1230,8 +1230,10 @@ void shrink_dcache_parent(struct dentry * parent)
        LIST_HEAD(dispose);
        int found;
-        while ((found = select_parent(parent, &dispose)) != 0)
+        while ((found = select_parent(parent, &dispose)) != 0) {
                shrink_dentry_list(&dispose);
+                cond_resched();
+        }
 }
 EXPORT_SYMBOL(shrink_dcache_parent);
diff --git a/fs/dcookies.c b/fs/dcookies.c
index 17c779967828..ab5954b50267 100644
--- a/fs/dcookies.c
+++ b/fs/dcookies.c
@@ -25,6 +25,7 @@
 #include <linux/dcookies.h>
 #include <linux/mutex.h>
 #include <linux/path.h>
+#include <linux/compat.h>
 #include <asm/uaccess.h>
 /* The dcookies are allocated from a kmem_cache and
@@ -145,7 +146,7 @@ out:
 /* And here is where the userspace process can look up the cookie value
 * to retrieve the path.
 */
-SYSCALL_DEFINE(lookup_dcookie)(u64 cookie64, char __user * buf, size_t len)
+SYSCALL_DEFINE3(lookup_dcookie, u64, cookie64, char __user *, buf, size_t, len)
 {
        unsigned long cookie = (unsigned long)cookie64;
        int err = -EINVAL;
@@ -201,12 +202,16 @@ out:
        mutex_unlock(&dcookie_mutex);
        return err;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_lookup_dcookie(u64 cookie64, long buf, long len)
+#ifdef CONFIG_COMPAT
+COMPAT_SYSCALL_DEFINE4(lookup_dcookie, u32, w0, u32, w1, char __user *, buf, size_t, len)
 {
-        return SYSC_lookup_dcookie(cookie64, (char __user *) buf, (size_t) len);
+#ifdef __BIG_ENDIAN
+        return sys_lookup_dcookie(((u64)w0 << 32) | w1, buf, len);
+#else
+        return sys_lookup_dcookie(((u64)w1 << 32) | w0, buf, len);
+#endif
 }
-SYSCALL_ALIAS(sys_lookup_dcookie, SyS_lookup_dcookie);
 #endif
 static int dcookie_init(void)
diff --git a/fs/direct-io.c b/fs/direct-io.c
index f853263cf74f..cfb816dc6d9f 100644
--- a/fs/direct-io.c
+++ b/fs/direct-io.c
@@ -672,12 +672,6 @@ static inline int dio_send_cur_page(struct dio *dio, struct dio_submit *sdio,
                if (sdio->final_block_in_bio != sdio->cur_page_block ||
                    cur_offset != bio_next_offset)
                        dio_bio_submit(dio, sdio);
-                /*
-                 * Submit now if the underlying fs is about to perform a
-                 * metadata read
-                 */
-                else if (sdio->boundary)
-                        dio_bio_submit(dio, sdio);
        }
        if (sdio->bio == NULL) {
@@ -737,16 +731,6 @@ submit_page_section(struct dio *dio, struct dio_submit *sdio, struct page *page,
            sdio->cur_page_block +
            (sdio->cur_page_len >> sdio->blkbits) == blocknr) {
                sdio->cur_page_len += len;
-                /*
-                 * If sdio->boundary then we want to schedule the IO now to
-                 * avoid metadata seeks.
-                 */
-                if (sdio->boundary) {
-                        ret = dio_send_cur_page(dio, sdio, map_bh);
-                        page_cache_release(sdio->cur_page);
-                        sdio->cur_page = NULL;
-                }
                goto out;
        }
@@ -758,7 +742,7 @@ submit_page_section(struct dio *dio, struct dio_submit *sdio, struct page *page,
                page_cache_release(sdio->cur_page);
                sdio->cur_page = NULL;
                if (ret)
-                        goto out;
+                        return ret;
        }
        page_cache_get(page);           /* It is in dio */
@@ -768,6 +752,16 @@ submit_page_section(struct dio *dio, struct dio_submit *sdio, struct page *page,
        sdio->cur_page_block = blocknr;
        sdio->cur_page_fs_offset = sdio->block_in_file << sdio->blkbits;
 out:
+        /*
+         * If sdio->boundary then we want to schedule the IO now to
+         * avoid metadata seeks.
+         */
+        if (sdio->boundary) {
+                ret = dio_send_cur_page(dio, sdio, map_bh);
+                dio_bio_submit(dio, sdio);
+                page_cache_release(sdio->cur_page);
+                sdio->cur_page = NULL;
+        }
        return ret;
 }
@@ -969,7 +963,8 @@ do_holes:
                        this_chunk_bytes = this_chunk_blocks << blkbits;
                        BUG_ON(this_chunk_bytes == 0);
-                        sdio->boundary = buffer_boundary(map_bh);
+                        if (this_chunk_blocks == sdio->blocks_available)
+                                sdio->boundary = buffer_boundary(map_bh);
                        ret = submit_page_section(dio, sdio, page,
                                                  offset_in_page,
                                                  this_chunk_bytes,
diff --git a/fs/dlm/plock.c b/fs/dlm/plock.c
index 01fd5c11a7fb..f704458ea5f5 100644
--- a/fs/dlm/plock.c
+++ b/fs/dlm/plock.c
@@ -247,6 +247,7 @@ int dlm_posix_unlock(dlm_lockspace_t *lockspace, u64 number, struct file *file,
        struct dlm_ls *ls;
        struct plock_op *op;
        int rv;
+        unsigned char fl_flags = fl->fl_flags;
        ls = dlm_find_lockspace_local(lockspace);
        if (!ls)
@@ -258,9 +259,18 @@ int dlm_posix_unlock(dlm_lockspace_t *lockspace, u64 number, struct file *file,
                goto out;
        }
-        if (posix_lock_file_wait(file, fl) < 0)
+        /* cause the vfs unlock to return ENOENT if lock is not found */
-                log_error(ls, "dlm_posix_unlock: vfs unlock error %llx",
+        fl->fl_flags |= FL_EXISTS;
-                          (unsigned long long)number);
+        rv = posix_lock_file_wait(file, fl);
+        if (rv == -ENOENT) {
+                rv = 0;
+                goto out_free;
+        }
+        if (rv < 0) {
+                log_error(ls, "dlm_posix_unlock: vfs unlock error %d %llx",
+                          rv, (unsigned long long)number);
+        }
        op->info.optype         = DLM_PLOCK_OP_UNLOCK;
        op->info.pid            = fl->fl_pid;
@@ -296,9 +306,11 @@ int dlm_posix_unlock(dlm_lockspace_t *lockspace, u64 number, struct file *file,
        if (rv == -ENOENT)
                rv = 0;
+out_free:
        kfree(op);
 out:
        dlm_put_lockspace(ls);
+        fl->fl_flags = fl_flags;
        return rv;
 }
 EXPORT_SYMBOL_GPL(dlm_posix_unlock);
diff --git a/fs/ecryptfs/miscdev.c b/fs/ecryptfs/miscdev.c
index 412e6eda25f8..e4141f257495 100644
--- a/fs/ecryptfs/miscdev.c
+++ b/fs/ecryptfs/miscdev.c
@@ -80,13 +80,6 @@ ecryptfs_miscdev_open(struct inode *inode, struct file *file)
        int rc;
        mutex_lock(&ecryptfs_daemon_hash_mux);
-        rc = try_module_get(THIS_MODULE);
-        if (rc == 0) {
-                rc = -EIO;
-                printk(KERN_ERR "%s: Error attempting to increment module use "
-                       "count; rc = [%d]\n", __func__, rc);
-                goto out_unlock_daemon_list;
-        }
        rc = ecryptfs_find_daemon_by_euid(&daemon);
        if (!rc) {
                rc = -EINVAL;
@@ -96,7 +89,7 @@ ecryptfs_miscdev_open(struct inode *inode, struct file *file)
        if (rc) {
                printk(KERN_ERR "%s: Error attempting to spawn daemon; "
                       "rc = [%d]\n", __func__, rc);
-                goto out_module_put_unlock_daemon_list;
+                goto out_unlock_daemon_list;
        }
        mutex_lock(&daemon->mux);
        if (daemon->flags & ECRYPTFS_DAEMON_MISCDEV_OPEN) {
@@ -108,9 +101,6 @@ ecryptfs_miscdev_open(struct inode *inode, struct file *file)
        atomic_inc(&ecryptfs_num_miscdev_opens);
 out_unlock_daemon:
        mutex_unlock(&daemon->mux);
-out_module_put_unlock_daemon_list:
-        if (rc)
-                module_put(THIS_MODULE);
 out_unlock_daemon_list:
        mutex_unlock(&ecryptfs_daemon_hash_mux);
        return rc;
@@ -147,7 +137,6 @@ ecryptfs_miscdev_release(struct inode *inode, struct file *file)
                       "bug.\n", __func__, rc);
                BUG();
        }
-        module_put(THIS_MODULE);
        return rc;
 }
@@ -471,6 +460,7 @@ out_free:
 static const struct file_operations ecryptfs_miscdev_fops = {
+        .owner   = THIS_MODULE,
        .open    = ecryptfs_miscdev_open,
        .poll    = ecryptfs_miscdev_poll,
        .read    = ecryptfs_miscdev_read,
diff --git a/fs/eventpoll.c b/fs/eventpoll.c
index 9fec1836057a..deecc7294a67 100644
--- a/fs/eventpoll.c
+++ b/fs/eventpoll.c
@@ -40,6 +40,7 @@
 #include <linux/atomic.h>
 #include <linux/proc_fs.h>
 #include <linux/seq_file.h>
+#include <linux/compat.h>
 /*
 * LOCKING:
@@ -104,7 +105,7 @@
 struct epoll_filefd {
        struct file *file;
        int fd;
-};
+} __packed;
 /*
 * Structure used to track possible nested calls, for too deep recursions
@@ -128,6 +129,8 @@ struct nested_calls {
 /*
 * Each file descriptor added to the eventpoll interface will
 * have an entry of this type linked to the "rbr" RB tree.
+ * Avoid increasing the size of this struct, there can be many thousands
+ * of these on a server and we do not want this to take another cache line.
 */
 struct epitem {
        /* RB tree node used to link this structure to the eventpoll RB tree */
@@ -158,7 +161,7 @@ struct epitem {
        struct list_head fllink;
        /* wakeup_source used when EPOLLWAKEUP is set */
-        struct wakeup_source *ws;
+        struct wakeup_source __rcu *ws;
        /* The structure that describe the interested events and the source fd */
        struct epoll_event event;
@@ -536,6 +539,38 @@ static void ep_unregister_pollwait(struct eventpoll *ep, struct epitem *epi)
        }
 }
+/* call only when ep->mtx is held */
+static inline struct wakeup_source *ep_wakeup_source(struct epitem *epi)
+{
+        return rcu_dereference_check(epi->ws, lockdep_is_held(&epi->ep->mtx));
+}
+/* call only when ep->mtx is held */
+static inline void ep_pm_stay_awake(struct epitem *epi)
+{
+        struct wakeup_source *ws = ep_wakeup_source(epi);
+        if (ws)
+                __pm_stay_awake(ws);
+}
+static inline bool ep_has_wakeup_source(struct epitem *epi)
+{
+        return rcu_access_pointer(epi->ws) ? true : false;
+}
+/* call when ep->mtx cannot be held (ep_poll_callback) */
+static inline void ep_pm_stay_awake_rcu(struct epitem *epi)
+{
+        struct wakeup_source *ws;
+        rcu_read_lock();
+        ws = rcu_dereference(epi->ws);
+        if (ws)
+                __pm_stay_awake(ws);
+        rcu_read_unlock();
+}
 /**
 * ep_scan_ready_list - Scans the ready list in a way that makes possible for
 *                      the scan code, to call f_op->poll(). Also allows for
@@ -599,7 +634,7 @@ static int ep_scan_ready_list(struct eventpoll *ep,
                 */
                if (!ep_is_linked(&epi->rdllink)) {
                        list_add_tail(&epi->rdllink, &ep->rdllist);
-                        __pm_stay_awake(epi->ws);
+                        ep_pm_stay_awake(epi);
                }
        }
        /*
@@ -668,7 +703,7 @@ static int ep_remove(struct eventpoll *ep, struct epitem *epi)
                list_del_init(&epi->rdllink);
        spin_unlock_irqrestore(&ep->lock, flags);
-        wakeup_source_unregister(epi->ws);
+        wakeup_source_unregister(ep_wakeup_source(epi));
        /* At this point it is safe to free the eventpoll item */
        kmem_cache_free(epi_cache, epi);
@@ -711,11 +746,15 @@ static void ep_free(struct eventpoll *ep)
         * point we are sure no poll callbacks will be lingering around, and also by
         * holding "epmutex" we can be sure that no file cleanup code will hit
         * us during this operation. So we can avoid the lock on "ep->lock".
+         * We do not need to lock ep->mtx, either, we only do it to prevent
+         * a lockdep warning.
         */
+        mutex_lock(&ep->mtx);
        while ((rbp = rb_first(&ep->rbr)) != NULL) {
                epi = rb_entry(rbp, struct epitem, rbn);
                ep_remove(ep, epi);
        }
+        mutex_unlock(&ep->mtx);
        mutex_unlock(&epmutex);
        mutex_destroy(&ep->mtx);
@@ -734,6 +773,13 @@ static int ep_eventpoll_release(struct inode *inode, struct file *file)
        return 0;
 }
+static inline unsigned int ep_item_poll(struct epitem *epi, poll_table *pt)
+{
+        pt->_key = epi->event.events;
+        return epi->ffd.file->f_op->poll(epi->ffd.file, pt) & epi->event.events;
+}
 static int ep_read_events_proc(struct eventpoll *ep, struct list_head *head,
                               void *priv)
 {
@@ -741,10 +787,9 @@ static int ep_read_events_proc(struct eventpoll *ep, struct list_head *head,
        poll_table pt;
        init_poll_funcptr(&pt, NULL);
        list_for_each_entry_safe(epi, tmp, head, rdllink) {
-                pt._key = epi->event.events;
+                if (ep_item_poll(epi, &pt))
-                if (epi->ffd.file->f_op->poll(epi->ffd.file, &pt) &
-                    epi->event.events)
                        return POLLIN | POLLRDNORM;
                else {
                        /*
@@ -752,7 +797,7 @@ static int ep_read_events_proc(struct eventpoll *ep, struct list_head *head,
                         * callback, but it's not actually ready, as far as
                         * caller requested events goes. We can remove it here.
                         */
-                        __pm_relax(epi->ws);
+                        __pm_relax(ep_wakeup_source(epi));
                        list_del_init(&epi->rdllink);
                }
        }
@@ -984,7 +1029,7 @@ static int ep_poll_callback(wait_queue_t *wait, unsigned mode, int sync, void *k
        /* If this file is already in the ready list we exit soon */
        if (!ep_is_linked(&epi->rdllink)) {
                list_add_tail(&epi->rdllink, &ep->rdllist);
-                __pm_stay_awake(epi->ws);
+                ep_pm_stay_awake_rcu(epi);
        }
        /*
@@ -1146,6 +1191,7 @@ static int reverse_path_check(void)
 static int ep_create_wakeup_source(struct epitem *epi)
 {
        const char *name;
+        struct wakeup_source *ws;
        if (!epi->ep->ws) {
                epi->ep->ws = wakeup_source_register("eventpoll");
@@ -1154,17 +1200,29 @@ static int ep_create_wakeup_source(struct epitem *epi)
        }
        name = epi->ffd.file->f_path.dentry->d_name.name;
-        epi->ws = wakeup_source_register(name);
+        ws = wakeup_source_register(name);
-        if (!epi->ws)
+        if (!ws)
                return -ENOMEM;
+        rcu_assign_pointer(epi->ws, ws);
        return 0;
 }
-static void ep_destroy_wakeup_source(struct epitem *epi)
+/* rare code path, only used when EPOLL_CTL_MOD removes a wakeup source */
+static noinline void ep_destroy_wakeup_source(struct epitem *epi)
 {
-        wakeup_source_unregister(epi->ws);
+        struct wakeup_source *ws = ep_wakeup_source(epi);
-        epi->ws = NULL;
+        RCU_INIT_POINTER(epi->ws, NULL);
+        /*
+         * wait for ep_pm_stay_awake_rcu to finish, synchronize_rcu is
+         * used internally by wakeup_source_remove, too (called by
+         * wakeup_source_unregister), so we cannot use call_rcu
+         */
+        synchronize_rcu();
+        wakeup_source_unregister(ws);
 }
 /*
@@ -1199,13 +1257,12 @@ static int ep_insert(struct eventpoll *ep, struct epoll_event *event,
                if (error)
                        goto error_create_wakeup_source;
        } else {
-                epi->ws = NULL;
+                RCU_INIT_POINTER(epi->ws, NULL);
        }
        /* Initialize the poll table using the queue callback */
        epq.epi = epi;
        init_poll_funcptr(&epq.pt, ep_ptable_queue_proc);
-        epq.pt._key = event->events;
        /*
         * Attach the item to the poll hooks and get current event bits.
@@ -1214,7 +1271,7 @@ static int ep_insert(struct eventpoll *ep, struct epoll_event *event,
         * this operation completes, the poll callback can start hitting
         * the new item.
         */
-        revents = tfile->f_op->poll(tfile, &epq.pt);
+        revents = ep_item_poll(epi, &epq.pt);
        /*
         * We have to check if something went wrong during the poll wait queue
@@ -1247,7 +1304,7 @@ static int ep_insert(struct eventpoll *ep, struct epoll_event *event,
        /* If the file is already "ready" we drop it inside the ready list */
        if ((revents & event->events) && !ep_is_linked(&epi->rdllink)) {
                list_add_tail(&epi->rdllink, &ep->rdllist);
-                __pm_stay_awake(epi->ws);
+                ep_pm_stay_awake(epi);
                /* Notify waiting tasks that events are available */
                if (waitqueue_active(&ep->wq))
@@ -1288,7 +1345,7 @@ error_unregister:
                list_del_init(&epi->rdllink);
        spin_unlock_irqrestore(&ep->lock, flags);
-        wakeup_source_unregister(epi->ws);
+        wakeup_source_unregister(ep_wakeup_source(epi));
 error_create_wakeup_source:
        kmem_cache_free(epi_cache, epi);
@@ -1314,12 +1371,11 @@ static int ep_modify(struct eventpoll *ep, struct epitem *epi, struct epoll_even
         * f_op->poll() call and the new event set registering.
         */
        epi->event.events = event->events; /* need barrier below */
-        pt._key = event->events;
        epi->event.data = event->data; /* protected by mtx */
        if (epi->event.events & EPOLLWAKEUP) {
-                if (!epi->ws)
+                if (!ep_has_wakeup_source(epi))
                        ep_create_wakeup_source(epi);
-        } else if (epi->ws) {
+        } else if (ep_has_wakeup_source(epi)) {
                ep_destroy_wakeup_source(epi);
        }
@@ -1347,7 +1403,7 @@ static int ep_modify(struct eventpoll *ep, struct epitem *epi, struct epoll_even
         * Get current event bits. We can safely use the file* here because
         * its usage count has been increased by the caller of this function.
         */
-        revents = epi->ffd.file->f_op->poll(epi->ffd.file, &pt);
+        revents = ep_item_poll(epi, &pt);
        /*
         * If the item is "hot" and it is not registered inside the ready
@@ -1357,7 +1413,7 @@ static int ep_modify(struct eventpoll *ep, struct epitem *epi, struct epoll_even
                spin_lock_irq(&ep->lock);
                if (!ep_is_linked(&epi->rdllink)) {
                        list_add_tail(&epi->rdllink, &ep->rdllist);
-                        __pm_stay_awake(epi->ws);
+                        ep_pm_stay_awake(epi);
                        /* Notify waiting tasks that events are available */
                        if (waitqueue_active(&ep->wq))
@@ -1383,6 +1439,7 @@ static int ep_send_events_proc(struct eventpoll *ep, struct list_head *head,
        unsigned int revents;
        struct epitem *epi;
        struct epoll_event __user *uevent;
+        struct wakeup_source *ws;
        poll_table pt;
        init_poll_funcptr(&pt, NULL);
@@ -1405,14 +1462,16 @@ static int ep_send_events_proc(struct eventpoll *ep, struct list_head *head,
                 * instead, but then epi->ws would temporarily be out of sync
                 * with ep_is_linked().
                 */
-                if (epi->ws && epi->ws->active)
+                ws = ep_wakeup_source(epi);
-                        __pm_stay_awake(ep->ws);
+                if (ws) {
-                __pm_relax(epi->ws);
+                        if (ws->active)
+                                __pm_stay_awake(ep->ws);
+                        __pm_relax(ws);
+                }
                list_del_init(&epi->rdllink);
-                pt._key = epi->event.events;
+                revents = ep_item_poll(epi, &pt);
-                revents = epi->ffd.file->f_op->poll(epi->ffd.file, &pt) &
-                        epi->event.events;
                /*
                 * If the event mask intersect the caller-requested one,
@@ -1424,7 +1483,7 @@ static int ep_send_events_proc(struct eventpoll *ep, struct list_head *head,
                        if (__put_user(revents, &uevent->events) ||
                            __put_user(epi->event.data, &uevent->data)) {
                                list_add(&epi->rdllink, head);
-                                __pm_stay_awake(epi->ws);
+                                ep_pm_stay_awake(epi);
                                return eventcnt ? eventcnt : -EFAULT;
                        }
                        eventcnt++;
@@ -1444,7 +1503,7 @@ static int ep_send_events_proc(struct eventpoll *ep, struct list_head *head,
                                 * poll callback will queue them in ep->ovflist.
                                 */
                                list_add_tail(&epi->rdllink, &ep->rdllist);
-                                __pm_stay_awake(epi->ws);
+                                ep_pm_stay_awake(epi);
                        }
                }
        }
@@ -1940,6 +1999,52 @@ SYSCALL_DEFINE6(epoll_pwait, int, epfd, struct epoll_event __user *, events,
        return error;
 }
+#ifdef CONFIG_COMPAT
+COMPAT_SYSCALL_DEFINE6(epoll_pwait, int, epfd,
+                        struct epoll_event __user *, events,
+                        int, maxevents, int, timeout,
+                        const compat_sigset_t __user *, sigmask,
+                        compat_size_t, sigsetsize)
+{
+        long err;
+        compat_sigset_t csigmask;
+        sigset_t ksigmask, sigsaved;
+        /*
+         * If the caller wants a certain signal mask to be set during the wait,
+         * we apply it here.
+         */
+        if (sigmask) {
+                if (sigsetsize != sizeof(compat_sigset_t))
+                        return -EINVAL;
+                if (copy_from_user(&csigmask, sigmask, sizeof(csigmask)))
+                        return -EFAULT;
+                sigset_from_compat(&ksigmask, &csigmask);
+                sigdelsetmask(&ksigmask, sigmask(SIGKILL) | sigmask(SIGSTOP));
+                sigprocmask(SIG_SETMASK, &ksigmask, &sigsaved);
+        }
+        err = sys_epoll_wait(epfd, events, maxevents, timeout);
+        /*
+         * If we changed the signal mask, we need to restore the original one.
+         * In case we've got a signal while waiting, we do not restore the
+         * signal mask yet, and we allow do_signal() to deliver the signal on
+         * the way back to userspace, before the signal mask is restored.
+         */
+        if (sigmask) {
+                if (err == -EINTR) {
+                        memcpy(&current->saved_sigmask, &sigsaved,
+                               sizeof(sigsaved));
+                        set_restore_sigmask();
+                } else
+                        sigprocmask(SIG_SETMASK, &sigsaved, NULL);
+        }
+        return err;
+}
+#endif
 static int __init eventpoll_init(void)
 {
        struct sysinfo si;
@@ -1964,6 +2069,12 @@ static int __init eventpoll_init(void)
        /* Initialize the structure used to perform file's f_op->poll() calls */
        ep_nested_calls_init(&poll_readywalk_ncalls);
+        /*
+         * We can have many thousands of epitems, so prevent this from
+         * using an extra cache line on 64-bit (and smaller) CPUs
+         */
+        BUILD_BUG_ON(sizeof(void *) <= 8 && sizeof(struct epitem) > 128);
        /* Allocates slab cache used to allocate "struct epitem" items */
        epi_cache = kmem_cache_create("eventpoll_epi", sizeof(struct epitem),
                        0, SLAB_HWCACHE_ALIGN | SLAB_PANIC, NULL);
diff --git a/fs/exec.c b/fs/exec.c
index a96a4885bbbf..963f510a25ab 100644
--- a/fs/exec.c
+++ b/fs/exec.c
@@ -613,7 +613,7 @@ static int shift_arg_pages(struct vm_area_struct *vma, unsigned long shift)
                 * when the old and new regions overlap clear from new_end.
                 */
                free_pgd_range(&tlb, new_end, old_end, new_end,
-                        vma->vm_next ? vma->vm_next->vm_start : 0);
+                        vma->vm_next ? vma->vm_next->vm_start : USER_PGTABLES_CEILING);
        } else {
                /*
                 * otherwise, clean from old_start; this is done to not touch
@@ -622,7 +622,7 @@ static int shift_arg_pages(struct vm_area_struct *vma, unsigned long shift)
                 * for the others its just a little faster.
                 */
                free_pgd_range(&tlb, old_start, old_end, new_end,
-                        vma->vm_next ? vma->vm_next->vm_start : 0);
+                        vma->vm_next ? vma->vm_next->vm_start : USER_PGTABLES_CEILING);
        }
        tlb_finish_mmu(&tlb, new_end, old_end);
@@ -898,11 +898,13 @@ static int de_thread(struct task_struct *tsk)
                sig->notify_count = -1; /* for exit_notify() */
                for (;;) {
+                        threadgroup_change_begin(tsk);
                        write_lock_irq(&tasklist_lock);
                        if (likely(leader->exit_state))
                                break;
                        __set_current_state(TASK_KILLABLE);
                        write_unlock_irq(&tasklist_lock);
+                        threadgroup_change_end(tsk);
                        schedule();
                        if (unlikely(__fatal_signal_pending(tsk)))
                                goto killed;
@@ -960,6 +962,7 @@ static int de_thread(struct task_struct *tsk)
                if (unlikely(leader->ptrace))
                        __wake_up_parent(leader, leader->parent);
                write_unlock_irq(&tasklist_lock);
+                threadgroup_change_end(tsk);
                release_task(leader);
        }
@@ -1027,17 +1030,7 @@ EXPORT_SYMBOL_GPL(get_task_comm);
 void set_task_comm(struct task_struct *tsk, char *buf)
 {
        task_lock(tsk);
        trace_task_rename(tsk, buf);
-        /*
-         * Threads may access current->comm without holding
-         * the task lock, so write the string carefully.
-         * Readers without a lock may see incomplete new
-         * names but are safe from non-terminating string reads.
-         */
-        memset(tsk->comm, 0, TASK_COMM_LEN);
-        wmb();
        strlcpy(tsk->comm, buf, sizeof(tsk->comm));
        task_unlock(tsk);
        perf_event_comm(tsk);
diff --git a/fs/ext3/super.c b/fs/ext3/super.c
index fb5120a5505c..3dc48cc8b6eb 100644
--- a/fs/ext3/super.c
+++ b/fs/ext3/super.c
@@ -2067,7 +2067,6 @@ static int ext3_fill_super (struct super_block *sb, void *data, int silent)
                test_opt(sb,DATA_FLAGS) == EXT3_MOUNT_JOURNAL_DATA ? "journal":
                test_opt(sb,DATA_FLAGS) == EXT3_MOUNT_ORDERED_DATA ? "ordered":
                "writeback");
-        sb->s_flags |= MS_SNAP_STABLE;
        return 0;
diff --git a/fs/f2fs/f2fs.h b/fs/f2fs/f2fs.h
index cc2213afdcc7..201c8d3b0f86 100644
--- a/fs/f2fs/f2fs.h
+++ b/fs/f2fs/f2fs.h
@@ -137,7 +137,7 @@ struct extent_info {
        rwlock_t ext_lock;      /* rwlock for consistency */
        unsigned int fofs;      /* start offset in a file */
        u32 blk_addr;           /* start block address of the extent */
-        unsigned int len;       /* lenth of the extent */
+        unsigned int len;       /* length of the extent */
 };
 /*
diff --git a/fs/f2fs/gc.c b/fs/f2fs/gc.c
index 94b8a0c48453..2e3eb2d4fc30 100644
--- a/fs/f2fs/gc.c
+++ b/fs/f2fs/gc.c
@@ -222,7 +222,7 @@ static unsigned int get_gc_cost(struct f2fs_sb_info *sbi, unsigned int segno,
 }
 /*
- * This function is called from two pathes.
+ * This function is called from two paths.
 * One is garbage collection and the other is SSR segment selection.
 * When it is called during GC, it just gets a victim segment
 * and it does not remove it from dirty seglist.
diff --git a/fs/f2fs/super.c b/fs/f2fs/super.c
index fea6e582a2ed..62e017743af6 100644
--- a/fs/f2fs/super.c
+++ b/fs/f2fs/super.c
@@ -82,7 +82,7 @@ static struct inode *f2fs_alloc_inode(struct super_block *sb)
        init_once((void *) fi);
-        /* Initilize f2fs-specific inode info */
+        /* Initialize f2fs-specific inode info */
        fi->vfs_inode.i_version = 1;
        atomic_set(&fi->dirty_dents, 0);
        fi->i_current_depth = 1;
diff --git a/fs/fat/dir.c b/fs/fat/dir.c
index 165012ef363a..7a6f02caf286 100644
--- a/fs/fat/dir.c
+++ b/fs/fat/dir.c
@@ -964,6 +964,29 @@ int fat_scan(struct inode *dir, const unsigned char *name,
 }
 EXPORT_SYMBOL_GPL(fat_scan);
+/*
+ * Scans a directory for a given logstart.
+ * Returns an error code or zero.
+ */
+int fat_scan_logstart(struct inode *dir, int i_logstart,
+                      struct fat_slot_info *sinfo)
+{
+        struct super_block *sb = dir->i_sb;
+        sinfo->slot_off = 0;
+        sinfo->bh = NULL;
+        while (fat_get_short_entry(dir, &sinfo->slot_off, &sinfo->bh,
+                                   &sinfo->de) >= 0) {
+                if (fat_get_start(MSDOS_SB(sb), sinfo->de) == i_logstart) {
+                        sinfo->slot_off -= sizeof(*sinfo->de);
+                        sinfo->nr_slots = 1;
+                        sinfo->i_pos = fat_make_i_pos(sb, sinfo->bh, sinfo->de);
+                        return 0;
+                }
+        }
+        return -ENOENT;
+}
 static int __fat_remove_entries(struct inode *dir, loff_t pos, int nr_slots)
 {
        struct super_block *sb = dir->i_sb;
diff --git a/fs/fat/fat.h b/fs/fat/fat.h
index e9cc3f0d58e2..21664fcf3616 100644
--- a/fs/fat/fat.h
+++ b/fs/fat/fat.h
@@ -23,6 +23,9 @@
 #define FAT_ERRORS_PANIC        2      /* panic on error */
 #define FAT_ERRORS_RO           3      /* remount r/o on error */
+#define FAT_NFS_STALE_RW        1      /* NFS RW support, can cause ESTALE */
+#define FAT_NFS_NOSTALE_RO      2      /* NFS RO support, no ESTALE issue */
 struct fat_mount_options {
        kuid_t fs_uid;
        kgid_t fs_gid;
@@ -34,6 +37,7 @@ struct fat_mount_options {
        unsigned short shortname;  /* flags for shortname display/create rule */
        unsigned char name_check;  /* r = relaxed, n = normal, s = strict */
        unsigned char errors;      /* On error: continue, panic, remount-ro */
+        unsigned char nfs;        /* NFS support: nostale_ro, stale_rw */
        unsigned short allow_utime;/* permission for setting the [am]time */
        unsigned quiet:1,          /* set = fake successful chmods and chowns */
                 showexec:1,       /* set = only set x bit for com/exe/bat */
@@ -48,8 +52,7 @@ struct fat_mount_options {
                 usefree:1,        /* Use free_clusters for FAT32 */
                 tz_set:1,         /* Filesystem timestamps' offset set */
                 rodir:1,          /* allow ATTR_RO for directory */
-                 discard:1,        /* Issue discard requests on deletions */
+                 discard:1;        /* Issue discard requests on deletions */
-                 nfs:1;            /* Do extra work needed for NFS export */
 };
 #define FAT_HASH_BITS   8
@@ -72,6 +75,7 @@ struct msdos_sb_info {
        unsigned long root_cluster;   /* first cluster of the root directory */
        unsigned long fsinfo_sector;  /* sector number of FAT32 fsinfo */
        struct mutex fat_lock;
+        struct mutex nfs_build_inode_lock;
        struct mutex s_lock;
        unsigned int prev_free;      /* previously allocated cluster number */
        unsigned int free_clusters;  /* -1 if undefined */
@@ -215,6 +219,27 @@ static inline sector_t fat_clus_to_blknr(struct msdos_sb_info *sbi, int clus)
                + sbi->data_start;
 }
+static inline void fat_get_blknr_offset(struct msdos_sb_info *sbi,
+                                loff_t i_pos, sector_t *blknr, int *offset)
+{
+        *blknr = i_pos >> sbi->dir_per_block_bits;
+        *offset = i_pos & (sbi->dir_per_block - 1);
+}
+static inline loff_t fat_i_pos_read(struct msdos_sb_info *sbi,
+                                        struct inode *inode)
+{
+        loff_t i_pos;
+#if BITS_PER_LONG == 32
+        spin_lock(&sbi->inode_hash_lock);
+#endif
+        i_pos = MSDOS_I(inode)->i_pos;
+#if BITS_PER_LONG == 32
+        spin_unlock(&sbi->inode_hash_lock);
+#endif
+        return i_pos;
+}
 static inline void fat16_towchar(wchar_t *dst, const __u8 *src, size_t len)
 {
 #ifdef __BIG_ENDIAN
@@ -271,6 +296,8 @@ extern int fat_dir_empty(struct inode *dir);
 extern int fat_subdirs(struct inode *dir);
 extern int fat_scan(struct inode *dir, const unsigned char *name,
                    struct fat_slot_info *sinfo);
+extern int fat_scan_logstart(struct inode *dir, int i_logstart,
+                             struct fat_slot_info *sinfo);
 extern int fat_get_dotdot_entry(struct inode *dir, struct buffer_head **bh,
                                struct msdos_dir_entry **de);
 extern int fat_alloc_new_dir(struct inode *dir, struct timespec *ts);
@@ -348,6 +375,7 @@ extern struct inode *fat_build_inode(struct super_block *sb,
 extern int fat_sync_inode(struct inode *inode);
 extern int fat_fill_super(struct super_block *sb, void *data, int silent,
                          int isvfat, void (*setup)(struct super_block *));
+extern int fat_fill_inode(struct inode *inode, struct msdos_dir_entry *de);
 extern int fat_flush_inodes(struct super_block *sb, struct inode *i1,
                            struct inode *i2);
@@ -382,12 +410,8 @@ int fat_cache_init(void);
 void fat_cache_destroy(void);
 /* fat/nfs.c */
-struct fid;
+extern const struct export_operations fat_export_ops;
-extern struct dentry *fat_fh_to_dentry(struct super_block *sb, struct fid *fid,
+extern const struct export_operations fat_export_ops_nostale;
-                                       int fh_len, int fh_type);
-extern struct dentry *fat_fh_to_parent(struct super_block *sb, struct fid *fid,
-                                       int fh_len, int fh_type);
-extern struct dentry *fat_get_parent(struct dentry *child_dir);
 /* helper for printk */
 typedef unsigned long long      llu;
diff --git a/fs/fat/file.c b/fs/fat/file.c
index 3978f8ca1823..b0b632e50ddb 100644
--- a/fs/fat/file.c
+++ b/fs/fat/file.c
@@ -306,6 +306,11 @@ int fat_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat)
        struct inode *inode = dentry->d_inode;
        generic_fillattr(inode, stat);
        stat->blksize = MSDOS_SB(inode->i_sb)->cluster_size;
+        if (MSDOS_SB(inode->i_sb)->options.nfs == FAT_NFS_NOSTALE_RO) {
+                /* Use i_pos for ino. This is used as fileid of nfs. */
+                stat->ino = fat_i_pos_read(MSDOS_SB(inode->i_sb), inode);
+        }
        return 0;
 }
 EXPORT_SYMBOL_GPL(fat_getattr);
diff --git a/fs/fat/inode.c b/fs/fat/inode.c
index acf6e479b443..4ff901632b26 100644
--- a/fs/fat/inode.c
+++ b/fs/fat/inode.c
@@ -18,7 +18,6 @@
 #include <linux/pagemap.h>
 #include <linux/mpage.h>
 #include <linux/buffer_head.h>
-#include <linux/exportfs.h>
 #include <linux/mount.h>
 #include <linux/vfs.h>
 #include <linux/parser.h>
@@ -385,7 +384,7 @@ static int fat_calc_dir_size(struct inode *inode)
 }
 /* doesn't deal with root inode */
-static int fat_fill_inode(struct inode *inode, struct msdos_dir_entry *de)
+int fat_fill_inode(struct inode *inode, struct msdos_dir_entry *de)
 {
        struct msdos_sb_info *sbi = MSDOS_SB(inode->i_sb);
        int error;
@@ -444,12 +443,25 @@ static int fat_fill_inode(struct inode *inode, struct msdos_dir_entry *de)
        return 0;
 }
+static inline void fat_lock_build_inode(struct msdos_sb_info *sbi)
+{
+        if (sbi->options.nfs == FAT_NFS_NOSTALE_RO)
+                mutex_lock(&sbi->nfs_build_inode_lock);
+}
+static inline void fat_unlock_build_inode(struct msdos_sb_info *sbi)
+{
+        if (sbi->options.nfs == FAT_NFS_NOSTALE_RO)
+                mutex_unlock(&sbi->nfs_build_inode_lock);
+}
 struct inode *fat_build_inode(struct super_block *sb,
                        struct msdos_dir_entry *de, loff_t i_pos)
 {
        struct inode *inode;
        int err;
+        fat_lock_build_inode(MSDOS_SB(sb));
        inode = fat_iget(sb, i_pos);
        if (inode)
                goto out;
@@ -469,6 +481,7 @@ struct inode *fat_build_inode(struct super_block *sb,
        fat_attach(inode, i_pos);
        insert_inode_hash(inode);
 out:
+        fat_unlock_build_inode(MSDOS_SB(sb));
        return inode;
 }
@@ -655,20 +668,6 @@ static int fat_statfs(struct dentry *dentry, struct kstatfs *buf)
        return 0;
 }
-static inline loff_t fat_i_pos_read(struct msdos_sb_info *sbi,
-                                    struct inode *inode)
-{
-        loff_t i_pos;
-#if BITS_PER_LONG == 32
-        spin_lock(&sbi->inode_hash_lock);
-#endif
-        i_pos = MSDOS_I(inode)->i_pos;
-#if BITS_PER_LONG == 32
-        spin_unlock(&sbi->inode_hash_lock);
-#endif
-        return i_pos;
-}
 static int __fat_write_inode(struct inode *inode, int wait)
 {
        struct super_block *sb = inode->i_sb;
@@ -676,7 +675,8 @@ static int __fat_write_inode(struct inode *inode, int wait)
        struct buffer_head *bh;
        struct msdos_dir_entry *raw_entry;
        loff_t i_pos;
-        int err;
+        sector_t blocknr;
+        int err, offset;
        if (inode->i_ino == MSDOS_ROOT_INO)
                return 0;
@@ -686,7 +686,8 @@ retry:
        if (!i_pos)
                return 0;
-        bh = sb_bread(sb, i_pos >> sbi->dir_per_block_bits);
+        fat_get_blknr_offset(sbi, i_pos, &blocknr, &offset);
+        bh = sb_bread(sb, blocknr);
        if (!bh) {
                fat_msg(sb, KERN_ERR, "unable to read inode block "
                       "for updating (i_pos %lld)", i_pos);
@@ -699,8 +700,7 @@ retry:
                goto retry;
        }
-        raw_entry = &((struct msdos_dir_entry *) (bh->b_data))
+        raw_entry = &((struct msdos_dir_entry *) (bh->b_data))[offset];
-            [i_pos & (sbi->dir_per_block - 1)];
        if (S_ISDIR(inode->i_mode))
                raw_entry->size = 0;
        else
@@ -761,12 +761,6 @@ static const struct super_operations fat_sops = {
        .show_options   = fat_show_options,
 };
-static const struct export_operations fat_export_ops = {
-        .fh_to_dentry   = fat_fh_to_dentry,
-        .fh_to_parent   = fat_fh_to_parent,
-        .get_parent     = fat_get_parent,
-};
 static int fat_show_options(struct seq_file *m, struct dentry *root)
 {
        struct msdos_sb_info *sbi = MSDOS_SB(root->d_sb);
@@ -814,8 +808,6 @@ static int fat_show_options(struct seq_file *m, struct dentry *root)
                seq_puts(m, ",usefree");
        if (opts->quiet)
                seq_puts(m, ",quiet");
-        if (opts->nfs)
-                seq_puts(m, ",nfs");
        if (opts->showexec)
                seq_puts(m, ",showexec");
        if (opts->sys_immutable)
@@ -849,6 +841,10 @@ static int fat_show_options(struct seq_file *m, struct dentry *root)
                seq_puts(m, ",errors=panic");
        else
                seq_puts(m, ",errors=remount-ro");
+        if (opts->nfs == FAT_NFS_NOSTALE_RO)
+                seq_puts(m, ",nfs=nostale_ro");
+        else if (opts->nfs)
+                seq_puts(m, ",nfs=stale_rw");
        if (opts->discard)
                seq_puts(m, ",discard");
@@ -865,7 +861,7 @@ enum {
        Opt_uni_xl_no, Opt_uni_xl_yes, Opt_nonumtail_no, Opt_nonumtail_yes,
        Opt_obsolete, Opt_flush, Opt_tz_utc, Opt_rodir, Opt_err_cont,
        Opt_err_panic, Opt_err_ro, Opt_discard, Opt_nfs, Opt_time_offset,
-        Opt_err,
+        Opt_nfs_stale_rw, Opt_nfs_nostale_ro, Opt_err,
 };
 static const match_table_t fat_tokens = {
@@ -895,7 +891,9 @@ static const match_table_t fat_tokens = {
        {Opt_err_panic, "errors=panic"},
        {Opt_err_ro, "errors=remount-ro"},
        {Opt_discard, "discard"},
-        {Opt_nfs, "nfs"},
+        {Opt_nfs_stale_rw, "nfs"},
+        {Opt_nfs_stale_rw, "nfs=stale_rw"},
+        {Opt_nfs_nostale_ro, "nfs=nostale_ro"},
        {Opt_obsolete, "conv=binary"},
        {Opt_obsolete, "conv=text"},
        {Opt_obsolete, "conv=auto"},
@@ -1092,6 +1090,12 @@ static int parse_options(struct super_block *sb, char *options, int is_vfat,
                case Opt_err_ro:
                        opts->errors = FAT_ERRORS_RO;
                        break;
+                case Opt_nfs_stale_rw:
+                        opts->nfs = FAT_NFS_STALE_RW;
+                        break;
+                case Opt_nfs_nostale_ro:
+                        opts->nfs = FAT_NFS_NOSTALE_RO;
+                        break;
                /* msdos specific */
                case Opt_dots:
@@ -1150,9 +1154,6 @@ static int parse_options(struct super_block *sb, char *options, int is_vfat,
                case Opt_discard:
                        opts->discard = 1;
                        break;
-                case Opt_nfs:
-                        opts->nfs = 1;
-                        break;
                /* obsolete mount options */
                case Opt_obsolete:
@@ -1183,6 +1184,10 @@ out:
                opts->allow_utime = ~opts->fs_dmask & (S_IWGRP | S_IWOTH);
        if (opts->unicode_xlate)
                opts->utf8 = 0;
+        if (opts->nfs == FAT_NFS_NOSTALE_RO) {
+                sb->s_flags |= MS_RDONLY;
+                sb->s_export_op = &fat_export_ops_nostale;
+        }
        return 0;
 }
@@ -1193,7 +1198,7 @@ static int fat_read_root(struct inode *inode)
        struct msdos_sb_info *sbi = MSDOS_SB(sb);
        int error;
-        MSDOS_I(inode)->i_pos = 0;
+        MSDOS_I(inode)->i_pos = MSDOS_ROOT_INO;
        inode->i_uid = sbi->options.fs_uid;
        inode->i_gid = sbi->options.fs_gid;
        inode->i_version++;
@@ -1256,6 +1261,7 @@ int fat_fill_super(struct super_block *sb, void *data, int silent, int isvfat,
        sb->s_magic = MSDOS_SUPER_MAGIC;
        sb->s_op = &fat_sops;
        sb->s_export_op = &fat_export_ops;
+        mutex_init(&sbi->nfs_build_inode_lock);
        ratelimit_state_init(&sbi->ratelimit, DEFAULT_RATELIMIT_INTERVAL,
                             DEFAULT_RATELIMIT_BURST);
diff --git a/fs/fat/nfs.c b/fs/fat/nfs.c
index 499c10438ca2..93e14933dcb6 100644
--- a/fs/fat/nfs.c
+++ b/fs/fat/nfs.c
@@ -14,6 +14,18 @@
 #include <linux/exportfs.h>
 #include "fat.h"
+struct fat_fid {
+        u32 i_gen;
+        u32 i_pos_low;
+        u16 i_pos_hi;
+        u16 parent_i_pos_hi;
+        u32 parent_i_pos_low;
+        u32 parent_i_gen;
+};
+#define FAT_FID_SIZE_WITHOUT_PARENT 3
+#define FAT_FID_SIZE_WITH_PARENT (sizeof(struct fat_fid)/sizeof(u32))
 /**
 * Look up a directory inode given its starting cluster.
 */
@@ -38,63 +50,252 @@ static struct inode *fat_dget(struct super_block *sb, int i_logstart)
        return inode;
 }
-static struct inode *fat_nfs_get_inode(struct super_block *sb,
+static struct inode *fat_ilookup(struct super_block *sb, u64 ino, loff_t i_pos)
-                                       u64 ino, u32 generation)
 {
-        struct inode *inode;
+        if (MSDOS_SB(sb)->options.nfs == FAT_NFS_NOSTALE_RO)
+                return fat_iget(sb, i_pos);
-        if ((ino < MSDOS_ROOT_INO) || (ino == MSDOS_FSINFO_INO))
+        else {
-                return NULL;
+                if ((ino < MSDOS_ROOT_INO) || (ino == MSDOS_FSINFO_INO))
+                        return NULL;
+                return ilookup(sb, ino);
+        }
+}
+static struct inode *__fat_nfs_get_inode(struct super_block *sb,
+                                       u64 ino, u32 generation, loff_t i_pos)
+{
+        struct inode *inode = fat_ilookup(sb, ino, i_pos);
-        inode = ilookup(sb, ino);
        if (inode && generation && (inode->i_generation != generation)) {
                iput(inode);
                inode = NULL;
        }
+        if (inode == NULL && MSDOS_SB(sb)->options.nfs == FAT_NFS_NOSTALE_RO) {
+                struct buffer_head *bh = NULL;
+                struct msdos_dir_entry *de ;
+                sector_t blocknr;
+                int offset;
+                fat_get_blknr_offset(MSDOS_SB(sb), i_pos, &blocknr, &offset);
+                bh = sb_bread(sb, blocknr);
+                if (!bh) {
+                        fat_msg(sb, KERN_ERR,
+                                "unable to read block(%llu) for building NFS inode",
+                                (llu)blocknr);
+                        return inode;
+                }
+                de = (struct msdos_dir_entry *)bh->b_data;
+                /* If a file is deleted on server and client is not updated
+                 * yet, we must not build the inode upon a lookup call.
+                 */
+                if (IS_FREE(de[offset].name))
+                        inode = NULL;
+                else
+                        inode = fat_build_inode(sb, &de[offset], i_pos);
+                brelse(bh);
+        }
        return inode;
 }
+static struct inode *fat_nfs_get_inode(struct super_block *sb,
+                                       u64 ino, u32 generation)
+{
+        return __fat_nfs_get_inode(sb, ino, generation, 0);
+}
+static int
+fat_encode_fh_nostale(struct inode *inode, __u32 *fh, int *lenp,
+                      struct inode *parent)
+{
+        int len = *lenp;
+        struct msdos_sb_info *sbi = MSDOS_SB(inode->i_sb);
+        struct fat_fid *fid = (struct fat_fid *) fh;
+        loff_t i_pos;
+        int type = FILEID_FAT_WITHOUT_PARENT;
+        if (parent) {
+                if (len < FAT_FID_SIZE_WITH_PARENT) {
+                        *lenp = FAT_FID_SIZE_WITH_PARENT;
+                        return FILEID_INVALID;
+                }
+        } else {
+                if (len < FAT_FID_SIZE_WITHOUT_PARENT) {
+                        *lenp = FAT_FID_SIZE_WITHOUT_PARENT;
+                        return FILEID_INVALID;
+                }
+        }
+        i_pos = fat_i_pos_read(sbi, inode);
+        *lenp = FAT_FID_SIZE_WITHOUT_PARENT;
+        fid->i_gen = inode->i_generation;
+        fid->i_pos_low = i_pos & 0xFFFFFFFF;
+        fid->i_pos_hi = (i_pos >> 32) & 0xFFFF;
+        if (parent) {
+                i_pos = fat_i_pos_read(sbi, parent);
+                fid->parent_i_pos_hi = (i_pos >> 32) & 0xFFFF;
+                fid->parent_i_pos_low = i_pos & 0xFFFFFFFF;
+                fid->parent_i_gen = parent->i_generation;
+                type = FILEID_FAT_WITH_PARENT;
+                *lenp = FAT_FID_SIZE_WITH_PARENT;
+        }
+        return type;
+}
 /**
 * Map a NFS file handle to a corresponding dentry.
 * The dentry may or may not be connected to the filesystem root.
 */
-struct dentry *fat_fh_to_dentry(struct super_block *sb, struct fid *fid,
+static struct dentry *fat_fh_to_dentry(struct super_block *sb, struct fid *fid,
                                int fh_len, int fh_type)
 {
        return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
                                    fat_nfs_get_inode);
 }
+static struct dentry *fat_fh_to_dentry_nostale(struct super_block *sb,
+                                               struct fid *fh, int fh_len,
+                                               int fh_type)
+{
+        struct inode *inode = NULL;
+        struct fat_fid *fid = (struct fat_fid *)fh;
+        loff_t i_pos;
+        switch (fh_type) {
+        case FILEID_FAT_WITHOUT_PARENT:
+                if (fh_len < FAT_FID_SIZE_WITHOUT_PARENT)
+                        return NULL;
+                break;
+        case FILEID_FAT_WITH_PARENT:
+                if (fh_len < FAT_FID_SIZE_WITH_PARENT)
+                        return NULL;
+                break;
+        default:
+                return NULL;
+        }
+        i_pos = fid->i_pos_hi;
+        i_pos = (i_pos << 32) | (fid->i_pos_low);
+        inode = __fat_nfs_get_inode(sb, 0, fid->i_gen, i_pos);
+        return d_obtain_alias(inode);
+}
 /*
 * Find the parent for a file specified by NFS handle.
 * This requires that the handle contain the i_ino of the parent.
 */
-struct dentry *fat_fh_to_parent(struct super_block *sb, struct fid *fid,
+static struct dentry *fat_fh_to_parent(struct super_block *sb, struct fid *fid,
                                int fh_len, int fh_type)
 {
        return generic_fh_to_parent(sb, fid, fh_len, fh_type,
                                    fat_nfs_get_inode);
 }
+static struct dentry *fat_fh_to_parent_nostale(struct super_block *sb,
+                                               struct fid *fh, int fh_len,
+                                               int fh_type)
+{
+        struct inode *inode = NULL;
+        struct fat_fid *fid = (struct fat_fid *)fh;
+        loff_t i_pos;
+        if (fh_len < FAT_FID_SIZE_WITH_PARENT)
+                return NULL;
+        switch (fh_type) {
+        case FILEID_FAT_WITH_PARENT:
+                i_pos = fid->parent_i_pos_hi;
+                i_pos = (i_pos << 32) | (fid->parent_i_pos_low);
+                inode = __fat_nfs_get_inode(sb, 0, fid->parent_i_gen, i_pos);
+                break;
+        }
+        return d_obtain_alias(inode);
+}
+/*
+ * Rebuild the parent for a directory that is not connected
+ *  to the filesystem root
+ */
+static
+struct inode *fat_rebuild_parent(struct super_block *sb, int parent_logstart)
+{
+        int search_clus, clus_to_match;
+        struct msdos_dir_entry *de;
+        struct inode *parent = NULL;
+        struct inode *dummy_grand_parent = NULL;
+        struct fat_slot_info sinfo;
+        struct msdos_sb_info *sbi = MSDOS_SB(sb);
+        sector_t blknr = fat_clus_to_blknr(sbi, parent_logstart);
+        struct buffer_head *parent_bh = sb_bread(sb, blknr);
+        if (!parent_bh) {
+                fat_msg(sb, KERN_ERR,
+                        "unable to read cluster of parent directory");
+                return NULL;
+        }
+        de = (struct msdos_dir_entry *) parent_bh->b_data;
+        clus_to_match = fat_get_start(sbi, &de[0]);
+        search_clus = fat_get_start(sbi, &de[1]);
+        dummy_grand_parent = fat_dget(sb, search_clus);
+        if (!dummy_grand_parent) {
+                dummy_grand_parent = new_inode(sb);
+                if (!dummy_grand_parent) {
+                        brelse(parent_bh);
+                        return parent;
+                }
+                dummy_grand_parent->i_ino = iunique(sb, MSDOS_ROOT_INO);
+                fat_fill_inode(dummy_grand_parent, &de[1]);
+                MSDOS_I(dummy_grand_parent)->i_pos = -1;
+        }
+        if (!fat_scan_logstart(dummy_grand_parent, clus_to_match, &sinfo))
+                parent = fat_build_inode(sb, sinfo.de, sinfo.i_pos);
+        brelse(parent_bh);
+        iput(dummy_grand_parent);
+        return parent;
+}
 /*
 * Find the parent for a directory that is not currently connected to
 * the filesystem root.
 *
 * On entry, the caller holds child_dir->d_inode->i_mutex.
 */
-struct dentry *fat_get_parent(struct dentry *child_dir)
+static struct dentry *fat_get_parent(struct dentry *child_dir)
 {
        struct super_block *sb = child_dir->d_sb;
        struct buffer_head *bh = NULL;
        struct msdos_dir_entry *de;
        struct inode *parent_inode = NULL;
+        struct msdos_sb_info *sbi = MSDOS_SB(sb);
        if (!fat_get_dotdot_entry(child_dir->d_inode, &bh, &de)) {
-                int parent_logstart = fat_get_start(MSDOS_SB(sb), de);
+                int parent_logstart = fat_get_start(sbi, de);
                parent_inode = fat_dget(sb, parent_logstart);
+                if (!parent_inode && sbi->options.nfs == FAT_NFS_NOSTALE_RO)
+                        parent_inode = fat_rebuild_parent(sb, parent_logstart);
        }
        brelse(bh);
        return d_obtain_alias(parent_inode);
 }
+const struct export_operations fat_export_ops = {
+        .fh_to_dentry   = fat_fh_to_dentry,
+        .fh_to_parent   = fat_fh_to_parent,
+        .get_parent     = fat_get_parent,
+};
+const struct export_operations fat_export_ops_nostale = {
+        .encode_fh      = fat_encode_fh_nostale,
+        .fh_to_dentry   = fat_fh_to_dentry_nostale,
+        .fh_to_parent   = fat_fh_to_parent_nostale,
+        .get_parent     = fat_get_parent,
+};
diff --git a/fs/fs-writeback.c b/fs/fs-writeback.c
index 21f46fb3a101..798d4458a4d3 100644
--- a/fs/fs-writeback.c
+++ b/fs/fs-writeback.c
@@ -1028,6 +1028,7 @@ int bdi_writeback_thread(void *data)
        struct backing_dev_info *bdi = wb->bdi;
        long pages_written;
+        set_worker_desc("flush-%s", dev_name(bdi->dev));
        current->flags |= PF_SWAPWRITE;
        set_freezable();
        wb->last_active = jiffies;
diff --git a/fs/fscache/stats.c b/fs/fscache/stats.c
index 8179e8bc4a3d..40d13c70ef51 100644
--- a/fs/fscache/stats.c
+++ b/fs/fscache/stats.c
@@ -287,5 +287,5 @@ const struct file_operations fscache_stats_fops = {
        .open           = fscache_stats_open,
        .read           = seq_read,
        .llseek         = seq_lseek,
-        .release        = seq_release,
+        .release        = single_release,
 };
diff --git a/fs/gfs2/aops.c b/fs/gfs2/aops.c
index 24f414f0ce61..9883694f1e7c 100644
--- a/fs/gfs2/aops.c
+++ b/fs/gfs2/aops.c
@@ -1055,7 +1055,7 @@ int gfs2_releasepage(struct page *page, gfp_t gfp_mask)
                if (atomic_read(&bh->b_count))
                        goto cannot_release;
                bd = bh->b_private;
-                if (bd && bd->bd_ail)
+                if (bd && bd->bd_tr)
                        goto cannot_release;
                if (buffer_pinned(bh) || buffer_dirty(bh))
                        goto not_possible;
diff --git a/fs/gfs2/bmap.c b/fs/gfs2/bmap.c
index 5e83657f046e..1dc9a13ce6bb 100644
--- a/fs/gfs2/bmap.c
+++ b/fs/gfs2/bmap.c
@@ -787,7 +787,7 @@ static int do_strip(struct gfs2_inode *ip, struct buffer_head *dibh,
                goto out_rlist;
        if (gfs2_rs_active(ip->i_res)) /* needs to be done with the rgrp glock held */
-                gfs2_rs_deltree(ip, ip->i_res);
+                gfs2_rs_deltree(ip->i_res);
        error = gfs2_trans_begin(sdp, rg_blocks + RES_DINODE +
                                 RES_INDIRECT + RES_STATFS + RES_QUOTA,
diff --git a/fs/gfs2/file.c b/fs/gfs2/file.c
index 019f45e45097..d79c2dadc536 100644
--- a/fs/gfs2/file.c
+++ b/fs/gfs2/file.c
@@ -923,8 +923,11 @@ static int gfs2_lock(struct file *file, int cmd, struct file_lock *fl)
                cmd = F_SETLK;
                fl->fl_type = F_UNLCK;
        }
-        if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
+        if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
+                if (fl->fl_type == F_UNLCK)
+                        posix_lock_file_wait(file, fl);
                return -EIO;
+        }
        if (IS_GETLK(cmd))
                return dlm_posix_get(ls->ls_dlm, ip->i_no_addr, file, fl);
        else if (fl->fl_type == F_UNLCK)
diff --git a/fs/gfs2/glock.c b/fs/gfs2/glock.c
index cf3515546739..9435384562a2 100644
--- a/fs/gfs2/glock.c
+++ b/fs/gfs2/glock.c
@@ -912,7 +912,7 @@ int gfs2_glock_wait(struct gfs2_holder *gh)
 */
 static void handle_callback(struct gfs2_glock *gl, unsigned int state,
-                            unsigned long delay)
+                            unsigned long delay, bool remote)
 {
        int bit = delay ? GLF_PENDING_DEMOTE : GLF_DEMOTE;
@@ -925,8 +925,8 @@ static void handle_callback(struct gfs2_glock *gl, unsigned int state,
                gl->gl_demote_state = LM_ST_UNLOCKED;
        }
        if (gl->gl_ops->go_callback)
-                gl->gl_ops->go_callback(gl);
+                gl->gl_ops->go_callback(gl, remote);
-        trace_gfs2_demote_rq(gl);
+        trace_gfs2_demote_rq(gl, remote);
 }
 void gfs2_print_dbg(struct seq_file *seq, const char *fmt, ...)
@@ -1017,11 +1017,11 @@ do_cancel:
        return;
 trap_recursive:
-        print_symbol(KERN_ERR "original: %s\n", gh2->gh_ip);
+        printk(KERN_ERR "original: %pSR\n", (void *)gh2->gh_ip);
        printk(KERN_ERR "pid: %d\n", pid_nr(gh2->gh_owner_pid));
        printk(KERN_ERR "lock type: %d req lock state : %d\n",
               gh2->gh_gl->gl_name.ln_type, gh2->gh_state);
-        print_symbol(KERN_ERR "new: %s\n", gh->gh_ip);
+        printk(KERN_ERR "new: %pSR\n", (void *)gh->gh_ip);
        printk(KERN_ERR "pid: %d\n", pid_nr(gh->gh_owner_pid));
        printk(KERN_ERR "lock type: %d req lock state : %d\n",
               gh->gh_gl->gl_name.ln_type, gh->gh_state);
@@ -1091,7 +1091,7 @@ void gfs2_glock_dq(struct gfs2_holder *gh)
        spin_lock(&gl->gl_spin);
        if (gh->gh_flags & GL_NOCACHE)
-                handle_callback(gl, LM_ST_UNLOCKED, 0);
+                handle_callback(gl, LM_ST_UNLOCKED, 0, false);
        list_del_init(&gh->gh_list);
        if (find_first_holder(gl) == NULL) {
@@ -1279,19 +1279,6 @@ void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
                gfs2_glock_dq(&ghs[num_gh]);
 }
-/**
- * gfs2_glock_dq_uninit_m - release multiple glocks
- * @num_gh: the number of structures
- * @ghs: an array of struct gfs2_holder structures
- *
- */
-void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
-{
-        while (num_gh--)
-                gfs2_glock_dq_uninit(&ghs[num_gh]);
-}
 void gfs2_glock_cb(struct gfs2_glock *gl, unsigned int state)
 {
        unsigned long delay = 0;
@@ -1309,7 +1296,7 @@ void gfs2_glock_cb(struct gfs2_glock *gl, unsigned int state)
        }
        spin_lock(&gl->gl_spin);
-        handle_callback(gl, state, delay);
+        handle_callback(gl, state, delay, true);
        spin_unlock(&gl->gl_spin);
        if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
                gfs2_glock_put(gl);
@@ -1422,7 +1409,7 @@ __acquires(&lru_lock)
                spin_unlock(&lru_lock);
                spin_lock(&gl->gl_spin);
                if (demote_ok(gl))
-                        handle_callback(gl, LM_ST_UNLOCKED, 0);
+                        handle_callback(gl, LM_ST_UNLOCKED, 0, false);
                WARN_ON(!test_and_clear_bit(GLF_LOCK, &gl->gl_flags));
                smp_mb__after_clear_bit();
                if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
@@ -1547,7 +1534,7 @@ static void clear_glock(struct gfs2_glock *gl)
        spin_lock(&gl->gl_spin);
        if (gl->gl_state != LM_ST_UNLOCKED)
-                handle_callback(gl, LM_ST_UNLOCKED, 0);
+                handle_callback(gl, LM_ST_UNLOCKED, 0, false);
        spin_unlock(&gl->gl_spin);
        gfs2_glock_hold(gl);
        if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
@@ -1590,6 +1577,7 @@ static void dump_glock_func(struct gfs2_glock *gl)
 void gfs2_gl_hash_clear(struct gfs2_sbd *sdp)
 {
        set_bit(SDF_SKIP_DLM_UNLOCK, &sdp->sd_flags);
+        flush_workqueue(glock_workqueue);
        glock_hash_walk(clear_glock, sdp);
        flush_workqueue(glock_workqueue);
        wait_event(sdp->sd_glock_wait, atomic_read(&sdp->sd_glock_disposal) == 0);
diff --git a/fs/gfs2/glock.h b/fs/gfs2/glock.h
index fd580b7861d5..69f66e3d22bf 100644
--- a/fs/gfs2/glock.h
+++ b/fs/gfs2/glock.h
@@ -201,7 +201,6 @@ extern int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
                             struct gfs2_holder *gh);
 extern int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs);
 extern void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs);
-extern void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs);
 extern int gfs2_dump_glock(struct seq_file *seq, const struct gfs2_glock *gl);
 #define GLOCK_BUG_ON(gl,x) do { if (unlikely(x)) { gfs2_dump_glock(NULL, gl); BUG(); } } while(0)
 extern __printf(2, 3)
diff --git a/fs/gfs2/glops.c b/fs/gfs2/glops.c
index 444b6503ebc4..c66e99c97571 100644
--- a/fs/gfs2/glops.c
+++ b/fs/gfs2/glops.c
@@ -515,12 +515,12 @@ static int trans_go_demote_ok(const struct gfs2_glock *gl)
 *
 * gl_spin lock is held while calling this
 */
-static void iopen_go_callback(struct gfs2_glock *gl)
+static void iopen_go_callback(struct gfs2_glock *gl, bool remote)
 {
        struct gfs2_inode *ip = (struct gfs2_inode *)gl->gl_object;
        struct gfs2_sbd *sdp = gl->gl_sbd;
-        if (sdp->sd_vfs->s_flags & MS_RDONLY)
+        if (!remote || (sdp->sd_vfs->s_flags & MS_RDONLY))
                return;
        if (gl->gl_demote_state == LM_ST_UNLOCKED &&
diff --git a/fs/gfs2/incore.h b/fs/gfs2/incore.h
index 156e42ec84ea..26aabd7caba7 100644
--- a/fs/gfs2/incore.h
+++ b/fs/gfs2/incore.h
@@ -31,7 +31,6 @@ struct gfs2_holder;
 struct gfs2_glock;
 struct gfs2_quota_data;
 struct gfs2_trans;
-struct gfs2_ail;
 struct gfs2_jdesc;
 struct gfs2_sbd;
 struct lm_lockops;
@@ -53,7 +52,7 @@ struct gfs2_log_header_host {
 struct gfs2_log_operations {
        void (*lo_before_commit) (struct gfs2_sbd *sdp);
-        void (*lo_after_commit) (struct gfs2_sbd *sdp, struct gfs2_ail *ai);
+        void (*lo_after_commit) (struct gfs2_sbd *sdp, struct gfs2_trans *tr);
        void (*lo_before_scan) (struct gfs2_jdesc *jd,
                                struct gfs2_log_header_host *head, int pass);
        int (*lo_scan_elements) (struct gfs2_jdesc *jd, unsigned int start,
@@ -139,7 +138,7 @@ struct gfs2_bufdata {
        struct list_head bd_list;
        const struct gfs2_log_operations *bd_ops;
-        struct gfs2_ail *bd_ail;
+        struct gfs2_trans *bd_tr;
        struct list_head bd_ail_st_list;
        struct list_head bd_ail_gl_list;
 };
@@ -211,7 +210,7 @@ struct gfs2_glock_operations {
        int (*go_lock) (struct gfs2_holder *gh);
        void (*go_unlock) (struct gfs2_holder *gh);
        int (*go_dump)(struct seq_file *seq, const struct gfs2_glock *gl);
-        void (*go_callback) (struct gfs2_glock *gl);
+        void (*go_callback)(struct gfs2_glock *gl, bool remote);
        const int go_type;
        const unsigned long go_flags;
 #define GLOF_ASPACE 1
@@ -433,6 +432,7 @@ struct gfs2_trans {
        struct gfs2_holder tr_t_gh;
        int tr_touched;
+        int tr_attached;
        unsigned int tr_num_buf_new;
        unsigned int tr_num_databuf_new;
@@ -440,14 +440,12 @@ struct gfs2_trans {
        unsigned int tr_num_databuf_rm;
        unsigned int tr_num_revoke;
        unsigned int tr_num_revoke_rm;
-};
-struct gfs2_ail {
+        struct list_head tr_list;
-        struct list_head ai_list;
-        unsigned int ai_first;
+        unsigned int tr_first;
-        struct list_head ai_ail1_list;
+        struct list_head tr_ail1_list;
-        struct list_head ai_ail2_list;
+        struct list_head tr_ail2_list;
 };
 struct gfs2_journal_extent {
@@ -588,6 +586,7 @@ struct lm_lockstruct {
        struct dlm_lksb ls_control_lksb; /* control_lock */
        char ls_control_lvb[GDLM_LVB_SIZE]; /* control_lock lvb */
        struct completion ls_sync_wait; /* {control,mounted}_{lock,unlock} */
+        char *ls_lvb_bits;
        spinlock_t ls_recover_spin; /* protects following fields */
        unsigned long ls_recover_flags; /* DFL_ */
@@ -709,6 +708,7 @@ struct gfs2_sbd {
        spinlock_t sd_log_lock;
+        struct gfs2_trans *sd_log_tr;
        unsigned int sd_log_blks_reserved;
        unsigned int sd_log_commited_buf;
        unsigned int sd_log_commited_databuf;
diff --git a/fs/gfs2/inode.c b/fs/gfs2/inode.c
index cc00bd1d1f87..8833a4f264e3 100644
--- a/fs/gfs2/inode.c
+++ b/fs/gfs2/inode.c
@@ -392,11 +392,15 @@ static int alloc_dinode(struct gfs2_inode *ip, u32 flags)
        int error;
        int dblocks = 1;
-        error = gfs2_inplace_reserve(ip, RES_DINODE, flags);
+        error = gfs2_quota_lock_check(ip);
        if (error)
                goto out;
-        error = gfs2_trans_begin(sdp, RES_RG_BIT + RES_STATFS, 0);
+        error = gfs2_inplace_reserve(ip, RES_DINODE, flags);
+        if (error)
+                goto out_quota;
+        error = gfs2_trans_begin(sdp, RES_RG_BIT + RES_STATFS + RES_QUOTA, 0);
        if (error)
                goto out_ipreserv;
@@ -409,6 +413,8 @@ static int alloc_dinode(struct gfs2_inode *ip, u32 flags)
 out_ipreserv:
        gfs2_inplace_release(ip);
+out_quota:
+        gfs2_quota_unlock(ip);
 out:
        return error;
 }
@@ -440,59 +446,27 @@ static void gfs2_init_dir(struct buffer_head *dibh,
 */
 static void init_dinode(struct gfs2_inode *dip, struct gfs2_inode *ip,
-                        const char *symname, struct buffer_head **bhp)
+                        const char *symname)
 {
-        struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
        struct gfs2_dinode *di;
        struct buffer_head *dibh;
-        struct timespec tv = CURRENT_TIME;
        dibh = gfs2_meta_new(ip->i_gl, ip->i_no_addr);
        gfs2_trans_add_meta(ip->i_gl, dibh);
-        gfs2_metatype_set(dibh, GFS2_METATYPE_DI, GFS2_FORMAT_DI);
-        gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
        di = (struct gfs2_dinode *)dibh->b_data;
+        gfs2_dinode_out(ip, di);
-        di->di_num.no_formal_ino = cpu_to_be64(ip->i_no_formal_ino);
-        di->di_num.no_addr = cpu_to_be64(ip->i_no_addr);
-        di->di_mode = cpu_to_be32(ip->i_inode.i_mode);
-        di->di_uid = cpu_to_be32(i_uid_read(&ip->i_inode));
-        di->di_gid = cpu_to_be32(i_gid_read(&ip->i_inode));
-        di->di_nlink = 0;
-        di->di_size = cpu_to_be64(ip->i_inode.i_size);
-        di->di_blocks = cpu_to_be64(1);
-        di->di_atime = di->di_mtime = di->di_ctime = cpu_to_be64(tv.tv_sec);
        di->di_major = cpu_to_be32(MAJOR(ip->i_inode.i_rdev));
        di->di_minor = cpu_to_be32(MINOR(ip->i_inode.i_rdev));
-        di->di_goal_meta = di->di_goal_data = cpu_to_be64(ip->i_no_addr);
-        di->di_generation = cpu_to_be64(ip->i_generation);
-        di->di_flags = 0;
        di->__pad1 = 0;
-        di->di_payload_format = cpu_to_be32(S_ISDIR(ip->i_inode.i_mode) ? GFS2_FORMAT_DE : 0);
-        di->di_height = 0;
        di->__pad2 = 0;
        di->__pad3 = 0;
-        di->di_depth = 0;
-        di->di_entries = 0;
        memset(&di->__pad4, 0, sizeof(di->__pad4));
-        di->di_eattr = 0;
-        di->di_atime_nsec = cpu_to_be32(tv.tv_nsec);
-        di->di_mtime_nsec = cpu_to_be32(tv.tv_nsec);
-        di->di_ctime_nsec = cpu_to_be32(tv.tv_nsec);
        memset(&di->di_reserved, 0, sizeof(di->di_reserved));
+        gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
        switch(ip->i_inode.i_mode & S_IFMT) {
-        case S_IFREG:
-                if ((dip->i_diskflags & GFS2_DIF_INHERIT_JDATA) ||
-                    gfs2_tune_get(sdp, gt_new_files_jdata))
-                        di->di_flags |= cpu_to_be32(GFS2_DIF_JDATA);
-                break;
        case S_IFDIR:
-                di->di_flags |= cpu_to_be32(dip->i_diskflags &
-                                            GFS2_DIF_INHERIT_JDATA);
-                di->di_flags |= cpu_to_be32(GFS2_DIF_JDATA);
-                di->di_size = cpu_to_be64(sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode));
-                di->di_entries = cpu_to_be32(2);
                gfs2_init_dir(dibh, dip);
                break;
        case S_IFLNK:
@@ -501,63 +475,17 @@ static void init_dinode(struct gfs2_inode *dip, struct gfs2_inode *ip,
        }
        set_buffer_uptodate(dibh);
+        brelse(dibh);
-        *bhp = dibh;
-}
-static int make_dinode(struct gfs2_inode *dip, struct gfs2_inode *ip,
-                       const char *symname, struct buffer_head **bhp)
-{
-        struct inode *inode = &ip->i_inode;
-        struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
-        int error;
-        error = gfs2_rindex_update(sdp);
-        if (error)
-                return error;
-        error = gfs2_quota_lock(dip, inode->i_uid, inode->i_gid);
-        if (error)
-                return error;
-        error = gfs2_quota_check(dip, inode->i_uid, inode->i_gid);
-        if (error)
-                goto out_quota;
-        error = gfs2_trans_begin(sdp, RES_DINODE + RES_QUOTA, 0);
-        if (error)
-                goto out_quota;
-        init_dinode(dip, ip, symname, bhp);
-        gfs2_quota_change(dip, +1, inode->i_uid, inode->i_gid);
-        gfs2_trans_end(sdp);
-out_quota:
-        gfs2_quota_unlock(dip);
-        return error;
 }
 static int link_dinode(struct gfs2_inode *dip, const struct qstr *name,
-                       struct gfs2_inode *ip)
+                       struct gfs2_inode *ip, int arq)
 {
        struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
-        int alloc_required;
-        struct buffer_head *dibh;
        int error;
-        error = gfs2_rindex_update(sdp);
+        if (arq) {
-        if (error)
+                error = gfs2_quota_lock_check(dip);
-                return error;
-        error = gfs2_quota_lock(dip, NO_UID_QUOTA_CHANGE, NO_GID_QUOTA_CHANGE);
-        if (error)
-                goto fail;
-        error = alloc_required = gfs2_diradd_alloc_required(&dip->i_inode, name);
-        if (alloc_required < 0)
-                goto fail_quota_locks;
-        if (alloc_required) {
-                error = gfs2_quota_check(dip, dip->i_inode.i_uid, dip->i_inode.i_gid);
                if (error)
                        goto fail_quota_locks;
@@ -581,26 +509,12 @@ static int link_dinode(struct gfs2_inode *dip, const struct qstr *name,
        if (error)
                goto fail_end_trans;
-        error = gfs2_meta_inode_buffer(ip, &dibh);
-        if (error)
-                goto fail_end_trans;
-        set_nlink(&ip->i_inode, S_ISDIR(ip->i_inode.i_mode) ? 2 : 1);
-        gfs2_trans_add_meta(ip->i_gl, dibh);
-        gfs2_dinode_out(ip, dibh->b_data);
-        brelse(dibh);
-        return 0;
 fail_end_trans:
        gfs2_trans_end(sdp);
 fail_ipreserv:
-        if (alloc_required)
+        gfs2_inplace_release(dip);
-                gfs2_inplace_release(dip);
 fail_quota_locks:
        gfs2_quota_unlock(dip);
-fail:
        return error;
 }
@@ -650,8 +564,8 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
        struct gfs2_glock *io_gl;
        int error;
-        struct buffer_head *bh = NULL;
        u32 aflags = 0;
+        int arq;
        if (!name->len || name->len > GFS2_FNAMESIZE)
                return -ENAMETOOLONG;
@@ -660,6 +574,10 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        if (error)
                return error;
+        error = gfs2_rindex_update(sdp);
+        if (error)
+                return error;
        error = gfs2_glock_nq_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
        if (error)
                goto fail;
@@ -674,22 +592,48 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        if (error)
                goto fail_gunlock;
+        arq = error = gfs2_diradd_alloc_required(dir, name);
+        if (error < 0)
+                goto fail_gunlock;
        inode = new_inode(sdp->sd_vfs);
-        if (!inode) {
+        error = -ENOMEM;
-                gfs2_glock_dq_uninit(ghs);
+        if (!inode)
-                return -ENOMEM;
+                goto fail_gunlock;
-        }
        ip = GFS2_I(inode);
        error = gfs2_rs_alloc(ip);
        if (error)
                goto fail_free_inode;
-        set_bit(GIF_INVALID, &ip->i_flags);
        inode->i_mode = mode;
+        set_nlink(inode, S_ISDIR(mode) ? 2 : 1);
        inode->i_rdev = dev;
        inode->i_size = size;
+        inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME;
+        gfs2_set_inode_blocks(inode, 1);
        munge_mode_uid_gid(dip, inode);
        ip->i_goal = dip->i_goal;
+        ip->i_diskflags = 0;
+        ip->i_eattr = 0;
+        ip->i_height = 0;
+        ip->i_depth = 0;
+        ip->i_entries = 0;
+        switch(mode & S_IFMT) {
+        case S_IFREG:
+                if ((dip->i_diskflags & GFS2_DIF_INHERIT_JDATA) ||
+                    gfs2_tune_get(sdp, gt_new_files_jdata))
+                        ip->i_diskflags |= GFS2_DIF_JDATA;
+                gfs2_set_aops(inode);
+                break;
+        case S_IFDIR:
+                ip->i_diskflags |= (dip->i_diskflags & GFS2_DIF_INHERIT_JDATA);
+                ip->i_diskflags |= GFS2_DIF_JDATA;
+                ip->i_entries = 2;
+                break;
+        }
+        gfs2_set_inode_flags(inode);
        if ((GFS2_I(sdp->sd_root_dir->d_inode) == dip) ||
            (dip->i_diskflags & GFS2_DIF_TOPDIR))
@@ -708,10 +652,13 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        if (error)
                goto fail_free_inode;
-        error = make_dinode(dip, ip, symname, &bh);
+        error = gfs2_trans_begin(sdp, RES_DINODE, 0);
        if (error)
                goto fail_gunlock2;
+        init_dinode(dip, ip, symname);
+        gfs2_trans_end(sdp);
        error = gfs2_glock_get(sdp, ip->i_no_addr, &gfs2_iopen_glops, CREATE, &io_gl);
        if (error)
                goto fail_gunlock2;
@@ -725,10 +672,6 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        gfs2_set_iop(inode);
        insert_inode_hash(inode);
-        error = gfs2_inode_refresh(ip);
-        if (error)
-                goto fail_gunlock3;
        error = gfs2_acl_create(dip, inode);
        if (error)
                goto fail_gunlock3;
@@ -737,18 +680,13 @@ static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
        if (error)
                goto fail_gunlock3;
-        error = link_dinode(dip, name, ip);
+        error = link_dinode(dip, name, ip, arq);
        if (error)
                goto fail_gunlock3;
-        if (bh)
-                brelse(bh);
-        gfs2_trans_end(sdp);
-        gfs2_inplace_release(dip);
-        gfs2_quota_unlock(dip);
        mark_inode_dirty(inode);
-        gfs2_glock_dq_uninit_m(2, ghs);
+        gfs2_glock_dq_uninit(ghs);
+        gfs2_glock_dq_uninit(ghs + 1);
        d_instantiate(dentry, inode);
        return 0;
@@ -769,12 +707,12 @@ fail_free_inode:
 fail_gunlock:
        gfs2_glock_dq_uninit(ghs);
        if (inode && !IS_ERR(inode)) {
+                clear_nlink(inode);
+                mark_inode_dirty(inode);
                set_bit(GIF_ALLOC_FAILED, &GFS2_I(inode)->i_flags);
                iput(inode);
        }
 fail:
-        if (bh)
-                brelse(bh);
        return error;
 }
@@ -1151,7 +1089,9 @@ static int gfs2_symlink(struct inode *dir, struct dentry *dentry,
 static int gfs2_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
 {
-        return gfs2_create_inode(dir, dentry, S_IFDIR | mode, 0, NULL, 0, 0);
+        struct gfs2_sbd *sdp = GFS2_SB(dir);
+        unsigned dsize = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode);
+        return gfs2_create_inode(dir, dentry, S_IFDIR | mode, 0, NULL, dsize, 0);
 }
 /**
diff --git a/fs/gfs2/lock_dlm.c b/fs/gfs2/lock_dlm.c
index 9802de0f85e6..c8423d6de6c3 100644
--- a/fs/gfs2/lock_dlm.c
+++ b/fs/gfs2/lock_dlm.c
@@ -483,12 +483,8 @@ static void control_lvb_write(struct lm_lockstruct *ls, uint32_t lvb_gen,
 static int all_jid_bits_clear(char *lvb)
 {
-        int i;
+        return !memchr_inv(lvb + JID_BITMAP_OFFSET, 0,
-        for (i = JID_BITMAP_OFFSET; i < GDLM_LVB_SIZE; i++) {
+                        GDLM_LVB_SIZE - JID_BITMAP_OFFSET);
-                if (lvb[i])
-                        return 0;
-        }
-        return 1;
 }
 static void sync_wait_cb(void *arg)
@@ -580,7 +576,6 @@ static void gfs2_control_func(struct work_struct *work)
 {
        struct gfs2_sbd *sdp = container_of(work, struct gfs2_sbd, sd_control_work.work);
        struct lm_lockstruct *ls = &sdp->sd_lockstruct;
-        char lvb_bits[GDLM_LVB_SIZE];
        uint32_t block_gen, start_gen, lvb_gen, flags;
        int recover_set = 0;
        int write_lvb = 0;
@@ -634,7 +629,7 @@ static void gfs2_control_func(struct work_struct *work)
                return;
        }
-        control_lvb_read(ls, &lvb_gen, lvb_bits);
+        control_lvb_read(ls, &lvb_gen, ls->ls_lvb_bits);
        spin_lock(&ls->ls_recover_spin);
        if (block_gen != ls->ls_recover_block ||
@@ -664,10 +659,10 @@ static void gfs2_control_func(struct work_struct *work)
                        ls->ls_recover_result[i] = 0;
-                        if (!test_bit_le(i, lvb_bits + JID_BITMAP_OFFSET))
+                        if (!test_bit_le(i, ls->ls_lvb_bits + JID_BITMAP_OFFSET))
                                continue;
-                        __clear_bit_le(i, lvb_bits + JID_BITMAP_OFFSET);
+                        __clear_bit_le(i, ls->ls_lvb_bits + JID_BITMAP_OFFSET);
                        write_lvb = 1;
                }
        }
@@ -691,7 +686,7 @@ static void gfs2_control_func(struct work_struct *work)
                                continue;
                        if (ls->ls_recover_submit[i] < start_gen) {
                                ls->ls_recover_submit[i] = 0;
-                                __set_bit_le(i, lvb_bits + JID_BITMAP_OFFSET);
+                                __set_bit_le(i, ls->ls_lvb_bits + JID_BITMAP_OFFSET);
                        }
                }
                /* even if there are no bits to set, we need to write the
@@ -705,7 +700,7 @@ static void gfs2_control_func(struct work_struct *work)
        spin_unlock(&ls->ls_recover_spin);
        if (write_lvb) {
-                control_lvb_write(ls, start_gen, lvb_bits);
+                control_lvb_write(ls, start_gen, ls->ls_lvb_bits);
                flags = DLM_LKF_CONVERT | DLM_LKF_VALBLK;
        } else {
                flags = DLM_LKF_CONVERT;
@@ -725,7 +720,7 @@ static void gfs2_control_func(struct work_struct *work)
         */
        for (i = 0; i < recover_size; i++) {
-                if (test_bit_le(i, lvb_bits + JID_BITMAP_OFFSET)) {
+                if (test_bit_le(i, ls->ls_lvb_bits + JID_BITMAP_OFFSET)) {
                        fs_info(sdp, "recover generation %u jid %d\n",
                                start_gen, i);
                        gfs2_recover_set(sdp, i);
@@ -758,7 +753,6 @@ static void gfs2_control_func(struct work_struct *work)
 static int control_mount(struct gfs2_sbd *sdp)
 {
        struct lm_lockstruct *ls = &sdp->sd_lockstruct;
-        char lvb_bits[GDLM_LVB_SIZE];
        uint32_t start_gen, block_gen, mount_gen, lvb_gen;
        int mounted_mode;
        int retries = 0;
@@ -857,7 +851,7 @@ locks_done:
         * lvb_gen will be non-zero.
         */
-        control_lvb_read(ls, &lvb_gen, lvb_bits);
+        control_lvb_read(ls, &lvb_gen, ls->ls_lvb_bits);
        if (lvb_gen == 0xFFFFFFFF) {
                /* special value to force mount attempts to fail */
@@ -887,7 +881,7 @@ locks_done:
         * and all lvb bits to be clear (no pending journal recoveries.)
         */
-        if (!all_jid_bits_clear(lvb_bits)) {
+        if (!all_jid_bits_clear(ls->ls_lvb_bits)) {
                /* journals need recovery, wait until all are clear */
                fs_info(sdp, "control_mount wait for journal recovery\n");
                goto restart;
@@ -949,7 +943,6 @@ static int dlm_recovery_wait(void *word)
 static int control_first_done(struct gfs2_sbd *sdp)
 {
        struct lm_lockstruct *ls = &sdp->sd_lockstruct;
-        char lvb_bits[GDLM_LVB_SIZE];
        uint32_t start_gen, block_gen;
        int error;
@@ -991,8 +984,8 @@ restart:
        memset(ls->ls_recover_result, 0, ls->ls_recover_size*sizeof(uint32_t));
        spin_unlock(&ls->ls_recover_spin);
-        memset(lvb_bits, 0, sizeof(lvb_bits));
+        memset(ls->ls_lvb_bits, 0, GDLM_LVB_SIZE);
-        control_lvb_write(ls, start_gen, lvb_bits);
+        control_lvb_write(ls, start_gen, ls->ls_lvb_bits);
        error = mounted_lock(sdp, DLM_LOCK_PR, DLM_LKF_CONVERT);
        if (error)
@@ -1022,6 +1015,12 @@ static int set_recover_size(struct gfs2_sbd *sdp, struct dlm_slot *slots,
        uint32_t old_size, new_size;
        int i, max_jid;
+        if (!ls->ls_lvb_bits) {
+                ls->ls_lvb_bits = kzalloc(GDLM_LVB_SIZE, GFP_NOFS);
+                if (!ls->ls_lvb_bits)
+                        return -ENOMEM;
+        }
        max_jid = 0;
        for (i = 0; i < num_slots; i++) {
                if (max_jid < slots[i].slot - 1)
@@ -1057,6 +1056,7 @@ static int set_recover_size(struct gfs2_sbd *sdp, struct dlm_slot *slots,
 static void free_recover_size(struct lm_lockstruct *ls)
 {
+        kfree(ls->ls_lvb_bits);
        kfree(ls->ls_recover_submit);
        kfree(ls->ls_recover_result);
        ls->ls_recover_submit = NULL;
@@ -1205,6 +1205,7 @@ static int gdlm_mount(struct gfs2_sbd *sdp, const char *table)
        ls->ls_recover_size = 0;
        ls->ls_recover_submit = NULL;
        ls->ls_recover_result = NULL;
+        ls->ls_lvb_bits = NULL;
        error = set_recover_size(sdp, NULL, 0);
        if (error)
diff --git a/fs/gfs2/log.c b/fs/gfs2/log.c
index 9a2ca8be7647..b404f4853034 100644
--- a/fs/gfs2/log.c
+++ b/fs/gfs2/log.c
@@ -73,7 +73,7 @@ unsigned int gfs2_struct2blk(struct gfs2_sbd *sdp, unsigned int nstruct,
 void gfs2_remove_from_ail(struct gfs2_bufdata *bd)
 {
-        bd->bd_ail = NULL;
+        bd->bd_tr = NULL;
        list_del_init(&bd->bd_ail_st_list);
        list_del_init(&bd->bd_ail_gl_list);
        atomic_dec(&bd->bd_gl->gl_ail_count);
@@ -90,7 +90,7 @@ void gfs2_remove_from_ail(struct gfs2_bufdata *bd)
 static int gfs2_ail1_start_one(struct gfs2_sbd *sdp,
                               struct writeback_control *wbc,
-                               struct gfs2_ail *ai)
+                               struct gfs2_trans *tr)
 __releases(&sdp->sd_ail_lock)
 __acquires(&sdp->sd_ail_lock)
 {
@@ -99,15 +99,15 @@ __acquires(&sdp->sd_ail_lock)
        struct gfs2_bufdata *bd, *s;
        struct buffer_head *bh;
-        list_for_each_entry_safe_reverse(bd, s, &ai->ai_ail1_list, bd_ail_st_list) {
+        list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list, bd_ail_st_list) {
                bh = bd->bd_bh;
-                gfs2_assert(sdp, bd->bd_ail == ai);
+                gfs2_assert(sdp, bd->bd_tr == tr);
                if (!buffer_busy(bh)) {
                        if (!buffer_uptodate(bh))
                                gfs2_io_error_bh(sdp, bh);
-                        list_move(&bd->bd_ail_st_list, &ai->ai_ail2_list);
+                        list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list);
                        continue;
                }
@@ -116,7 +116,7 @@ __acquires(&sdp->sd_ail_lock)
                if (gl == bd->bd_gl)
                        continue;
                gl = bd->bd_gl;
-                list_move(&bd->bd_ail_st_list, &ai->ai_ail1_list);
+                list_move(&bd->bd_ail_st_list, &tr->tr_ail1_list);
                mapping = bh->b_page->mapping;
                if (!mapping)
                        continue;
@@ -144,15 +144,15 @@ __acquires(&sdp->sd_ail_lock)
 void gfs2_ail1_flush(struct gfs2_sbd *sdp, struct writeback_control *wbc)
 {
        struct list_head *head = &sdp->sd_ail1_list;
-        struct gfs2_ail *ai;
+        struct gfs2_trans *tr;
        trace_gfs2_ail_flush(sdp, wbc, 1);
        spin_lock(&sdp->sd_ail_lock);
 restart:
-        list_for_each_entry_reverse(ai, head, ai_list) {
+        list_for_each_entry_reverse(tr, head, tr_list) {
                if (wbc->nr_to_write <= 0)
                        break;
-                if (gfs2_ail1_start_one(sdp, wbc, ai))
+                if (gfs2_ail1_start_one(sdp, wbc, tr))
                        goto restart;
        }
        spin_unlock(&sdp->sd_ail_lock);
@@ -183,20 +183,20 @@ static void gfs2_ail1_start(struct gfs2_sbd *sdp)
 *
 */
-static void gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static void gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
        struct gfs2_bufdata *bd, *s;
        struct buffer_head *bh;
-        list_for_each_entry_safe_reverse(bd, s, &ai->ai_ail1_list,
+        list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list,
                                         bd_ail_st_list) {
                bh = bd->bd_bh;
-                gfs2_assert(sdp, bd->bd_ail == ai);
+                gfs2_assert(sdp, bd->bd_tr == tr);
                if (buffer_busy(bh))
                        continue;
                if (!buffer_uptodate(bh))
                        gfs2_io_error_bh(sdp, bh);
-                list_move(&bd->bd_ail_st_list, &ai->ai_ail2_list);
+                list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list);
        }
 }
@@ -210,14 +210,14 @@ static void gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
 static int gfs2_ail1_empty(struct gfs2_sbd *sdp)
 {
-        struct gfs2_ail *ai, *s;
+        struct gfs2_trans *tr, *s;
        int ret;
        spin_lock(&sdp->sd_ail_lock);
-        list_for_each_entry_safe_reverse(ai, s, &sdp->sd_ail1_list, ai_list) {
+        list_for_each_entry_safe_reverse(tr, s, &sdp->sd_ail1_list, tr_list) {
-                gfs2_ail1_empty_one(sdp, ai);
+                gfs2_ail1_empty_one(sdp, tr);
-                if (list_empty(&ai->ai_ail1_list))
+                if (list_empty(&tr->tr_ail1_list))
-                        list_move(&ai->ai_list, &sdp->sd_ail2_list);
+                        list_move(&tr->tr_list, &sdp->sd_ail2_list);
                else
                        break;
        }
@@ -229,13 +229,13 @@ static int gfs2_ail1_empty(struct gfs2_sbd *sdp)
 static void gfs2_ail1_wait(struct gfs2_sbd *sdp)
 {
-        struct gfs2_ail *ai;
+        struct gfs2_trans *tr;
        struct gfs2_bufdata *bd;
        struct buffer_head *bh;
        spin_lock(&sdp->sd_ail_lock);
-        list_for_each_entry_reverse(ai, &sdp->sd_ail1_list, ai_list) {
+        list_for_each_entry_reverse(tr, &sdp->sd_ail1_list, tr_list) {
-                list_for_each_entry(bd, &ai->ai_ail1_list, bd_ail_st_list) {
+                list_for_each_entry(bd, &tr->tr_ail1_list, bd_ail_st_list) {
                        bh = bd->bd_bh;
                        if (!buffer_locked(bh))
                                continue;
@@ -256,40 +256,40 @@ static void gfs2_ail1_wait(struct gfs2_sbd *sdp)
 *
 */
-static void gfs2_ail2_empty_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static void gfs2_ail2_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
-        struct list_head *head = &ai->ai_ail2_list;
+        struct list_head *head = &tr->tr_ail2_list;
        struct gfs2_bufdata *bd;
        while (!list_empty(head)) {
                bd = list_entry(head->prev, struct gfs2_bufdata,
                                bd_ail_st_list);
-                gfs2_assert(sdp, bd->bd_ail == ai);
+                gfs2_assert(sdp, bd->bd_tr == tr);
                gfs2_remove_from_ail(bd);
        }
 }
 static void ail2_empty(struct gfs2_sbd *sdp, unsigned int new_tail)
 {
-        struct gfs2_ail *ai, *safe;
+        struct gfs2_trans *tr, *safe;
        unsigned int old_tail = sdp->sd_log_tail;
        int wrap = (new_tail < old_tail);
        int a, b, rm;
        spin_lock(&sdp->sd_ail_lock);
-        list_for_each_entry_safe(ai, safe, &sdp->sd_ail2_list, ai_list) {
+        list_for_each_entry_safe(tr, safe, &sdp->sd_ail2_list, tr_list) {
-                a = (old_tail <= ai->ai_first);
+                a = (old_tail <= tr->tr_first);
-                b = (ai->ai_first < new_tail);
+                b = (tr->tr_first < new_tail);
                rm = (wrap) ? (a || b) : (a && b);
                if (!rm)
                        continue;
-                gfs2_ail2_empty_one(sdp, ai);
+                gfs2_ail2_empty_one(sdp, tr);
-                list_del(&ai->ai_list);
+                list_del(&tr->tr_list);
-                gfs2_assert_warn(sdp, list_empty(&ai->ai_ail1_list));
+                gfs2_assert_warn(sdp, list_empty(&tr->tr_ail1_list));
-                gfs2_assert_warn(sdp, list_empty(&ai->ai_ail2_list));
+                gfs2_assert_warn(sdp, list_empty(&tr->tr_ail2_list));
-                kfree(ai);
+                kfree(tr);
        }
        spin_unlock(&sdp->sd_ail_lock);
@@ -435,7 +435,7 @@ static unsigned int calc_reserved(struct gfs2_sbd *sdp)
 static unsigned int current_tail(struct gfs2_sbd *sdp)
 {
-        struct gfs2_ail *ai;
+        struct gfs2_trans *tr;
        unsigned int tail;
        spin_lock(&sdp->sd_ail_lock);
@@ -443,8 +443,9 @@ static unsigned int current_tail(struct gfs2_sbd *sdp)
        if (list_empty(&sdp->sd_ail1_list)) {
                tail = sdp->sd_log_head;
        } else {
-                ai = list_entry(sdp->sd_ail1_list.prev, struct gfs2_ail, ai_list);
+                tr = list_entry(sdp->sd_ail1_list.prev, struct gfs2_trans,
-                tail = ai->ai_first;
+                                tr_list);
+                tail = tr->tr_first;
        }
        spin_unlock(&sdp->sd_ail_lock);
@@ -600,7 +601,7 @@ static void log_write_header(struct gfs2_sbd *sdp, u32 flags)
 void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl)
 {
-        struct gfs2_ail *ai;
+        struct gfs2_trans *tr;
        down_write(&sdp->sd_log_flush_lock);
@@ -611,9 +612,12 @@ void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl)
        }
        trace_gfs2_log_flush(sdp, 1);
-        ai = kzalloc(sizeof(struct gfs2_ail), GFP_NOFS | __GFP_NOFAIL);
+        tr = sdp->sd_log_tr;
-        INIT_LIST_HEAD(&ai->ai_ail1_list);
+        if (tr) {
-        INIT_LIST_HEAD(&ai->ai_ail2_list);
+                sdp->sd_log_tr = NULL;
+                INIT_LIST_HEAD(&tr->tr_ail1_list);
+                INIT_LIST_HEAD(&tr->tr_ail2_list);
+        }
        if (sdp->sd_log_num_buf != sdp->sd_log_commited_buf) {
                printk(KERN_INFO "GFS2: log buf %u %u\n", sdp->sd_log_num_buf,
@@ -630,7 +634,8 @@ void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl)
        sdp->sd_log_flush_head = sdp->sd_log_head;
        sdp->sd_log_flush_wrapped = 0;
-        ai->ai_first = sdp->sd_log_flush_head;
+        if (tr)
+                tr->tr_first = sdp->sd_log_flush_head;
        gfs2_ordered_write(sdp);
        lops_before_commit(sdp);
@@ -643,7 +648,7 @@ void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl)
                trace_gfs2_log_blocks(sdp, -1);
                log_write_header(sdp, 0);
        }
-        lops_after_commit(sdp, ai);
+        lops_after_commit(sdp, tr);
        gfs2_log_lock(sdp);
        sdp->sd_log_head = sdp->sd_log_flush_head;
@@ -653,16 +658,16 @@ void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl)
        sdp->sd_log_commited_revoke = 0;
        spin_lock(&sdp->sd_ail_lock);
-        if (!list_empty(&ai->ai_ail1_list)) {
+        if (tr && !list_empty(&tr->tr_ail1_list)) {
-                list_add(&ai->ai_list, &sdp->sd_ail1_list);
+                list_add(&tr->tr_list, &sdp->sd_ail1_list);
-                ai = NULL;
+                tr = NULL;
        }
        spin_unlock(&sdp->sd_ail_lock);
        gfs2_log_unlock(sdp);
        trace_gfs2_log_flush(sdp, 0);
        up_write(&sdp->sd_log_flush_lock);
-        kfree(ai);
+        kfree(tr);
 }
 static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
@@ -687,6 +692,12 @@ static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
                             sdp->sd_jdesc->jd_blocks);
        sdp->sd_log_blks_reserved = reserved;
+        if (sdp->sd_log_tr == NULL &&
+            (tr->tr_num_buf_new || tr->tr_num_databuf_new)) {
+                gfs2_assert_withdraw(sdp, tr->tr_t_gh.gh_gl);
+                sdp->sd_log_tr = tr;
+                tr->tr_attached = 1;
+        }
        gfs2_log_unlock(sdp);
 }
@@ -708,7 +719,6 @@ static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 void gfs2_log_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
        log_refund(sdp, tr);
-        up_read(&sdp->sd_log_flush_lock);
        if (atomic_read(&sdp->sd_log_pinned) > atomic_read(&sdp->sd_log_thresh1) ||
            ((sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free)) >
diff --git a/fs/gfs2/lops.c b/fs/gfs2/lops.c
index a5055977a214..7318abf9d0fb 100644
--- a/fs/gfs2/lops.c
+++ b/fs/gfs2/lops.c
@@ -53,8 +53,8 @@ void gfs2_pin(struct gfs2_sbd *sdp, struct buffer_head *bh)
         * to in-place disk block, remove it from the AIL.
         */
        spin_lock(&sdp->sd_ail_lock);
-        if (bd->bd_ail)
+        if (bd->bd_tr)
-                list_move(&bd->bd_ail_st_list, &bd->bd_ail->ai_ail2_list);
+                list_move(&bd->bd_ail_st_list, &bd->bd_tr->tr_ail2_list);
        spin_unlock(&sdp->sd_ail_lock);
        get_bh(bh);
        atomic_inc(&sdp->sd_log_pinned);
@@ -94,7 +94,7 @@ static void maybe_release_space(struct gfs2_bufdata *bd)
 */
 static void gfs2_unpin(struct gfs2_sbd *sdp, struct buffer_head *bh,
-                       struct gfs2_ail *ai)
+                       struct gfs2_trans *tr)
 {
        struct gfs2_bufdata *bd = bh->b_private;
@@ -109,7 +109,7 @@ static void gfs2_unpin(struct gfs2_sbd *sdp, struct buffer_head *bh,
                maybe_release_space(bd);
        spin_lock(&sdp->sd_ail_lock);
-        if (bd->bd_ail) {
+        if (bd->bd_tr) {
                list_del(&bd->bd_ail_st_list);
                brelse(bh);
        } else {
@@ -117,8 +117,8 @@ static void gfs2_unpin(struct gfs2_sbd *sdp, struct buffer_head *bh,
                list_add(&bd->bd_ail_gl_list, &gl->gl_ail_list);
                atomic_inc(&gl->gl_ail_count);
        }
-        bd->bd_ail = ai;
+        bd->bd_tr = tr;
-        list_add(&bd->bd_ail_st_list, &ai->ai_ail1_list);
+        list_add(&bd->bd_ail_st_list, &tr->tr_ail1_list);
        spin_unlock(&sdp->sd_ail_lock);
        clear_bit(GLF_LFLUSH, &bd->bd_gl->gl_flags);
@@ -480,17 +480,22 @@ static void buf_lo_before_commit(struct gfs2_sbd *sdp)
                           &sdp->sd_log_le_buf, 0);
 }
-static void buf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static void buf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
        struct list_head *head = &sdp->sd_log_le_buf;
        struct gfs2_bufdata *bd;
+        if (tr == NULL) {
+                gfs2_assert(sdp, list_empty(head));
+                return;
+        }
        while (!list_empty(head)) {
                bd = list_entry(head->next, struct gfs2_bufdata, bd_list);
                list_del_init(&bd->bd_list);
                sdp->sd_log_num_buf--;
-                gfs2_unpin(sdp, bd->bd_bh, ai);
+                gfs2_unpin(sdp, bd->bd_bh, tr);
        }
        gfs2_assert_warn(sdp, !sdp->sd_log_num_buf);
 }
@@ -613,7 +618,7 @@ static void revoke_lo_before_commit(struct gfs2_sbd *sdp)
        gfs2_log_write_page(sdp, page);
 }
-static void revoke_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static void revoke_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
        struct list_head *head = &sdp->sd_log_le_revoke;
        struct gfs2_bufdata *bd;
@@ -791,16 +796,21 @@ static void databuf_lo_after_scan(struct gfs2_jdesc *jd, int error, int pass)
                jd->jd_jid, sdp->sd_replayed_blocks, sdp->sd_found_blocks);
 }
-static void databuf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static void databuf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr)
 {
        struct list_head *head = &sdp->sd_log_le_databuf;
        struct gfs2_bufdata *bd;
+        if (tr == NULL) {
+                gfs2_assert(sdp, list_empty(head));
+                return;
+        }
        while (!list_empty(head)) {
                bd = list_entry(head->next, struct gfs2_bufdata, bd_list);
                list_del_init(&bd->bd_list);
                sdp->sd_log_num_databuf--;
-                gfs2_unpin(sdp, bd->bd_bh, ai);
+                gfs2_unpin(sdp, bd->bd_bh, tr);
        }
        gfs2_assert_warn(sdp, !sdp->sd_log_num_databuf);
 }
diff --git a/fs/gfs2/lops.h b/fs/gfs2/lops.h
index ba77b7da8325..87e062e05c92 100644
--- a/fs/gfs2/lops.h
+++ b/fs/gfs2/lops.h
@@ -55,12 +55,13 @@ static inline void lops_before_commit(struct gfs2_sbd *sdp)
                        gfs2_log_ops[x]->lo_before_commit(sdp);
 }
-static inline void lops_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
+static inline void lops_after_commit(struct gfs2_sbd *sdp,
+                                     struct gfs2_trans *tr)
 {
        int x;
        for (x = 0; gfs2_log_ops[x]; x++)
                if (gfs2_log_ops[x]->lo_after_commit)
-                        gfs2_log_ops[x]->lo_after_commit(sdp, ai);
+                        gfs2_log_ops[x]->lo_after_commit(sdp, tr);
 }
 static inline void lops_before_scan(struct gfs2_jdesc *jd,
diff --git a/fs/gfs2/meta_io.c b/fs/gfs2/meta_io.c
index b059bbb5059e..1a89afb68472 100644
--- a/fs/gfs2/meta_io.c
+++ b/fs/gfs2/meta_io.c
@@ -295,7 +295,7 @@ void gfs2_remove_from_journal(struct buffer_head *bh, struct gfs2_trans *tr, int
        }
        if (bd) {
                spin_lock(&sdp->sd_ail_lock);
-                if (bd->bd_ail) {
+                if (bd->bd_tr) {
                        gfs2_remove_from_ail(bd);
                        bh->b_private = NULL;
                        bd->bd_bh = NULL;
diff --git a/fs/gfs2/rgrp.c b/fs/gfs2/rgrp.c
index d1f51fd73f86..0c5a575b513e 100644
--- a/fs/gfs2/rgrp.c
+++ b/fs/gfs2/rgrp.c
@@ -576,7 +576,7 @@ int gfs2_rs_alloc(struct gfs2_inode *ip)
        RB_CLEAR_NODE(&ip->i_res->rs_node);
 out:
        up_write(&ip->i_rw_mutex);
-        return 0;
+        return error;
 }
 static void dump_rs(struct seq_file *seq, const struct gfs2_blkreserv *rs)
@@ -592,7 +592,7 @@ static void dump_rs(struct seq_file *seq, const struct gfs2_blkreserv *rs)
 * @rs: The reservation to remove
 *
 */
-static void __rs_deltree(struct gfs2_inode *ip, struct gfs2_blkreserv *rs)
+static void __rs_deltree(struct gfs2_blkreserv *rs)
 {
        struct gfs2_rgrpd *rgd;
@@ -605,7 +605,7 @@ static void __rs_deltree(struct gfs2_inode *ip, struct gfs2_blkreserv *rs)
        RB_CLEAR_NODE(&rs->rs_node);
        if (rs->rs_free) {
-                /* return reserved blocks to the rgrp and the ip */
+                /* return reserved blocks to the rgrp */
                BUG_ON(rs->rs_rbm.rgd->rd_reserved < rs->rs_free);
                rs->rs_rbm.rgd->rd_reserved -= rs->rs_free;
                rs->rs_free = 0;
@@ -619,14 +619,14 @@ static void __rs_deltree(struct gfs2_inode *ip, struct gfs2_blkreserv *rs)
 * @rs: The reservation to remove
 *
 */
-void gfs2_rs_deltree(struct gfs2_inode *ip, struct gfs2_blkreserv *rs)
+void gfs2_rs_deltree(struct gfs2_blkreserv *rs)
 {
        struct gfs2_rgrpd *rgd;
        rgd = rs->rs_rbm.rgd;
        if (rgd) {
                spin_lock(&rgd->rd_rsspin);
-                __rs_deltree(ip, rs);
+                __rs_deltree(rs);
                spin_unlock(&rgd->rd_rsspin);
        }
 }
@@ -640,7 +640,7 @@ void gfs2_rs_delete(struct gfs2_inode *ip)
 {
        down_write(&ip->i_rw_mutex);
        if (ip->i_res) {
-                gfs2_rs_deltree(ip, ip->i_res);
+                gfs2_rs_deltree(ip->i_res);
                BUG_ON(ip->i_res->rs_free);
                kmem_cache_free(gfs2_rsrv_cachep, ip->i_res);
                ip->i_res = NULL;
@@ -664,7 +664,7 @@ static void return_all_reservations(struct gfs2_rgrpd *rgd)
        spin_lock(&rgd->rd_rsspin);
        while ((n = rb_first(&rgd->rd_rstree))) {
                rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
-                __rs_deltree(NULL, rs);
+                __rs_deltree(rs);
        }
        spin_unlock(&rgd->rd_rsspin);
 }
@@ -1181,12 +1181,9 @@ int gfs2_rgrp_send_discards(struct gfs2_sbd *sdp, u64 offset,
                             const struct gfs2_bitmap *bi, unsigned minlen, u64 *ptrimmed)
 {
        struct super_block *sb = sdp->sd_vfs;
-        struct block_device *bdev = sb->s_bdev;
-        const unsigned int sects_per_blk = sdp->sd_sb.sb_bsize /
-                                           bdev_logical_block_size(sb->s_bdev);
        u64 blk;
        sector_t start = 0;
-        sector_t nr_sects = 0;
+        sector_t nr_blks = 0;
        int rv;
        unsigned int x;
        u32 trimmed = 0;
@@ -1206,35 +1203,34 @@ int gfs2_rgrp_send_discards(struct gfs2_sbd *sdp, u64 offset,
                if (diff == 0)
                        continue;
                blk = offset + ((bi->bi_start + x) * GFS2_NBBY);
-                blk *= sects_per_blk; /* convert to sectors */
                while(diff) {
                        if (diff & 1) {
-                                if (nr_sects == 0)
+                                if (nr_blks == 0)
                                        goto start_new_extent;
-                                if ((start + nr_sects) != blk) {
+                                if ((start + nr_blks) != blk) {
-                                        if (nr_sects >= minlen) {
+                                        if (nr_blks >= minlen) {
-                                                rv = blkdev_issue_discard(bdev,
+                                                rv = sb_issue_discard(sb,
-                                                        start, nr_sects,
+                                                        start, nr_blks,
                                                        GFP_NOFS, 0);
                                                if (rv)
                                                        goto fail;
-                                                trimmed += nr_sects;
+                                                trimmed += nr_blks;
                                        }
-                                        nr_sects = 0;
+                                        nr_blks = 0;
 start_new_extent:
                                        start = blk;
                                }
-                                nr_sects += sects_per_blk;
+                                nr_blks++;
                        }
                        diff >>= 2;
-                        blk += sects_per_blk;
+                        blk++;
                }
        }
-        if (nr_sects >= minlen) {
+        if (nr_blks >= minlen) {
-                rv = blkdev_issue_discard(bdev, start, nr_sects, GFP_NOFS, 0);
+                rv = sb_issue_discard(sb, start, nr_blks, GFP_NOFS, 0);
                if (rv)
                        goto fail;
-                trimmed += nr_sects;
+                trimmed += nr_blks;
        }
        if (ptrimmed)
                *ptrimmed = trimmed;
@@ -1878,7 +1874,7 @@ int gfs2_inplace_reserve(struct gfs2_inode *ip, u32 requested, u32 aflags)
                /* Drop reservation, if we couldn't use reserved rgrp */
                if (gfs2_rs_active(rs))
-                        gfs2_rs_deltree(ip, rs);
+                        gfs2_rs_deltree(rs);
 check_rgrp:
                /* Check for unlinked inodes which can be reclaimed */
                if (rs->rs_rbm.rgd->rd_flags & GFS2_RDF_CHECK)
@@ -2091,7 +2087,7 @@ static void gfs2_adjust_reservation(struct gfs2_inode *ip,
                        if (rs->rs_free && !ret)
                                goto out;
                }
-                __rs_deltree(ip, rs);
+                __rs_deltree(rs);
        }
 out:
        spin_unlock(&rgd->rd_rsspin);
@@ -2184,13 +2180,7 @@ int gfs2_alloc_blocks(struct gfs2_inode *ip, u64 *bn, unsigned int *nblocks,
        if (dinode)
                gfs2_trans_add_unrevoke(sdp, block, 1);
-        /*
+        gfs2_quota_change(ip, *nblocks, ip->i_inode.i_uid, ip->i_inode.i_gid);
-         * This needs reviewing to see why we cannot do the quota change
-         * at this point in the dinode case.
-         */
-        if (ndata)
-                gfs2_quota_change(ip, ndata, ip->i_inode.i_uid,
-                                  ip->i_inode.i_gid);
        rbm.rgd->rd_free_clone -= *nblocks;
        trace_gfs2_block_alloc(ip, rbm.rgd, block, *nblocks,
diff --git a/fs/gfs2/rgrp.h b/fs/gfs2/rgrp.h
index 842185853f6b..5b3f4a896e6c 100644
--- a/fs/gfs2/rgrp.h
+++ b/fs/gfs2/rgrp.h
@@ -47,7 +47,7 @@ extern int gfs2_alloc_blocks(struct gfs2_inode *ip, u64 *bn, unsigned int *n,
                             bool dinode, u64 *generation);
 extern int gfs2_rs_alloc(struct gfs2_inode *ip);
-extern void gfs2_rs_deltree(struct gfs2_inode *ip, struct gfs2_blkreserv *rs);
+extern void gfs2_rs_deltree(struct gfs2_blkreserv *rs);
 extern void gfs2_rs_delete(struct gfs2_inode *ip);
 extern void __gfs2_free_blocks(struct gfs2_inode *ip, u64 bstart, u32 blen, int meta);
 extern void gfs2_free_meta(struct gfs2_inode *ip, u64 bstart, u32 blen);
diff --git a/fs/gfs2/super.c b/fs/gfs2/super.c
index cab77b8ba84f..917c8e1eb4ae 100644
--- a/fs/gfs2/super.c
+++ b/fs/gfs2/super.c
@@ -1512,7 +1512,7 @@ out_truncate:
 out_unlock:
        /* Error path for case 1 */
        if (gfs2_rs_active(ip->i_res))
-                gfs2_rs_deltree(ip, ip->i_res);
+                gfs2_rs_deltree(ip->i_res);
        if (test_bit(HIF_HOLDER, &ip->i_iopen_gh.gh_iflags))
                gfs2_glock_dq(&ip->i_iopen_gh);
diff --git a/fs/gfs2/trace_gfs2.h b/fs/gfs2/trace_gfs2.h
index 2ee13e841e9f..20c007d747ab 100644
--- a/fs/gfs2/trace_gfs2.h
+++ b/fs/gfs2/trace_gfs2.h
@@ -159,9 +159,9 @@ TRACE_EVENT(gfs2_glock_put,
 /* Callback (local or remote) requesting lock demotion */
 TRACE_EVENT(gfs2_demote_rq,
-        TP_PROTO(const struct gfs2_glock *gl),
+        TP_PROTO(const struct gfs2_glock *gl, bool remote),
-        TP_ARGS(gl),
+        TP_ARGS(gl, remote),
        TP_STRUCT__entry(
                __field(        dev_t,  dev                     )
@@ -170,6 +170,7 @@ TRACE_EVENT(gfs2_demote_rq,
                __field(        u8,     cur_state               )
                __field(        u8,     dmt_state               )
                __field(        unsigned long,  flags           )
+                __field(        bool,   remote                  )
        ),
        TP_fast_assign(
@@ -179,14 +180,16 @@ TRACE_EVENT(gfs2_demote_rq,
                __entry->cur_state      = glock_trace_state(gl->gl_state);
                __entry->dmt_state      = glock_trace_state(gl->gl_demote_state);
                __entry->flags          = gl->gl_flags  | (gl->gl_object ? (1UL<<GLF_OBJECT) : 0);
+                __entry->remote         = remote;
        ),
-        TP_printk("%u,%u glock %d:%lld demote %s to %s flags:%s",
+        TP_printk("%u,%u glock %d:%lld demote %s to %s flags:%s %s",
                  MAJOR(__entry->dev), MINOR(__entry->dev), __entry->gltype,
                  (unsigned long long)__entry->glnum,
                  glock_trace_name(__entry->cur_state),
                  glock_trace_name(__entry->dmt_state),
-                  show_glock_flags(__entry->flags))
+                  show_glock_flags(__entry->flags),
+                  __entry->remote ? "remote" : "local")
 );
diff --git a/fs/gfs2/trans.c b/fs/gfs2/trans.c
index 88162fae27a5..7374907742a8 100644
--- a/fs/gfs2/trans.c
+++ b/fs/gfs2/trans.c
@@ -96,7 +96,8 @@ static void gfs2_log_release(struct gfs2_sbd *sdp, unsigned int blks)
 static void gfs2_print_trans(const struct gfs2_trans *tr)
 {
-        print_symbol(KERN_WARNING "GFS2: Transaction created at: %s\n", tr->tr_ip);
+        printk(KERN_WARNING "GFS2: Transaction created at: %pSR\n",
+               (void *)tr->tr_ip);
        printk(KERN_WARNING "GFS2: blocks=%u revokes=%u reserved=%u touched=%d\n",
               tr->tr_blocks, tr->tr_revokes, tr->tr_reserved, tr->tr_touched);
        printk(KERN_WARNING "GFS2: Buf %u/%u Databuf %u/%u Revoke %u/%u\n",
@@ -135,8 +136,10 @@ void gfs2_trans_end(struct gfs2_sbd *sdp)
        if (tr->tr_t_gh.gh_gl) {
                gfs2_glock_dq(&tr->tr_t_gh);
                gfs2_holder_uninit(&tr->tr_t_gh);
-                kfree(tr);
+                if (!tr->tr_attached)
+                        kfree(tr);
        }
+        up_read(&sdp->sd_log_flush_lock);
        if (sdp->sd_vfs->s_flags & MS_SYNCHRONOUS)
                gfs2_log_flush(sdp, NULL);
diff --git a/fs/hfs/bfind.c b/fs/hfs/bfind.c
index 571abe97b42a..de69d8a24f6d 100644
--- a/fs/hfs/bfind.c
+++ b/fs/hfs/bfind.c
@@ -22,7 +22,8 @@ int hfs_find_init(struct hfs_btree *tree, struct hfs_find_data *fd)
                return -ENOMEM;
        fd->search_key = ptr;
        fd->key = ptr + tree->max_key_len + 2;
-        dprint(DBG_BNODE_REFS, "find_init: %d (%p)\n", tree->cnid, __builtin_return_address(0));
+        hfs_dbg(BNODE_REFS, "find_init: %d (%p)\n",
+                tree->cnid, __builtin_return_address(0));
        mutex_lock(&tree->tree_lock);
        return 0;
 }
@@ -31,7 +32,8 @@ void hfs_find_exit(struct hfs_find_data *fd)
 {
        hfs_bnode_put(fd->bnode);
        kfree(fd->search_key);
-        dprint(DBG_BNODE_REFS, "find_exit: %d (%p)\n", fd->tree->cnid, __builtin_return_address(0));
+        hfs_dbg(BNODE_REFS, "find_exit: %d (%p)\n",
+                fd->tree->cnid, __builtin_return_address(0));
        mutex_unlock(&fd->tree->tree_lock);
        fd->tree = NULL;
 }
@@ -135,8 +137,8 @@ int hfs_brec_find(struct hfs_find_data *fd)
        return res;
 invalid:
-        printk(KERN_ERR "hfs: inconsistency in B*Tree (%d,%d,%d,%u,%u)\n",
+        pr_err("inconsistency in B*Tree (%d,%d,%d,%u,%u)\n",
-                height, bnode->height, bnode->type, nidx, parent);
+               height, bnode->height, bnode->type, nidx, parent);
        res = -EIO;
 release:
        hfs_bnode_put(bnode);
diff --git a/fs/hfs/bitmap.c b/fs/hfs/bitmap.c
index c6e97366e8ac..28307bc9ec1e 100644
--- a/fs/hfs/bitmap.c
+++ b/fs/hfs/bitmap.c
@@ -158,7 +158,7 @@ u32 hfs_vbm_search_free(struct super_block *sb, u32 goal, u32 *num_bits)
                }
        }
-        dprint(DBG_BITMAP, "alloc_bits: %u,%u\n", pos, *num_bits);
+        hfs_dbg(BITMAP, "alloc_bits: %u,%u\n", pos, *num_bits);
        HFS_SB(sb)->free_ablocks -= *num_bits;
        hfs_bitmap_dirty(sb);
 out:
@@ -200,7 +200,7 @@ int hfs_clear_vbm_bits(struct super_block *sb, u16 start, u16 count)
        if (!count)
                return 0;
-        dprint(DBG_BITMAP, "clear_bits: %u,%u\n", start, count);
+        hfs_dbg(BITMAP, "clear_bits: %u,%u\n", start, count);
        /* are all of the bits in range? */
        if ((start + count) > HFS_SB(sb)->fs_ablocks)
                return -2;
diff --git a/fs/hfs/bnode.c b/fs/hfs/bnode.c
index cdb41a1f6a64..f3b1a15ccd59 100644
--- a/fs/hfs/bnode.c
+++ b/fs/hfs/bnode.c
@@ -100,7 +100,7 @@ void hfs_bnode_copy(struct hfs_bnode *dst_node, int dst,
        struct hfs_btree *tree;
        struct page *src_page, *dst_page;
-        dprint(DBG_BNODE_MOD, "copybytes: %u,%u,%u\n", dst, src, len);
+        hfs_dbg(BNODE_MOD, "copybytes: %u,%u,%u\n", dst, src, len);
        if (!len)
                return;
        tree = src_node->tree;
@@ -120,7 +120,7 @@ void hfs_bnode_move(struct hfs_bnode *node, int dst, int src, int len)
        struct page *page;
        void *ptr;
-        dprint(DBG_BNODE_MOD, "movebytes: %u,%u,%u\n", dst, src, len);
+        hfs_dbg(BNODE_MOD, "movebytes: %u,%u,%u\n", dst, src, len);
        if (!len)
                return;
        src += node->page_offset;
@@ -138,16 +138,16 @@ void hfs_bnode_dump(struct hfs_bnode *node)
        __be32 cnid;
        int i, off, key_off;
-        dprint(DBG_BNODE_MOD, "bnode: %d\n", node->this);
+        hfs_dbg(BNODE_MOD, "bnode: %d\n", node->this);
        hfs_bnode_read(node, &desc, 0, sizeof(desc));
-        dprint(DBG_BNODE_MOD, "%d, %d, %d, %d, %d\n",
+        hfs_dbg(BNODE_MOD, "%d, %d, %d, %d, %d\n",
                be32_to_cpu(desc.next), be32_to_cpu(desc.prev),
                desc.type, desc.height, be16_to_cpu(desc.num_recs));
        off = node->tree->node_size - 2;
        for (i = be16_to_cpu(desc.num_recs); i >= 0; off -= 2, i--) {
                key_off = hfs_bnode_read_u16(node, off);
-                dprint(DBG_BNODE_MOD, " %d", key_off);
+                hfs_dbg_cont(BNODE_MOD, " %d", key_off);
                if (i && node->type == HFS_NODE_INDEX) {
                        int tmp;
@@ -155,17 +155,18 @@ void hfs_bnode_dump(struct hfs_bnode *node)
                                tmp = (hfs_bnode_read_u8(node, key_off) | 1) + 1;
                        else
                                tmp = node->tree->max_key_len + 1;
-                        dprint(DBG_BNODE_MOD, " (%d,%d", tmp, hfs_bnode_read_u8(node, key_off));
+                        hfs_dbg_cont(BNODE_MOD, " (%d,%d",
+                                     tmp, hfs_bnode_read_u8(node, key_off));
                        hfs_bnode_read(node, &cnid, key_off + tmp, 4);
-                        dprint(DBG_BNODE_MOD, ",%d)", be32_to_cpu(cnid));
+                        hfs_dbg_cont(BNODE_MOD, ",%d)", be32_to_cpu(cnid));
                } else if (i && node->type == HFS_NODE_LEAF) {
                        int tmp;
                        tmp = hfs_bnode_read_u8(node, key_off);
-                        dprint(DBG_BNODE_MOD, " (%d)", tmp);
+                        hfs_dbg_cont(BNODE_MOD, " (%d)", tmp);
                }
        }
-        dprint(DBG_BNODE_MOD, "\n");
+        hfs_dbg_cont(BNODE_MOD, "\n");
 }
 void hfs_bnode_unlink(struct hfs_bnode *node)
@@ -220,7 +221,7 @@ struct hfs_bnode *hfs_bnode_findhash(struct hfs_btree *tree, u32 cnid)
        struct hfs_bnode *node;
        if (cnid >= tree->node_count) {
-                printk(KERN_ERR "hfs: request for non-existent node %d in B*Tree\n", cnid);
+                pr_err("request for non-existent node %d in B*Tree\n", cnid);
                return NULL;
        }
@@ -243,7 +244,7 @@ static struct hfs_bnode *__hfs_bnode_create(struct hfs_btree *tree, u32 cnid)
        loff_t off;
        if (cnid >= tree->node_count) {
-                printk(KERN_ERR "hfs: request for non-existent node %d in B*Tree\n", cnid);
+                pr_err("request for non-existent node %d in B*Tree\n", cnid);
                return NULL;
        }
@@ -257,8 +258,8 @@ static struct hfs_bnode *__hfs_bnode_create(struct hfs_btree *tree, u32 cnid)
        node->this = cnid;
        set_bit(HFS_BNODE_NEW, &node->flags);
        atomic_set(&node->refcnt, 1);
-        dprint(DBG_BNODE_REFS, "new_node(%d:%d): 1\n",
+        hfs_dbg(BNODE_REFS, "new_node(%d:%d): 1\n",
-               node->tree->cnid, node->this);
+                node->tree->cnid, node->this);
        init_waitqueue_head(&node->lock_wq);
        spin_lock(&tree->hash_lock);
        node2 = hfs_bnode_findhash(tree, cnid);
@@ -301,7 +302,7 @@ void hfs_bnode_unhash(struct hfs_bnode *node)
 {
        struct hfs_bnode **p;
-        dprint(DBG_BNODE_REFS, "remove_node(%d:%d): %d\n",
+        hfs_dbg(BNODE_REFS, "remove_node(%d:%d): %d\n",
                node->tree->cnid, node->this, atomic_read(&node->refcnt));
        for (p = &node->tree->node_hash[hfs_bnode_hash(node->this)];
             *p && *p != node; p = &(*p)->next_hash)
@@ -443,8 +444,9 @@ void hfs_bnode_get(struct hfs_bnode *node)
 {
        if (node) {
                atomic_inc(&node->refcnt);
-                dprint(DBG_BNODE_REFS, "get_node(%d:%d): %d\n",
+                hfs_dbg(BNODE_REFS, "get_node(%d:%d): %d\n",
-                       node->tree->cnid, node->this, atomic_read(&node->refcnt));
+                        node->tree->cnid, node->this,
+                        atomic_read(&node->refcnt));
        }
 }
@@ -455,8 +457,9 @@ void hfs_bnode_put(struct hfs_bnode *node)
                struct hfs_btree *tree = node->tree;
                int i;
-                dprint(DBG_BNODE_REFS, "put_node(%d:%d): %d\n",
+                hfs_dbg(BNODE_REFS, "put_node(%d:%d): %d\n",
-                       node->tree->cnid, node->this, atomic_read(&node->refcnt));
+                        node->tree->cnid, node->this,
+                        atomic_read(&node->refcnt));
                BUG_ON(!atomic_read(&node->refcnt));
                if (!atomic_dec_and_lock(&node->refcnt, &tree->hash_lock))
                        return;
diff --git a/fs/hfs/brec.c b/fs/hfs/brec.c
index 92fb358ce824..9f4ee7f52026 100644
--- a/fs/hfs/brec.c
+++ b/fs/hfs/brec.c
@@ -47,15 +47,13 @@ u16 hfs_brec_keylen(struct hfs_bnode *node, u16 rec)
                if (node->tree->attributes & HFS_TREE_BIGKEYS) {
                        retval = hfs_bnode_read_u16(node, recoff) + 2;
                        if (retval > node->tree->max_key_len + 2) {
-                                printk(KERN_ERR "hfs: keylen %d too large\n",
+                                pr_err("keylen %d too large\n", retval);
-                                        retval);
                                retval = 0;
                        }
                } else {
                        retval = (hfs_bnode_read_u8(node, recoff) | 1) + 1;
                        if (retval > node->tree->max_key_len + 1) {
-                                printk(KERN_ERR "hfs: keylen %d too large\n",
+                                pr_err("keylen %d too large\n", retval);
-                                        retval);
                                retval = 0;
                        }
                }
@@ -94,7 +92,8 @@ again:
        end_rec_off = tree->node_size - (node->num_recs + 1) * 2;
        end_off = hfs_bnode_read_u16(node, end_rec_off);
        end_rec_off -= 2;
-        dprint(DBG_BNODE_MOD, "insert_rec: %d, %d, %d, %d\n", rec, size, end_off, end_rec_off);
+        hfs_dbg(BNODE_MOD, "insert_rec: %d, %d, %d, %d\n",
+                rec, size, end_off, end_rec_off);
        if (size > end_rec_off - end_off) {
                if (new_node)
                        panic("not enough room!\n");
@@ -190,7 +189,8 @@ again:
                mark_inode_dirty(tree->inode);
        }
        hfs_bnode_dump(node);
-        dprint(DBG_BNODE_MOD, "remove_rec: %d, %d\n", fd->record, fd->keylength + fd->entrylength);
+        hfs_dbg(BNODE_MOD, "remove_rec: %d, %d\n",
+                fd->record, fd->keylength + fd->entrylength);
        if (!--node->num_recs) {
                hfs_bnode_unlink(node);
                if (!node->parent)
@@ -240,7 +240,7 @@ static struct hfs_bnode *hfs_bnode_split(struct hfs_find_data *fd)
        if (IS_ERR(new_node))
                return new_node;
        hfs_bnode_get(node);
-        dprint(DBG_BNODE_MOD, "split_nodes: %d - %d - %d\n",
+        hfs_dbg(BNODE_MOD, "split_nodes: %d - %d - %d\n",
                node->this, new_node->this, node->next);
        new_node->next = node->next;
        new_node->prev = node->this;
@@ -374,7 +374,8 @@ again:
                newkeylen = (hfs_bnode_read_u8(node, 14) | 1) + 1;
        else
                fd->keylength = newkeylen = tree->max_key_len + 1;
-        dprint(DBG_BNODE_MOD, "update_rec: %d, %d, %d\n", rec, fd->keylength, newkeylen);
+        hfs_dbg(BNODE_MOD, "update_rec: %d, %d, %d\n",
+                rec, fd->keylength, newkeylen);
        rec_off = tree->node_size - (rec + 2) * 2;
        end_rec_off = tree->node_size - (parent->num_recs + 1) * 2;
@@ -385,7 +386,7 @@ again:
                end_off = hfs_bnode_read_u16(parent, end_rec_off);
                if (end_rec_off - end_off < diff) {
-                        printk(KERN_DEBUG "hfs: splitting index node...\n");
+                        printk(KERN_DEBUG "splitting index node...\n");
                        fd->bnode = parent;
                        new_node = hfs_bnode_split(fd);
                        if (IS_ERR(new_node))
diff --git a/fs/hfs/btree.c b/fs/hfs/btree.c
index 1cbdeea1db44..1ab19e660e69 100644
--- a/fs/hfs/btree.c
+++ b/fs/hfs/btree.c
@@ -48,7 +48,7 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id, btree_keycmp ke
                                    mdb->drXTFlSize, be32_to_cpu(mdb->drXTClpSiz));
                if (HFS_I(tree->inode)->alloc_blocks >
                                        HFS_I(tree->inode)->first_blocks) {
-                        printk(KERN_ERR "hfs: invalid btree extent records\n");
+                        pr_err("invalid btree extent records\n");
                        unlock_new_inode(tree->inode);
                        goto free_inode;
                }
@@ -60,8 +60,7 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id, btree_keycmp ke
                                    mdb->drCTFlSize, be32_to_cpu(mdb->drCTClpSiz));
                if (!HFS_I(tree->inode)->first_blocks) {
-                        printk(KERN_ERR "hfs: invalid btree extent records "
+                        pr_err("invalid btree extent records (0 size)\n");
-                                                                "(0 size).\n");
                        unlock_new_inode(tree->inode);
                        goto free_inode;
                }
@@ -100,15 +99,15 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id, btree_keycmp ke
        switch (id) {
        case HFS_EXT_CNID:
                if (tree->max_key_len != HFS_MAX_EXT_KEYLEN) {
-                        printk(KERN_ERR "hfs: invalid extent max_key_len %d\n",
+                        pr_err("invalid extent max_key_len %d\n",
-                                tree->max_key_len);
+                               tree->max_key_len);
                        goto fail_page;
                }
                break;
        case HFS_CAT_CNID:
                if (tree->max_key_len != HFS_MAX_CAT_KEYLEN) {
-                        printk(KERN_ERR "hfs: invalid catalog max_key_len %d\n",
+                        pr_err("invalid catalog max_key_len %d\n",
-                                tree->max_key_len);
+                               tree->max_key_len);
                        goto fail_page;
                }
                break;
@@ -146,8 +145,9 @@ void hfs_btree_close(struct hfs_btree *tree)
                while ((node = tree->node_hash[i])) {
                        tree->node_hash[i] = node->next_hash;
                        if (atomic_read(&node->refcnt))
-                                printk(KERN_ERR "hfs: node %d:%d still has %d user(s)!\n",
+                                pr_err("node %d:%d still has %d user(s)!\n",
-                                        node->tree->cnid, node->this, atomic_read(&node->refcnt));
+                                       node->tree->cnid, node->this,
+                                       atomic_read(&node->refcnt));
                        hfs_bnode_free(node);
                        tree->node_hash_cnt--;
                }
@@ -290,7 +290,7 @@ struct hfs_bnode *hfs_bmap_alloc(struct hfs_btree *tree)
                kunmap(*pagep);
                nidx = node->next;
                if (!nidx) {
-                        printk(KERN_DEBUG "hfs: create new bmap node...\n");
+                        printk(KERN_DEBUG "create new bmap node...\n");
                        next_node = hfs_bmap_new_bmap(node, idx);
                } else
                        next_node = hfs_bnode_find(tree, nidx);
@@ -316,7 +316,7 @@ void hfs_bmap_free(struct hfs_bnode *node)
        u32 nidx;
        u8 *data, byte, m;
-        dprint(DBG_BNODE_MOD, "btree_free_node: %u\n", node->this);
+        hfs_dbg(BNODE_MOD, "btree_free_node: %u\n", node->this);
        tree = node->tree;
        nidx = node->this;
        node = hfs_bnode_find(tree, 0);
@@ -331,7 +331,8 @@ void hfs_bmap_free(struct hfs_bnode *node)
                hfs_bnode_put(node);
                if (!i) {
                        /* panic */;
-                        printk(KERN_CRIT "hfs: unable to free bnode %u. bmap not found!\n", node->this);
+                        pr_crit("unable to free bnode %u. bmap not found!\n",
+                                node->this);
                        return;
                }
                node = hfs_bnode_find(tree, i);
@@ -339,7 +340,8 @@ void hfs_bmap_free(struct hfs_bnode *node)
                        return;
                if (node->type != HFS_NODE_MAP) {
                        /* panic */;
-                        printk(KERN_CRIT "hfs: invalid bmap found! (%u,%d)\n", node->this, node->type);
+                        pr_crit("invalid bmap found! (%u,%d)\n",
+                                node->this, node->type);
                        hfs_bnode_put(node);
                        return;
                }
@@ -352,7 +354,8 @@ void hfs_bmap_free(struct hfs_bnode *node)
        m = 1 << (~nidx & 7);
        byte = data[off];
        if (!(byte & m)) {
-                printk(KERN_CRIT "hfs: trying to free free bnode %u(%d)\n", node->this, node->type);
+                pr_crit("trying to free free bnode %u(%d)\n",
+                        node->this, node->type);
                kunmap(page);
                hfs_bnode_put(node);
                return;
diff --git a/fs/hfs/catalog.c b/fs/hfs/catalog.c
index 424b0337f524..ff0316b925a5 100644
--- a/fs/hfs/catalog.c
+++ b/fs/hfs/catalog.c
@@ -87,12 +87,15 @@ int hfs_cat_create(u32 cnid, struct inode *dir, struct qstr *str, struct inode *
        int entry_size;
        int err;
-        dprint(DBG_CAT_MOD, "create_cat: %s,%u(%d)\n", str->name, cnid, inode->i_nlink);
+        hfs_dbg(CAT_MOD, "create_cat: %s,%u(%d)\n",
+                str->name, cnid, inode->i_nlink);
        if (dir->i_size >= HFS_MAX_VALENCE)
                return -ENOSPC;
        sb = dir->i_sb;
-        hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        err = hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        if (err)
+                return err;
        hfs_cat_build_key(sb, fd.search_key, cnid, NULL);
        entry_size = hfs_cat_build_thread(sb, &entry, S_ISDIR(inode->i_mode) ?
@@ -184,14 +187,14 @@ int hfs_cat_find_brec(struct super_block *sb, u32 cnid,
        type = rec.type;
        if (type != HFS_CDR_THD && type != HFS_CDR_FTH) {
-                printk(KERN_ERR "hfs: found bad thread record in catalog\n");
+                pr_err("found bad thread record in catalog\n");
                return -EIO;
        }
        fd->search_key->cat.ParID = rec.thread.ParID;
        len = fd->search_key->cat.CName.len = rec.thread.CName.len;
        if (len > HFS_NAMELEN) {
-                printk(KERN_ERR "hfs: bad catalog namelength\n");
+                pr_err("bad catalog namelength\n");
                return -EIO;
        }
        memcpy(fd->search_key->cat.CName.name, rec.thread.CName.name, len);
@@ -212,9 +215,11 @@ int hfs_cat_delete(u32 cnid, struct inode *dir, struct qstr *str)
        struct list_head *pos;
        int res, type;
-        dprint(DBG_CAT_MOD, "delete_cat: %s,%u\n", str ? str->name : NULL, cnid);
+        hfs_dbg(CAT_MOD, "delete_cat: %s,%u\n", str ? str->name : NULL, cnid);
        sb = dir->i_sb;
-        hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        res = hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        if (res)
+                return res;
        hfs_cat_build_key(sb, fd.search_key, dir->i_ino, str);
        res = hfs_brec_find(&fd);
@@ -278,10 +283,13 @@ int hfs_cat_move(u32 cnid, struct inode *src_dir, struct qstr *src_name,
        int entry_size, type;
        int err;
-        dprint(DBG_CAT_MOD, "rename_cat: %u - %lu,%s - %lu,%s\n", cnid, src_dir->i_ino, src_name->name,
+        hfs_dbg(CAT_MOD, "rename_cat: %u - %lu,%s - %lu,%s\n",
+                cnid, src_dir->i_ino, src_name->name,
                dst_dir->i_ino, dst_name->name);
        sb = src_dir->i_sb;
-        hfs_find_init(HFS_SB(sb)->cat_tree, &src_fd);
+        err = hfs_find_init(HFS_SB(sb)->cat_tree, &src_fd);
+        if (err)
+                return err;
        dst_fd = src_fd;
        /* find the old dir entry and read the data */
diff --git a/fs/hfs/dir.c b/fs/hfs/dir.c
index 5f7f1abd5f6d..17c22a8fd40a 100644
--- a/fs/hfs/dir.c
+++ b/fs/hfs/dir.c
@@ -25,7 +25,9 @@ static struct dentry *hfs_lookup(struct inode *dir, struct dentry *dentry,
        struct inode *inode = NULL;
        int res;
-        hfs_find_init(HFS_SB(dir->i_sb)->cat_tree, &fd);
+        res = hfs_find_init(HFS_SB(dir->i_sb)->cat_tree, &fd);
+        if (res)
+                return ERR_PTR(res);
        hfs_cat_build_key(dir->i_sb, fd.search_key, dir->i_ino, &dentry->d_name);
        res = hfs_brec_read(&fd, &rec, sizeof(rec));
        if (res) {
@@ -63,7 +65,9 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
        if (filp->f_pos >= inode->i_size)
                return 0;
-        hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        err = hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        if (err)
+                return err;
        hfs_cat_build_key(sb, fd.search_key, inode->i_ino, NULL);
        err = hfs_brec_find(&fd);
        if (err)
@@ -84,12 +88,12 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
                hfs_bnode_read(fd.bnode, &entry, fd.entryoffset, fd.entrylength);
                if (entry.type != HFS_CDR_THD) {
-                        printk(KERN_ERR "hfs: bad catalog folder thread\n");
+                        pr_err("bad catalog folder thread\n");
                        err = -EIO;
                        goto out;
                }
                //if (fd.entrylength < HFS_MIN_THREAD_SZ) {
-                //      printk(KERN_ERR "hfs: truncated catalog thread\n");
+                //      pr_err("truncated catalog thread\n");
                //      err = -EIO;
                //      goto out;
                //}
@@ -108,7 +112,7 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
        for (;;) {
                if (be32_to_cpu(fd.key->cat.ParID) != inode->i_ino) {
-                        printk(KERN_ERR "hfs: walked past end of dir\n");
+                        pr_err("walked past end of dir\n");
                        err = -EIO;
                        goto out;
                }
@@ -123,7 +127,7 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
                len = hfs_mac2asc(sb, strbuf, &fd.key->cat.CName);
                if (type == HFS_CDR_DIR) {
                        if (fd.entrylength < sizeof(struct hfs_cat_dir)) {
-                                printk(KERN_ERR "hfs: small dir entry\n");
+                                pr_err("small dir entry\n");
                                err = -EIO;
                                goto out;
                        }
@@ -132,7 +136,7 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
                                break;
                } else if (type == HFS_CDR_FIL) {
                        if (fd.entrylength < sizeof(struct hfs_cat_file)) {
-                                printk(KERN_ERR "hfs: small file entry\n");
+                                pr_err("small file entry\n");
                                err = -EIO;
                                goto out;
                        }
@@ -140,7 +144,7 @@ static int hfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
                                    be32_to_cpu(entry.file.FlNum), DT_REG))
                                break;
                } else {
-                        printk(KERN_ERR "hfs: bad catalog entry type %d\n", type);
+                        pr_err("bad catalog entry type %d\n", type);
                        err = -EIO;
                        goto out;
                }
diff --git a/fs/hfs/extent.c b/fs/hfs/extent.c
index a67955a0c36f..e33a0d36a93e 100644
--- a/fs/hfs/extent.c
+++ b/fs/hfs/extent.c
@@ -107,7 +107,7 @@ static u16 hfs_ext_lastblock(struct hfs_extent *ext)
        return be16_to_cpu(ext->block) + be16_to_cpu(ext->count);
 }
-static void __hfs_ext_write_extent(struct inode *inode, struct hfs_find_data *fd)
+static int __hfs_ext_write_extent(struct inode *inode, struct hfs_find_data *fd)
 {
        int res;
@@ -116,26 +116,31 @@ static void __hfs_ext_write_extent(struct inode *inode, struct hfs_find_data *fd
        res = hfs_brec_find(fd);
        if (HFS_I(inode)->flags & HFS_FLG_EXT_NEW) {
                if (res != -ENOENT)
-                        return;
+                        return res;
                hfs_brec_insert(fd, HFS_I(inode)->cached_extents, sizeof(hfs_extent_rec));
                HFS_I(inode)->flags &= ~(HFS_FLG_EXT_DIRTY|HFS_FLG_EXT_NEW);
        } else {
                if (res)
-                        return;
+                        return res;
                hfs_bnode_write(fd->bnode, HFS_I(inode)->cached_extents, fd->entryoffset, fd->entrylength);
                HFS_I(inode)->flags &= ~HFS_FLG_EXT_DIRTY;
        }
+        return 0;
 }
-void hfs_ext_write_extent(struct inode *inode)
+int hfs_ext_write_extent(struct inode *inode)
 {
        struct hfs_find_data fd;
+        int res = 0;
        if (HFS_I(inode)->flags & HFS_FLG_EXT_DIRTY) {
-                hfs_find_init(HFS_SB(inode->i_sb)->ext_tree, &fd);
+                res = hfs_find_init(HFS_SB(inode->i_sb)->ext_tree, &fd);
-                __hfs_ext_write_extent(inode, &fd);
+                if (res)
+                        return res;
+                res = __hfs_ext_write_extent(inode, &fd);
                hfs_find_exit(&fd);
        }
+        return res;
 }
 static inline int __hfs_ext_read_extent(struct hfs_find_data *fd, struct hfs_extent *extent,
@@ -161,8 +166,11 @@ static inline int __hfs_ext_cache_extent(struct hfs_find_data *fd, struct inode
 {
        int res;
-        if (HFS_I(inode)->flags & HFS_FLG_EXT_DIRTY)
+        if (HFS_I(inode)->flags & HFS_FLG_EXT_DIRTY) {
-                __hfs_ext_write_extent(inode, fd);
+                res = __hfs_ext_write_extent(inode, fd);
+                if (res)
+                        return res;
+        }
        res = __hfs_ext_read_extent(fd, HFS_I(inode)->cached_extents, inode->i_ino,
                                    block, HFS_IS_RSRC(inode) ? HFS_FK_RSRC : HFS_FK_DATA);
@@ -185,9 +193,11 @@ static int hfs_ext_read_extent(struct inode *inode, u16 block)
            block < HFS_I(inode)->cached_start + HFS_I(inode)->cached_blocks)
                return 0;
-        hfs_find_init(HFS_SB(inode->i_sb)->ext_tree, &fd);
+        res = hfs_find_init(HFS_SB(inode->i_sb)->ext_tree, &fd);
-        res = __hfs_ext_cache_extent(&fd, inode, block);
+        if (!res) {
-        hfs_find_exit(&fd);
+                res = __hfs_ext_cache_extent(&fd, inode, block);
+                hfs_find_exit(&fd);
+        }
        return res;
 }
@@ -195,11 +205,12 @@ static void hfs_dump_extent(struct hfs_extent *extent)
 {
        int i;
-        dprint(DBG_EXTENT, "   ");
+        hfs_dbg(EXTENT, "   ");
        for (i = 0; i < 3; i++)
-                dprint(DBG_EXTENT, " %u:%u", be16_to_cpu(extent[i].block),
+                hfs_dbg_cont(EXTENT, " %u:%u",
-                                 be16_to_cpu(extent[i].count));
+                             be16_to_cpu(extent[i].block),
-        dprint(DBG_EXTENT, "\n");
+                             be16_to_cpu(extent[i].count));
+        hfs_dbg_cont(EXTENT, "\n");
 }
 static int hfs_add_extent(struct hfs_extent *extent, u16 offset,
@@ -298,7 +309,9 @@ int hfs_free_fork(struct super_block *sb, struct hfs_cat_file *file, int type)
        if (total_blocks == blocks)
                return 0;
-        hfs_find_init(HFS_SB(sb)->ext_tree, &fd);
+        res = hfs_find_init(HFS_SB(sb)->ext_tree, &fd);
+        if (res)
+                return res;
        do {
                res = __hfs_ext_read_extent(&fd, extent, cnid, total_blocks, type);
                if (res)
@@ -392,10 +405,10 @@ int hfs_extend_file(struct inode *inode)
                goto out;
        }
-        dprint(DBG_EXTENT, "extend %lu: %u,%u\n", inode->i_ino, start, len);
+        hfs_dbg(EXTENT, "extend %lu: %u,%u\n", inode->i_ino, start, len);
        if (HFS_I(inode)->alloc_blocks == HFS_I(inode)->first_blocks) {
                if (!HFS_I(inode)->first_blocks) {
-                        dprint(DBG_EXTENT, "first extents\n");
+                        hfs_dbg(EXTENT, "first extents\n");
                        /* no extents yet */
                        HFS_I(inode)->first_extents[0].block = cpu_to_be16(start);
                        HFS_I(inode)->first_extents[0].count = cpu_to_be16(len);
@@ -437,8 +450,10 @@ out:
        return res;
 insert_extent:
-        dprint(DBG_EXTENT, "insert new extent\n");
+        hfs_dbg(EXTENT, "insert new extent\n");
-        hfs_ext_write_extent(inode);
+        res = hfs_ext_write_extent(inode);
+        if (res)
+                goto out;
        memset(HFS_I(inode)->cached_extents, 0, sizeof(hfs_extent_rec));
        HFS_I(inode)->cached_extents[0].block = cpu_to_be16(start);
@@ -460,13 +475,13 @@ void hfs_file_truncate(struct inode *inode)
        u32 size;
        int res;
-        dprint(DBG_INODE, "truncate: %lu, %Lu -> %Lu\n", inode->i_ino,
+        hfs_dbg(INODE, "truncate: %lu, %Lu -> %Lu\n",
-               (long long)HFS_I(inode)->phys_size, inode->i_size);
+                inode->i_ino, (long long)HFS_I(inode)->phys_size,
+                inode->i_size);
        if (inode->i_size > HFS_I(inode)->phys_size) {
                struct address_space *mapping = inode->i_mapping;
                void *fsdata;
                struct page *page;
-                int res;
                /* XXX: Can use generic_cont_expand? */
                size = inode->i_size - 1;
@@ -488,7 +503,12 @@ void hfs_file_truncate(struct inode *inode)
                goto out;
        mutex_lock(&HFS_I(inode)->extents_lock);
-        hfs_find_init(HFS_SB(sb)->ext_tree, &fd);
+        res = hfs_find_init(HFS_SB(sb)->ext_tree, &fd);
+        if (res) {
+                mutex_unlock(&HFS_I(inode)->extents_lock);
+                /* XXX: We lack error handling of hfs_file_truncate() */
+                return;
+        }
        while (1) {
                if (alloc_cnt == HFS_I(inode)->first_blocks) {
                        hfs_free_extents(sb, HFS_I(inode)->first_extents,
diff --git a/fs/hfs/hfs_fs.h b/fs/hfs/hfs_fs.h
index 693df9fe52b2..a73b11839a41 100644
--- a/fs/hfs/hfs_fs.h
+++ b/fs/hfs/hfs_fs.h
@@ -9,6 +9,12 @@
 #ifndef _LINUX_HFS_FS_H
 #define _LINUX_HFS_FS_H
+#ifdef pr_fmt
+#undef pr_fmt
+#endif
+#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 #include <linux/slab.h>
 #include <linux/types.h>
 #include <linux/mutex.h>
@@ -34,8 +40,18 @@
 //#define DBG_MASK      (DBG_CAT_MOD|DBG_BNODE_REFS|DBG_INODE|DBG_EXTENT)
 #define DBG_MASK        (0)
-#define dprint(flg, fmt, args...) \
+#define hfs_dbg(flg, fmt, ...)                                  \
-        if (flg & DBG_MASK) printk(fmt , ## args)
+do {                                                            \
+        if (DBG_##flg & DBG_MASK)                               \
+                printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__);  \
+} while (0)
+#define hfs_dbg_cont(flg, fmt, ...)                             \
+do {                                                            \
+        if (DBG_##flg & DBG_MASK)                               \
+                pr_cont(fmt, ##__VA_ARGS__);                    \
+} while (0)
 /*
 * struct hfs_inode_info
@@ -174,7 +190,7 @@ extern const struct inode_operations hfs_dir_inode_operations;
 /* extent.c */
 extern int hfs_ext_keycmp(const btree_key *, const btree_key *);
 extern int hfs_free_fork(struct super_block *, struct hfs_cat_file *, int);
-extern void hfs_ext_write_extent(struct inode *);
+extern int hfs_ext_write_extent(struct inode *);
 extern int hfs_extend_file(struct inode *);
 extern void hfs_file_truncate(struct inode *);
diff --git a/fs/hfs/inode.c b/fs/hfs/inode.c
index 3031dfdd2358..716e1aafb2e2 100644
--- a/fs/hfs/inode.c
+++ b/fs/hfs/inode.c
@@ -237,7 +237,7 @@ void hfs_delete_inode(struct inode *inode)
 {
        struct super_block *sb = inode->i_sb;
-        dprint(DBG_INODE, "delete_inode: %lu\n", inode->i_ino);
+        hfs_dbg(INODE, "delete_inode: %lu\n", inode->i_ino);
        if (S_ISDIR(inode->i_mode)) {
                HFS_SB(sb)->folder_count--;
                if (HFS_I(inode)->cat_key.ParID == cpu_to_be32(HFS_ROOT_CNID))
@@ -416,9 +416,12 @@ int hfs_write_inode(struct inode *inode, struct writeback_control *wbc)
        struct inode *main_inode = inode;
        struct hfs_find_data fd;
        hfs_cat_rec rec;
+        int res;
-        dprint(DBG_INODE, "hfs_write_inode: %lu\n", inode->i_ino);
+        hfs_dbg(INODE, "hfs_write_inode: %lu\n", inode->i_ino);
-        hfs_ext_write_extent(inode);
+        res = hfs_ext_write_extent(inode);
+        if (res)
+                return res;
        if (inode->i_ino < HFS_FIRSTUSER_CNID) {
                switch (inode->i_ino) {
@@ -515,7 +518,11 @@ static struct dentry *hfs_file_lookup(struct inode *dir, struct dentry *dentry,
        if (!inode)
                return ERR_PTR(-ENOMEM);
-        hfs_find_init(HFS_SB(dir->i_sb)->cat_tree, &fd);
+        res = hfs_find_init(HFS_SB(dir->i_sb)->cat_tree, &fd);
+        if (res) {
+                iput(inode);
+                return ERR_PTR(res);
+        }
        fd.search_key->cat = HFS_I(dir)->cat_key;
        res = hfs_brec_read(&fd, &rec, sizeof(rec));
        if (!res) {
diff --git a/fs/hfs/mdb.c b/fs/hfs/mdb.c
index b7ec224910c5..aa3f0d6d043c 100644
--- a/fs/hfs/mdb.c
+++ b/fs/hfs/mdb.c
@@ -48,7 +48,7 @@ static int hfs_get_last_session(struct super_block *sb,
                        *start = (sector_t)te.cdte_addr.lba << 2;
                        return 0;
                }
-                printk(KERN_ERR "hfs: invalid session number or type of track\n");
+                pr_err("invalid session number or type of track\n");
                return -EINVAL;
        }
        ms_info.addr_format = CDROM_LBA;
@@ -101,7 +101,7 @@ int hfs_mdb_get(struct super_block *sb)
        HFS_SB(sb)->alloc_blksz = size = be32_to_cpu(mdb->drAlBlkSiz);
        if (!size || (size & (HFS_SECTOR_SIZE - 1))) {
-                printk(KERN_ERR "hfs: bad allocation block size %d\n", size);
+                pr_err("bad allocation block size %d\n", size);
                goto out_bh;
        }
@@ -118,7 +118,7 @@ int hfs_mdb_get(struct super_block *sb)
                size >>= 1;
        brelse(bh);
        if (!sb_set_blocksize(sb, size)) {
-                printk(KERN_ERR "hfs: unable to set blocksize to %u\n", size);
+                pr_err("unable to set blocksize to %u\n", size);
                goto out;
        }
@@ -162,8 +162,8 @@ int hfs_mdb_get(struct super_block *sb)
        }
        if (!HFS_SB(sb)->alt_mdb) {
-                printk(KERN_WARNING "hfs: unable to locate alternate MDB\n");
+                pr_warn("unable to locate alternate MDB\n");
-                printk(KERN_WARNING "hfs: continuing without an alternate MDB\n");
+                pr_warn("continuing without an alternate MDB\n");
        }
        HFS_SB(sb)->bitmap = (__be32 *)__get_free_pages(GFP_KERNEL, PAGE_SIZE < 8192 ? 1 : 0);
@@ -178,7 +178,7 @@ int hfs_mdb_get(struct super_block *sb)
        while (size) {
                bh = sb_bread(sb, off >> sb->s_blocksize_bits);
                if (!bh) {
-                        printk(KERN_ERR "hfs: unable to read volume bitmap\n");
+                        pr_err("unable to read volume bitmap\n");
                        goto out;
                }
                off2 = off & (sb->s_blocksize - 1);
@@ -192,23 +192,22 @@ int hfs_mdb_get(struct super_block *sb)
        HFS_SB(sb)->ext_tree = hfs_btree_open(sb, HFS_EXT_CNID, hfs_ext_keycmp);
        if (!HFS_SB(sb)->ext_tree) {
-                printk(KERN_ERR "hfs: unable to open extent tree\n");
+                pr_err("unable to open extent tree\n");
                goto out;
        }
        HFS_SB(sb)->cat_tree = hfs_btree_open(sb, HFS_CAT_CNID, hfs_cat_keycmp);
        if (!HFS_SB(sb)->cat_tree) {
-                printk(KERN_ERR "hfs: unable to open catalog tree\n");
+                pr_err("unable to open catalog tree\n");
                goto out;
        }
        attrib = mdb->drAtrb;
        if (!(attrib & cpu_to_be16(HFS_SB_ATTRIB_UNMNT))) {
-                printk(KERN_WARNING "hfs: filesystem was not cleanly unmounted, "
+                pr_warn("filesystem was not cleanly unmounted, running fsck.hfs is recommended.  mounting read-only.\n");
-                         "running fsck.hfs is recommended.  mounting read-only.\n");
                sb->s_flags |= MS_RDONLY;
        }
        if ((attrib & cpu_to_be16(HFS_SB_ATTRIB_SLOCK))) {
-                printk(KERN_WARNING "hfs: filesystem is marked locked, mounting read-only.\n");
+                pr_warn("filesystem is marked locked, mounting read-only.\n");
                sb->s_flags |= MS_RDONLY;
        }
        if (!(sb->s_flags & MS_RDONLY)) {
@@ -312,7 +311,7 @@ void hfs_mdb_commit(struct super_block *sb)
                while (size) {
                        bh = sb_bread(sb, block);
                        if (!bh) {
-                                printk(KERN_ERR "hfs: unable to read volume bitmap\n");
+                                pr_err("unable to read volume bitmap\n");
                                break;
                        }
                        len = min((int)sb->s_blocksize - off, size);
diff --git a/fs/hfs/super.c b/fs/hfs/super.c
index bbaaa8a4ee64..2d2039e754cd 100644
--- a/fs/hfs/super.c
+++ b/fs/hfs/super.c
@@ -117,12 +117,11 @@ static int hfs_remount(struct super_block *sb, int *flags, char *data)
                return 0;
        if (!(*flags & MS_RDONLY)) {
                if (!(HFS_SB(sb)->mdb->drAtrb & cpu_to_be16(HFS_SB_ATTRIB_UNMNT))) {
-                        printk(KERN_WARNING "hfs: filesystem was not cleanly unmounted, "
+                        pr_warn("filesystem was not cleanly unmounted, running fsck.hfs is recommended.  leaving read-only.\n");
-                               "running fsck.hfs is recommended.  leaving read-only.\n");
                        sb->s_flags |= MS_RDONLY;
                        *flags |= MS_RDONLY;
                } else if (HFS_SB(sb)->mdb->drAtrb & cpu_to_be16(HFS_SB_ATTRIB_SLOCK)) {
-                        printk(KERN_WARNING "hfs: filesystem is marked locked, leaving read-only.\n");
+                        pr_warn("filesystem is marked locked, leaving read-only.\n");
                        sb->s_flags |= MS_RDONLY;
                        *flags |= MS_RDONLY;
                }
@@ -253,29 +252,29 @@ static int parse_options(char *options, struct hfs_sb_info *hsb)
                switch (token) {
                case opt_uid:
                        if (match_int(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: uid requires an argument\n");
+                                pr_err("uid requires an argument\n");
                                return 0;
                        }
                        hsb->s_uid = make_kuid(current_user_ns(), (uid_t)tmp);
                        if (!uid_valid(hsb->s_uid)) {
-                                printk(KERN_ERR "hfs: invalid uid %d\n", tmp);
+                                pr_err("invalid uid %d\n", tmp);
                                return 0;
                        }
                        break;
                case opt_gid:
                        if (match_int(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: gid requires an argument\n");
+                                pr_err("gid requires an argument\n");
                                return 0;
                        }
                        hsb->s_gid = make_kgid(current_user_ns(), (gid_t)tmp);
                        if (!gid_valid(hsb->s_gid)) {
-                                printk(KERN_ERR "hfs: invalid gid %d\n", tmp);
+                                pr_err("invalid gid %d\n", tmp);
                                return 0;
                        }
                        break;
                case opt_umask:
                        if (match_octal(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: umask requires a value\n");
+                                pr_err("umask requires a value\n");
                                return 0;
                        }
                        hsb->s_file_umask = (umode_t)tmp;
@@ -283,39 +282,39 @@ static int parse_options(char *options, struct hfs_sb_info *hsb)
                        break;
                case opt_file_umask:
                        if (match_octal(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: file_umask requires a value\n");
+                                pr_err("file_umask requires a value\n");
                                return 0;
                        }
                        hsb->s_file_umask = (umode_t)tmp;
                        break;
                case opt_dir_umask:
                        if (match_octal(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: dir_umask requires a value\n");
+                                pr_err("dir_umask requires a value\n");
                                return 0;
                        }
                        hsb->s_dir_umask = (umode_t)tmp;
                        break;
                case opt_part:
                        if (match_int(&args[0], &hsb->part)) {
-                                printk(KERN_ERR "hfs: part requires an argument\n");
+                                pr_err("part requires an argument\n");
                                return 0;
                        }
                        break;
                case opt_session:
                        if (match_int(&args[0], &hsb->session)) {
-                                printk(KERN_ERR "hfs: session requires an argument\n");
+                                pr_err("session requires an argument\n");
                                return 0;
                        }
                        break;
                case opt_type:
                        if (match_fourchar(&args[0], &hsb->s_type)) {
-                                printk(KERN_ERR "hfs: type requires a 4 character value\n");
+                                pr_err("type requires a 4 character value\n");
                                return 0;
                        }
                        break;
                case opt_creator:
                        if (match_fourchar(&args[0], &hsb->s_creator)) {
-                                printk(KERN_ERR "hfs: creator requires a 4 character value\n");
+                                pr_err("creator requires a 4 character value\n");
                                return 0;
                        }
                        break;
@@ -324,14 +323,14 @@ static int parse_options(char *options, struct hfs_sb_info *hsb)
                        break;
                case opt_codepage:
                        if (hsb->nls_disk) {
-                                printk(KERN_ERR "hfs: unable to change codepage\n");
+                                pr_err("unable to change codepage\n");
                                return 0;
                        }
                        p = match_strdup(&args[0]);
                        if (p)
                                hsb->nls_disk = load_nls(p);
                        if (!hsb->nls_disk) {
-                                printk(KERN_ERR "hfs: unable to load codepage \"%s\"\n", p);
+                                pr_err("unable to load codepage \"%s\"\n", p);
                                kfree(p);
                                return 0;
                        }
@@ -339,14 +338,14 @@ static int parse_options(char *options, struct hfs_sb_info *hsb)
                        break;
                case opt_iocharset:
                        if (hsb->nls_io) {
-                                printk(KERN_ERR "hfs: unable to change iocharset\n");
+                                pr_err("unable to change iocharset\n");
                                return 0;
                        }
                        p = match_strdup(&args[0]);
                        if (p)
                                hsb->nls_io = load_nls(p);
                        if (!hsb->nls_io) {
-                                printk(KERN_ERR "hfs: unable to load iocharset \"%s\"\n", p);
+                                pr_err("unable to load iocharset \"%s\"\n", p);
                                kfree(p);
                                return 0;
                        }
@@ -360,7 +359,7 @@ static int parse_options(char *options, struct hfs_sb_info *hsb)
        if (hsb->nls_disk && !hsb->nls_io) {
                hsb->nls_io = load_nls_default();
                if (!hsb->nls_io) {
-                        printk(KERN_ERR "hfs: unable to load default iocharset\n");
+                        pr_err("unable to load default iocharset\n");
                        return 0;
                }
        }
@@ -400,7 +399,7 @@ static int hfs_fill_super(struct super_block *sb, void *data, int silent)
        res = -EINVAL;
        if (!parse_options((char *)data, sbi)) {
-                printk(KERN_ERR "hfs: unable to parse mount options.\n");
+                pr_err("unable to parse mount options\n");
                goto bail;
        }
@@ -411,14 +410,16 @@ static int hfs_fill_super(struct super_block *sb, void *data, int silent)
        res = hfs_mdb_get(sb);
        if (res) {
                if (!silent)
-                        printk(KERN_WARNING "hfs: can't find a HFS filesystem on dev %s.\n",
+                        pr_warn("can't find a HFS filesystem on dev %s\n",
                                hfs_mdb_name(sb));
                res = -EINVAL;
                goto bail;
        }
        /* try to get the root inode */
-        hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        res = hfs_find_init(HFS_SB(sb)->cat_tree, &fd);
+        if (res)
+                goto bail_no_root;
        res = hfs_cat_find_brec(sb, HFS_ROOT_CNID, &fd);
        if (!res) {
                if (fd.entrylength > sizeof(rec) || fd.entrylength < 0) {
@@ -447,7 +448,7 @@ static int hfs_fill_super(struct super_block *sb, void *data, int silent)
        return 0;
 bail_no_root:
-        printk(KERN_ERR "hfs: get root inode failed.\n");
+        pr_err("get root inode failed\n");
 bail:
        hfs_mdb_put(sb);
        return res;
diff --git a/fs/hfsplus/attributes.c b/fs/hfsplus/attributes.c
index 8d691f124714..0f47890299c4 100644
--- a/fs/hfsplus/attributes.c
+++ b/fs/hfsplus/attributes.c
@@ -56,7 +56,7 @@ int hfsplus_attr_build_key(struct super_block *sb, hfsplus_btree_key *key,
        if (name) {
                len = strlen(name);
                if (len > HFSPLUS_ATTR_MAX_STRLEN) {
-                        printk(KERN_ERR "hfs: invalid xattr name's length\n");
+                        pr_err("invalid xattr name's length\n");
                        return -EINVAL;
                }
                hfsplus_asc2uni(sb,
@@ -166,10 +166,10 @@ int hfsplus_find_attr(struct super_block *sb, u32 cnid,
 {
        int err = 0;
-        dprint(DBG_ATTR_MOD, "find_attr: %s,%d\n", name ? name : NULL, cnid);
+        hfs_dbg(ATTR_MOD, "find_attr: %s,%d\n", name ? name : NULL, cnid);
        if (!HFSPLUS_SB(sb)->attr_tree) {
-                printk(KERN_ERR "hfs: attributes file doesn't exist\n");
+                pr_err("attributes file doesn't exist\n");
                return -EINVAL;
        }
@@ -228,11 +228,11 @@ int hfsplus_create_attr(struct inode *inode,
        int entry_size;
        int err;
-        dprint(DBG_ATTR_MOD, "create_attr: %s,%ld\n",
+        hfs_dbg(ATTR_MOD, "create_attr: %s,%ld\n",
                name ? name : NULL, inode->i_ino);
        if (!HFSPLUS_SB(sb)->attr_tree) {
-                printk(KERN_ERR "hfs: attributes file doesn't exist\n");
+                pr_err("attributes file doesn't exist\n");
                return -EINVAL;
        }
@@ -307,10 +307,10 @@ static int __hfsplus_delete_attr(struct inode *inode, u32 cnid,
                break;
        case HFSPLUS_ATTR_FORK_DATA:
        case HFSPLUS_ATTR_EXTENTS:
-                printk(KERN_ERR "hfs: only inline data xattr are supported\n");
+                pr_err("only inline data xattr are supported\n");
                return -EOPNOTSUPP;
        default:
-                printk(KERN_ERR "hfs: invalid extended attribute record\n");
+                pr_err("invalid extended attribute record\n");
                return -ENOENT;
        }
@@ -328,11 +328,11 @@ int hfsplus_delete_attr(struct inode *inode, const char *name)
        struct super_block *sb = inode->i_sb;
        struct hfs_find_data fd;
-        dprint(DBG_ATTR_MOD, "delete_attr: %s,%ld\n",
+        hfs_dbg(ATTR_MOD, "delete_attr: %s,%ld\n",
                name ? name : NULL, inode->i_ino);
        if (!HFSPLUS_SB(sb)->attr_tree) {
-                printk(KERN_ERR "hfs: attributes file doesn't exist\n");
+                pr_err("attributes file doesn't exist\n");
                return -EINVAL;
        }
@@ -346,7 +346,7 @@ int hfsplus_delete_attr(struct inode *inode, const char *name)
                if (err)
                        goto out;
        } else {
-                printk(KERN_ERR "hfs: invalid extended attribute name\n");
+                pr_err("invalid extended attribute name\n");
                err = -EINVAL;
                goto out;
        }
@@ -369,10 +369,10 @@ int hfsplus_delete_all_attrs(struct inode *dir, u32 cnid)
        int err = 0;
        struct hfs_find_data fd;
-        dprint(DBG_ATTR_MOD, "delete_all_attrs: %d\n", cnid);
+        hfs_dbg(ATTR_MOD, "delete_all_attrs: %d\n", cnid);
        if (!HFSPLUS_SB(dir->i_sb)->attr_tree) {
-                printk(KERN_ERR "hfs: attributes file doesn't exist\n");
+                pr_err("attributes file doesn't exist\n");
                return -EINVAL;
        }
@@ -384,7 +384,7 @@ int hfsplus_delete_all_attrs(struct inode *dir, u32 cnid)
                err = hfsplus_find_attr(dir->i_sb, cnid, NULL, &fd);
                if (err) {
                        if (err != -ENOENT)
-                                printk(KERN_ERR "hfs: xattr search failed.\n");
+                                pr_err("xattr search failed\n");
                        goto end_delete_all;
                }
diff --git a/fs/hfsplus/bfind.c b/fs/hfsplus/bfind.c
index d73c98d1ee99..c1422d91cd36 100644
--- a/fs/hfsplus/bfind.c
+++ b/fs/hfsplus/bfind.c
@@ -22,7 +22,7 @@ int hfs_find_init(struct hfs_btree *tree, struct hfs_find_data *fd)
                return -ENOMEM;
        fd->search_key = ptr;
        fd->key = ptr + tree->max_key_len + 2;
-        dprint(DBG_BNODE_REFS, "find_init: %d (%p)\n",
+        hfs_dbg(BNODE_REFS, "find_init: %d (%p)\n",
                tree->cnid, __builtin_return_address(0));
        switch (tree->cnid) {
        case HFSPLUS_CAT_CNID:
@@ -44,7 +44,7 @@ void hfs_find_exit(struct hfs_find_data *fd)
 {
        hfs_bnode_put(fd->bnode);
        kfree(fd->search_key);
-        dprint(DBG_BNODE_REFS, "find_exit: %d (%p)\n",
+        hfs_dbg(BNODE_REFS, "find_exit: %d (%p)\n",
                fd->tree->cnid, __builtin_return_address(0));
        mutex_unlock(&fd->tree->tree_lock);
        fd->tree = NULL;
@@ -56,7 +56,8 @@ int hfs_find_1st_rec_by_cnid(struct hfs_bnode *bnode,
                                int *end,
                                int *cur_rec)
 {
-        __be32 cur_cnid, search_cnid;
+        __be32 cur_cnid;
+        __be32 search_cnid;
        if (bnode->tree->cnid == HFSPLUS_EXT_CNID) {
                cur_cnid = fd->key->ext.cnid;
@@ -67,8 +68,11 @@ int hfs_find_1st_rec_by_cnid(struct hfs_bnode *bnode,
        } else if (bnode->tree->cnid == HFSPLUS_ATTR_CNID) {
                cur_cnid = fd->key->attr.cnid;
                search_cnid = fd->search_key->attr.cnid;
-        } else
+        } else {
+                cur_cnid = 0;   /* used-uninitialized warning */
+                search_cnid = 0;
                BUG();
+        }
        if (cur_cnid == search_cnid) {
                (*end) = (*cur_rec);
@@ -204,7 +208,7 @@ int hfs_brec_find(struct hfs_find_data *fd, search_strategy_t do_key_compare)
        return res;
 invalid:
-        printk(KERN_ERR "hfs: inconsistency in B*Tree (%d,%d,%d,%u,%u)\n",
+        pr_err("inconsistency in B*Tree (%d,%d,%d,%u,%u)\n",
                height, bnode->height, bnode->type, nidx, parent);
        res = -EIO;
 release:
diff --git a/fs/hfsplus/bitmap.c b/fs/hfsplus/bitmap.c
index 6feefc0cb48a..d2954451519e 100644
--- a/fs/hfsplus/bitmap.c
+++ b/fs/hfsplus/bitmap.c
@@ -30,7 +30,7 @@ int hfsplus_block_allocate(struct super_block *sb, u32 size,
        if (!len)
                return size;
-        dprint(DBG_BITMAP, "block_allocate: %u,%u,%u\n", size, offset, len);
+        hfs_dbg(BITMAP, "block_allocate: %u,%u,%u\n", size, offset, len);
        mutex_lock(&sbi->alloc_mutex);
        mapping = sbi->alloc_file->i_mapping;
        page = read_mapping_page(mapping, offset / PAGE_CACHE_BITS, NULL);
@@ -89,14 +89,14 @@ int hfsplus_block_allocate(struct super_block *sb, u32 size,
                else
                        end = pptr + ((size + 31) & (PAGE_CACHE_BITS - 1)) / 32;
        }
-        dprint(DBG_BITMAP, "bitmap full\n");
+        hfs_dbg(BITMAP, "bitmap full\n");
        start = size;
        goto out;
 found:
        start = offset + (curr - pptr) * 32 + i;
        if (start >= size) {
-                dprint(DBG_BITMAP, "bitmap full\n");
+                hfs_dbg(BITMAP, "bitmap full\n");
                goto out;
        }
        /* do any partial u32 at the start */
@@ -154,7 +154,7 @@ done:
        *max = offset + (curr - pptr) * 32 + i - start;
        sbi->free_blocks -= *max;
        hfsplus_mark_mdb_dirty(sb);
-        dprint(DBG_BITMAP, "-> %u,%u\n", start, *max);
+        hfs_dbg(BITMAP, "-> %u,%u\n", start, *max);
 out:
        mutex_unlock(&sbi->alloc_mutex);
        return start;
@@ -173,7 +173,7 @@ int hfsplus_block_free(struct super_block *sb, u32 offset, u32 count)
        if (!count)
                return 0;
-        dprint(DBG_BITMAP, "block_free: %u,%u\n", offset, count);
+        hfs_dbg(BITMAP, "block_free: %u,%u\n", offset, count);
        /* are all of the bits in range? */
        if ((offset + count) > sbi->total_blocks)
                return -ENOENT;
@@ -238,8 +238,7 @@ out:
        return 0;
 kaboom:
-        printk(KERN_CRIT "hfsplus: unable to mark blocks free: error %ld\n",
+        pr_crit("unable to mark blocks free: error %ld\n", PTR_ERR(page));
-                        PTR_ERR(page));
        mutex_unlock(&sbi->alloc_mutex);
        return -EIO;
diff --git a/fs/hfsplus/bnode.c b/fs/hfsplus/bnode.c
index f31ac6f404f1..11c860204520 100644
--- a/fs/hfsplus/bnode.c
+++ b/fs/hfsplus/bnode.c
@@ -130,7 +130,7 @@ void hfs_bnode_copy(struct hfs_bnode *dst_node, int dst,
        struct page **src_page, **dst_page;
        int l;
-        dprint(DBG_BNODE_MOD, "copybytes: %u,%u,%u\n", dst, src, len);
+        hfs_dbg(BNODE_MOD, "copybytes: %u,%u,%u\n", dst, src, len);
        if (!len)
                return;
        tree = src_node->tree;
@@ -188,7 +188,7 @@ void hfs_bnode_move(struct hfs_bnode *node, int dst, int src, int len)
        struct page **src_page, **dst_page;
        int l;
-        dprint(DBG_BNODE_MOD, "movebytes: %u,%u,%u\n", dst, src, len);
+        hfs_dbg(BNODE_MOD, "movebytes: %u,%u,%u\n", dst, src, len);
        if (!len)
                return;
        src += node->page_offset;
@@ -302,16 +302,16 @@ void hfs_bnode_dump(struct hfs_bnode *node)
        __be32 cnid;
        int i, off, key_off;
-        dprint(DBG_BNODE_MOD, "bnode: %d\n", node->this);
+        hfs_dbg(BNODE_MOD, "bnode: %d\n", node->this);
        hfs_bnode_read(node, &desc, 0, sizeof(desc));
-        dprint(DBG_BNODE_MOD, "%d, %d, %d, %d, %d\n",
+        hfs_dbg(BNODE_MOD, "%d, %d, %d, %d, %d\n",
                be32_to_cpu(desc.next), be32_to_cpu(desc.prev),
                desc.type, desc.height, be16_to_cpu(desc.num_recs));
        off = node->tree->node_size - 2;
        for (i = be16_to_cpu(desc.num_recs); i >= 0; off -= 2, i--) {
                key_off = hfs_bnode_read_u16(node, off);
-                dprint(DBG_BNODE_MOD, " %d", key_off);
+                hfs_dbg(BNODE_MOD, " %d", key_off);
                if (i && node->type == HFS_NODE_INDEX) {
                        int tmp;
@@ -320,17 +320,17 @@ void hfs_bnode_dump(struct hfs_bnode *node)
                                tmp = hfs_bnode_read_u16(node, key_off) + 2;
                        else
                                tmp = node->tree->max_key_len + 2;
-                        dprint(DBG_BNODE_MOD, " (%d", tmp);
+                        hfs_dbg_cont(BNODE_MOD, " (%d", tmp);
                        hfs_bnode_read(node, &cnid, key_off + tmp, 4);
-                        dprint(DBG_BNODE_MOD, ",%d)", be32_to_cpu(cnid));
+                        hfs_dbg_cont(BNODE_MOD, ",%d)", be32_to_cpu(cnid));
                } else if (i && node->type == HFS_NODE_LEAF) {
                        int tmp;
                        tmp = hfs_bnode_read_u16(node, key_off);
-                        dprint(DBG_BNODE_MOD, " (%d)", tmp);
+                        hfs_dbg_cont(BNODE_MOD, " (%d)", tmp);
                }
        }
-        dprint(DBG_BNODE_MOD, "\n");
+        hfs_dbg_cont(BNODE_MOD, "\n");
 }
 void hfs_bnode_unlink(struct hfs_bnode *node)
@@ -366,7 +366,7 @@ void hfs_bnode_unlink(struct hfs_bnode *node)
        /* move down? */
        if (!node->prev && !node->next)
-                dprint(DBG_BNODE_MOD, "hfs_btree_del_level\n");
+                hfs_dbg(BNODE_MOD, "hfs_btree_del_level\n");
        if (!node->parent) {
                tree->root = 0;
                tree->depth = 0;
@@ -386,7 +386,7 @@ struct hfs_bnode *hfs_bnode_findhash(struct hfs_btree *tree, u32 cnid)
        struct hfs_bnode *node;
        if (cnid >= tree->node_count) {
-                printk(KERN_ERR "hfs: request for non-existent node "
+                pr_err("request for non-existent node "
                                "%d in B*Tree\n",
                        cnid);
                return NULL;
@@ -409,7 +409,7 @@ static struct hfs_bnode *__hfs_bnode_create(struct hfs_btree *tree, u32 cnid)
        loff_t off;
        if (cnid >= tree->node_count) {
-                printk(KERN_ERR "hfs: request for non-existent node "
+                pr_err("request for non-existent node "
                                "%d in B*Tree\n",
                        cnid);
                return NULL;
@@ -425,8 +425,8 @@ static struct hfs_bnode *__hfs_bnode_create(struct hfs_btree *tree, u32 cnid)
        node->this = cnid;
        set_bit(HFS_BNODE_NEW, &node->flags);
        atomic_set(&node->refcnt, 1);
-        dprint(DBG_BNODE_REFS, "new_node(%d:%d): 1\n",
+        hfs_dbg(BNODE_REFS, "new_node(%d:%d): 1\n",
-               node->tree->cnid, node->this);
+                node->tree->cnid, node->this);
        init_waitqueue_head(&node->lock_wq);
        spin_lock(&tree->hash_lock);
        node2 = hfs_bnode_findhash(tree, cnid);
@@ -470,7 +470,7 @@ void hfs_bnode_unhash(struct hfs_bnode *node)
 {
        struct hfs_bnode **p;
-        dprint(DBG_BNODE_REFS, "remove_node(%d:%d): %d\n",
+        hfs_dbg(BNODE_REFS, "remove_node(%d:%d): %d\n",
                node->tree->cnid, node->this, atomic_read(&node->refcnt));
        for (p = &node->tree->node_hash[hfs_bnode_hash(node->this)];
             *p && *p != node; p = &(*p)->next_hash)
@@ -588,7 +588,7 @@ struct hfs_bnode *hfs_bnode_create(struct hfs_btree *tree, u32 num)
        node = hfs_bnode_findhash(tree, num);
        spin_unlock(&tree->hash_lock);
        if (node) {
-                printk(KERN_CRIT "new node %u already hashed?\n", num);
+                pr_crit("new node %u already hashed?\n", num);
                WARN_ON(1);
                return node;
        }
@@ -620,7 +620,7 @@ void hfs_bnode_get(struct hfs_bnode *node)
 {
        if (node) {
                atomic_inc(&node->refcnt);
-                dprint(DBG_BNODE_REFS, "get_node(%d:%d): %d\n",
+                hfs_dbg(BNODE_REFS, "get_node(%d:%d): %d\n",
                        node->tree->cnid, node->this,
                        atomic_read(&node->refcnt));
        }
@@ -633,7 +633,7 @@ void hfs_bnode_put(struct hfs_bnode *node)
                struct hfs_btree *tree = node->tree;
                int i;
-                dprint(DBG_BNODE_REFS, "put_node(%d:%d): %d\n",
+                hfs_dbg(BNODE_REFS, "put_node(%d:%d): %d\n",
                        node->tree->cnid, node->this,
                        atomic_read(&node->refcnt));
                BUG_ON(!atomic_read(&node->refcnt));
diff --git a/fs/hfsplus/brec.c b/fs/hfsplus/brec.c
index 298d4e45604b..6e560d56094b 100644
--- a/fs/hfsplus/brec.c
+++ b/fs/hfsplus/brec.c
@@ -45,13 +45,13 @@ u16 hfs_brec_keylen(struct hfs_bnode *node, u16 rec)
                if (!recoff)
                        return 0;
                if (recoff > node->tree->node_size - 2) {
-                        printk(KERN_ERR "hfs: recoff %d too large\n", recoff);
+                        pr_err("recoff %d too large\n", recoff);
                        return 0;
                }
                retval = hfs_bnode_read_u16(node, recoff) + 2;
                if (retval > node->tree->max_key_len + 2) {
-                        printk(KERN_ERR "hfs: keylen %d too large\n",
+                        pr_err("keylen %d too large\n",
                                retval);
                        retval = 0;
                }
@@ -90,7 +90,7 @@ again:
        end_rec_off = tree->node_size - (node->num_recs + 1) * 2;
        end_off = hfs_bnode_read_u16(node, end_rec_off);
        end_rec_off -= 2;
-        dprint(DBG_BNODE_MOD, "insert_rec: %d, %d, %d, %d\n",
+        hfs_dbg(BNODE_MOD, "insert_rec: %d, %d, %d, %d\n",
                rec, size, end_off, end_rec_off);
        if (size > end_rec_off - end_off) {
                if (new_node)
@@ -191,7 +191,7 @@ again:
                mark_inode_dirty(tree->inode);
        }
        hfs_bnode_dump(node);
-        dprint(DBG_BNODE_MOD, "remove_rec: %d, %d\n",
+        hfs_dbg(BNODE_MOD, "remove_rec: %d, %d\n",
                fd->record, fd->keylength + fd->entrylength);
        if (!--node->num_recs) {
                hfs_bnode_unlink(node);
@@ -244,7 +244,7 @@ static struct hfs_bnode *hfs_bnode_split(struct hfs_find_data *fd)
        if (IS_ERR(new_node))
                return new_node;
        hfs_bnode_get(node);
-        dprint(DBG_BNODE_MOD, "split_nodes: %d - %d - %d\n",
+        hfs_dbg(BNODE_MOD, "split_nodes: %d - %d - %d\n",
                node->this, new_node->this, node->next);
        new_node->next = node->next;
        new_node->prev = node->this;
@@ -379,7 +379,7 @@ again:
                newkeylen = hfs_bnode_read_u16(node, 14) + 2;
        else
                fd->keylength = newkeylen = tree->max_key_len + 2;
-        dprint(DBG_BNODE_MOD, "update_rec: %d, %d, %d\n",
+        hfs_dbg(BNODE_MOD, "update_rec: %d, %d, %d\n",
                rec, fd->keylength, newkeylen);
        rec_off = tree->node_size - (rec + 2) * 2;
@@ -391,7 +391,7 @@ again:
                end_off = hfs_bnode_read_u16(parent, end_rec_off);
                if (end_rec_off - end_off < diff) {
-                        dprint(DBG_BNODE_MOD, "hfs: splitting index node.\n");
+                        hfs_dbg(BNODE_MOD, "splitting index node\n");
                        fd->bnode = parent;
                        new_node = hfs_bnode_split(fd);
                        if (IS_ERR(new_node))
diff --git a/fs/hfsplus/btree.c b/fs/hfsplus/btree.c
index efb689c21a95..0c6540c91167 100644
--- a/fs/hfsplus/btree.c
+++ b/fs/hfsplus/btree.c
@@ -40,8 +40,7 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id)
        tree->inode = inode;
        if (!HFSPLUS_I(tree->inode)->first_blocks) {
-                printk(KERN_ERR
+                pr_err("invalid btree extent records (0 size)\n");
-                       "hfs: invalid btree extent records (0 size).\n");
                goto free_inode;
        }
@@ -68,12 +67,12 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id)
        switch (id) {
        case HFSPLUS_EXT_CNID:
                if (tree->max_key_len != HFSPLUS_EXT_KEYLEN - sizeof(u16)) {
-                        printk(KERN_ERR "hfs: invalid extent max_key_len %d\n",
+                        pr_err("invalid extent max_key_len %d\n",
                                tree->max_key_len);
                        goto fail_page;
                }
                if (tree->attributes & HFS_TREE_VARIDXKEYS) {
-                        printk(KERN_ERR "hfs: invalid extent btree flag\n");
+                        pr_err("invalid extent btree flag\n");
                        goto fail_page;
                }
@@ -81,12 +80,12 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id)
                break;
        case HFSPLUS_CAT_CNID:
                if (tree->max_key_len != HFSPLUS_CAT_KEYLEN - sizeof(u16)) {
-                        printk(KERN_ERR "hfs: invalid catalog max_key_len %d\n",
+                        pr_err("invalid catalog max_key_len %d\n",
                                tree->max_key_len);
                        goto fail_page;
                }
                if (!(tree->attributes & HFS_TREE_VARIDXKEYS)) {
-                        printk(KERN_ERR "hfs: invalid catalog btree flag\n");
+                        pr_err("invalid catalog btree flag\n");
                        goto fail_page;
                }
@@ -100,19 +99,19 @@ struct hfs_btree *hfs_btree_open(struct super_block *sb, u32 id)
                break;
        case HFSPLUS_ATTR_CNID:
                if (tree->max_key_len != HFSPLUS_ATTR_KEYLEN - sizeof(u16)) {
-                        printk(KERN_ERR "hfs: invalid attributes max_key_len %d\n",
+                        pr_err("invalid attributes max_key_len %d\n",
                                tree->max_key_len);
                        goto fail_page;
                }
                tree->keycmp = hfsplus_attr_bin_cmp_key;
                break;
        default:
-                printk(KERN_ERR "hfs: unknown B*Tree requested\n");
+                pr_err("unknown B*Tree requested\n");
                goto fail_page;
        }
        if (!(tree->attributes & HFS_TREE_BIGKEYS)) {
-                printk(KERN_ERR "hfs: invalid btree flag\n");
+                pr_err("invalid btree flag\n");
                goto fail_page;
        }
@@ -155,7 +154,7 @@ void hfs_btree_close(struct hfs_btree *tree)
                while ((node = tree->node_hash[i])) {
                        tree->node_hash[i] = node->next_hash;
                        if (atomic_read(&node->refcnt))
-                                printk(KERN_CRIT "hfs: node %d:%d "
+                                pr_crit("node %d:%d "
                                                "still has %d user(s)!\n",
                                        node->tree->cnid, node->this,
                                        atomic_read(&node->refcnt));
@@ -303,7 +302,7 @@ struct hfs_bnode *hfs_bmap_alloc(struct hfs_btree *tree)
                kunmap(*pagep);
                nidx = node->next;
                if (!nidx) {
-                        dprint(DBG_BNODE_MOD, "hfs: create new bmap node.\n");
+                        hfs_dbg(BNODE_MOD, "create new bmap node\n");
                        next_node = hfs_bmap_new_bmap(node, idx);
                } else
                        next_node = hfs_bnode_find(tree, nidx);
@@ -329,7 +328,7 @@ void hfs_bmap_free(struct hfs_bnode *node)
        u32 nidx;
        u8 *data, byte, m;
-        dprint(DBG_BNODE_MOD, "btree_free_node: %u\n", node->this);
+        hfs_dbg(BNODE_MOD, "btree_free_node: %u\n", node->this);
        BUG_ON(!node->this);
        tree = node->tree;
        nidx = node->this;
@@ -345,7 +344,7 @@ void hfs_bmap_free(struct hfs_bnode *node)
                hfs_bnode_put(node);
                if (!i) {
                        /* panic */;
-                        printk(KERN_CRIT "hfs: unable to free bnode %u. "
+                        pr_crit("unable to free bnode %u. "
                                        "bmap not found!\n",
                                node->this);
                        return;
@@ -355,7 +354,7 @@ void hfs_bmap_free(struct hfs_bnode *node)
                        return;
                if (node->type != HFS_NODE_MAP) {
                        /* panic */;
-                        printk(KERN_CRIT "hfs: invalid bmap found! "
+                        pr_crit("invalid bmap found! "
                                        "(%u,%d)\n",
                                node->this, node->type);
                        hfs_bnode_put(node);
@@ -370,7 +369,7 @@ void hfs_bmap_free(struct hfs_bnode *node)
        m = 1 << (~nidx & 7);
        byte = data[off];
        if (!(byte & m)) {
-                printk(KERN_CRIT "hfs: trying to free free bnode "
+                pr_crit("trying to free free bnode "
                                "%u(%d)\n",
                        node->this, node->type);
                kunmap(page);
diff --git a/fs/hfsplus/catalog.c b/fs/hfsplus/catalog.c
index 840d71edd193..968ce411db53 100644
--- a/fs/hfsplus/catalog.c
+++ b/fs/hfsplus/catalog.c
@@ -188,12 +188,12 @@ int hfsplus_find_cat(struct super_block *sb, u32 cnid,
        type = be16_to_cpu(tmp.type);
        if (type != HFSPLUS_FOLDER_THREAD && type != HFSPLUS_FILE_THREAD) {
-                printk(KERN_ERR "hfs: found bad thread record in catalog\n");
+                pr_err("found bad thread record in catalog\n");
                return -EIO;
        }
        if (be16_to_cpu(tmp.thread.nodeName.length) > 255) {
-                printk(KERN_ERR "hfs: catalog name length corrupted\n");
+                pr_err("catalog name length corrupted\n");
                return -EIO;
        }
@@ -212,7 +212,7 @@ int hfsplus_create_cat(u32 cnid, struct inode *dir,
        int entry_size;
        int err;
-        dprint(DBG_CAT_MOD, "create_cat: %s,%u(%d)\n",
+        hfs_dbg(CAT_MOD, "create_cat: %s,%u(%d)\n",
                str->name, cnid, inode->i_nlink);
        err = hfs_find_init(HFSPLUS_SB(sb)->cat_tree, &fd);
        if (err)
@@ -271,8 +271,7 @@ int hfsplus_delete_cat(u32 cnid, struct inode *dir, struct qstr *str)
        int err, off;
        u16 type;
-        dprint(DBG_CAT_MOD, "delete_cat: %s,%u\n",
+        hfs_dbg(CAT_MOD, "delete_cat: %s,%u\n", str ? str->name : NULL, cnid);
-                str ? str->name : NULL, cnid);
        err = hfs_find_init(HFSPLUS_SB(sb)->cat_tree, &fd);
        if (err)
                return err;
@@ -361,7 +360,7 @@ int hfsplus_rename_cat(u32 cnid,
        int entry_size, type;
        int err;
-        dprint(DBG_CAT_MOD, "rename_cat: %u - %lu,%s - %lu,%s\n",
+        hfs_dbg(CAT_MOD, "rename_cat: %u - %lu,%s - %lu,%s\n",
                cnid, src_dir->i_ino, src_name->name,
                dst_dir->i_ino, dst_name->name);
        err = hfs_find_init(HFSPLUS_SB(sb)->cat_tree, &src_fd);
diff --git a/fs/hfsplus/dir.c b/fs/hfsplus/dir.c
index 031c24e50521..a37ac934732f 100644
--- a/fs/hfsplus/dir.c
+++ b/fs/hfsplus/dir.c
@@ -103,7 +103,7 @@ again:
                } else if (!dentry->d_fsdata)
                        dentry->d_fsdata = (void *)(unsigned long)cnid;
        } else {
-                printk(KERN_ERR "hfs: invalid catalog entry type in lookup\n");
+                pr_err("invalid catalog entry type in lookup\n");
                err = -EIO;
                goto fail;
        }
@@ -159,12 +159,12 @@ static int hfsplus_readdir(struct file *filp, void *dirent, filldir_t filldir)
                hfs_bnode_read(fd.bnode, &entry, fd.entryoffset,
                        fd.entrylength);
                if (be16_to_cpu(entry.type) != HFSPLUS_FOLDER_THREAD) {
-                        printk(KERN_ERR "hfs: bad catalog folder thread\n");
+                        pr_err("bad catalog folder thread\n");
                        err = -EIO;
                        goto out;
                }
                if (fd.entrylength < HFSPLUS_MIN_THREAD_SZ) {
-                        printk(KERN_ERR "hfs: truncated catalog thread\n");
+                        pr_err("truncated catalog thread\n");
                        err = -EIO;
                        goto out;
                }
@@ -183,7 +183,7 @@ static int hfsplus_readdir(struct file *filp, void *dirent, filldir_t filldir)
        for (;;) {
                if (be32_to_cpu(fd.key->cat.parent) != inode->i_ino) {
-                        printk(KERN_ERR "hfs: walked past end of dir\n");
+                        pr_err("walked past end of dir\n");
                        err = -EIO;
                        goto out;
                }
@@ -203,7 +203,7 @@ static int hfsplus_readdir(struct file *filp, void *dirent, filldir_t filldir)
                if (type == HFSPLUS_FOLDER) {
                        if (fd.entrylength <
                                        sizeof(struct hfsplus_cat_folder)) {
-                                printk(KERN_ERR "hfs: small dir entry\n");
+                                pr_err("small dir entry\n");
                                err = -EIO;
                                goto out;
                        }
@@ -216,7 +216,7 @@ static int hfsplus_readdir(struct file *filp, void *dirent, filldir_t filldir)
                                break;
                } else if (type == HFSPLUS_FILE) {
                        if (fd.entrylength < sizeof(struct hfsplus_cat_file)) {
-                                printk(KERN_ERR "hfs: small file entry\n");
+                                pr_err("small file entry\n");
                                err = -EIO;
                                goto out;
                        }
@@ -224,7 +224,7 @@ static int hfsplus_readdir(struct file *filp, void *dirent, filldir_t filldir)
                                    be32_to_cpu(entry.file.id), DT_REG))
                                break;
                } else {
-                        printk(KERN_ERR "hfs: bad catalog entry type\n");
+                        pr_err("bad catalog entry type\n");
                        err = -EIO;
                        goto out;
                }
diff --git a/fs/hfsplus/extents.c b/fs/hfsplus/extents.c
index a94f0f779d5e..fbb212fbb1ef 100644
--- a/fs/hfsplus/extents.c
+++ b/fs/hfsplus/extents.c
@@ -83,7 +83,7 @@ static u32 hfsplus_ext_lastblock(struct hfsplus_extent *ext)
        return be32_to_cpu(ext->start_block) + be32_to_cpu(ext->block_count);
 }
-static void __hfsplus_ext_write_extent(struct inode *inode,
+static int __hfsplus_ext_write_extent(struct inode *inode,
                struct hfs_find_data *fd)
 {
        struct hfsplus_inode_info *hip = HFSPLUS_I(inode);
@@ -98,13 +98,13 @@ static void __hfsplus_ext_write_extent(struct inode *inode,
        res = hfs_brec_find(fd, hfs_find_rec_by_key);
        if (hip->extent_state & HFSPLUS_EXT_NEW) {
                if (res != -ENOENT)
-                        return;
+                        return res;
                hfs_brec_insert(fd, hip->cached_extents,
                                sizeof(hfsplus_extent_rec));
                hip->extent_state &= ~(HFSPLUS_EXT_DIRTY | HFSPLUS_EXT_NEW);
        } else {
                if (res)
-                        return;
+                        return res;
                hfs_bnode_write(fd->bnode, hip->cached_extents,
                                fd->entryoffset, fd->entrylength);
                hip->extent_state &= ~HFSPLUS_EXT_DIRTY;
@@ -117,11 +117,13 @@ static void __hfsplus_ext_write_extent(struct inode *inode,
         * to explicily mark the inode dirty, too.
         */
        set_bit(HFSPLUS_I_EXT_DIRTY, &hip->flags);
+        return 0;
 }
 static int hfsplus_ext_write_extent_locked(struct inode *inode)
 {
-        int res;
+        int res = 0;
        if (HFSPLUS_I(inode)->extent_state & HFSPLUS_EXT_DIRTY) {
                struct hfs_find_data fd;
@@ -129,10 +131,10 @@ static int hfsplus_ext_write_extent_locked(struct inode *inode)
                res = hfs_find_init(HFSPLUS_SB(inode->i_sb)->ext_tree, &fd);
                if (res)
                        return res;
-                __hfsplus_ext_write_extent(inode, &fd);
+                res = __hfsplus_ext_write_extent(inode, &fd);
                hfs_find_exit(&fd);
        }
-        return 0;
+        return res;
 }
 int hfsplus_ext_write_extent(struct inode *inode)
@@ -175,8 +177,11 @@ static inline int __hfsplus_ext_cache_extent(struct hfs_find_data *fd,
        WARN_ON(!mutex_is_locked(&hip->extents_lock));
-        if (hip->extent_state & HFSPLUS_EXT_DIRTY)
+        if (hip->extent_state & HFSPLUS_EXT_DIRTY) {
-                __hfsplus_ext_write_extent(inode, fd);
+                res = __hfsplus_ext_write_extent(inode, fd);
+                if (res)
+                        return res;
+        }
        res = __hfsplus_ext_read_extent(fd, hip->cached_extents, inode->i_ino,
                                        block, HFSPLUS_IS_RSRC(inode) ?
@@ -265,7 +270,7 @@ int hfsplus_get_block(struct inode *inode, sector_t iblock,
        mutex_unlock(&hip->extents_lock);
 done:
-        dprint(DBG_EXTENT, "get_block(%lu): %llu - %u\n",
+        hfs_dbg(EXTENT, "get_block(%lu): %llu - %u\n",
                inode->i_ino, (long long)iblock, dblock);
        mask = (1 << sbi->fs_shift) - 1;
@@ -288,11 +293,12 @@ static void hfsplus_dump_extent(struct hfsplus_extent *extent)
 {
        int i;
-        dprint(DBG_EXTENT, "   ");
+        hfs_dbg(EXTENT, "   ");
        for (i = 0; i < 8; i++)
-                dprint(DBG_EXTENT, " %u:%u", be32_to_cpu(extent[i].start_block),
+                hfs_dbg_cont(EXTENT, " %u:%u",
-                                 be32_to_cpu(extent[i].block_count));
+                             be32_to_cpu(extent[i].start_block),
-        dprint(DBG_EXTENT, "\n");
+                             be32_to_cpu(extent[i].block_count));
+        hfs_dbg_cont(EXTENT, "\n");
 }
 static int hfsplus_add_extent(struct hfsplus_extent *extent, u32 offset,
@@ -348,8 +354,8 @@ found:
                if (count <= block_nr) {
                        err = hfsplus_block_free(sb, start, count);
                        if (err) {
-                                printk(KERN_ERR "hfs: can't free extent\n");
+                                pr_err("can't free extent\n");
-                                dprint(DBG_EXTENT, " start: %u count: %u\n",
+                                hfs_dbg(EXTENT, " start: %u count: %u\n",
                                        start, count);
                        }
                        extent->block_count = 0;
@@ -359,8 +365,8 @@ found:
                        count -= block_nr;
                        err = hfsplus_block_free(sb, start + count, block_nr);
                        if (err) {
-                                printk(KERN_ERR "hfs: can't free extent\n");
+                                pr_err("can't free extent\n");
-                                dprint(DBG_EXTENT, " start: %u count: %u\n",
+                                hfs_dbg(EXTENT, " start: %u count: %u\n",
                                        start, count);
                        }
                        extent->block_count = cpu_to_be32(count);
@@ -432,7 +438,7 @@ int hfsplus_file_extend(struct inode *inode)
        if (sbi->alloc_file->i_size * 8 <
            sbi->total_blocks - sbi->free_blocks + 8) {
                /* extend alloc file */
-                printk(KERN_ERR "hfs: extend alloc file! "
+                pr_err("extend alloc file! "
                                "(%llu,%u,%u)\n",
                        sbi->alloc_file->i_size * 8,
                        sbi->total_blocks, sbi->free_blocks);
@@ -459,11 +465,11 @@ int hfsplus_file_extend(struct inode *inode)
                }
        }
-        dprint(DBG_EXTENT, "extend %lu: %u,%u\n", inode->i_ino, start, len);
+        hfs_dbg(EXTENT, "extend %lu: %u,%u\n", inode->i_ino, start, len);
        if (hip->alloc_blocks <= hip->first_blocks) {
                if (!hip->first_blocks) {
-                        dprint(DBG_EXTENT, "first extents\n");
+                        hfs_dbg(EXTENT, "first extents\n");
                        /* no extents yet */
                        hip->first_extents[0].start_block = cpu_to_be32(start);
                        hip->first_extents[0].block_count = cpu_to_be32(len);
@@ -500,7 +506,7 @@ out:
        return res;
 insert_extent:
-        dprint(DBG_EXTENT, "insert new extent\n");
+        hfs_dbg(EXTENT, "insert new extent\n");
        res = hfsplus_ext_write_extent_locked(inode);
        if (res)
                goto out;
@@ -525,15 +531,14 @@ void hfsplus_file_truncate(struct inode *inode)
        u32 alloc_cnt, blk_cnt, start;
        int res;
-        dprint(DBG_INODE, "truncate: %lu, %llu -> %llu\n",
+        hfs_dbg(INODE, "truncate: %lu, %llu -> %llu\n",
-                inode->i_ino, (long long)hip->phys_size,
+                inode->i_ino, (long long)hip->phys_size, inode->i_size);
-                inode->i_size);
        if (inode->i_size > hip->phys_size) {
                struct address_space *mapping = inode->i_mapping;
                struct page *page;
                void *fsdata;
-                u32 size = inode->i_size;
+                loff_t size = inode->i_size;
                res = pagecache_write_begin(NULL, mapping, size, 0,
                                                AOP_FLAG_UNINTERRUPTIBLE,
diff --git a/fs/hfsplus/hfsplus_fs.h b/fs/hfsplus/hfsplus_fs.h
index 05b11f36024c..60b0a3388b26 100644
--- a/fs/hfsplus/hfsplus_fs.h
+++ b/fs/hfsplus/hfsplus_fs.h
@@ -10,6 +10,12 @@
 #ifndef _LINUX_HFSPLUS_FS_H
 #define _LINUX_HFSPLUS_FS_H
+#ifdef pr_fmt
+#undef pr_fmt
+#endif
+#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 #include <linux/fs.h>
 #include <linux/mutex.h>
 #include <linux/buffer_head.h>
@@ -32,9 +38,17 @@
 #endif
 #define DBG_MASK        (0)
-#define dprint(flg, fmt, args...) \
+#define hfs_dbg(flg, fmt, ...)                                  \
-        if (flg & DBG_MASK) \
+do {                                                            \
-                printk(fmt , ## args)
+        if (DBG_##flg & DBG_MASK)                               \
+                printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__);  \
+} while (0)
+#define hfs_dbg_cont(flg, fmt, ...)                             \
+do {                                                            \
+        if (DBG_##flg & DBG_MASK)                               \
+                pr_cont(fmt, ##__VA_ARGS__);                    \
+} while (0)
 /* Runtime config options */
 #define HFSPLUS_DEF_CR_TYPE    0x3F3F3F3F  /* '????' */
diff --git a/fs/hfsplus/inode.c b/fs/hfsplus/inode.c
index 160ccc9cdb4b..7faaa964968e 100644
--- a/fs/hfsplus/inode.c
+++ b/fs/hfsplus/inode.c
@@ -357,7 +357,7 @@ int hfsplus_file_fsync(struct file *file, loff_t start, loff_t end,
                        if (!error)
                                error = error2;
                } else {
-                        printk(KERN_ERR "hfs: sync non-existent attributes tree\n");
+                        pr_err("sync non-existent attributes tree\n");
                }
        }
@@ -573,7 +573,7 @@ int hfsplus_cat_read_inode(struct inode *inode, struct hfs_find_data *fd)
                inode->i_ctime = hfsp_mt2ut(file->attribute_mod_date);
                HFSPLUS_I(inode)->create_date = file->create_date;
        } else {
-                printk(KERN_ERR "hfs: bad catalog entry used to create inode\n");
+                pr_err("bad catalog entry used to create inode\n");
                res = -EIO;
        }
        return res;
diff --git a/fs/hfsplus/options.c b/fs/hfsplus/options.c
index ed257c671615..968eab5bc1f5 100644
--- a/fs/hfsplus/options.c
+++ b/fs/hfsplus/options.c
@@ -113,67 +113,67 @@ int hfsplus_parse_options(char *input, struct hfsplus_sb_info *sbi)
                switch (token) {
                case opt_creator:
                        if (match_fourchar(&args[0], &sbi->creator)) {
-                                printk(KERN_ERR "hfs: creator requires a 4 character value\n");
+                                pr_err("creator requires a 4 character value\n");
                                return 0;
                        }
                        break;
                case opt_type:
                        if (match_fourchar(&args[0], &sbi->type)) {
-                                printk(KERN_ERR "hfs: type requires a 4 character value\n");
+                                pr_err("type requires a 4 character value\n");
                                return 0;
                        }
                        break;
                case opt_umask:
                        if (match_octal(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: umask requires a value\n");
+                                pr_err("umask requires a value\n");
                                return 0;
                        }
                        sbi->umask = (umode_t)tmp;
                        break;
                case opt_uid:
                        if (match_int(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: uid requires an argument\n");
+                                pr_err("uid requires an argument\n");
                                return 0;
                        }
                        sbi->uid = make_kuid(current_user_ns(), (uid_t)tmp);
                        if (!uid_valid(sbi->uid)) {
-                                printk(KERN_ERR "hfs: invalid uid specified\n");
+                                pr_err("invalid uid specified\n");
                                return 0;
                        }
                        break;
                case opt_gid:
                        if (match_int(&args[0], &tmp)) {
-                                printk(KERN_ERR "hfs: gid requires an argument\n");
+                                pr_err("gid requires an argument\n");
                                return 0;
                        }
                        sbi->gid = make_kgid(current_user_ns(), (gid_t)tmp);
                        if (!gid_valid(sbi->gid)) {
-                                printk(KERN_ERR "hfs: invalid gid specified\n");
+                                pr_err("invalid gid specified\n");
                                return 0;
                        }
                        break;
                case opt_part:
                        if (match_int(&args[0], &sbi->part)) {
-                                printk(KERN_ERR "hfs: part requires an argument\n");
+                                pr_err("part requires an argument\n");
                                return 0;
                        }
                        break;
                case opt_session:
                        if (match_int(&args[0], &sbi->session)) {
-                                printk(KERN_ERR "hfs: session requires an argument\n");
+                                pr_err("session requires an argument\n");
                                return 0;
                        }
                        break;
                case opt_nls:
                        if (sbi->nls) {
-                                printk(KERN_ERR "hfs: unable to change nls mapping\n");
+                                pr_err("unable to change nls mapping\n");
                                return 0;
                        }
                        p = match_strdup(&args[0]);
                        if (p)
                                sbi->nls = load_nls(p);
                        if (!sbi->nls) {
-                                printk(KERN_ERR "hfs: unable to load "
+                                pr_err("unable to load "
                                                "nls mapping \"%s\"\n",
                                        p);
                                kfree(p);
diff --git a/fs/hfsplus/super.c b/fs/hfsplus/super.c
index 7b87284e46dc..4c4d142cf890 100644
--- a/fs/hfsplus/super.c
+++ b/fs/hfsplus/super.c
@@ -132,7 +132,7 @@ static int hfsplus_system_write_inode(struct inode *inode)
        if (tree) {
                int err = hfs_btree_write(tree);
                if (err) {
-                        printk(KERN_ERR "hfs: b-tree write err: %d, ino %lu\n",
+                        pr_err("b-tree write err: %d, ino %lu\n",
                                        err, inode->i_ino);
                        return err;
                }
@@ -145,7 +145,7 @@ static int hfsplus_write_inode(struct inode *inode,
 {
        int err;
-        dprint(DBG_INODE, "hfsplus_write_inode: %lu\n", inode->i_ino);
+        hfs_dbg(INODE, "hfsplus_write_inode: %lu\n", inode->i_ino);
        err = hfsplus_ext_write_extent(inode);
        if (err)
@@ -160,7 +160,7 @@ static int hfsplus_write_inode(struct inode *inode,
 static void hfsplus_evict_inode(struct inode *inode)
 {
-        dprint(DBG_INODE, "hfsplus_evict_inode: %lu\n", inode->i_ino);
+        hfs_dbg(INODE, "hfsplus_evict_inode: %lu\n", inode->i_ino);
        truncate_inode_pages(&inode->i_data, 0);
        clear_inode(inode);
        if (HFSPLUS_IS_RSRC(inode)) {
@@ -179,7 +179,7 @@ static int hfsplus_sync_fs(struct super_block *sb, int wait)
        if (!wait)
                return 0;
-        dprint(DBG_SUPER, "hfsplus_sync_fs\n");
+        hfs_dbg(SUPER, "hfsplus_sync_fs\n");
        /*
         * Explicitly write out the special metadata inodes.
@@ -251,7 +251,7 @@ static void delayed_sync_fs(struct work_struct *work)
        err = hfsplus_sync_fs(sbi->alloc_file->i_sb, 1);
        if (err)
-                printk(KERN_ERR "hfs: delayed sync fs err %d\n", err);
+                pr_err("delayed sync fs err %d\n", err);
 }
 void hfsplus_mark_mdb_dirty(struct super_block *sb)
@@ -275,7 +275,7 @@ static void hfsplus_put_super(struct super_block *sb)
 {
        struct hfsplus_sb_info *sbi = HFSPLUS_SB(sb);
-        dprint(DBG_SUPER, "hfsplus_put_super\n");
+        hfs_dbg(SUPER, "hfsplus_put_super\n");
        cancel_delayed_work_sync(&sbi->sync_work);
@@ -333,25 +333,19 @@ static int hfsplus_remount(struct super_block *sb, int *flags, char *data)
                        return -EINVAL;
                if (!(vhdr->attributes & cpu_to_be32(HFSPLUS_VOL_UNMNT))) {
-                        printk(KERN_WARNING "hfs: filesystem was "
+                        pr_warn("filesystem was not cleanly unmounted, running fsck.hfsplus is recommended.  leaving read-only.\n");
-                                        "not cleanly unmounted, "
-                                        "running fsck.hfsplus is recommended.  "
-                                        "leaving read-only.\n");
                        sb->s_flags |= MS_RDONLY;
                        *flags |= MS_RDONLY;
                } else if (force) {
                        /* nothing */
                } else if (vhdr->attributes &
                                cpu_to_be32(HFSPLUS_VOL_SOFTLOCK)) {
-                        printk(KERN_WARNING "hfs: filesystem is marked locked, "
+                        pr_warn("filesystem is marked locked, leaving read-only.\n");
-                                        "leaving read-only.\n");
                        sb->s_flags |= MS_RDONLY;
                        *flags |= MS_RDONLY;
                } else if (vhdr->attributes &
                                cpu_to_be32(HFSPLUS_VOL_JOURNALED)) {
-                        printk(KERN_WARNING "hfs: filesystem is "
+                        pr_warn("filesystem is marked journaled, leaving read-only.\n");
-                                        "marked journaled, "
-                                        "leaving read-only.\n");
                        sb->s_flags |= MS_RDONLY;
                        *flags |= MS_RDONLY;
                }
@@ -397,7 +391,7 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        err = -EINVAL;
        if (!hfsplus_parse_options(data, sbi)) {
-                printk(KERN_ERR "hfs: unable to parse mount options\n");
+                pr_err("unable to parse mount options\n");
                goto out_unload_nls;
        }
@@ -405,14 +399,14 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        nls = sbi->nls;
        sbi->nls = load_nls("utf8");
        if (!sbi->nls) {
-                printk(KERN_ERR "hfs: unable to load nls for utf8\n");
+                pr_err("unable to load nls for utf8\n");
                goto out_unload_nls;
        }
        /* Grab the volume header */
        if (hfsplus_read_wrapper(sb)) {
                if (!silent)
-                        printk(KERN_WARNING "hfs: unable to find HFS+ superblock\n");
+                        pr_warn("unable to find HFS+ superblock\n");
                goto out_unload_nls;
        }
        vhdr = sbi->s_vhdr;
@@ -421,7 +415,7 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        sb->s_magic = HFSPLUS_VOLHEAD_SIG;
        if (be16_to_cpu(vhdr->version) < HFSPLUS_MIN_VERSION ||
            be16_to_cpu(vhdr->version) > HFSPLUS_CURRENT_VERSION) {
-                printk(KERN_ERR "hfs: wrong filesystem version\n");
+                pr_err("wrong filesystem version\n");
                goto out_free_vhdr;
        }
        sbi->total_blocks = be32_to_cpu(vhdr->total_blocks);
@@ -445,7 +439,7 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        if ((last_fs_block > (sector_t)(~0ULL) >> (sbi->alloc_blksz_shift - 9)) ||
            (last_fs_page > (pgoff_t)(~0ULL))) {
-                printk(KERN_ERR "hfs: filesystem size too large.\n");
+                pr_err("filesystem size too large\n");
                goto out_free_vhdr;
        }
@@ -454,22 +448,16 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        sb->s_maxbytes = MAX_LFS_FILESIZE;
        if (!(vhdr->attributes & cpu_to_be32(HFSPLUS_VOL_UNMNT))) {
-                printk(KERN_WARNING "hfs: Filesystem was "
+                pr_warn("Filesystem was not cleanly unmounted, running fsck.hfsplus is recommended.  mounting read-only.\n");
-                                "not cleanly unmounted, "
-                                "running fsck.hfsplus is recommended.  "
-                                "mounting read-only.\n");
                sb->s_flags |= MS_RDONLY;
        } else if (test_and_clear_bit(HFSPLUS_SB_FORCE, &sbi->flags)) {
                /* nothing */
        } else if (vhdr->attributes & cpu_to_be32(HFSPLUS_VOL_SOFTLOCK)) {
-                printk(KERN_WARNING "hfs: Filesystem is marked locked, mounting read-only.\n");
+                pr_warn("Filesystem is marked locked, mounting read-only.\n");
                sb->s_flags |= MS_RDONLY;
        } else if ((vhdr->attributes & cpu_to_be32(HFSPLUS_VOL_JOURNALED)) &&
                        !(sb->s_flags & MS_RDONLY)) {
-                printk(KERN_WARNING "hfs: write access to "
+                pr_warn("write access to a journaled filesystem is not supported, use the force option at your own risk, mounting read-only.\n");
-                                "a journaled filesystem is not supported, "
-                                "use the force option at your own risk, "
-                                "mounting read-only.\n");
                sb->s_flags |= MS_RDONLY;
        }
@@ -478,18 +466,18 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        /* Load metadata objects (B*Trees) */
        sbi->ext_tree = hfs_btree_open(sb, HFSPLUS_EXT_CNID);
        if (!sbi->ext_tree) {
-                printk(KERN_ERR "hfs: failed to load extents file\n");
+                pr_err("failed to load extents file\n");
                goto out_free_vhdr;
        }
        sbi->cat_tree = hfs_btree_open(sb, HFSPLUS_CAT_CNID);
        if (!sbi->cat_tree) {
-                printk(KERN_ERR "hfs: failed to load catalog file\n");
+                pr_err("failed to load catalog file\n");
                goto out_close_ext_tree;
        }
        if (vhdr->attr_file.total_blocks != 0) {
                sbi->attr_tree = hfs_btree_open(sb, HFSPLUS_ATTR_CNID);
                if (!sbi->attr_tree) {
-                        printk(KERN_ERR "hfs: failed to load attributes file\n");
+                        pr_err("failed to load attributes file\n");
                        goto out_close_cat_tree;
                }
        }
@@ -497,7 +485,7 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        inode = hfsplus_iget(sb, HFSPLUS_ALLOC_CNID);
        if (IS_ERR(inode)) {
-                printk(KERN_ERR "hfs: failed to load allocation file\n");
+                pr_err("failed to load allocation file\n");
                err = PTR_ERR(inode);
                goto out_close_attr_tree;
        }
@@ -506,7 +494,7 @@ static int hfsplus_fill_super(struct super_block *sb, void *data, int silent)
        /* Load the root directory */
        root = hfsplus_iget(sb, HFSPLUS_ROOT_CNID);
        if (IS_ERR(root)) {
-                printk(KERN_ERR "hfs: failed to load root directory\n");
+                pr_err("failed to load root directory\n");
                err = PTR_ERR(root);
                goto out_put_alloc_file;
        }
diff --git a/fs/hfsplus/wrapper.c b/fs/hfsplus/wrapper.c
index 90effcccca9a..b51a6079108d 100644
--- a/fs/hfsplus/wrapper.c
+++ b/fs/hfsplus/wrapper.c
@@ -156,7 +156,7 @@ static int hfsplus_get_last_session(struct super_block *sb,
                        *start = (sector_t)te.cdte_addr.lba << 2;
                        return 0;
                }
-                printk(KERN_ERR "hfs: invalid session number or type of track\n");
+                pr_err("invalid session number or type of track\n");
                return -EINVAL;
        }
        ms_info.addr_format = CDROM_LBA;
@@ -234,8 +234,7 @@ reread:
        error = -EINVAL;
        if (sbi->s_backup_vhdr->signature != sbi->s_vhdr->signature) {
-                printk(KERN_WARNING
+                pr_warn("invalid secondary volume header\n");
-                        "hfs: invalid secondary volume header\n");
                goto out_free_backup_vhdr;
        }
@@ -259,8 +258,7 @@ reread:
                blocksize >>= 1;
        if (sb_set_blocksize(sb, blocksize) != blocksize) {
-                printk(KERN_ERR "hfs: unable to set blocksize to %u!\n",
+                pr_err("unable to set blocksize to %u!\n", blocksize);
-                        blocksize);
                goto out_free_backup_vhdr;
        }
diff --git a/fs/hfsplus/xattr.c b/fs/hfsplus/xattr.c
index e8a4b0815c61..f66346155df5 100644
--- a/fs/hfsplus/xattr.c
+++ b/fs/hfsplus/xattr.c
@@ -107,19 +107,19 @@ int __hfsplus_setxattr(struct inode *inode, const char *name,
        err = hfs_find_init(HFSPLUS_SB(inode->i_sb)->cat_tree, &cat_fd);
        if (err) {
-                printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                pr_err("can't init xattr find struct\n");
                return err;
        }
        err = hfsplus_find_cat(inode->i_sb, inode->i_ino, &cat_fd);
        if (err) {
-                printk(KERN_ERR "hfs: catalog searching failed\n");
+                pr_err("catalog searching failed\n");
                goto end_setxattr;
        }
        if (!strcmp_xattr_finder_info(name)) {
                if (flags & XATTR_CREATE) {
-                        printk(KERN_ERR "hfs: xattr exists yet\n");
+                        pr_err("xattr exists yet\n");
                        err = -EOPNOTSUPP;
                        goto end_setxattr;
                }
@@ -165,7 +165,7 @@ int __hfsplus_setxattr(struct inode *inode, const char *name,
        if (hfsplus_attr_exists(inode, name)) {
                if (flags & XATTR_CREATE) {
-                        printk(KERN_ERR "hfs: xattr exists yet\n");
+                        pr_err("xattr exists yet\n");
                        err = -EOPNOTSUPP;
                        goto end_setxattr;
                }
@@ -177,7 +177,7 @@ int __hfsplus_setxattr(struct inode *inode, const char *name,
                        goto end_setxattr;
        } else {
                if (flags & XATTR_REPLACE) {
-                        printk(KERN_ERR "hfs: cannot replace xattr\n");
+                        pr_err("cannot replace xattr\n");
                        err = -EOPNOTSUPP;
                        goto end_setxattr;
                }
@@ -210,7 +210,7 @@ int __hfsplus_setxattr(struct inode *inode, const char *name,
                                    cat_entry_flags);
                hfsplus_mark_inode_dirty(inode, HFSPLUS_I_CAT_DIRTY);
        } else {
-                printk(KERN_ERR "hfs: invalid catalog entry type\n");
+                pr_err("invalid catalog entry type\n");
                err = -EIO;
                goto end_setxattr;
        }
@@ -269,7 +269,7 @@ static ssize_t hfsplus_getxattr_finder_info(struct dentry *dentry,
        if (size >= record_len) {
                res = hfs_find_init(HFSPLUS_SB(inode->i_sb)->cat_tree, &fd);
                if (res) {
-                        printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                        pr_err("can't init xattr find struct\n");
                        return res;
                }
                res = hfsplus_find_cat(inode->i_sb, inode->i_ino, &fd);
@@ -340,13 +340,13 @@ ssize_t hfsplus_getxattr(struct dentry *dentry, const char *name,
        entry = hfsplus_alloc_attr_entry();
        if (!entry) {
-                printk(KERN_ERR "hfs: can't allocate xattr entry\n");
+                pr_err("can't allocate xattr entry\n");
                return -ENOMEM;
        }
        res = hfs_find_init(HFSPLUS_SB(inode->i_sb)->attr_tree, &fd);
        if (res) {
-                printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                pr_err("can't init xattr find struct\n");
                goto failed_getxattr_init;
        }
@@ -355,7 +355,7 @@ ssize_t hfsplus_getxattr(struct dentry *dentry, const char *name,
                if (res == -ENOENT)
                        res = -ENODATA;
                else
-                        printk(KERN_ERR "hfs: xattr searching failed\n");
+                        pr_err("xattr searching failed\n");
                goto out;
        }
@@ -368,17 +368,17 @@ ssize_t hfsplus_getxattr(struct dentry *dentry, const char *name,
                                offsetof(struct hfsplus_attr_inline_data,
                                length));
                if (record_length > HFSPLUS_MAX_INLINE_DATA_SIZE) {
-                        printk(KERN_ERR "hfs: invalid xattr record size\n");
+                        pr_err("invalid xattr record size\n");
                        res = -EIO;
                        goto out;
                }
        } else if (record_type == HFSPLUS_ATTR_FORK_DATA ||
                        record_type == HFSPLUS_ATTR_EXTENTS) {
-                printk(KERN_ERR "hfs: only inline data xattr are supported\n");
+                pr_err("only inline data xattr are supported\n");
                res = -EOPNOTSUPP;
                goto out;
        } else {
-                printk(KERN_ERR "hfs: invalid xattr record\n");
+                pr_err("invalid xattr record\n");
                res = -EIO;
                goto out;
        }
@@ -427,7 +427,7 @@ static ssize_t hfsplus_listxattr_finder_info(struct dentry *dentry,
        res = hfs_find_init(HFSPLUS_SB(inode->i_sb)->cat_tree, &fd);
        if (res) {
-                printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                pr_err("can't init xattr find struct\n");
                return res;
        }
@@ -506,7 +506,7 @@ ssize_t hfsplus_listxattr(struct dentry *dentry, char *buffer, size_t size)
        err = hfs_find_init(HFSPLUS_SB(inode->i_sb)->attr_tree, &fd);
        if (err) {
-                printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                pr_err("can't init xattr find struct\n");
                return err;
        }
@@ -525,8 +525,7 @@ ssize_t hfsplus_listxattr(struct dentry *dentry, char *buffer, size_t size)
        for (;;) {
                key_len = hfs_bnode_read_u16(fd.bnode, fd.keyoffset);
                if (key_len == 0 || key_len > fd.tree->max_key_len) {
-                        printk(KERN_ERR "hfs: invalid xattr key length: %d\n",
+                        pr_err("invalid xattr key length: %d\n", key_len);
-                                                        key_len);
                        res = -EIO;
                        goto end_listxattr;
                }
@@ -541,7 +540,7 @@ ssize_t hfsplus_listxattr(struct dentry *dentry, char *buffer, size_t size)
                if (hfsplus_uni2asc(inode->i_sb,
                        (const struct hfsplus_unistr *)&fd.key->attr.key_name,
                                        strbuf, &xattr_name_len)) {
-                        printk(KERN_ERR "hfs: unicode conversion failed\n");
+                        pr_err("unicode conversion failed\n");
                        res = -EIO;
                        goto end_listxattr;
                }
@@ -598,13 +597,13 @@ int hfsplus_removexattr(struct dentry *dentry, const char *name)
        err = hfs_find_init(HFSPLUS_SB(inode->i_sb)->cat_tree, &cat_fd);
        if (err) {
-                printk(KERN_ERR "hfs: can't init xattr find struct\n");
+                pr_err("can't init xattr find struct\n");
                return err;
        }
        err = hfsplus_find_cat(inode->i_sb, inode->i_ino, &cat_fd);
        if (err) {
-                printk(KERN_ERR "hfs: catalog searching failed\n");
+                pr_err("catalog searching failed\n");
                goto end_removexattr;
        }
@@ -643,7 +642,7 @@ int hfsplus_removexattr(struct dentry *dentry, const char *name)
                                flags);
                hfsplus_mark_inode_dirty(inode, HFSPLUS_I_CAT_DIRTY);
        } else {
-                printk(KERN_ERR "hfs: invalid catalog entry type\n");
+                pr_err("invalid catalog entry type\n");
                err = -EIO;
                goto end_removexattr;
        }
diff --git a/fs/hugetlbfs/inode.c b/fs/hugetlbfs/inode.c
index 84e3d856e91d..523464e62849 100644
--- a/fs/hugetlbfs/inode.c
+++ b/fs/hugetlbfs/inode.c
@@ -110,7 +110,7 @@ static int hugetlbfs_file_mmap(struct file *file, struct vm_area_struct *vma)
         * way when do_mmap_pgoff unwinds (may be important on powerpc
         * and ia64).
         */
-        vma->vm_flags |= VM_HUGETLB | VM_DONTEXPAND | VM_DONTDUMP;
+        vma->vm_flags |= VM_HUGETLB | VM_DONTEXPAND;
        vma->vm_ops = &hugetlb_vm_ops;
        if (vma->vm_pgoff & (~huge_page_mask(h) >> PAGE_SHIFT))
diff --git a/fs/inode.c b/fs/inode.c
index f5f7c06c36fb..a898b3d43ccf 100644
--- a/fs/inode.c
+++ b/fs/inode.c
@@ -725,7 +725,7 @@ void prune_icache_sb(struct super_block *sb, int nr_to_scan)
                 * inode to the back of the list so we don't spin on it.
                 */
                if (!spin_trylock(&inode->i_lock)) {
-                        list_move_tail(&inode->i_lru, &sb->s_inode_lru);
+                        list_move(&inode->i_lru, &sb->s_inode_lru);
                        continue;
                }
diff --git a/fs/jbd/commit.c b/fs/jbd/commit.c
index 86b39b167c23..11bb11f48b3a 100644
--- a/fs/jbd/commit.c
+++ b/fs/jbd/commit.c
@@ -162,8 +162,17 @@ static void journal_do_submit_data(struct buffer_head **wbuf, int bufs,
        for (i = 0; i < bufs; i++) {
                wbuf[i]->b_end_io = end_buffer_write_sync;
-                /* We use-up our safety reference in submit_bh() */
+                /*
-                submit_bh(write_op, wbuf[i]);
+                 * Here we write back pagecache data that may be mmaped. Since
+                 * we cannot afford to clean the page and set PageWriteback
+                 * here due to lock ordering (page lock ranks above transaction
+                 * start), the data can change while IO is in flight. Tell the
+                 * block layer it should bounce the bio pages if stable data
+                 * during write is required.
+                 *
+                 * We use up our safety reference in submit_bh().
+                 */
+                _submit_bh(write_op, wbuf[i], 1 << BIO_SNAP_STABLE);
        }
 }
@@ -667,7 +676,17 @@ start_journal_io:
                                clear_buffer_dirty(bh);
                                set_buffer_uptodate(bh);
                                bh->b_end_io = journal_end_buffer_io_sync;
-                                submit_bh(write_op, bh);
+                                /*
+                                 * In data=journal mode, here we can end up
+                                 * writing pagecache data that might be
+                                 * mmapped. Since we can't afford to clean the
+                                 * page and set PageWriteback (see the comment
+                                 * near the other use of _submit_bh()), the
+                                 * data can change while the write is in
+                                 * flight.  Tell the block layer to bounce the
+                                 * bio pages if stable pages are required.
+                                 */
+                                _submit_bh(write_op, bh, 1 << BIO_SNAP_STABLE);
                        }
                        cond_resched();
diff --git a/fs/jbd/journal.c b/fs/jbd/journal.c
index 81cc7eaff863..865c4308acb6 100644
--- a/fs/jbd/journal.c
+++ b/fs/jbd/journal.c
@@ -310,8 +310,6 @@ int journal_write_metadata_buffer(transaction_t *transaction,
        new_bh = alloc_buffer_head(GFP_NOFS|__GFP_NOFAIL);
        /* keep subsequent assertions sane */
-        new_bh->b_state = 0;
-        init_buffer(new_bh, NULL, NULL);
        atomic_set(&new_bh->b_count, 1);
        new_jh = journal_add_journal_head(new_bh);      /* This sleeps */
diff --git a/fs/jbd2/journal.c b/fs/jbd2/journal.c
index 886ec2faa9b4..f6c5ba027f4f 100644
--- a/fs/jbd2/journal.c
+++ b/fs/jbd2/journal.c
@@ -367,8 +367,6 @@ retry_alloc:
        }
        /* keep subsequent assertions sane */
-        new_bh->b_state = 0;
-        init_buffer(new_bh, NULL, NULL);
        atomic_set(&new_bh->b_count, 1);
        new_jh = jbd2_journal_add_journal_head(new_bh); /* This sleeps */
diff --git a/fs/lockd/clntlock.c b/fs/lockd/clntlock.c
index 0796c45d0d4d..01bfe7662751 100644
--- a/fs/lockd/clntlock.c
+++ b/fs/lockd/clntlock.c
@@ -144,6 +144,9 @@ int nlmclnt_block(struct nlm_wait *block, struct nlm_rqst *req, long timeout)
                        timeout);
        if (ret < 0)
                return -ERESTARTSYS;
+        /* Reset the lock status after a server reboot so we resend */
+        if (block->b_status == nlm_lck_denied_grace_period)
+                block->b_status = nlm_lck_blocked;
        req->a_res.status = block->b_status;
        return 0;
 }
diff --git a/fs/lockd/clntproc.c b/fs/lockd/clntproc.c
index 7e529c3c45c0..9760ecb9b60f 100644
--- a/fs/lockd/clntproc.c
+++ b/fs/lockd/clntproc.c
@@ -550,9 +550,6 @@ again:
                status = nlmclnt_block(block, req, NLMCLNT_POLL_TIMEOUT);
                if (status < 0)
                        break;
-                /* Resend the blocking lock request after a server reboot */
-                if (resp->status ==  nlm_lck_denied_grace_period)
-                        continue;
                if (resp->status != nlm_lck_blocked)
                        break;
        }
diff --git a/fs/namespace.c b/fs/namespace.c
index d581e45c0a9f..341d3f564082 100644
--- a/fs/namespace.c
+++ b/fs/namespace.c
@@ -1690,7 +1690,7 @@ static int do_loopback(struct path *path, const char *old_name,
        if (IS_ERR(mnt)) {
                err = PTR_ERR(mnt);
-                goto out;
+                goto out2;
        }
        err = graft_tree(mnt, path);
diff --git a/fs/nfs/callback.c b/fs/nfs/callback.c
index 5088b57b078a..cff089a412c7 100644
--- a/fs/nfs/callback.c
+++ b/fs/nfs/callback.c
@@ -125,6 +125,9 @@ nfs41_callback_svc(void *vrqstp)
        set_freezable();
        while (!kthread_should_stop()) {
+                if (try_to_freeze())
+                        continue;
                prepare_to_wait(&serv->sv_cb_waitq, &wq, TASK_INTERRUPTIBLE);
                spin_lock_bh(&serv->sv_cb_lock);
                if (!list_empty(&serv->sv_cb_list)) {
diff --git a/fs/nfs/callback_proc.c b/fs/nfs/callback_proc.c
index 2960512792c2..a13d26ede254 100644
--- a/fs/nfs/callback_proc.c
+++ b/fs/nfs/callback_proc.c
@@ -500,7 +500,7 @@ __be32 nfs4_callback_recallany(struct cb_recallanyargs *args, void *dummy,
                     &args->craa_type_mask))
                pnfs_recall_all_layouts(cps->clp);
        if (flags)
-                nfs_expire_all_delegation_types(cps->clp, flags);
+                nfs_expire_unused_delegation_types(cps->clp, flags);
 out:
        dprintk("%s: exit with status = %d\n", __func__, ntohl(status));
        return status;
diff --git a/fs/nfs/client.c b/fs/nfs/client.c
index 84d8eae203a7..c513b0cc835f 100644
--- a/fs/nfs/client.c
+++ b/fs/nfs/client.c
@@ -593,6 +593,8 @@ int nfs_create_rpc_client(struct nfs_client *clp,
                args.flags |= RPC_CLNT_CREATE_DISCRTRY;
        if (test_bit(NFS_CS_NORESVPORT, &clp->cl_flags))
                args.flags |= RPC_CLNT_CREATE_NONPRIVPORT;
+        if (test_bit(NFS_CS_INFINITE_SLOTS, &clp->cl_flags))
+                args.flags |= RPC_CLNT_CREATE_INFINITE_SLOTS;
        if (!IS_ERR(clp->cl_rpcclient))
                return 0;
diff --git a/fs/nfs/delegation.c b/fs/nfs/delegation.c
index 6390a4b5fee7..57db3244f4d9 100644
--- a/fs/nfs/delegation.c
+++ b/fs/nfs/delegation.c
@@ -64,17 +64,15 @@ int nfs4_have_delegation(struct inode *inode, fmode_t flags)
        return ret;
 }
-static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_state *state)
+static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
 {
        struct inode *inode = state->inode;
        struct file_lock *fl;
        int status = 0;
        if (inode->i_flock == NULL)
-                return 0;
-        if (inode->i_flock == NULL)
                goto out;
        /* Protect inode->i_flock using the file locks lock */
        lock_flocks();
        for (fl = inode->i_flock; fl != NULL; fl = fl->fl_next) {
@@ -83,7 +81,7 @@ static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_
                if (nfs_file_open_context(fl->fl_file) != ctx)
                        continue;
                unlock_flocks();
-                status = nfs4_lock_delegation_recall(state, fl);
+                status = nfs4_lock_delegation_recall(fl, state, stateid);
                if (status < 0)
                        goto out;
                lock_flocks();
@@ -120,7 +118,7 @@ again:
                seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
                err = nfs4_open_delegation_recall(ctx, state, stateid);
                if (!err)
-                        err = nfs_delegation_claim_locks(ctx, state);
+                        err = nfs_delegation_claim_locks(ctx, state, stateid);
                if (!err && read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
                        err = -EAGAIN;
                mutex_unlock(&sp->so_delegreturn_mutex);
@@ -389,6 +387,24 @@ out:
        return err;
 }
+static bool nfs_delegation_need_return(struct nfs_delegation *delegation)
+{
+        bool ret = false;
+        if (test_and_clear_bit(NFS_DELEGATION_RETURN, &delegation->flags))
+                ret = true;
+        if (test_and_clear_bit(NFS_DELEGATION_RETURN_IF_CLOSED, &delegation->flags) && !ret) {
+                struct inode *inode;
+                spin_lock(&delegation->lock);
+                inode = delegation->inode;
+                if (inode && list_empty(&NFS_I(inode)->open_files))
+                        ret = true;
+                spin_unlock(&delegation->lock);
+        }
+        return ret;
+}
 /**
 * nfs_client_return_marked_delegations - return previously marked delegations
 * @clp: nfs_client to process
@@ -411,8 +427,7 @@ restart:
        list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) {
                list_for_each_entry_rcu(delegation, &server->delegations,
                                                                super_list) {
-                        if (!test_and_clear_bit(NFS_DELEGATION_RETURN,
+                        if (!nfs_delegation_need_return(delegation))
-                                                        &delegation->flags))
                                continue;
                        inode = nfs_delegation_grab_inode(delegation);
                        if (inode == NULL)
@@ -471,6 +486,13 @@ int nfs4_inode_return_delegation(struct inode *inode)
        return err;
 }
+static void nfs_mark_return_if_closed_delegation(struct nfs_server *server,
+                struct nfs_delegation *delegation)
+{
+        set_bit(NFS_DELEGATION_RETURN_IF_CLOSED, &delegation->flags);
+        set_bit(NFS4CLNT_DELEGRETURN, &server->nfs_client->cl_state);
+}
 static void nfs_mark_return_delegation(struct nfs_server *server,
                struct nfs_delegation *delegation)
 {
@@ -478,6 +500,45 @@ static void nfs_mark_return_delegation(struct nfs_server *server,
        set_bit(NFS4CLNT_DELEGRETURN, &server->nfs_client->cl_state);
 }
+static bool nfs_server_mark_return_all_delegations(struct nfs_server *server)
+{
+        struct nfs_delegation *delegation;
+        bool ret = false;
+        list_for_each_entry_rcu(delegation, &server->delegations, super_list) {
+                nfs_mark_return_delegation(server, delegation);
+                ret = true;
+        }
+        return ret;
+}
+static void nfs_client_mark_return_all_delegations(struct nfs_client *clp)
+{
+        struct nfs_server *server;
+        rcu_read_lock();
+        list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link)
+                nfs_server_mark_return_all_delegations(server);
+        rcu_read_unlock();
+}
+static void nfs_delegation_run_state_manager(struct nfs_client *clp)
+{
+        if (test_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state))
+                nfs4_schedule_state_manager(clp);
+}
+/**
+ * nfs_expire_all_delegations
+ * @clp: client to process
+ *
+ */
+void nfs_expire_all_delegations(struct nfs_client *clp)
+{
+        nfs_client_mark_return_all_delegations(clp);
+        nfs_delegation_run_state_manager(clp);
+}
 /**
 * nfs_super_return_all_delegations - return delegations for one superblock
 * @sb: sb to process
@@ -486,24 +547,22 @@ static void nfs_mark_return_delegation(struct nfs_server *server,
 void nfs_server_return_all_delegations(struct nfs_server *server)
 {
        struct nfs_client *clp = server->nfs_client;
-        struct nfs_delegation *delegation;
+        bool need_wait;
        if (clp == NULL)
                return;
        rcu_read_lock();
-        list_for_each_entry_rcu(delegation, &server->delegations, super_list) {
+        need_wait = nfs_server_mark_return_all_delegations(server);
-                spin_lock(&delegation->lock);
-                set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
-                spin_unlock(&delegation->lock);
-        }
        rcu_read_unlock();
-        if (nfs_client_return_marked_delegations(clp) != 0)
+        if (need_wait) {
                nfs4_schedule_state_manager(clp);
+                nfs4_wait_clnt_recover(clp);
+        }
 }
-static void nfs_mark_return_all_delegation_types(struct nfs_server *server,
+static void nfs_mark_return_unused_delegation_types(struct nfs_server *server,
                                                 fmode_t flags)
 {
        struct nfs_delegation *delegation;
@@ -512,27 +571,21 @@ static void nfs_mark_return_all_delegation_types(struct nfs_server *server,
                if ((delegation->type == (FMODE_READ|FMODE_WRITE)) && !(flags & FMODE_WRITE))
                        continue;
                if (delegation->type & flags)
-                        nfs_mark_return_delegation(server, delegation);
+                        nfs_mark_return_if_closed_delegation(server, delegation);
        }
 }
-static void nfs_client_mark_return_all_delegation_types(struct nfs_client *clp,
+static void nfs_client_mark_return_unused_delegation_types(struct nfs_client *clp,
                                                        fmode_t flags)
 {
        struct nfs_server *server;
        rcu_read_lock();
        list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link)
-                nfs_mark_return_all_delegation_types(server, flags);
+                nfs_mark_return_unused_delegation_types(server, flags);
        rcu_read_unlock();
 }
-static void nfs_delegation_run_state_manager(struct nfs_client *clp)
-{
-        if (test_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state))
-                nfs4_schedule_state_manager(clp);
-}
 void nfs_remove_bad_delegation(struct inode *inode)
 {
        struct nfs_delegation *delegation;
@@ -546,27 +599,17 @@ void nfs_remove_bad_delegation(struct inode *inode)
 EXPORT_SYMBOL_GPL(nfs_remove_bad_delegation);
 /**
- * nfs_expire_all_delegation_types
+ * nfs_expire_unused_delegation_types
 * @clp: client to process
 * @flags: delegation types to expire
 *
 */
-void nfs_expire_all_delegation_types(struct nfs_client *clp, fmode_t flags)
+void nfs_expire_unused_delegation_types(struct nfs_client *clp, fmode_t flags)
 {
-        nfs_client_mark_return_all_delegation_types(clp, flags);
+        nfs_client_mark_return_unused_delegation_types(clp, flags);
        nfs_delegation_run_state_manager(clp);
 }
-/**
- * nfs_expire_all_delegations
- * @clp: client to process
- *
- */
-void nfs_expire_all_delegations(struct nfs_client *clp)
-{
-        nfs_expire_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
-}
 static void nfs_mark_return_unreferenced_delegations(struct nfs_server *server)
 {
        struct nfs_delegation *delegation;
@@ -574,7 +617,7 @@ static void nfs_mark_return_unreferenced_delegations(struct nfs_server *server)
        list_for_each_entry_rcu(delegation, &server->delegations, super_list) {
                if (test_and_clear_bit(NFS_DELEGATION_REFERENCED, &delegation->flags))
                        continue;
-                nfs_mark_return_delegation(server, delegation);
+                nfs_mark_return_if_closed_delegation(server, delegation);
        }
 }
diff --git a/fs/nfs/delegation.h b/fs/nfs/delegation.h
index d54d4fca6793..9a79c7a99d6d 100644
--- a/fs/nfs/delegation.h
+++ b/fs/nfs/delegation.h
@@ -28,6 +28,7 @@ struct nfs_delegation {
 enum {
        NFS_DELEGATION_NEED_RECLAIM = 0,
        NFS_DELEGATION_RETURN,
+        NFS_DELEGATION_RETURN_IF_CLOSED,
        NFS_DELEGATION_REFERENCED,
        NFS_DELEGATION_RETURNING,
 };
@@ -41,7 +42,7 @@ void nfs_inode_return_delegation_noreclaim(struct inode *inode);
 struct inode *nfs_delegation_find_inode(struct nfs_client *clp, const struct nfs_fh *fhandle);
 void nfs_server_return_all_delegations(struct nfs_server *);
 void nfs_expire_all_delegations(struct nfs_client *clp);
-void nfs_expire_all_delegation_types(struct nfs_client *clp, fmode_t flags);
+void nfs_expire_unused_delegation_types(struct nfs_client *clp, fmode_t flags);
 void nfs_expire_unreferenced_delegations(struct nfs_client *clp);
 int nfs_client_return_marked_delegations(struct nfs_client *clp);
 int nfs_delegations_present(struct nfs_client *clp);
@@ -53,7 +54,7 @@ void nfs_delegation_reap_unclaimed(struct nfs_client *clp);
 /* NFSv4 delegation-related procedures */
 int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync);
 int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid);
-int nfs4_lock_delegation_recall(struct nfs4_state *state, struct file_lock *fl);
+int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid);
 bool nfs4_copy_delegation_stateid(nfs4_stateid *dst, struct inode *inode, fmode_t flags);
 void nfs_mark_delegation_referenced(struct nfs_delegation *delegation);
diff --git a/fs/nfs/dir.c b/fs/nfs/dir.c
index f23f455be42b..e093e73178b7 100644
--- a/fs/nfs/dir.c
+++ b/fs/nfs/dir.c
@@ -1486,6 +1486,8 @@ static int nfs4_lookup_revalidate(struct dentry *dentry, unsigned int flags)
                goto no_open;
        if (d_mountpoint(dentry))
                goto no_open;
+        if (NFS_SB(dentry->d_sb)->caps & NFS_CAP_ATOMIC_OPEN_V1)
+                goto no_open;
        inode = dentry->d_inode;
        parent = dget_parent(dentry);
diff --git a/fs/nfs/file.c b/fs/nfs/file.c
index 29f4a48a0ee6..a87a44f84113 100644
--- a/fs/nfs/file.c
+++ b/fs/nfs/file.c
@@ -744,6 +744,7 @@ static int
 do_unlk(struct file *filp, int cmd, struct file_lock *fl, int is_local)
 {
        struct inode *inode = filp->f_mapping->host;
+        struct nfs_lock_context *l_ctx;
        int status;
        /*
@@ -752,6 +753,14 @@ do_unlk(struct file *filp, int cmd, struct file_lock *fl, int is_local)
         */
        nfs_sync_mapping(filp->f_mapping);
+        l_ctx = nfs_get_lock_context(nfs_file_open_context(filp));
+        if (!IS_ERR(l_ctx)) {
+                status = nfs_iocounter_wait(&l_ctx->io_count);
+                nfs_put_lock_context(l_ctx);
+                if (status < 0)
+                        return status;
+        }
        /* NOTE: special case
         *      If we're signalled while cleaning up locks on process exit, we
         *      still need to complete the unlock.
diff --git a/fs/nfs/inode.c b/fs/nfs/inode.c
index 1f941674b089..c1c7a9d78722 100644
--- a/fs/nfs/inode.c
+++ b/fs/nfs/inode.c
@@ -561,20 +561,22 @@ static void nfs_init_lock_context(struct nfs_lock_context *l_ctx)
        l_ctx->lockowner.l_owner = current->files;
        l_ctx->lockowner.l_pid = current->tgid;
        INIT_LIST_HEAD(&l_ctx->list);
+        nfs_iocounter_init(&l_ctx->io_count);
 }
 static struct nfs_lock_context *__nfs_find_lock_context(struct nfs_open_context *ctx)
 {
-        struct nfs_lock_context *pos;
+        struct nfs_lock_context *head = &ctx->lock_context;
+        struct nfs_lock_context *pos = head;
-        list_for_each_entry(pos, &ctx->lock_context.list, list) {
+        do {
                if (pos->lockowner.l_owner != current->files)
                        continue;
                if (pos->lockowner.l_pid != current->tgid)
                        continue;
                atomic_inc(&pos->count);
                return pos;
-        }
+        } while ((pos = list_entry(pos->list.next, typeof(*pos), list)) != head);
        return NULL;
 }
diff --git a/fs/nfs/internal.h b/fs/nfs/internal.h
index 541c9ebdbc5a..91e59a39fc08 100644
--- a/fs/nfs/internal.h
+++ b/fs/nfs/internal.h
@@ -229,6 +229,13 @@ extern void nfs_pgheader_init(struct nfs_pageio_descriptor *desc,
                              struct nfs_pgio_header *hdr,
                              void (*release)(struct nfs_pgio_header *hdr));
 void nfs_set_pgio_error(struct nfs_pgio_header *hdr, int error, loff_t pos);
+int nfs_iocounter_wait(struct nfs_io_counter *c);
+static inline void nfs_iocounter_init(struct nfs_io_counter *c)
+{
+        c->flags = 0;
+        atomic_set(&c->io_count, 0);
+}
 /* nfs2xdr.c */
 extern struct rpc_procinfo nfs_procedures[];
diff --git a/fs/nfs/nfs4_fs.h b/fs/nfs/nfs4_fs.h
index 944c9a5c1039..553a83cc4106 100644
--- a/fs/nfs/nfs4_fs.h
+++ b/fs/nfs/nfs4_fs.h
@@ -36,6 +36,7 @@ enum nfs4_client_state {
 struct nfs4_minor_version_ops {
        u32     minor_version;
+        unsigned init_caps;
        int     (*call_sync)(struct rpc_clnt *clnt,
                        struct nfs_server *server,
@@ -143,12 +144,14 @@ struct nfs4_lock_state {
 enum {
        LK_STATE_IN_USE,
        NFS_DELEGATED_STATE,            /* Current stateid is delegation */
+        NFS_OPEN_STATE,                 /* OPEN stateid is set */
        NFS_O_RDONLY_STATE,             /* OPEN stateid has read-only state */
        NFS_O_WRONLY_STATE,             /* OPEN stateid has write-only state */
        NFS_O_RDWR_STATE,               /* OPEN stateid has read/write state */
        NFS_STATE_RECLAIM_REBOOT,       /* OPEN stateid server rebooted */
        NFS_STATE_RECLAIM_NOGRACE,      /* OPEN stateid needs to recover state */
        NFS_STATE_POSIX_LOCKS,          /* Posix locks are supported */
+        NFS_STATE_RECOVERY_FAILED,      /* OPEN stateid state recovery failed */
 };
 struct nfs4_state {
@@ -233,6 +236,10 @@ extern struct rpc_clnt *nfs4_proc_lookup_mountpoint(struct inode *, struct qstr
 extern int nfs4_proc_secinfo(struct inode *, const struct qstr *, struct nfs4_secinfo_flavors *);
 extern int nfs4_release_lockowner(struct nfs4_lock_state *);
 extern const struct xattr_handler *nfs4_xattr_handlers[];
+extern int nfs4_set_rw_stateid(nfs4_stateid *stateid,
+                const struct nfs_open_context *ctx,
+                const struct nfs_lock_context *l_ctx,
+                fmode_t fmode);
 #if defined(CONFIG_NFS_V4_1)
 static inline struct nfs4_session *nfs4_get_session(const struct nfs_server *server)
@@ -347,13 +354,13 @@ extern int nfs4_wait_clnt_recover(struct nfs_client *clp);
 extern int nfs4_client_recover_expired_lease(struct nfs_client *clp);
 extern void nfs4_schedule_state_manager(struct nfs_client *);
 extern void nfs4_schedule_path_down_recovery(struct nfs_client *clp);
-extern void nfs4_schedule_stateid_recovery(const struct nfs_server *, struct nfs4_state *);
+extern int nfs4_schedule_stateid_recovery(const struct nfs_server *, struct nfs4_state *);
 extern void nfs41_handle_sequence_flag_errors(struct nfs_client *clp, u32 flags);
 extern void nfs41_handle_server_scope(struct nfs_client *,
                                      struct nfs41_server_scope **);
 extern void nfs4_put_lock_state(struct nfs4_lock_state *lsp);
 extern int nfs4_set_lock_state(struct nfs4_state *state, struct file_lock *fl);
-extern void nfs4_select_rw_stateid(nfs4_stateid *, struct nfs4_state *,
+extern int nfs4_select_rw_stateid(nfs4_stateid *, struct nfs4_state *,
                fmode_t, const struct nfs_lockowner *);
 extern struct nfs_seqid *nfs_alloc_seqid(struct nfs_seqid_counter *counter, gfp_t gfp_mask);
@@ -412,6 +419,11 @@ static inline bool nfs4_stateid_match(const nfs4_stateid *dst, const nfs4_statei
        return memcmp(dst, src, sizeof(*dst)) == 0;
 }
+static inline bool nfs4_valid_open_stateid(const struct nfs4_state *state)
+{
+        return test_bit(NFS_STATE_RECOVERY_FAILED, &state->flags) == 0;
+}
 #else
 #define nfs4_close_state(a, b) do { } while (0)
diff --git a/fs/nfs/nfs4client.c b/fs/nfs/nfs4client.c
index ac4fc9a8fdbc..947b0c908aa9 100644
--- a/fs/nfs/nfs4client.c
+++ b/fs/nfs/nfs4client.c
@@ -198,8 +198,12 @@ struct nfs_client *nfs4_init_client(struct nfs_client *clp,
        /* Check NFS protocol revision and initialize RPC op vector */
        clp->rpc_ops = &nfs_v4_clientops;
+        if (clp->cl_minorversion != 0)
+                __set_bit(NFS_CS_INFINITE_SLOTS, &clp->cl_flags);
        __set_bit(NFS_CS_DISCRTRY, &clp->cl_flags);
-        error = nfs_create_rpc_client(clp, timeparms, authflavour);
+        error = nfs_create_rpc_client(clp, timeparms, RPC_AUTH_GSS_KRB5I);
+        if (error == -EINVAL)
+                error = nfs_create_rpc_client(clp, timeparms, RPC_AUTH_NULL);
        if (error < 0)
                goto error;
@@ -300,7 +304,7 @@ int nfs40_walk_client_list(struct nfs_client *new,
                           struct rpc_cred *cred)
 {
        struct nfs_net *nn = net_generic(new->cl_net, nfs_net_id);
-        struct nfs_client *pos, *n, *prev = NULL;
+        struct nfs_client *pos, *prev = NULL;
        struct nfs4_setclientid_res clid = {
                .clientid       = new->cl_clientid,
                .confirm        = new->cl_confirm,
@@ -308,10 +312,23 @@ int nfs40_walk_client_list(struct nfs_client *new,
        int status = -NFS4ERR_STALE_CLIENTID;
        spin_lock(&nn->nfs_client_lock);
-        list_for_each_entry_safe(pos, n, &nn->nfs_client_list, cl_share_link) {
+        list_for_each_entry(pos, &nn->nfs_client_list, cl_share_link) {
                /* If "pos" isn't marked ready, we can't trust the
                 * remaining fields in "pos" */
-                if (pos->cl_cons_state < NFS_CS_READY)
+                if (pos->cl_cons_state > NFS_CS_READY) {
+                        atomic_inc(&pos->cl_count);
+                        spin_unlock(&nn->nfs_client_lock);
+                        if (prev)
+                                nfs_put_client(prev);
+                        prev = pos;
+                        status = nfs_wait_client_init_complete(pos);
+                        spin_lock(&nn->nfs_client_lock);
+                        if (status < 0)
+                                continue;
+                }
+                if (pos->cl_cons_state != NFS_CS_READY)
                        continue;
                if (pos->rpc_ops != new->rpc_ops)
@@ -423,16 +440,16 @@ int nfs41_walk_client_list(struct nfs_client *new,
                           struct rpc_cred *cred)
 {
        struct nfs_net *nn = net_generic(new->cl_net, nfs_net_id);
-        struct nfs_client *pos, *n, *prev = NULL;
+        struct nfs_client *pos, *prev = NULL;
        int status = -NFS4ERR_STALE_CLIENTID;
        spin_lock(&nn->nfs_client_lock);
-        list_for_each_entry_safe(pos, n, &nn->nfs_client_list, cl_share_link) {
+        list_for_each_entry(pos, &nn->nfs_client_list, cl_share_link) {
                /* If "pos" isn't marked ready, we can't trust the
                 * remaining fields in "pos", especially the client
                 * ID and serverowner fields.  Wait for CREATE_SESSION
                 * to finish. */
-                if (pos->cl_cons_state < NFS_CS_READY) {
+                if (pos->cl_cons_state > NFS_CS_READY) {
                        atomic_inc(&pos->cl_count);
                        spin_unlock(&nn->nfs_client_lock);
@@ -440,18 +457,17 @@ int nfs41_walk_client_list(struct nfs_client *new,
                                nfs_put_client(prev);
                        prev = pos;
-                        nfs4_schedule_lease_recovery(pos);
                        status = nfs_wait_client_init_complete(pos);
-                        if (status < 0) {
+                        if (status == 0) {
-                                nfs_put_client(pos);
+                                nfs4_schedule_lease_recovery(pos);
-                                spin_lock(&nn->nfs_client_lock);
+                                status = nfs4_wait_clnt_recover(pos);
-                                continue;
                        }
-                        status = pos->cl_cons_state;
                        spin_lock(&nn->nfs_client_lock);
                        if (status < 0)
                                continue;
                }
+                if (pos->cl_cons_state != NFS_CS_READY)
+                        continue;
                if (pos->rpc_ops != new->rpc_ops)
                        continue;
@@ -469,17 +485,18 @@ int nfs41_walk_client_list(struct nfs_client *new,
                        continue;
                atomic_inc(&pos->cl_count);
-                spin_unlock(&nn->nfs_client_lock);
+                *result = pos;
+                status = 0;
                dprintk("NFS: <-- %s using nfs_client = %p ({%d})\n",
                        __func__, pos, atomic_read(&pos->cl_count));
+                break;
-                *result = pos;
-                return 0;
        }
        /* No matching nfs_client found. */
        spin_unlock(&nn->nfs_client_lock);
        dprintk("NFS: <-- %s status = %d\n", __func__, status);
+        if (prev)
+                nfs_put_client(prev);
        return status;
 }
 #endif  /* CONFIG_NFS_V4_1 */
@@ -717,6 +734,19 @@ static int nfs4_server_common_setup(struct nfs_server *server,
        if (error < 0)
                goto out;
+        /* Set the basic capabilities */
+        server->caps |= server->nfs_client->cl_mvops->init_caps;
+        if (server->flags & NFS_MOUNT_NORDIRPLUS)
+                        server->caps &= ~NFS_CAP_READDIRPLUS;
+        /*
+         * Don't use NFS uid/gid mapping if we're using AUTH_SYS or lower
+         * authentication.
+         */
+        if (nfs4_disable_idmapping &&
+                        server->client->cl_auth->au_flavor == RPC_AUTH_UNIX)
+                server->caps |= NFS_CAP_UIDGID_NOMAP;
        /* Probe the root fh to retrieve its FSID and filehandle */
        error = nfs4_get_rootfh(server, mntfh);
        if (error < 0)
@@ -760,9 +790,6 @@ static int nfs4_init_server(struct nfs_server *server,
        /* Initialise the client representation from the mount data */
        server->flags = data->flags;
-        server->caps |= NFS_CAP_ATOMIC_OPEN|NFS_CAP_CHANGE_ATTR|NFS_CAP_POSIX_LOCK;
-        if (!(data->flags & NFS_MOUNT_NORDIRPLUS))
-                        server->caps |= NFS_CAP_READDIRPLUS;
        server->options = data->options;
        /* Get a client record */
@@ -779,13 +806,6 @@ static int nfs4_init_server(struct nfs_server *server,
        if (error < 0)
                goto error;
-        /*
-         * Don't use NFS uid/gid mapping if we're using AUTH_SYS or lower
-         * authentication.
-         */
-        if (nfs4_disable_idmapping && data->auth_flavors[0] == RPC_AUTH_UNIX)
-                server->caps |= NFS_CAP_UIDGID_NOMAP;
        if (data->rsize)
                server->rsize = nfs_block_size(data->rsize, NULL);
        if (data->wsize)
@@ -863,7 +883,6 @@ struct nfs_server *nfs4_create_referral_server(struct nfs_clone_mount *data,
        /* Initialise the client representation from the parent server */
        nfs_server_copy_userdata(server, parent_server);
-        server->caps |= NFS_CAP_ATOMIC_OPEN|NFS_CAP_CHANGE_ATTR;
        /* Get a client representation.
         * Note: NFSv4 always uses TCP, */
diff --git a/fs/nfs/nfs4filelayout.c b/fs/nfs/nfs4filelayout.c
index 4fb234d3aefb..22d10623f5ee 100644
--- a/fs/nfs/nfs4filelayout.c
+++ b/fs/nfs/nfs4filelayout.c
@@ -158,11 +158,14 @@ static int filelayout_async_handle_error(struct rpc_task *task,
        case -NFS4ERR_OPENMODE:
                if (state == NULL)
                        break;
-                nfs4_schedule_stateid_recovery(mds_server, state);
+                if (nfs4_schedule_stateid_recovery(mds_server, state) < 0)
+                        goto out_bad_stateid;
                goto wait_on_recovery;
        case -NFS4ERR_EXPIRED:
-                if (state != NULL)
+                if (state != NULL) {
-                        nfs4_schedule_stateid_recovery(mds_server, state);
+                        if (nfs4_schedule_stateid_recovery(mds_server, state) < 0)
+                                goto out_bad_stateid;
+                }
                nfs4_schedule_lease_recovery(mds_client);
                goto wait_on_recovery;
        /* DS session errors */
@@ -226,6 +229,9 @@ reset:
 out:
        task->tk_status = 0;
        return -EAGAIN;
+out_bad_stateid:
+        task->tk_status = -EIO;
+        return 0;
 wait_on_recovery:
        rpc_sleep_on(&mds_client->cl_rpcwaitq, task, NULL);
        if (test_bit(NFS4CLNT_MANAGER_RUNNING, &mds_client->cl_state) == 0)
@@ -299,6 +305,10 @@ static void filelayout_read_prepare(struct rpc_task *task, void *data)
 {
        struct nfs_read_data *rdata = data;
+        if (unlikely(test_bit(NFS_CONTEXT_BAD, &rdata->args.context->flags))) {
+                rpc_exit(task, -EIO);
+                return;
+        }
        if (filelayout_reset_to_mds(rdata->header->lseg)) {
                dprintk("%s task %u reset io to MDS\n", __func__, task->tk_pid);
                filelayout_reset_read(rdata);
@@ -307,10 +317,13 @@ static void filelayout_read_prepare(struct rpc_task *task, void *data)
        }
        rdata->read_done_cb = filelayout_read_done_cb;
-        nfs41_setup_sequence(rdata->ds_clp->cl_session,
+        if (nfs41_setup_sequence(rdata->ds_clp->cl_session,
                        &rdata->args.seq_args,
                        &rdata->res.seq_res,
-                        task);
+                        task))
+                return;
+        nfs4_set_rw_stateid(&rdata->args.stateid, rdata->args.context,
+                        rdata->args.lock_context, FMODE_READ);
 }
 static void filelayout_read_call_done(struct rpc_task *task, void *data)
@@ -401,16 +414,23 @@ static void filelayout_write_prepare(struct rpc_task *task, void *data)
 {
        struct nfs_write_data *wdata = data;
+        if (unlikely(test_bit(NFS_CONTEXT_BAD, &wdata->args.context->flags))) {
+                rpc_exit(task, -EIO);
+                return;
+        }
        if (filelayout_reset_to_mds(wdata->header->lseg)) {
                dprintk("%s task %u reset io to MDS\n", __func__, task->tk_pid);
                filelayout_reset_write(wdata);
                rpc_exit(task, 0);
                return;
        }
-        nfs41_setup_sequence(wdata->ds_clp->cl_session,
+        if (nfs41_setup_sequence(wdata->ds_clp->cl_session,
                        &wdata->args.seq_args,
                        &wdata->res.seq_res,
-                        task);
+                        task))
+                return;
+        nfs4_set_rw_stateid(&wdata->args.stateid, wdata->args.context,
+                        wdata->args.lock_context, FMODE_WRITE);
 }
 static void filelayout_write_call_done(struct rpc_task *task, void *data)
diff --git a/fs/nfs/nfs4namespace.c b/fs/nfs/nfs4namespace.c
index 0dd766079e1c..cdb0b41a4810 100644
--- a/fs/nfs/nfs4namespace.c
+++ b/fs/nfs/nfs4namespace.c
@@ -134,33 +134,38 @@ static size_t nfs_parse_server_name(char *string, size_t len,
        return ret;
 }
+/**
+ * nfs_find_best_sec - Find a security mechanism supported locally
+ * @flavors: List of security tuples returned by SECINFO procedure
+ *
+ * Return the pseudoflavor of the first security mechanism in
+ * "flavors" that is locally supported.  Return RPC_AUTH_UNIX if
+ * no matching flavor is found in the array.  The "flavors" array
+ * is searched in the order returned from the server, per RFC 3530
+ * recommendation.
+ */
 rpc_authflavor_t nfs_find_best_sec(struct nfs4_secinfo_flavors *flavors)
 {
-        struct gss_api_mech *mech;
+        rpc_authflavor_t pseudoflavor;
-        struct xdr_netobj oid;
+        struct nfs4_secinfo4 *secinfo;
-        int i;
+        unsigned int i;
-        rpc_authflavor_t pseudoflavor = RPC_AUTH_UNIX;
        for (i = 0; i < flavors->num_flavors; i++) {
-                struct nfs4_secinfo_flavor *flavor;
+                secinfo = &flavors->flavors[i];
-                flavor = &flavors->flavors[i];
+                switch (secinfo->flavor) {
-                if (flavor->flavor == RPC_AUTH_NULL || flavor->flavor == RPC_AUTH_UNIX) {
+                case RPC_AUTH_NULL:
-                        pseudoflavor = flavor->flavor;
+                case RPC_AUTH_UNIX:
-                        break;
+                case RPC_AUTH_GSS:
-                } else if (flavor->flavor == RPC_AUTH_GSS) {
+                        pseudoflavor = rpcauth_get_pseudoflavor(secinfo->flavor,
-                        oid.len  = flavor->gss.sec_oid4.len;
+                                                        &secinfo->flavor_info);
-                        oid.data = flavor->gss.sec_oid4.data;
+                        if (pseudoflavor != RPC_AUTH_MAXFLAVOR)
-                        mech = gss_mech_get_by_OID(&oid);
+                                return pseudoflavor;
-                        if (!mech)
-                                continue;
-                        pseudoflavor = gss_svc_to_pseudoflavor(mech, flavor->gss.service);
-                        gss_mech_put(mech);
                        break;
                }
        }
-        return pseudoflavor;
+        return RPC_AUTH_UNIX;
 }
 static rpc_authflavor_t nfs4_negotiate_security(struct inode *inode, struct qstr *name)
diff --git a/fs/nfs/nfs4proc.c b/fs/nfs/nfs4proc.c
index 26431cf62ddb..9da4bd55eb30 100644
--- a/fs/nfs/nfs4proc.c
+++ b/fs/nfs/nfs4proc.c
@@ -107,6 +107,8 @@ static int nfs4_map_errors(int err)
                return -EPROTONOSUPPORT;
        case -NFS4ERR_ACCESS:
                return -EACCES;
+        case -NFS4ERR_FILE_OPEN:
+                return -EBUSY;
        default:
                dprintk("%s could not handle NFSv4 error %d\n",
                                __func__, -err);
@@ -295,19 +297,30 @@ static int nfs4_handle_exception(struct nfs_server *server, int errorcode, struc
                        }
                        if (state == NULL)
                                break;
-                        nfs4_schedule_stateid_recovery(server, state);
+                        ret = nfs4_schedule_stateid_recovery(server, state);
+                        if (ret < 0)
+                                break;
                        goto wait_on_recovery;
                case -NFS4ERR_DELEG_REVOKED:
                case -NFS4ERR_ADMIN_REVOKED:
                case -NFS4ERR_BAD_STATEID:
+                        if (inode != NULL && nfs4_have_delegation(inode, FMODE_READ)) {
+                                nfs_remove_bad_delegation(inode);
+                                exception->retry = 1;
+                                break;
+                        }
                        if (state == NULL)
                                break;
-                        nfs_remove_bad_delegation(state->inode);
+                        ret = nfs4_schedule_stateid_recovery(server, state);
-                        nfs4_schedule_stateid_recovery(server, state);
+                        if (ret < 0)
+                                break;
                        goto wait_on_recovery;
                case -NFS4ERR_EXPIRED:
-                        if (state != NULL)
+                        if (state != NULL) {
-                                nfs4_schedule_stateid_recovery(server, state);
+                                ret = nfs4_schedule_stateid_recovery(server, state);
+                                if (ret < 0)
+                                        break;
+                        }
                case -NFS4ERR_STALE_STATEID:
                case -NFS4ERR_STALE_CLIENTID:
                        nfs4_schedule_lease_recovery(clp);
@@ -756,10 +769,40 @@ struct nfs4_opendata {
        struct iattr attrs;
        unsigned long timestamp;
        unsigned int rpc_done : 1;
+        unsigned int is_recover : 1;
        int rpc_status;
        int cancelled;
 };
+static bool nfs4_clear_cap_atomic_open_v1(struct nfs_server *server,
+                int err, struct nfs4_exception *exception)
+{
+        if (err != -EINVAL)
+                return false;
+        if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
+                return false;
+        server->caps &= ~NFS_CAP_ATOMIC_OPEN_V1;
+        exception->retry = 1;
+        return true;
+}
+static enum open_claim_type4
+nfs4_map_atomic_open_claim(struct nfs_server *server,
+                enum open_claim_type4 claim)
+{
+        if (server->caps & NFS_CAP_ATOMIC_OPEN_V1)
+                return claim;
+        switch (claim) {
+        default:
+                return claim;
+        case NFS4_OPEN_CLAIM_FH:
+                return NFS4_OPEN_CLAIM_NULL;
+        case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
+                return NFS4_OPEN_CLAIM_DELEGATE_CUR;
+        case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
+                return NFS4_OPEN_CLAIM_DELEGATE_PREV;
+        }
+}
 static void nfs4_init_opendata_res(struct nfs4_opendata *p)
 {
@@ -775,6 +818,7 @@ static void nfs4_init_opendata_res(struct nfs4_opendata *p)
 static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
                struct nfs4_state_owner *sp, fmode_t fmode, int flags,
                const struct iattr *attrs,
+                enum open_claim_type4 claim,
                gfp_t gfp_mask)
 {
        struct dentry *parent = dget_parent(dentry);
@@ -793,7 +837,6 @@ static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
        p->dir = parent;
        p->owner = sp;
        atomic_inc(&sp->so_count);
-        p->o_arg.fh = NFS_FH(dir);
        p->o_arg.open_flags = flags;
        p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
        /* don't put an ACCESS op in OPEN compound if O_EXCL, because ACCESS
@@ -811,7 +854,19 @@ static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
        p->o_arg.server = server;
        p->o_arg.bitmask = server->attr_bitmask;
        p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
-        p->o_arg.claim = NFS4_OPEN_CLAIM_NULL;
+        p->o_arg.claim = nfs4_map_atomic_open_claim(server, claim);
+        switch (p->o_arg.claim) {
+        case NFS4_OPEN_CLAIM_NULL:
+        case NFS4_OPEN_CLAIM_DELEGATE_CUR:
+        case NFS4_OPEN_CLAIM_DELEGATE_PREV:
+                p->o_arg.fh = NFS_FH(dir);
+                break;
+        case NFS4_OPEN_CLAIM_PREVIOUS:
+        case NFS4_OPEN_CLAIM_FH:
+        case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
+        case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
+                p->o_arg.fh = NFS_FH(dentry->d_inode);
+        }
        if (attrs != NULL && attrs->ia_valid != 0) {
                __be32 verf[2];
@@ -924,6 +979,7 @@ static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *
        if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
                nfs4_stateid_copy(&state->stateid, stateid);
        nfs4_stateid_copy(&state->open_stateid, stateid);
+        set_bit(NFS_OPEN_STATE, &state->flags);
        switch (fmode) {
                case FMODE_READ:
                        set_bit(NFS_O_RDONLY_STATE, &state->flags);
@@ -1046,9 +1102,12 @@ static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
                /* Save the delegation */
                nfs4_stateid_copy(&stateid, &delegation->stateid);
                rcu_read_unlock();
-                ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
+                nfs_release_seqid(opendata->o_arg.seqid);
-                if (ret != 0)
+                if (!opendata->is_recover) {
-                        goto out;
+                        ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
+                        if (ret != 0)
+                                goto out;
+                }
                ret = -EAGAIN;
                /* Try to update the stateid using the delegation */
@@ -1193,11 +1252,13 @@ static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *
        return ERR_PTR(-ENOENT);
 }
-static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx, struct nfs4_state *state)
+static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx,
+                struct nfs4_state *state, enum open_claim_type4 claim)
 {
        struct nfs4_opendata *opendata;
-        opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0, NULL, GFP_NOFS);
+        opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0,
+                        NULL, claim, GFP_NOFS);
        if (opendata == NULL)
                return ERR_PTR(-ENOMEM);
        opendata->state = state;
@@ -1233,6 +1294,7 @@ static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *
        /* memory barrier prior to reading state->n_* */
        clear_bit(NFS_DELEGATED_STATE, &state->flags);
+        clear_bit(NFS_OPEN_STATE, &state->flags);
        smp_rmb();
        if (state->n_rdwr != 0) {
                clear_bit(NFS_O_RDWR_STATE, &state->flags);
@@ -1283,11 +1345,10 @@ static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state
        fmode_t delegation_type = 0;
        int status;
-        opendata = nfs4_open_recoverdata_alloc(ctx, state);
+        opendata = nfs4_open_recoverdata_alloc(ctx, state,
+                        NFS4_OPEN_CLAIM_PREVIOUS);
        if (IS_ERR(opendata))
                return PTR_ERR(opendata);
-        opendata->o_arg.claim = NFS4_OPEN_CLAIM_PREVIOUS;
-        opendata->o_arg.fh = NFS_FH(state->inode);
        rcu_read_lock();
        delegation = rcu_dereference(NFS_I(state->inode)->delegation);
        if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
@@ -1306,6 +1367,8 @@ static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state
        int err;
        do {
                err = _nfs4_do_open_reclaim(ctx, state);
+                if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
+                        continue;
                if (err != -NFS4ERR_DELAY)
                        break;
                nfs4_handle_exception(server, err, &exception);
@@ -1320,71 +1383,72 @@ static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *sta
        ctx = nfs4_state_find_open_context(state);
        if (IS_ERR(ctx))
-                return PTR_ERR(ctx);
+                return -EAGAIN;
        ret = nfs4_do_open_reclaim(ctx, state);
        put_nfs_open_context(ctx);
        return ret;
 }
-static int _nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
+static int nfs4_handle_delegation_recall_error(struct nfs_server *server, struct nfs4_state *state, const nfs4_stateid *stateid, int err)
 {
-        struct nfs4_opendata *opendata;
+        switch (err) {
-        int ret;
+                default:
+                        printk(KERN_ERR "NFS: %s: unhandled error "
-        opendata = nfs4_open_recoverdata_alloc(ctx, state);
+                                        "%d.\n", __func__, err);
-        if (IS_ERR(opendata))
+                case 0:
-                return PTR_ERR(opendata);
+                case -ENOENT:
-        opendata->o_arg.claim = NFS4_OPEN_CLAIM_DELEGATE_CUR;
+                case -ESTALE:
-        nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
+                        break;
-        ret = nfs4_open_recover(opendata, state);
+                case -NFS4ERR_BADSESSION:
-        nfs4_opendata_put(opendata);
+                case -NFS4ERR_BADSLOT:
-        return ret;
+                case -NFS4ERR_BAD_HIGH_SLOT:
+                case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
+                case -NFS4ERR_DEADSESSION:
+                        set_bit(NFS_DELEGATED_STATE, &state->flags);
+                        nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
+                        return -EAGAIN;
+                case -NFS4ERR_STALE_CLIENTID:
+                case -NFS4ERR_STALE_STATEID:
+                        set_bit(NFS_DELEGATED_STATE, &state->flags);
+                case -NFS4ERR_EXPIRED:
+                        /* Don't recall a delegation if it was lost */
+                        nfs4_schedule_lease_recovery(server->nfs_client);
+                        return -EAGAIN;
+                case -NFS4ERR_DELEG_REVOKED:
+                case -NFS4ERR_ADMIN_REVOKED:
+                case -NFS4ERR_BAD_STATEID:
+                case -NFS4ERR_OPENMODE:
+                        nfs_inode_find_state_and_recover(state->inode,
+                                        stateid);
+                        nfs4_schedule_stateid_recovery(server, state);
+                        return 0;
+                case -NFS4ERR_DELAY:
+                case -NFS4ERR_GRACE:
+                        set_bit(NFS_DELEGATED_STATE, &state->flags);
+                        ssleep(1);
+                        return -EAGAIN;
+                case -ENOMEM:
+                case -NFS4ERR_DENIED:
+                        /* kill_proc(fl->fl_pid, SIGLOST, 1); */
+                        return 0;
+        }
+        return err;
 }
 int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
 {
-        struct nfs4_exception exception = { };
        struct nfs_server *server = NFS_SERVER(state->inode);
+        struct nfs4_opendata *opendata;
        int err;
-        do {
-                err = _nfs4_open_delegation_recall(ctx, state, stateid);
+        opendata = nfs4_open_recoverdata_alloc(ctx, state,
-                switch (err) {
+                        NFS4_OPEN_CLAIM_DELEG_CUR_FH);
-                        case 0:
+        if (IS_ERR(opendata))
-                        case -ENOENT:
+                return PTR_ERR(opendata);
-                        case -ESTALE:
+        nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
-                                goto out;
+        err = nfs4_open_recover(opendata, state);
-                        case -NFS4ERR_BADSESSION:
+        nfs4_opendata_put(opendata);
-                        case -NFS4ERR_BADSLOT:
+        return nfs4_handle_delegation_recall_error(server, state, stateid, err);
-                        case -NFS4ERR_BAD_HIGH_SLOT:
-                        case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
-                        case -NFS4ERR_DEADSESSION:
-                                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                                nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
-                                err = -EAGAIN;
-                                goto out;
-                        case -NFS4ERR_STALE_CLIENTID:
-                        case -NFS4ERR_STALE_STATEID:
-                                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                        case -NFS4ERR_EXPIRED:
-                                /* Don't recall a delegation if it was lost */
-                                nfs4_schedule_lease_recovery(server->nfs_client);
-                                err = -EAGAIN;
-                                goto out;
-                        case -NFS4ERR_DELEG_REVOKED:
-                        case -NFS4ERR_ADMIN_REVOKED:
-                        case -NFS4ERR_BAD_STATEID:
-                                nfs_inode_find_state_and_recover(state->inode,
-                                                stateid);
-                                nfs4_schedule_stateid_recovery(server, state);
-                        case -ENOMEM:
-                                err = 0;
-                                goto out;
-                }
-                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                err = nfs4_handle_exception(server, err, &exception);
-        } while (exception.retry);
-out:
-        return err;
 }
 static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
@@ -1467,6 +1531,7 @@ static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
 {
        struct nfs4_opendata *data = calldata;
        struct nfs4_state_owner *sp = data->owner;
+        struct nfs_client *clp = sp->so_server->nfs_client;
        if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
                goto out_wait;
@@ -1482,15 +1547,20 @@ static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
                rcu_read_lock();
                delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
                if (data->o_arg.claim != NFS4_OPEN_CLAIM_DELEGATE_CUR &&
+                    data->o_arg.claim != NFS4_OPEN_CLAIM_DELEG_CUR_FH &&
                    can_open_delegated(delegation, data->o_arg.fmode))
                        goto unlock_no_action;
                rcu_read_unlock();
        }
        /* Update client id. */
-        data->o_arg.clientid = sp->so_server->nfs_client->cl_clientid;
+        data->o_arg.clientid = clp->cl_clientid;
-        if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS) {
+        switch (data->o_arg.claim) {
-                task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
+        case NFS4_OPEN_CLAIM_PREVIOUS:
+        case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
+        case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
                data->o_arg.open_bitmap = &nfs4_open_noattr_bitmap[0];
+        case NFS4_OPEN_CLAIM_FH:
+                task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
                nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
        }
        data->timestamp = jiffies;
@@ -1499,6 +1569,16 @@ static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
                                &data->o_res.seq_res,
                                task) != 0)
                nfs_release_seqid(data->o_arg.seqid);
+        /* Set the create mode (note dependency on the session type) */
+        data->o_arg.createmode = NFS4_CREATE_UNCHECKED;
+        if (data->o_arg.open_flags & O_EXCL) {
+                data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE;
+                if (nfs4_has_persistent_session(clp))
+                        data->o_arg.createmode = NFS4_CREATE_GUARDED;
+                else if (clp->cl_mvops->minor_version > 0)
+                        data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE4_1;
+        }
        return;
 unlock_no_action:
        rcu_read_unlock();
@@ -1594,8 +1674,11 @@ static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
        data->rpc_done = 0;
        data->rpc_status = 0;
        data->cancelled = 0;
-        if (isrecover)
+        data->is_recover = 0;
+        if (isrecover) {
                nfs4_set_sequence_privileged(&o_arg->seq_args);
+                data->is_recover = 1;
+        }
        task = rpc_run_task(&task_setup_data);
        if (IS_ERR(task))
                return PTR_ERR(task);
@@ -1720,7 +1803,8 @@ static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *s
        struct nfs4_opendata *opendata;
        int ret;
-        opendata = nfs4_open_recoverdata_alloc(ctx, state);
+        opendata = nfs4_open_recoverdata_alloc(ctx, state,
+                        NFS4_OPEN_CLAIM_FH);
        if (IS_ERR(opendata))
                return PTR_ERR(opendata);
        ret = nfs4_open_recover(opendata, state);
@@ -1738,6 +1822,8 @@ static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state
        do {
                err = _nfs4_open_expired(ctx, state);
+                if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
+                        continue;
                switch (err) {
                default:
                        goto out;
@@ -1758,7 +1844,7 @@ static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *sta
        ctx = nfs4_state_find_open_context(state);
        if (IS_ERR(ctx))
-                return PTR_ERR(ctx);
+                return -EAGAIN;
        ret = nfs4_do_open_expired(ctx, state);
        put_nfs_open_context(ctx);
        return ret;
@@ -1820,6 +1906,7 @@ static int nfs41_check_open_stateid(struct nfs4_state *state)
                clear_bit(NFS_O_RDONLY_STATE, &state->flags);
                clear_bit(NFS_O_WRONLY_STATE, &state->flags);
                clear_bit(NFS_O_RDWR_STATE, &state->flags);
+                clear_bit(NFS_OPEN_STATE, &state->flags);
        }
        return status;
 }
@@ -1880,10 +1967,8 @@ static int _nfs4_open_and_get_state(struct nfs4_opendata *opendata,
        if (ret != 0)
                goto out;
-        if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq)) {
+        if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
                nfs4_schedule_stateid_recovery(server, state);
-                nfs4_wait_clnt_recover(server->nfs_client);
-        }
        *res = state;
 out:
        return ret;
@@ -1905,6 +1990,7 @@ static int _nfs4_do_open(struct inode *dir,
        struct nfs4_state     *state = NULL;
        struct nfs_server       *server = NFS_SERVER(dir);
        struct nfs4_opendata *opendata;
+        enum open_claim_type4 claim = NFS4_OPEN_CLAIM_NULL;
        int status;
        /* Protect against reboot recovery conflicts */
@@ -1920,7 +2006,10 @@ static int _nfs4_do_open(struct inode *dir,
        if (dentry->d_inode != NULL)
                nfs4_return_incompatible_delegation(dentry->d_inode, fmode);
        status = -ENOMEM;
-        opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr, GFP_KERNEL);
+        if (dentry->d_inode)
+                claim = NFS4_OPEN_CLAIM_FH;
+        opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr,
+                        claim, GFP_KERNEL);
        if (opendata == NULL)
                goto err_put_state_owner;
@@ -1937,7 +2026,8 @@ static int _nfs4_do_open(struct inode *dir,
        if (status != 0)
                goto err_opendata_put;
-        if (opendata->o_arg.open_flags & O_EXCL) {
+        if ((opendata->o_arg.open_flags & O_EXCL) &&
+            (opendata->o_arg.createmode != NFS4_CREATE_GUARDED)) {
                nfs4_exclusive_attrset(opendata, sattr);
                nfs_fattr_init(opendata->o_res.f_attr);
@@ -1978,6 +2068,7 @@ static struct nfs4_state *nfs4_do_open(struct inode *dir,
                                        struct rpc_cred *cred,
                                        struct nfs4_threshold **ctx_th)
 {
+        struct nfs_server *server = NFS_SERVER(dir);
        struct nfs4_exception exception = { };
        struct nfs4_state *res;
        int status;
@@ -2021,7 +2112,9 @@ static struct nfs4_state *nfs4_do_open(struct inode *dir,
                        exception.retry = 1;
                        continue;
                }
-                res = ERR_PTR(nfs4_handle_exception(NFS_SERVER(dir),
+                if (nfs4_clear_cap_atomic_open_v1(server, status, &exception))
+                        continue;
+                res = ERR_PTR(nfs4_handle_exception(server,
                                        status, &exception));
        } while (exception.retry);
        return res;
@@ -2049,20 +2142,25 @@ static int _nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
                .rpc_cred       = cred,
        };
        unsigned long timestamp = jiffies;
+        fmode_t fmode;
+        bool truncate;
        int status;
        nfs_fattr_init(fattr);
-        if (state != NULL) {
+        /* Servers should only apply open mode checks for file size changes */
+        truncate = (sattr->ia_valid & ATTR_SIZE) ? true : false;
+        fmode = truncate ? FMODE_WRITE : FMODE_READ;
+        if (nfs4_copy_delegation_stateid(&arg.stateid, inode, fmode)) {
+                /* Use that stateid */
+        } else if (truncate && state != NULL && nfs4_valid_open_stateid(state)) {
                struct nfs_lockowner lockowner = {
                        .l_owner = current->files,
                        .l_pid = current->tgid,
                };
                nfs4_select_rw_stateid(&arg.stateid, state, FMODE_WRITE,
                                &lockowner);
-        } else if (nfs4_copy_delegation_stateid(&arg.stateid, inode,
-                                FMODE_WRITE)) {
-                /* Use that stateid */
        } else
                nfs4_stateid_copy(&arg.stateid, &zero_stateid);
@@ -2086,6 +2184,13 @@ static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
                err = _nfs4_do_setattr(inode, cred, fattr, sattr, state);
                switch (err) {
                case -NFS4ERR_OPENMODE:
+                        if (!(sattr->ia_valid & ATTR_SIZE)) {
+                                pr_warn_once("NFSv4: server %s is incorrectly "
+                                                "applying open mode checks to "
+                                                "a SETATTR that is not "
+                                                "changing file size.\n",
+                                                server->nfs_client->cl_hostname);
+                        }
                        if (state && !(state->state & FMODE_WRITE)) {
                                err = -EBADF;
                                if (sattr->ia_valid & ATTR_OPEN)
@@ -2129,11 +2234,19 @@ static void nfs4_close_clear_stateid_flags(struct nfs4_state *state,
                fmode_t fmode)
 {
        spin_lock(&state->owner->so_lock);
-        if (!(fmode & FMODE_READ))
+        clear_bit(NFS_O_RDWR_STATE, &state->flags);
+        switch (fmode & (FMODE_READ|FMODE_WRITE)) {
+        case FMODE_WRITE:
                clear_bit(NFS_O_RDONLY_STATE, &state->flags);
-        if (!(fmode & FMODE_WRITE))
+                break;
+        case FMODE_READ:
                clear_bit(NFS_O_WRONLY_STATE, &state->flags);
-        clear_bit(NFS_O_RDWR_STATE, &state->flags);
+                break;
+        case 0:
+                clear_bit(NFS_O_RDONLY_STATE, &state->flags);
+                clear_bit(NFS_O_WRONLY_STATE, &state->flags);
+                clear_bit(NFS_OPEN_STATE, &state->flags);
+        }
        spin_unlock(&state->owner->so_lock);
 }
@@ -2201,6 +2314,8 @@ static void nfs4_close_prepare(struct rpc_task *task, void *data)
                        calldata->arg.fmode &= ~FMODE_WRITE;
                }
        }
+        if (!nfs4_valid_open_stateid(state))
+                call_close = 0;
        spin_unlock(&state->owner->so_lock);
        if (!call_close) {
@@ -2211,8 +2326,10 @@ static void nfs4_close_prepare(struct rpc_task *task, void *data)
        if (calldata->arg.fmode == 0) {
                task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
                if (calldata->roc &&
-                    pnfs_roc_drain(inode, &calldata->roc_barrier, task))
+                    pnfs_roc_drain(inode, &calldata->roc_barrier, task)) {
+                        nfs_release_seqid(calldata->arg.seqid);
                        goto out_wait;
+                    }
        }
        nfs_fattr_init(calldata->res.fattr);
@@ -2443,7 +2560,7 @@ static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandl
        auth = rpcauth_create(flavor, server->client);
        if (IS_ERR(auth)) {
-                ret = -EIO;
+                ret = -EACCES;
                goto out;
        }
        ret = nfs4_lookup_root(server, fhandle, info);
@@ -2451,27 +2568,36 @@ out:
        return ret;
 }
+/*
+ * Retry pseudoroot lookup with various security flavors.  We do this when:
+ *
+ *   NFSv4.0: the PUTROOTFH operation returns NFS4ERR_WRONGSEC
+ *   NFSv4.1: the server does not support the SECINFO_NO_NAME operation
+ *
+ * Returns zero on success, or a negative NFS4ERR value, or a
+ * negative errno value.
+ */
 static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
                              struct nfs_fsinfo *info)
 {
-        int i, len, status = 0;
+        /* Per 3530bis 15.33.5 */
-        rpc_authflavor_t flav_array[NFS_MAX_SECFLAVORS];
+        static const rpc_authflavor_t flav_array[] = {
+                RPC_AUTH_GSS_KRB5P,
-        len = rpcauth_list_flavors(flav_array, ARRAY_SIZE(flav_array));
+                RPC_AUTH_GSS_KRB5I,
-        if (len < 0)
+                RPC_AUTH_GSS_KRB5,
-                return len;
+                RPC_AUTH_UNIX,                  /* courtesy */
+                RPC_AUTH_NULL,
-        for (i = 0; i < len; i++) {
+        };
-                /* AUTH_UNIX is the default flavor if none was specified,
+        int status = -EPERM;
-                 * thus has already been tried. */
+        size_t i;
-                if (flav_array[i] == RPC_AUTH_UNIX)
-                        continue;
+        for (i = 0; i < ARRAY_SIZE(flav_array); i++) {
                status = nfs4_lookup_root_sec(server, fhandle, info, flav_array[i]);
                if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
                        continue;
                break;
        }
        /*
         * -EACCESS could mean that the user doesn't have correct permissions
         * to access the mount.  It could also mean that we tried to mount
@@ -2484,24 +2610,36 @@ static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
        return status;
 }
-/*
+static int nfs4_do_find_root_sec(struct nfs_server *server,
- * get the file handle for the "/" directory on the server
+                struct nfs_fh *fhandle, struct nfs_fsinfo *info)
+{
+        int mv = server->nfs_client->cl_minorversion;
+        return nfs_v4_minor_ops[mv]->find_root_sec(server, fhandle, info);
+}
+/**
+ * nfs4_proc_get_rootfh - get file handle for server's pseudoroot
+ * @server: initialized nfs_server handle
+ * @fhandle: we fill in the pseudo-fs root file handle
+ * @info: we fill in an FSINFO struct
+ *
+ * Returns zero on success, or a negative errno.
 */
 int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
                         struct nfs_fsinfo *info)
 {
-        int minor_version = server->nfs_client->cl_minorversion;
+        int status;
-        int status = nfs4_lookup_root(server, fhandle, info);
-        if ((status == -NFS4ERR_WRONGSEC) && !(server->flags & NFS_MOUNT_SECFLAVOUR))
+        status = nfs4_lookup_root(server, fhandle, info);
-                /*
+        if ((status == -NFS4ERR_WRONGSEC) &&
-                 * A status of -NFS4ERR_WRONGSEC will be mapped to -EPERM
+            !(server->flags & NFS_MOUNT_SECFLAVOUR))
-                 * by nfs4_map_errors() as this function exits.
+                status = nfs4_do_find_root_sec(server, fhandle, info);
-                 */
-                status = nfs_v4_minor_ops[minor_version]->find_root_sec(server, fhandle, info);
        if (status == 0)
                status = nfs4_server_capabilities(server, fhandle);
        if (status == 0)
                status = nfs4_do_fsinfo(server, fhandle, info);
        return nfs4_map_errors(status);
 }
@@ -3380,12 +3518,21 @@ static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
 static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
 {
        struct nfs4_exception exception = { };
+        unsigned long now = jiffies;
        int err;
        do {
-                err = nfs4_handle_exception(server,
+                err = _nfs4_do_fsinfo(server, fhandle, fsinfo);
-                                _nfs4_do_fsinfo(server, fhandle, fsinfo),
+                if (err == 0) {
-                                &exception);
+                        struct nfs_client *clp = server->nfs_client;
+                        spin_lock(&clp->cl_lock);
+                        clp->cl_lease_time = fsinfo->lease_time * HZ;
+                        clp->cl_last_renewal = now;
+                        spin_unlock(&clp->cl_lock);
+                        break;
+                }
+                err = nfs4_handle_exception(server, err, &exception);
        } while (exception.retry);
        return err;
 }
@@ -3445,6 +3592,46 @@ static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
        return err;
 }
+int nfs4_set_rw_stateid(nfs4_stateid *stateid,
+                const struct nfs_open_context *ctx,
+                const struct nfs_lock_context *l_ctx,
+                fmode_t fmode)
+{
+        const struct nfs_lockowner *lockowner = NULL;
+        if (l_ctx != NULL)
+                lockowner = &l_ctx->lockowner;
+        return nfs4_select_rw_stateid(stateid, ctx->state, fmode, lockowner);
+}
+EXPORT_SYMBOL_GPL(nfs4_set_rw_stateid);
+static bool nfs4_stateid_is_current(nfs4_stateid *stateid,
+                const struct nfs_open_context *ctx,
+                const struct nfs_lock_context *l_ctx,
+                fmode_t fmode)
+{
+        nfs4_stateid current_stateid;
+        if (nfs4_set_rw_stateid(&current_stateid, ctx, l_ctx, fmode))
+                return false;
+        return nfs4_stateid_match(stateid, &current_stateid);
+}
+static bool nfs4_error_stateid_expired(int err)
+{
+        switch (err) {
+        case -NFS4ERR_DELEG_REVOKED:
+        case -NFS4ERR_ADMIN_REVOKED:
+        case -NFS4ERR_BAD_STATEID:
+        case -NFS4ERR_STALE_STATEID:
+        case -NFS4ERR_OLD_STATEID:
+        case -NFS4ERR_OPENMODE:
+        case -NFS4ERR_EXPIRED:
+                return true;
+        }
+        return false;
+}
 void __nfs4_read_done_cb(struct nfs_read_data *data)
 {
        nfs_invalidate_atime(data->header->inode);
@@ -3465,6 +3652,20 @@ static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_read_data *data)
        return 0;
 }
+static bool nfs4_read_stateid_changed(struct rpc_task *task,
+                struct nfs_readargs *args)
+{
+        if (!nfs4_error_stateid_expired(task->tk_status) ||
+                nfs4_stateid_is_current(&args->stateid,
+                                args->context,
+                                args->lock_context,
+                                FMODE_READ))
+                return false;
+        rpc_restart_call_prepare(task);
+        return true;
+}
 static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
 {
@@ -3472,7 +3673,8 @@ static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
        if (!nfs4_sequence_done(task, &data->res.seq_res))
                return -EAGAIN;
+        if (nfs4_read_stateid_changed(task, &data->args))
+                return -EAGAIN;
        return data->read_done_cb ? data->read_done_cb(task, data) :
                                    nfs4_read_done_cb(task, data);
 }
@@ -3487,10 +3689,13 @@ static void nfs4_proc_read_setup(struct nfs_read_data *data, struct rpc_message
 static void nfs4_proc_read_rpc_prepare(struct rpc_task *task, struct nfs_read_data *data)
 {
-        nfs4_setup_sequence(NFS_SERVER(data->header->inode),
+        if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
                        &data->args.seq_args,
                        &data->res.seq_res,
-                        task);
+                        task))
+                return;
+        nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
+                        data->args.lock_context, FMODE_READ);
 }
 static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data)
@@ -3508,10 +3713,26 @@ static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data
        return 0;
 }
+static bool nfs4_write_stateid_changed(struct rpc_task *task,
+                struct nfs_writeargs *args)
+{
+        if (!nfs4_error_stateid_expired(task->tk_status) ||
+                nfs4_stateid_is_current(&args->stateid,
+                                args->context,
+                                args->lock_context,
+                                FMODE_WRITE))
+                return false;
+        rpc_restart_call_prepare(task);
+        return true;
+}
 static int nfs4_write_done(struct rpc_task *task, struct nfs_write_data *data)
 {
        if (!nfs4_sequence_done(task, &data->res.seq_res))
                return -EAGAIN;
+        if (nfs4_write_stateid_changed(task, &data->args))
+                return -EAGAIN;
        return data->write_done_cb ? data->write_done_cb(task, data) :
                nfs4_write_done_cb(task, data);
 }
@@ -3551,10 +3772,13 @@ static void nfs4_proc_write_setup(struct nfs_write_data *data, struct rpc_messag
 static void nfs4_proc_write_rpc_prepare(struct rpc_task *task, struct nfs_write_data *data)
 {
-        nfs4_setup_sequence(NFS_SERVER(data->header->inode),
+        if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
                        &data->args.seq_args,
                        &data->res.seq_res,
-                        task);
+                        task))
+                return;
+        nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
+                        data->args.lock_context, FMODE_WRITE);
 }
 static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
@@ -3656,7 +3880,7 @@ static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred,
                return -ENOMEM;
        data->client = clp;
        data->timestamp = jiffies;
-        return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_SOFT,
+        return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT,
                        &nfs4_renew_ops, data);
 }
@@ -3670,7 +3894,7 @@ static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
        unsigned long now = jiffies;
        int status;
-        status = rpc_call_sync(clp->cl_rpcclient, &msg, 0);
+        status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
        if (status < 0)
                return status;
        do_renew_lease(clp, now);
@@ -3980,11 +4204,14 @@ nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server,
                case -NFS4ERR_OPENMODE:
                        if (state == NULL)
                                break;
-                        nfs4_schedule_stateid_recovery(server, state);
+                        if (nfs4_schedule_stateid_recovery(server, state) < 0)
+                                goto stateid_invalid;
                        goto wait_on_recovery;
                case -NFS4ERR_EXPIRED:
-                        if (state != NULL)
+                        if (state != NULL) {
-                                nfs4_schedule_stateid_recovery(server, state);
+                                if (nfs4_schedule_stateid_recovery(server, state) < 0)
+                                        goto stateid_invalid;
+                        }
                case -NFS4ERR_STALE_STATEID:
                case -NFS4ERR_STALE_CLIENTID:
                        nfs4_schedule_lease_recovery(clp);
@@ -4016,6 +4243,9 @@ nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server,
        }
        task->tk_status = nfs4_map_errors(task->tk_status);
        return 0;
+stateid_invalid:
+        task->tk_status = -EIO;
+        return 0;
 wait_on_recovery:
        rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
        if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
@@ -4143,27 +4373,17 @@ int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
                struct nfs4_setclientid_res *arg,
                struct rpc_cred *cred)
 {
-        struct nfs_fsinfo fsinfo;
        struct rpc_message msg = {
                .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
                .rpc_argp = arg,
-                .rpc_resp = &fsinfo,
                .rpc_cred = cred,
        };
-        unsigned long now;
        int status;
        dprintk("NFS call  setclientid_confirm auth=%s, (client ID %llx)\n",
                clp->cl_rpcclient->cl_auth->au_ops->au_name,
                clp->cl_clientid);
-        now = jiffies;
        status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
-        if (status == 0) {
-                spin_lock(&clp->cl_lock);
-                clp->cl_lease_time = fsinfo.lease_time * HZ;
-                clp->cl_last_renewal = now;
-                spin_unlock(&clp->cl_lock);
-        }
        dprintk("NFS reply setclientid_confirm: %d\n", status);
        return status;
 }
@@ -4627,17 +4847,23 @@ static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
                if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0) {
                        goto out_release_lock_seqid;
                }
-                data->arg.open_stateid = &state->stateid;
+                data->arg.open_stateid = &state->open_stateid;
                data->arg.new_lock_owner = 1;
                data->res.open_seqid = data->arg.open_seqid;
        } else
                data->arg.new_lock_owner = 0;
+        if (!nfs4_valid_open_stateid(state)) {
+                data->rpc_status = -EBADF;
+                task->tk_action = NULL;
+                goto out_release_open_seqid;
+        }
        data->timestamp = jiffies;
        if (nfs4_setup_sequence(data->server,
                                &data->arg.seq_args,
                                &data->res.seq_res,
                                task) == 0)
                return;
+out_release_open_seqid:
        nfs_release_seqid(data->arg.open_seqid);
 out_release_lock_seqid:
        nfs_release_seqid(data->arg.lock_seqid);
@@ -4983,58 +5209,16 @@ nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
        return status;
 }
-int nfs4_lock_delegation_recall(struct nfs4_state *state, struct file_lock *fl)
+int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid)
 {
        struct nfs_server *server = NFS_SERVER(state->inode);
-        struct nfs4_exception exception = { };
        int err;
        err = nfs4_set_lock_state(state, fl);
        if (err != 0)
-                goto out;
+                return err;
-        do {
+        err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
-                err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
+        return nfs4_handle_delegation_recall_error(server, state, stateid, err);
-                switch (err) {
-                        default:
-                                printk(KERN_ERR "NFS: %s: unhandled error "
-                                        "%d.\n", __func__, err);
-                        case 0:
-                        case -ESTALE:
-                                goto out;
-                        case -NFS4ERR_STALE_CLIENTID:
-                        case -NFS4ERR_STALE_STATEID:
-                                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                        case -NFS4ERR_EXPIRED:
-                                nfs4_schedule_lease_recovery(server->nfs_client);
-                                err = -EAGAIN;
-                                goto out;
-                        case -NFS4ERR_BADSESSION:
-                        case -NFS4ERR_BADSLOT:
-                        case -NFS4ERR_BAD_HIGH_SLOT:
-                        case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
-                        case -NFS4ERR_DEADSESSION:
-                                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                                nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
-                                err = -EAGAIN;
-                                goto out;
-                        case -NFS4ERR_DELEG_REVOKED:
-                        case -NFS4ERR_ADMIN_REVOKED:
-                        case -NFS4ERR_BAD_STATEID:
-                        case -NFS4ERR_OPENMODE:
-                                nfs4_schedule_stateid_recovery(server, state);
-                                err = 0;
-                                goto out;
-                        case -ENOMEM:
-                        case -NFS4ERR_DENIED:
-                                /* kill_proc(fl->fl_pid, SIGLOST, 1); */
-                                err = 0;
-                                goto out;
-                }
-                set_bit(NFS_DELEGATED_STATE, &state->flags);
-                err = nfs4_handle_exception(server, err, &exception);
-        } while (exception.retry);
-out:
-        return err;
 }
 struct nfs_release_lockowner_data {
@@ -5848,7 +6032,7 @@ static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
                .rpc_client = clp->cl_rpcclient,
                .rpc_message = &msg,
                .callback_ops = &nfs41_sequence_ops,
-                .flags = RPC_TASK_ASYNC | RPC_TASK_SOFT,
+                .flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
        };
        if (!atomic_inc_not_zero(&clp->cl_count))
@@ -6725,6 +6909,10 @@ static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
 static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
        .minor_version = 0,
+        .init_caps = NFS_CAP_READDIRPLUS
+                | NFS_CAP_ATOMIC_OPEN
+                | NFS_CAP_CHANGE_ATTR
+                | NFS_CAP_POSIX_LOCK,
        .call_sync = _nfs4_call_sync,
        .match_stateid = nfs4_match_stateid,
        .find_root_sec = nfs4_find_root_sec,
@@ -6736,6 +6924,12 @@ static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
 #if defined(CONFIG_NFS_V4_1)
 static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
        .minor_version = 1,
+        .init_caps = NFS_CAP_READDIRPLUS
+                | NFS_CAP_ATOMIC_OPEN
+                | NFS_CAP_CHANGE_ATTR
+                | NFS_CAP_POSIX_LOCK
+                | NFS_CAP_STATEID_NFSV41
+                | NFS_CAP_ATOMIC_OPEN_V1,
        .call_sync = nfs4_call_sync_sequence,
        .match_stateid = nfs41_match_stateid,
        .find_root_sec = nfs41_find_root_sec,
diff --git a/fs/nfs/nfs4state.c b/fs/nfs/nfs4state.c
index 6ace365c6334..0b32f9483b7a 100644
--- a/fs/nfs/nfs4state.c
+++ b/fs/nfs/nfs4state.c
@@ -154,18 +154,6 @@ struct rpc_cred *nfs4_get_machine_cred_locked(struct nfs_client *clp)
        return cred;
 }
-static void nfs4_clear_machine_cred(struct nfs_client *clp)
-{
-        struct rpc_cred *cred;
-        spin_lock(&clp->cl_lock);
-        cred = clp->cl_machine_cred;
-        clp->cl_machine_cred = NULL;
-        spin_unlock(&clp->cl_lock);
-        if (cred != NULL)
-                put_rpccred(cred);
-}
 static struct rpc_cred *
 nfs4_get_renew_cred_server_locked(struct nfs_server *server)
 {
@@ -699,6 +687,8 @@ __nfs4_find_state_byowner(struct inode *inode, struct nfs4_state_owner *owner)
        list_for_each_entry(state, &nfsi->open_states, inode_states) {
                if (state->owner != owner)
                        continue;
+                if (!nfs4_valid_open_stateid(state))
+                        continue;
                if (atomic_inc_not_zero(&state->count))
                        return state;
        }
@@ -987,13 +977,14 @@ int nfs4_set_lock_state(struct nfs4_state *state, struct file_lock *fl)
        return 0;
 }
-static bool nfs4_copy_lock_stateid(nfs4_stateid *dst, struct nfs4_state *state,
+static int nfs4_copy_lock_stateid(nfs4_stateid *dst,
+                struct nfs4_state *state,
                const struct nfs_lockowner *lockowner)
 {
        struct nfs4_lock_state *lsp;
        fl_owner_t fl_owner;
        pid_t fl_pid;
-        bool ret = false;
+        int ret = -ENOENT;
        if (lockowner == NULL)
@@ -1008,7 +999,10 @@ static bool nfs4_copy_lock_stateid(nfs4_stateid *dst, struct nfs4_state *state,
        lsp = __nfs4_find_lock_state(state, fl_owner, fl_pid, NFS4_ANY_LOCK_TYPE);
        if (lsp != NULL && test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0) {
                nfs4_stateid_copy(dst, &lsp->ls_stateid);
-                ret = true;
+                ret = 0;
+                smp_rmb();
+                if (!list_empty(&lsp->ls_seqid.list))
+                        ret = -EWOULDBLOCK;
        }
        spin_unlock(&state->state_lock);
        nfs4_put_lock_state(lsp);
@@ -1016,28 +1010,44 @@ out:
        return ret;
 }
-static void nfs4_copy_open_stateid(nfs4_stateid *dst, struct nfs4_state *state)
+static int nfs4_copy_open_stateid(nfs4_stateid *dst, struct nfs4_state *state)
 {
+        const nfs4_stateid *src;
+        int ret;
        int seq;
        do {
+                src = &zero_stateid;
                seq = read_seqbegin(&state->seqlock);
-                nfs4_stateid_copy(dst, &state->stateid);
+                if (test_bit(NFS_OPEN_STATE, &state->flags))
+                        src = &state->open_stateid;
+                nfs4_stateid_copy(dst, src);
+                ret = 0;
+                smp_rmb();
+                if (!list_empty(&state->owner->so_seqid.list))
+                        ret = -EWOULDBLOCK;
        } while (read_seqretry(&state->seqlock, seq));
+        return ret;
 }
 /*
 * Byte-range lock aware utility to initialize the stateid of read/write
 * requests.
 */
-void nfs4_select_rw_stateid(nfs4_stateid *dst, struct nfs4_state *state,
+int nfs4_select_rw_stateid(nfs4_stateid *dst, struct nfs4_state *state,
                fmode_t fmode, const struct nfs_lockowner *lockowner)
 {
+        int ret = 0;
        if (nfs4_copy_delegation_stateid(dst, state->inode, fmode))
-                return;
+                goto out;
-        if (nfs4_copy_lock_stateid(dst, state, lockowner))
+        ret = nfs4_copy_lock_stateid(dst, state, lockowner);
-                return;
+        if (ret != -ENOENT)
-        nfs4_copy_open_stateid(dst, state);
+                goto out;
+        ret = nfs4_copy_open_stateid(dst, state);
+out:
+        if (nfs_server_capable(state->inode, NFS_CAP_STATEID_NFSV41))
+                dst->seqid = 0;
+        return ret;
 }
 struct nfs_seqid *nfs_alloc_seqid(struct nfs_seqid_counter *counter, gfp_t gfp_mask)
@@ -1286,14 +1296,17 @@ static int nfs4_state_mark_reclaim_nograce(struct nfs_client *clp, struct nfs4_s
        return 1;
 }
-void nfs4_schedule_stateid_recovery(const struct nfs_server *server, struct nfs4_state *state)
+int nfs4_schedule_stateid_recovery(const struct nfs_server *server, struct nfs4_state *state)
 {
        struct nfs_client *clp = server->nfs_client;
+        if (!nfs4_valid_open_stateid(state))
+                return -EBADF;
        nfs4_state_mark_reclaim_nograce(clp, state);
        dprintk("%s: scheduling stateid recovery for server %s\n", __func__,
                        clp->cl_hostname);
        nfs4_schedule_state_manager(clp);
+        return 0;
 }
 EXPORT_SYMBOL_GPL(nfs4_schedule_stateid_recovery);
@@ -1323,6 +1336,27 @@ void nfs_inode_find_state_and_recover(struct inode *inode,
                nfs4_schedule_state_manager(clp);
 }
+static void nfs4_state_mark_open_context_bad(struct nfs4_state *state)
+{
+        struct inode *inode = state->inode;
+        struct nfs_inode *nfsi = NFS_I(inode);
+        struct nfs_open_context *ctx;
+        spin_lock(&inode->i_lock);
+        list_for_each_entry(ctx, &nfsi->open_files, list) {
+                if (ctx->state != state)
+                        continue;
+                set_bit(NFS_CONTEXT_BAD, &ctx->flags);
+        }
+        spin_unlock(&inode->i_lock);
+}
+static void nfs4_state_mark_recovery_failed(struct nfs4_state *state, int error)
+{
+        set_bit(NFS_STATE_RECOVERY_FAILED, &state->flags);
+        nfs4_state_mark_open_context_bad(state);
+}
 static int nfs4_reclaim_locks(struct nfs4_state *state, const struct nfs4_state_recovery_ops *ops)
 {
@@ -1398,6 +1432,8 @@ restart:
        list_for_each_entry(state, &sp->so_states, open_states) {
                if (!test_and_clear_bit(ops->state_flag_bit, &state->flags))
                        continue;
+                if (!nfs4_valid_open_stateid(state))
+                        continue;
                if (state->state == 0)
                        continue;
                atomic_inc(&state->count);
@@ -1430,11 +1466,10 @@ restart:
                                 * Open state on this file cannot be recovered
                                 * All we can do is revert to using the zero stateid.
                                 */
-                                memset(&state->stateid, 0,
+                                nfs4_state_mark_recovery_failed(state, status);
-                                        sizeof(state->stateid));
-                                /* Mark the file as being 'closed' */
-                                state->state = 0;
                                break;
+                        case -EAGAIN:
+                                ssleep(1);
                        case -NFS4ERR_ADMIN_REVOKED:
                        case -NFS4ERR_STALE_STATEID:
                        case -NFS4ERR_BAD_STATEID:
@@ -1696,6 +1731,10 @@ static int nfs4_check_lease(struct nfs_client *clp)
        }
        status = ops->renew_lease(clp, cred);
        put_rpccred(cred);
+        if (status == -ETIMEDOUT) {
+                set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state);
+                return 0;
+        }
 out:
        return nfs4_recovery_handle_error(clp, status);
 }
@@ -1725,10 +1764,6 @@ static int nfs4_handle_reclaim_lease_error(struct nfs_client *clp, int status)
                clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
                return -EPERM;
        case -EACCES:
-                if (clp->cl_machine_cred == NULL)
-                        return -EACCES;
-                /* Handle case where the user hasn't set up machine creds */
-                nfs4_clear_machine_cred(clp);
        case -NFS4ERR_DELAY:
        case -ETIMEDOUT:
        case -EAGAIN:
@@ -1823,31 +1858,18 @@ int nfs4_discover_server_trunking(struct nfs_client *clp,
 {
        const struct nfs4_state_recovery_ops *ops =
                                clp->cl_mvops->reboot_recovery_ops;
-        rpc_authflavor_t *flavors, flav, save;
        struct rpc_clnt *clnt;
        struct rpc_cred *cred;
-        int i, len, status;
+        int i, status;
        dprintk("NFS: %s: testing '%s'\n", __func__, clp->cl_hostname);
-        len = NFS_MAX_SECFLAVORS;
-        flavors = kcalloc(len, sizeof(*flavors), GFP_KERNEL);
-        if (flavors == NULL) {
-                status = -ENOMEM;
-                goto out;
-        }
-        len = rpcauth_list_flavors(flavors, len);
-        if (len < 0) {
-                status = len;
-                goto out_free;
-        }
        clnt = clp->cl_rpcclient;
-        save = clnt->cl_auth->au_flavor;
        i = 0;
        mutex_lock(&nfs_clid_init_mutex);
-        status  = -ENOENT;
 again:
+        status  = -ENOENT;
        cred = ops->get_clid_cred(clp);
        if (cred == NULL)
                goto out_unlock;
@@ -1857,12 +1879,6 @@ again:
        switch (status) {
        case 0:
                break;
-        case -EACCES:
-                if (clp->cl_machine_cred == NULL)
-                        break;
-                /* Handle case where the user hasn't set up machine creds */
-                nfs4_clear_machine_cred(clp);
        case -NFS4ERR_DELAY:
        case -ETIMEDOUT:
        case -EAGAIN:
@@ -1871,22 +1887,23 @@ again:
                dprintk("NFS: %s after status %d, retrying\n",
                        __func__, status);
                goto again;
+        case -EACCES:
+                if (i++)
+                        break;
        case -NFS4ERR_CLID_INUSE:
        case -NFS4ERR_WRONGSEC:
-                status = -EPERM;
+                clnt = rpc_clone_client_set_auth(clnt, RPC_AUTH_UNIX);
-                if (i >= len)
-                        break;
-                flav = flavors[i++];
-                if (flav == save)
-                        flav = flavors[i++];
-                clnt = rpc_clone_client_set_auth(clnt, flav);
                if (IS_ERR(clnt)) {
                        status = PTR_ERR(clnt);
                        break;
                }
-                clp->cl_rpcclient = clnt;
+                /* Note: this is safe because we haven't yet marked the
+                 * client as ready, so we are the only user of
+                 * clp->cl_rpcclient
+                 */
+                clnt = xchg(&clp->cl_rpcclient, clnt);
+                rpc_shutdown_client(clnt);
+                clnt = clp->cl_rpcclient;
                goto again;
        case -NFS4ERR_MINOR_VERS_MISMATCH:
@@ -1897,13 +1914,15 @@ again:
        case -NFS4ERR_NOT_SAME: /* FixMe: implement recovery
                                 * in nfs4_exchange_id */
                status = -EKEYEXPIRED;
+                break;
+        default:
+                pr_warn("NFS: %s unhandled error %d. Exiting with error EIO\n",
+                                __func__, status);
+                status = -EIO;
        }
 out_unlock:
        mutex_unlock(&nfs_clid_init_mutex);
-out_free:
-        kfree(flavors);
-out:
        dprintk("NFS: %s: status = %d\n", __func__, status);
        return status;
 }
diff --git a/fs/nfs/nfs4super.c b/fs/nfs/nfs4super.c
index 569b166cc050..a5e1a3026d48 100644
--- a/fs/nfs/nfs4super.c
+++ b/fs/nfs/nfs4super.c
@@ -252,6 +252,8 @@ struct dentry *nfs4_try_mount(int flags, const char *dev_name,
        dfprintk(MOUNT, "--> nfs4_try_mount()\n");
+        if (data->auth_flavors[0] == RPC_AUTH_MAXFLAVOR)
+                data->auth_flavors[0] = RPC_AUTH_UNIX;
        export_path = data->nfs_server.export_path;
        data->nfs_server.export_path = "/";
        root_mnt = nfs_do_root_mount(&nfs4_remote_fs_type, flags, mount_info,
diff --git a/fs/nfs/nfs4xdr.c b/fs/nfs/nfs4xdr.c
index e3edda554ac7..3c79c5878c6d 100644
--- a/fs/nfs/nfs4xdr.c
+++ b/fs/nfs/nfs4xdr.c
@@ -530,14 +530,10 @@ static int nfs4_stat_to_errno(int);
                                decode_setclientid_maxsz)
 #define NFS4_enc_setclientid_confirm_sz \
                                (compound_encode_hdr_maxsz + \
-                                encode_setclientid_confirm_maxsz + \
+                                encode_setclientid_confirm_maxsz)
-                                encode_putrootfh_maxsz + \
-                                encode_fsinfo_maxsz)
 #define NFS4_dec_setclientid_confirm_sz \
                                (compound_decode_hdr_maxsz + \
-                                decode_setclientid_confirm_maxsz + \
+                                decode_setclientid_confirm_maxsz)
-                                decode_putrootfh_maxsz + \
-                                decode_fsinfo_maxsz)
 #define NFS4_enc_lock_sz        (compound_encode_hdr_maxsz + \
                                encode_sequence_maxsz + \
                                encode_putfh_maxsz + \
@@ -1058,8 +1054,7 @@ static void encode_attrs(struct xdr_stream *xdr, const struct iattr *iap, const
        if (iap->ia_valid & ATTR_ATIME_SET) {
                bmval1 |= FATTR4_WORD1_TIME_ACCESS_SET;
                *p++ = cpu_to_be32(NFS4_SET_TO_CLIENT_TIME);
-                *p++ = cpu_to_be32(0);
+                p = xdr_encode_hyper(p, (s64)iap->ia_atime.tv_sec);
-                *p++ = cpu_to_be32(iap->ia_atime.tv_sec);
                *p++ = cpu_to_be32(iap->ia_atime.tv_nsec);
        }
        else if (iap->ia_valid & ATTR_ATIME) {
@@ -1069,8 +1064,7 @@ static void encode_attrs(struct xdr_stream *xdr, const struct iattr *iap, const
        if (iap->ia_valid & ATTR_MTIME_SET) {
                bmval1 |= FATTR4_WORD1_TIME_MODIFY_SET;
                *p++ = cpu_to_be32(NFS4_SET_TO_CLIENT_TIME);
-                *p++ = cpu_to_be32(0);
+                p = xdr_encode_hyper(p, (s64)iap->ia_mtime.tv_sec);
-                *p++ = cpu_to_be32(iap->ia_mtime.tv_sec);
                *p++ = cpu_to_be32(iap->ia_mtime.tv_nsec);
        }
        else if (iap->ia_valid & ATTR_MTIME) {
@@ -1366,33 +1360,28 @@ static inline void encode_openhdr(struct xdr_stream *xdr, const struct nfs_opena
 static inline void encode_createmode(struct xdr_stream *xdr, const struct nfs_openargs *arg)
 {
+        struct iattr dummy;
        __be32 *p;
-        struct nfs_client *clp;
        p = reserve_space(xdr, 4);
-        switch(arg->open_flags & O_EXCL) {
+        switch(arg->createmode) {
-        case 0:
+        case NFS4_CREATE_UNCHECKED:
                *p = cpu_to_be32(NFS4_CREATE_UNCHECKED);
                encode_attrs(xdr, arg->u.attrs, arg->server);
                break;
-        default:
+        case NFS4_CREATE_GUARDED:
-                clp = arg->server->nfs_client;
+                *p = cpu_to_be32(NFS4_CREATE_GUARDED);
-                if (clp->cl_mvops->minor_version > 0) {
+                encode_attrs(xdr, arg->u.attrs, arg->server);
-                        if (nfs4_has_persistent_session(clp)) {
+                break;
-                                *p = cpu_to_be32(NFS4_CREATE_GUARDED);
+        case NFS4_CREATE_EXCLUSIVE:
-                                encode_attrs(xdr, arg->u.attrs, arg->server);
+                *p = cpu_to_be32(NFS4_CREATE_EXCLUSIVE);
-                        } else {
+                encode_nfs4_verifier(xdr, &arg->u.verifier);
-                                struct iattr dummy;
+                break;
+        case NFS4_CREATE_EXCLUSIVE4_1:
-                                *p = cpu_to_be32(NFS4_CREATE_EXCLUSIVE4_1);
+                *p = cpu_to_be32(NFS4_CREATE_EXCLUSIVE4_1);
-                                encode_nfs4_verifier(xdr, &arg->u.verifier);
+                encode_nfs4_verifier(xdr, &arg->u.verifier);
-                                dummy.ia_valid = 0;
+                dummy.ia_valid = 0;
-                                encode_attrs(xdr, &dummy, arg->server);
+                encode_attrs(xdr, &dummy, arg->server);
-                        }
-                } else {
-                        *p = cpu_to_be32(NFS4_CREATE_EXCLUSIVE);
-                        encode_nfs4_verifier(xdr, &arg->u.verifier);
-                }
        }
 }
@@ -1459,6 +1448,23 @@ static inline void encode_claim_delegate_cur(struct xdr_stream *xdr, const struc
        encode_string(xdr, name->len, name->name);
 }
+static inline void encode_claim_fh(struct xdr_stream *xdr)
+{
+        __be32 *p;
+        p = reserve_space(xdr, 4);
+        *p = cpu_to_be32(NFS4_OPEN_CLAIM_FH);
+}
+static inline void encode_claim_delegate_cur_fh(struct xdr_stream *xdr, const nfs4_stateid *stateid)
+{
+        __be32 *p;
+        p = reserve_space(xdr, 4);
+        *p = cpu_to_be32(NFS4_OPEN_CLAIM_DELEG_CUR_FH);
+        encode_nfs4_stateid(xdr, stateid);
+}
 static void encode_open(struct xdr_stream *xdr, const struct nfs_openargs *arg, struct compound_hdr *hdr)
 {
        encode_op_hdr(xdr, OP_OPEN, decode_open_maxsz, hdr);
@@ -1474,6 +1480,12 @@ static void encode_open(struct xdr_stream *xdr, const struct nfs_openargs *arg,
        case NFS4_OPEN_CLAIM_DELEGATE_CUR:
                encode_claim_delegate_cur(xdr, arg->name, &arg->u.delegation);
                break;
+        case NFS4_OPEN_CLAIM_FH:
+                encode_claim_fh(xdr);
+                break;
+        case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
+                encode_claim_delegate_cur_fh(xdr, &arg->u.delegation);
+                break;
        default:
                BUG();
        }
@@ -1506,35 +1518,12 @@ static void encode_putrootfh(struct xdr_stream *xdr, struct compound_hdr *hdr)
        encode_op_hdr(xdr, OP_PUTROOTFH, decode_putrootfh_maxsz, hdr);
 }
-static void encode_open_stateid(struct xdr_stream *xdr,
-                const struct nfs_open_context *ctx,
-                const struct nfs_lock_context *l_ctx,
-                fmode_t fmode,
-                int zero_seqid)
-{
-        nfs4_stateid stateid;
-        if (ctx->state != NULL) {
-                const struct nfs_lockowner *lockowner = NULL;
-                if (l_ctx != NULL)
-                        lockowner = &l_ctx->lockowner;
-                nfs4_select_rw_stateid(&stateid, ctx->state,
-                                fmode, lockowner);
-                if (zero_seqid)
-                        stateid.seqid = 0;
-                encode_nfs4_stateid(xdr, &stateid);
-        } else
-                encode_nfs4_stateid(xdr, &zero_stateid);
-}
 static void encode_read(struct xdr_stream *xdr, const struct nfs_readargs *args, struct compound_hdr *hdr)
 {
        __be32 *p;
        encode_op_hdr(xdr, OP_READ, decode_read_maxsz, hdr);
-        encode_open_stateid(xdr, args->context, args->lock_context,
+        encode_nfs4_stateid(xdr, &args->stateid);
-                        FMODE_READ, hdr->minorversion);
        p = reserve_space(xdr, 12);
        p = xdr_encode_hyper(p, args->offset);
@@ -1670,8 +1659,7 @@ static void encode_write(struct xdr_stream *xdr, const struct nfs_writeargs *arg
        __be32 *p;
        encode_op_hdr(xdr, OP_WRITE, decode_write_maxsz, hdr);
-        encode_open_stateid(xdr, args->context, args->lock_context,
+        encode_nfs4_stateid(xdr, &args->stateid);
-                        FMODE_WRITE, hdr->minorversion);
        p = reserve_space(xdr, 16);
        p = xdr_encode_hyper(p, args->offset);
@@ -2609,12 +2597,9 @@ static void nfs4_xdr_enc_setclientid_confirm(struct rpc_rqst *req,
        struct compound_hdr hdr = {
                .nops   = 0,
        };
-        const u32 lease_bitmap[3] = { FATTR4_WORD0_LEASE_TIME };
        encode_compound_hdr(xdr, req, &hdr);
        encode_setclientid_confirm(xdr, arg, &hdr);
-        encode_putrootfh(xdr, &hdr);
-        encode_fsinfo(xdr, lease_bitmap, &hdr);
        encode_nops(&hdr);
 }
@@ -3497,8 +3482,11 @@ static int decode_pathname(struct xdr_stream *xdr, struct nfs4_pathname *path)
        if (n == 0)
                goto root_path;
        dprintk("pathname4: ");
-        path->ncomponents = 0;
+        if (n > NFS4_PATHNAME_MAXCOMPONENTS) {
-        while (path->ncomponents < n) {
+                dprintk("cannot parse %d components in path\n", n);
+                goto out_eio;
+        }
+        for (path->ncomponents = 0; path->ncomponents < n; path->ncomponents++) {
                struct nfs4_string *component = &path->components[path->ncomponents];
                status = decode_opaque_inline(xdr, &component->len, &component->data);
                if (unlikely(status != 0))
@@ -3507,12 +3495,6 @@ static int decode_pathname(struct xdr_stream *xdr, struct nfs4_pathname *path)
                        pr_cont("%s%.*s ",
                                (path->ncomponents != n ? "/ " : ""),
                                component->len, component->data);
-                if (path->ncomponents < NFS4_PATHNAME_MAXCOMPONENTS)
-                        path->ncomponents++;
-                else {
-                        dprintk("cannot parse %d components in path\n", n);
-                        goto out_eio;
-                }
        }
 out:
        return status;
@@ -3557,27 +3539,23 @@ static int decode_attr_fs_locations(struct xdr_stream *xdr, uint32_t *bitmap, st
        n = be32_to_cpup(p);
        if (n <= 0)
                goto out_eio;
-        res->nlocations = 0;
+        for (res->nlocations = 0; res->nlocations < n; res->nlocations++) {
-        while (res->nlocations < n) {
                u32 m;
-                struct nfs4_fs_location *loc = &res->locations[res->nlocations];
+                struct nfs4_fs_location *loc;
+                if (res->nlocations == NFS4_FS_LOCATIONS_MAXENTRIES)
+                        break;
+                loc = &res->locations[res->nlocations];
                p = xdr_inline_decode(xdr, 4);
                if (unlikely(!p))
                        goto out_overflow;
                m = be32_to_cpup(p);
-                loc->nservers = 0;
                dprintk("%s: servers:\n", __func__);
-                while (loc->nservers < m) {
+                for (loc->nservers = 0; loc->nservers < m; loc->nservers++) {
-                        struct nfs4_string *server = &loc->servers[loc->nservers];
+                        struct nfs4_string *server;
-                        status = decode_opaque_inline(xdr, &server->len, &server->data);
-                        if (unlikely(status != 0))
+                        if (loc->nservers == NFS4_FS_LOCATION_MAXSERVERS) {
-                                goto out_eio;
-                        dprintk("%s ", server->data);
-                        if (loc->nservers < NFS4_FS_LOCATION_MAXSERVERS)
-                                loc->nservers++;
-                        else {
                                unsigned int i;
                                dprintk("%s: using first %u of %u servers "
                                        "returned for location %u\n",
@@ -3591,13 +3569,17 @@ static int decode_attr_fs_locations(struct xdr_stream *xdr, uint32_t *bitmap, st
                                        if (unlikely(status != 0))
                                                goto out_eio;
                                }
+                                break;
                        }
+                        server = &loc->servers[loc->nservers];
+                        status = decode_opaque_inline(xdr, &server->len, &server->data);
+                        if (unlikely(status != 0))
+                                goto out_eio;
+                        dprintk("%s ", server->data);
                }
                status = decode_pathname(xdr, &loc->rootpath);
                if (unlikely(status != 0))
                        goto out_eio;
-                if (res->nlocations < NFS4_FS_LOCATIONS_MAXENTRIES)
-                        res->nlocations++;
        }
        if (res->nlocations != 0)
                status = NFS_ATTR_FATTR_V4_LOCATIONS;
@@ -5209,27 +5191,30 @@ static int decode_delegreturn(struct xdr_stream *xdr)
        return decode_op_hdr(xdr, OP_DELEGRETURN);
 }
-static int decode_secinfo_gss(struct xdr_stream *xdr, struct nfs4_secinfo_flavor *flavor)
+static int decode_secinfo_gss(struct xdr_stream *xdr,
+                              struct nfs4_secinfo4 *flavor)
 {
+        u32 oid_len;
        __be32 *p;
        p = xdr_inline_decode(xdr, 4);
        if (unlikely(!p))
                goto out_overflow;
-        flavor->gss.sec_oid4.len = be32_to_cpup(p);
+        oid_len = be32_to_cpup(p);
-        if (flavor->gss.sec_oid4.len > GSS_OID_MAX_LEN)
+        if (oid_len > GSS_OID_MAX_LEN)
                goto out_err;
-        p = xdr_inline_decode(xdr, flavor->gss.sec_oid4.len);
+        p = xdr_inline_decode(xdr, oid_len);
        if (unlikely(!p))
                goto out_overflow;
-        memcpy(flavor->gss.sec_oid4.data, p, flavor->gss.sec_oid4.len);
+        memcpy(flavor->flavor_info.oid.data, p, oid_len);
+        flavor->flavor_info.oid.len = oid_len;
        p = xdr_inline_decode(xdr, 8);
        if (unlikely(!p))
                goto out_overflow;
-        flavor->gss.qop4 = be32_to_cpup(p++);
+        flavor->flavor_info.qop = be32_to_cpup(p++);
-        flavor->gss.service = be32_to_cpup(p);
+        flavor->flavor_info.service = be32_to_cpup(p);
        return 0;
@@ -5242,10 +5227,10 @@ out_err:
 static int decode_secinfo_common(struct xdr_stream *xdr, struct nfs4_secinfo_res *res)
 {
-        struct nfs4_secinfo_flavor *sec_flavor;
+        struct nfs4_secinfo4 *sec_flavor;
+        unsigned int i, num_flavors;
        int status;
        __be32 *p;
-        int i, num_flavors;
        p = xdr_inline_decode(xdr, 4);
        if (unlikely(!p))
@@ -6648,8 +6633,7 @@ static int nfs4_xdr_dec_setclientid(struct rpc_rqst *req,
 * Decode SETCLIENTID_CONFIRM response
 */
 static int nfs4_xdr_dec_setclientid_confirm(struct rpc_rqst *req,
-                                            struct xdr_stream *xdr,
+                                            struct xdr_stream *xdr)
-                                            struct nfs_fsinfo *fsinfo)
 {
        struct compound_hdr hdr;
        int status;
@@ -6657,10 +6641,6 @@ static int nfs4_xdr_dec_setclientid_confirm(struct rpc_rqst *req,
        status = decode_compound_hdr(xdr, &hdr);
        if (!status)
                status = decode_setclientid_confirm(xdr);
-        if (!status)
-                status = decode_putrootfh(xdr);
-        if (!status)
-                status = decode_fsinfo(xdr, fsinfo);
        return status;
 }
diff --git a/fs/nfs/objlayout/objio_osd.c b/fs/nfs/objlayout/objio_osd.c
index 88f9611a945c..5457745dd4f1 100644
--- a/fs/nfs/objlayout/objio_osd.c
+++ b/fs/nfs/objlayout/objio_osd.c
@@ -234,7 +234,7 @@ static int __alloc_objio_seg(unsigned numdevs, gfp_t gfp_flags,
        lseg = kzalloc(lseg_size, gfp_flags);
        if (unlikely(!lseg)) {
-                dprintk("%s: Faild allocation numdevs=%d size=%zd\n", __func__,
+                dprintk("%s: Failed allocation numdevs=%d size=%zd\n", __func__,
                        numdevs, lseg_size);
                return -ENOMEM;
        }
diff --git a/fs/nfs/objlayout/objlayout.h b/fs/nfs/objlayout/objlayout.h
index 880ba086be94..87aa1dec6120 100644
--- a/fs/nfs/objlayout/objlayout.h
+++ b/fs/nfs/objlayout/objlayout.h
@@ -114,7 +114,7 @@ extern int objio_alloc_lseg(struct pnfs_layout_segment **outp,
        gfp_t gfp_flags);
 extern void objio_free_lseg(struct pnfs_layout_segment *lseg);
-/* objio_free_result will free these @oir structs recieved from
+/* objio_free_result will free these @oir structs received from
 * objlayout_{read,write}_done
 */
 extern void objio_free_result(struct objlayout_io_res *oir);
diff --git a/fs/nfs/pagelist.c b/fs/nfs/pagelist.c
index e56e846e9d2d..29cfb7ade121 100644
--- a/fs/nfs/pagelist.c
+++ b/fs/nfs/pagelist.c
@@ -84,6 +84,55 @@ nfs_page_free(struct nfs_page *p)
        kmem_cache_free(nfs_page_cachep, p);
 }
+static void
+nfs_iocounter_inc(struct nfs_io_counter *c)
+{
+        atomic_inc(&c->io_count);
+}
+static void
+nfs_iocounter_dec(struct nfs_io_counter *c)
+{
+        if (atomic_dec_and_test(&c->io_count)) {
+                clear_bit(NFS_IO_INPROGRESS, &c->flags);
+                smp_mb__after_clear_bit();
+                wake_up_bit(&c->flags, NFS_IO_INPROGRESS);
+        }
+}
+static int
+__nfs_iocounter_wait(struct nfs_io_counter *c)
+{
+        wait_queue_head_t *wq = bit_waitqueue(&c->flags, NFS_IO_INPROGRESS);
+        DEFINE_WAIT_BIT(q, &c->flags, NFS_IO_INPROGRESS);
+        int ret = 0;
+        do {
+                prepare_to_wait(wq, &q.wait, TASK_KILLABLE);
+                set_bit(NFS_IO_INPROGRESS, &c->flags);
+                if (atomic_read(&c->io_count) == 0)
+                        break;
+                ret = nfs_wait_bit_killable(&c->flags);
+        } while (atomic_read(&c->io_count) != 0);
+        finish_wait(wq, &q.wait);
+        return ret;
+}
+/**
+ * nfs_iocounter_wait - wait for i/o to complete
+ * @c: nfs_io_counter to use
+ *
+ * returns -ERESTARTSYS if interrupted by a fatal signal.
+ * Otherwise returns 0 once the io_count hits 0.
+ */
+int
+nfs_iocounter_wait(struct nfs_io_counter *c)
+{
+        if (atomic_read(&c->io_count) == 0)
+                return 0;
+        return __nfs_iocounter_wait(c);
+}
 /**
 * nfs_create_request - Create an NFS read/write request.
 * @ctx: open context to use
@@ -104,6 +153,8 @@ nfs_create_request(struct nfs_open_context *ctx, struct inode *inode,
        struct nfs_page         *req;
        struct nfs_lock_context *l_ctx;
+        if (test_bit(NFS_CONTEXT_BAD, &ctx->flags))
+                return ERR_PTR(-EBADF);
        /* try to allocate the request struct */
        req = nfs_page_alloc();
        if (req == NULL)
@@ -116,6 +167,7 @@ nfs_create_request(struct nfs_open_context *ctx, struct inode *inode,
                return ERR_CAST(l_ctx);
        }
        req->wb_lock_context = l_ctx;
+        nfs_iocounter_inc(&l_ctx->io_count);
        /* Initialize the request struct. Initially, we assume a
         * long write-back delay. This will be adjusted in
@@ -175,6 +227,7 @@ static void nfs_clear_request(struct nfs_page *req)
                req->wb_page = NULL;
        }
        if (l_ctx != NULL) {
+                nfs_iocounter_dec(&l_ctx->io_count);
                nfs_put_lock_context(l_ctx);
                req->wb_lock_context = NULL;
        }
diff --git a/fs/nfs/pnfs.c b/fs/nfs/pnfs.c
index 4bdffe0ba025..c5bd758e5637 100644
--- a/fs/nfs/pnfs.c
+++ b/fs/nfs/pnfs.c
@@ -718,6 +718,8 @@ pnfs_choose_layoutget_stateid(nfs4_stateid *dst, struct pnfs_layout_hdr *lo,
        spin_lock(&lo->plh_inode->i_lock);
        if (pnfs_layoutgets_blocked(lo, 1)) {
                status = -EAGAIN;
+        } else if (!nfs4_valid_open_stateid(open_state)) {
+                status = -EBADF;
        } else if (list_empty(&lo->plh_segs)) {
                int seq;
diff --git a/fs/nfs/read.c b/fs/nfs/read.c
index a5e5d9899d56..70a26c651f09 100644
--- a/fs/nfs/read.c
+++ b/fs/nfs/read.c
@@ -514,6 +514,8 @@ void nfs_read_prepare(struct rpc_task *task, void *calldata)
 {
        struct nfs_read_data *data = calldata;
        NFS_PROTO(data->header->inode)->read_rpc_prepare(task, data);
+        if (unlikely(test_bit(NFS_CONTEXT_BAD, &data->args.context->flags)))
+                rpc_exit(task, -EIO);
 }
 static const struct rpc_call_ops nfs_read_common_ops = {
diff --git a/fs/nfs/super.c b/fs/nfs/super.c
index 2f8a29db0f1b..1bb071dca9ab 100644
--- a/fs/nfs/super.c
+++ b/fs/nfs/super.c
@@ -920,7 +920,7 @@ static struct nfs_parsed_mount_data *nfs_alloc_parsed_mount_data(void)
                data->mount_server.port = NFS_UNSPEC_PORT;
                data->nfs_server.port   = NFS_UNSPEC_PORT;
                data->nfs_server.protocol = XPRT_TRANSPORT_TCP;
-                data->auth_flavors[0]   = RPC_AUTH_UNIX;
+                data->auth_flavors[0]   = RPC_AUTH_MAXFLAVOR;
                data->auth_flavor_len   = 1;
                data->minorversion      = 0;
                data->need_mount        = true;
@@ -1608,49 +1608,57 @@ out_security_failure:
 }
 /*
- * Match the requested auth flavors with the list returned by
+ * Select a security flavor for this mount.  The selected flavor
- * the server.  Returns zero and sets the mount's authentication
+ * is planted in args->auth_flavors[0].
- * flavor on success; returns -EACCES if server does not support
- * the requested flavor.
 */
-static int nfs_walk_authlist(struct nfs_parsed_mount_data *args,
+static void nfs_select_flavor(struct nfs_parsed_mount_data *args,
-                             struct nfs_mount_request *request)
+                              struct nfs_mount_request *request)
 {
-        unsigned int i, j, server_authlist_len = *(request->auth_flav_len);
+        unsigned int i, count = *(request->auth_flav_len);
+        rpc_authflavor_t flavor;
+        if (args->auth_flavors[0] != RPC_AUTH_MAXFLAVOR)
+                goto out;
+        /*
+         * The NFSv2 MNT operation does not return a flavor list.
+         */
+        if (args->mount_server.version != NFS_MNT3_VERSION)
+                goto out_default;
        /*
         * Certain releases of Linux's mountd return an empty
-         * flavor list.  To prevent behavioral regression with
+         * flavor list in some cases.
-         * these servers (ie. rejecting mounts that used to
-         * succeed), revert to pre-2.6.32 behavior (no checking)
-         * if the returned flavor list is empty.
         */
-        if (server_authlist_len == 0)
+        if (count == 0)
-                return 0;
+                goto out_default;
        /*
-         * We avoid sophisticated negotiating here, as there are
-         * plenty of cases where we can get it wrong, providing
-         * either too little or too much security.
-         *
         * RFC 2623, section 2.7 suggests we SHOULD prefer the
         * flavor listed first.  However, some servers list
-         * AUTH_NULL first.  Our caller plants AUTH_SYS, the
+         * AUTH_NULL first.  Avoid ever choosing AUTH_NULL.
-         * preferred default, in args->auth_flavors[0] if user
-         * didn't specify sec= mount option.
         */
-        for (i = 0; i < args->auth_flavor_len; i++)
+        for (i = 0; i < count; i++) {
-                for (j = 0; j < server_authlist_len; j++)
+                struct rpcsec_gss_info info;
-                        if (args->auth_flavors[i] == request->auth_flavs[j]) {
-                                dfprintk(MOUNT, "NFS: using auth flavor %d\n",
+                flavor = request->auth_flavs[i];
-                                        request->auth_flavs[j]);
+                switch (flavor) {
-                                args->auth_flavors[0] = request->auth_flavs[j];
+                case RPC_AUTH_UNIX:
-                                return 0;
+                        goto out_set;
-                        }
+                case RPC_AUTH_NULL:
+                        continue;
+                default:
+                        if (rpcauth_get_gssinfo(flavor, &info) == 0)
+                                goto out_set;
+                }
+        }
-        dfprintk(MOUNT, "NFS: server does not support requested auth flavor\n");
+out_default:
-        nfs_umount(request);
+        flavor = RPC_AUTH_UNIX;
-        return -EACCES;
+out_set:
+        args->auth_flavors[0] = flavor;
+out:
+        dfprintk(MOUNT, "NFS: using auth flavor %d\n", args->auth_flavors[0]);
 }
 /*
@@ -1713,12 +1721,8 @@ static int nfs_request_mount(struct nfs_parsed_mount_data *args,
                return status;
        }
-        /*
+        nfs_select_flavor(args, &request);
-         * MNTv1 (NFSv2) does not support auth flavor negotiation.
+        return 0;
-         */
-        if (args->mount_server.version != NFS_MNT3_VERSION)
-                return 0;
-        return nfs_walk_authlist(args, &request);
 }
 struct dentry *nfs_try_mount(int flags, const char *dev_name,
@@ -2381,10 +2385,9 @@ int nfs_clone_sb_security(struct super_block *s, struct dentry *mntroot,
                          struct nfs_mount_info *mount_info)
 {
        /* clone any lsm security options from the parent to the new sb */
-        security_sb_clone_mnt_opts(mount_info->cloned->sb, s);
        if (mntroot->d_inode->i_op != NFS_SB(s)->nfs_client->rpc_ops->dir_inode_ops)
                return -ESTALE;
-        return 0;
+        return security_sb_clone_mnt_opts(mount_info->cloned->sb, s);
 }
 EXPORT_SYMBOL_GPL(nfs_clone_sb_security);
diff --git a/fs/nfs/write.c b/fs/nfs/write.c
index c483cc50b82e..a2c7c28049d5 100644
--- a/fs/nfs/write.c
+++ b/fs/nfs/write.c
@@ -1251,6 +1251,8 @@ void nfs_write_prepare(struct rpc_task *task, void *calldata)
 {
        struct nfs_write_data *data = calldata;
        NFS_PROTO(data->header->inode)->write_rpc_prepare(task, data);
+        if (unlikely(test_bit(NFS_CONTEXT_BAD, &data->args.context->flags)))
+                rpc_exit(task, -EIO);
 }
 void nfs_commit_prepare(struct rpc_task *task, void *calldata)
diff --git a/fs/nfsd/nfs4state.c b/fs/nfsd/nfs4state.c
index 2e27430b9070..417c84877742 100644
--- a/fs/nfsd/nfs4state.c
+++ b/fs/nfsd/nfs4state.c
@@ -234,7 +234,6 @@ static struct nfs4_stid *nfs4_alloc_stid(struct nfs4_client *cl, struct
 kmem_cache *slab)
 {
        struct idr *stateids = &cl->cl_stateids;
-        static int min_stateid = 0;
        struct nfs4_stid *stid;
        int new_id;
@@ -242,7 +241,7 @@ kmem_cache *slab)
        if (!stid)
                return NULL;
-        new_id = idr_alloc(stateids, stid, min_stateid, 0, GFP_KERNEL);
+        new_id = idr_alloc_cyclic(stateids, stid, 0, 0, GFP_KERNEL);
        if (new_id < 0)
                goto out_free;
        stid->sc_client = cl;
@@ -261,10 +260,6 @@ kmem_cache *slab)
         * amount of time until an id is reused, by ensuring they always
         * "increase" (mod INT_MAX):
         */
-        min_stateid = new_id+1;
-        if (min_stateid == INT_MAX)
-                min_stateid = 0;
        return stid;
 out_free:
        kfree(stid);
diff --git a/fs/nfsd/nfs4xdr.c b/fs/nfsd/nfs4xdr.c
index 01168865dd37..2502951714b1 100644
--- a/fs/nfsd/nfs4xdr.c
+++ b/fs/nfsd/nfs4xdr.c
@@ -264,7 +264,7 @@ nfsd4_decode_fattr(struct nfsd4_compoundargs *argp, u32 *bmval,
                iattr->ia_valid |= ATTR_SIZE;
        }
        if (bmval[0] & FATTR4_WORD0_ACL) {
-                int nace;
+                u32 nace;
                struct nfs4_ace *ace;
                READ_BUF(4); len += 4;
@@ -3138,10 +3138,9 @@ nfsd4_encode_rename(struct nfsd4_compoundres *resp, __be32 nfserr, struct nfsd4_
 static __be32
 nfsd4_do_encode_secinfo(struct nfsd4_compoundres *resp,
-                         __be32 nfserr,struct svc_export *exp)
+                         __be32 nfserr, struct svc_export *exp)
 {
-        int i = 0;
+        u32 i, nflavs;
-        u32 nflavs;
        struct exp_flavor_info *flavs;
        struct exp_flavor_info def_flavs[2];
        __be32 *p;
@@ -3172,30 +3171,29 @@ nfsd4_do_encode_secinfo(struct nfsd4_compoundres *resp,
        WRITE32(nflavs);
        ADJUST_ARGS();
        for (i = 0; i < nflavs; i++) {
-                u32 flav = flavs[i].pseudoflavor;
+                struct rpcsec_gss_info info;
-                struct gss_api_mech *gm = gss_mech_get_by_pseudoflavor(flav);
-                if (gm) {
+                if (rpcauth_get_gssinfo(flavs[i].pseudoflavor, &info) == 0) {
                        RESERVE_SPACE(4);
                        WRITE32(RPC_AUTH_GSS);
                        ADJUST_ARGS();
-                        RESERVE_SPACE(4 + gm->gm_oid.len);
+                        RESERVE_SPACE(4 + info.oid.len);
-                        WRITE32(gm->gm_oid.len);
+                        WRITE32(info.oid.len);
-                        WRITEMEM(gm->gm_oid.data, gm->gm_oid.len);
+                        WRITEMEM(info.oid.data, info.oid.len);
                        ADJUST_ARGS();
                        RESERVE_SPACE(4);
-                        WRITE32(0); /* qop */
+                        WRITE32(info.qop);
                        ADJUST_ARGS();
                        RESERVE_SPACE(4);
-                        WRITE32(gss_pseudoflavor_to_service(gm, flav));
+                        WRITE32(info.service);
                        ADJUST_ARGS();
-                        gss_mech_put(gm);
                } else {
                        RESERVE_SPACE(4);
-                        WRITE32(flav);
+                        WRITE32(flavs[i].pseudoflavor);
                        ADJUST_ARGS();
                }
        }
 out:
        if (exp)
                exp_put(exp);
diff --git a/fs/nilfs2/inode.c b/fs/nilfs2/inode.c
index 6b49f14eac8c..cf02f5530713 100644
--- a/fs/nilfs2/inode.c
+++ b/fs/nilfs2/inode.c
@@ -175,6 +175,11 @@ static int nilfs_writepages(struct address_space *mapping,
        struct inode *inode = mapping->host;
        int err = 0;
+        if (inode->i_sb->s_flags & MS_RDONLY) {
+                nilfs_clear_dirty_pages(mapping, false);
+                return -EROFS;
+        }
        if (wbc->sync_mode == WB_SYNC_ALL)
                err = nilfs_construct_dsync_segment(inode->i_sb, inode,
                                                    wbc->range_start,
@@ -187,6 +192,18 @@ static int nilfs_writepage(struct page *page, struct writeback_control *wbc)
        struct inode *inode = page->mapping->host;
        int err;
+        if (inode->i_sb->s_flags & MS_RDONLY) {
+                /*
+                 * It means that filesystem was remounted in read-only
+                 * mode because of error or metadata corruption. But we
+                 * have dirty pages that try to be flushed in background.
+                 * So, here we simply discard this dirty page.
+                 */
+                nilfs_clear_dirty_page(page, false);
+                unlock_page(page);
+                return -EROFS;
+        }
        redirty_page_for_writepage(wbc, page);
        unlock_page(page);
diff --git a/fs/nilfs2/mdt.c b/fs/nilfs2/mdt.c
index f9897d09c693..c4dcd1db57ee 100644
--- a/fs/nilfs2/mdt.c
+++ b/fs/nilfs2/mdt.c
@@ -375,14 +375,25 @@ int nilfs_mdt_fetch_dirty(struct inode *inode)
 static int
 nilfs_mdt_write_page(struct page *page, struct writeback_control *wbc)
 {
-        struct inode *inode;
+        struct inode *inode = page->mapping->host;
        struct super_block *sb;
        int err = 0;
+        if (inode && (inode->i_sb->s_flags & MS_RDONLY)) {
+                /*
+                 * It means that filesystem was remounted in read-only
+                 * mode because of error or metadata corruption. But we
+                 * have dirty pages that try to be flushed in background.
+                 * So, here we simply discard this dirty page.
+                 */
+                nilfs_clear_dirty_page(page, false);
+                unlock_page(page);
+                return -EROFS;
+        }
        redirty_page_for_writepage(wbc, page);
        unlock_page(page);
-        inode = page->mapping->host;
        if (!inode)
                return 0;
@@ -561,10 +572,10 @@ void nilfs_mdt_restore_from_shadow_map(struct inode *inode)
        if (mi->mi_palloc_cache)
                nilfs_palloc_clear_cache(inode);
-        nilfs_clear_dirty_pages(inode->i_mapping);
+        nilfs_clear_dirty_pages(inode->i_mapping, true);
        nilfs_copy_back_pages(inode->i_mapping, &shadow->frozen_data);
-        nilfs_clear_dirty_pages(&ii->i_btnode_cache);
+        nilfs_clear_dirty_pages(&ii->i_btnode_cache, true);
        nilfs_copy_back_pages(&ii->i_btnode_cache, &shadow->frozen_btnodes);
        nilfs_bmap_restore(ii->i_bmap, &shadow->bmap_store);
diff --git a/fs/nilfs2/page.c b/fs/nilfs2/page.c
index 07f76db04ec7..0ba679866e50 100644
--- a/fs/nilfs2/page.c
+++ b/fs/nilfs2/page.c
@@ -370,7 +370,12 @@ repeat:
        goto repeat;
 }
-void nilfs_clear_dirty_pages(struct address_space *mapping)
+/**
+ * nilfs_clear_dirty_pages - discard dirty pages in address space
+ * @mapping: address space with dirty pages for discarding
+ * @silent: suppress [true] or print [false] warning messages
+ */
+void nilfs_clear_dirty_pages(struct address_space *mapping, bool silent)
 {
        struct pagevec pvec;
        unsigned int i;
@@ -382,25 +387,9 @@ void nilfs_clear_dirty_pages(struct address_space *mapping)
                                  PAGEVEC_SIZE)) {
                for (i = 0; i < pagevec_count(&pvec); i++) {
                        struct page *page = pvec.pages[i];
-                        struct buffer_head *bh, *head;
                        lock_page(page);
-                        ClearPageUptodate(page);
+                        nilfs_clear_dirty_page(page, silent);
-                        ClearPageMappedToDisk(page);
-                        bh = head = page_buffers(page);
-                        do {
-                                lock_buffer(bh);
-                                clear_buffer_dirty(bh);
-                                clear_buffer_nilfs_volatile(bh);
-                                clear_buffer_nilfs_checked(bh);
-                                clear_buffer_nilfs_redirected(bh);
-                                clear_buffer_uptodate(bh);
-                                clear_buffer_mapped(bh);
-                                unlock_buffer(bh);
-                                bh = bh->b_this_page;
-                        } while (bh != head);
-                        __nilfs_clear_page_dirty(page);
                        unlock_page(page);
                }
                pagevec_release(&pvec);
@@ -408,6 +397,51 @@ void nilfs_clear_dirty_pages(struct address_space *mapping)
        }
 }
+/**
+ * nilfs_clear_dirty_page - discard dirty page
+ * @page: dirty page that will be discarded
+ * @silent: suppress [true] or print [false] warning messages
+ */
+void nilfs_clear_dirty_page(struct page *page, bool silent)
+{
+        struct inode *inode = page->mapping->host;
+        struct super_block *sb = inode->i_sb;
+        BUG_ON(!PageLocked(page));
+        if (!silent) {
+                nilfs_warning(sb, __func__,
+                                "discard page: offset %lld, ino %lu",
+                                page_offset(page), inode->i_ino);
+        }
+        ClearPageUptodate(page);
+        ClearPageMappedToDisk(page);
+        if (page_has_buffers(page)) {
+                struct buffer_head *bh, *head;
+                bh = head = page_buffers(page);
+                do {
+                        lock_buffer(bh);
+                        if (!silent) {
+                                nilfs_warning(sb, __func__,
+                                        "discard block %llu, size %zu",
+                                        (u64)bh->b_blocknr, bh->b_size);
+                        }
+                        clear_buffer_dirty(bh);
+                        clear_buffer_nilfs_volatile(bh);
+                        clear_buffer_nilfs_checked(bh);
+                        clear_buffer_nilfs_redirected(bh);
+                        clear_buffer_uptodate(bh);
+                        clear_buffer_mapped(bh);
+                        unlock_buffer(bh);
+                } while (bh = bh->b_this_page, bh != head);
+        }
+        __nilfs_clear_page_dirty(page);
+}
 unsigned nilfs_page_count_clean_buffers(struct page *page,
                                        unsigned from, unsigned to)
 {
diff --git a/fs/nilfs2/page.h b/fs/nilfs2/page.h
index fb7de71605a0..ef30c5c2426f 100644
--- a/fs/nilfs2/page.h
+++ b/fs/nilfs2/page.h
@@ -55,7 +55,8 @@ void nilfs_page_bug(struct page *);
 int nilfs_copy_dirty_pages(struct address_space *, struct address_space *);
 void nilfs_copy_back_pages(struct address_space *, struct address_space *);
-void nilfs_clear_dirty_pages(struct address_space *);
+void nilfs_clear_dirty_page(struct page *, bool);
+void nilfs_clear_dirty_pages(struct address_space *, bool);
 void nilfs_mapping_init(struct address_space *mapping, struct inode *inode,
                        struct backing_dev_info *bdi);
 unsigned nilfs_page_count_clean_buffers(struct page *, unsigned, unsigned);
diff --git a/fs/notify/fanotify/fanotify_user.c b/fs/notify/fanotify/fanotify_user.c
index 5d8444268a16..d0be29fa94cf 100644
--- a/fs/notify/fanotify/fanotify_user.c
+++ b/fs/notify/fanotify/fanotify_user.c
@@ -755,9 +755,9 @@ out_destroy_group:
        return fd;
 }
-SYSCALL_DEFINE(fanotify_mark)(int fanotify_fd, unsigned int flags,
+SYSCALL_DEFINE5(fanotify_mark, int, fanotify_fd, unsigned int, flags,
-                              __u64 mask, int dfd,
+                              __u64, mask, int, dfd,
-                              const char  __user * pathname)
+                              const char  __user *, pathname)
 {
        struct inode *inode = NULL;
        struct vfsmount *mnt = NULL;
@@ -857,17 +857,6 @@ fput_and_out:
        return ret;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_fanotify_mark(long fanotify_fd, long flags, __u64 mask,
-                                  long dfd, long pathname)
-{
-        return SYSC_fanotify_mark((int) fanotify_fd, (unsigned int) flags,
-                                  mask, (int) dfd,
-                                  (const char  __user *) pathname);
-}
-SYSCALL_ALIAS(sys_fanotify_mark, SyS_fanotify_mark);
-#endif
 /*
 * fanotify_user_setup - Our initialization function.  Note that we cannot return
 * error because we have compiled-in VFS hooks.  So an (unlikely) failure here
diff --git a/fs/notify/inotify/inotify_user.c b/fs/notify/inotify/inotify_user.c
index e0f7c1241a6a..c616a70e8cf9 100644
--- a/fs/notify/inotify/inotify_user.c
+++ b/fs/notify/inotify/inotify_user.c
@@ -359,7 +359,6 @@ static int inotify_find_inode(const char __user *dirname, struct path *path, uns
 }
 static int inotify_add_to_idr(struct idr *idr, spinlock_t *idr_lock,
-                              int *last_wd,
                              struct inotify_inode_mark *i_mark)
 {
        int ret;
@@ -367,11 +366,10 @@ static int inotify_add_to_idr(struct idr *idr, spinlock_t *idr_lock,
        idr_preload(GFP_KERNEL);
        spin_lock(idr_lock);
-        ret = idr_alloc(idr, i_mark, *last_wd + 1, 0, GFP_NOWAIT);
+        ret = idr_alloc_cyclic(idr, i_mark, 1, 0, GFP_NOWAIT);
        if (ret >= 0) {
                /* we added the mark to the idr, take a reference */
                i_mark->wd = ret;
-                *last_wd = i_mark->wd;
                fsnotify_get_mark(&i_mark->fsn_mark);
        }
@@ -572,7 +570,6 @@ static int inotify_update_existing_watch(struct fsnotify_group *group,
        int add = (arg & IN_MASK_ADD);
        int ret;
-        /* don't allow invalid bits: we don't want flags set */
        mask = inotify_arg_to_mask(arg);
        fsn_mark = fsnotify_find_inode_mark(group, inode);
@@ -623,7 +620,6 @@ static int inotify_new_watch(struct fsnotify_group *group,
        struct idr *idr = &group->inotify_data.idr;
        spinlock_t *idr_lock = &group->inotify_data.idr_lock;
-        /* don't allow invalid bits: we don't want flags set */
        mask = inotify_arg_to_mask(arg);
        tmp_i_mark = kmem_cache_alloc(inotify_inode_mark_cachep, GFP_KERNEL);
@@ -638,8 +634,7 @@ static int inotify_new_watch(struct fsnotify_group *group,
        if (atomic_read(&group->inotify_data.user->inotify_watches) >= inotify_max_user_watches)
                goto out_err;
-        ret = inotify_add_to_idr(idr, idr_lock, &group->inotify_data.last_wd,
+        ret = inotify_add_to_idr(idr, idr_lock, tmp_i_mark);
-                                 tmp_i_mark);
        if (ret)
                goto out_err;
@@ -697,7 +692,6 @@ static struct fsnotify_group *inotify_new_group(unsigned int max_events)
        spin_lock_init(&group->inotify_data.idr_lock);
        idr_init(&group->inotify_data.idr);
-        group->inotify_data.last_wd = 0;
        group->inotify_data.user = get_current_user();
        if (atomic_inc_return(&group->inotify_data.user->inotify_devs) >
@@ -751,6 +745,10 @@ SYSCALL_DEFINE3(inotify_add_watch, int, fd, const char __user *, pathname,
        int ret;
        unsigned flags = 0;
+        /* don't allow invalid bits: we don't want flags set */
+        if (unlikely(!(mask & ALL_INOTIFY_BITS)))
+                return -EINVAL;
        f = fdget(fd);
        if (unlikely(!f.file))
                return -EBADF;
diff --git a/fs/ocfs2/dlm/dlmrecovery.c b/fs/ocfs2/dlm/dlmrecovery.c
index eeac97bb3bfa..b3fdd1a323d6 100644
--- a/fs/ocfs2/dlm/dlmrecovery.c
+++ b/fs/ocfs2/dlm/dlmrecovery.c
@@ -1498,10 +1498,8 @@ leave:
        dlm_put(dlm);
        if (ret < 0) {
-                if (buf)
+                kfree(buf);
-                        kfree(buf);
+                kfree(item);
-                if (item)
-                        kfree(item);
                mlog_errno(ret);
        }
diff --git a/fs/ocfs2/ioctl.c b/fs/ocfs2/ioctl.c
index 752f0b26221d..0c60ef2d8056 100644
--- a/fs/ocfs2/ioctl.c
+++ b/fs/ocfs2/ioctl.c
@@ -101,13 +101,6 @@ static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
        if (!S_ISDIR(inode->i_mode))
                flags &= ~OCFS2_DIRSYNC_FL;
-        handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
-        if (IS_ERR(handle)) {
-                status = PTR_ERR(handle);
-                mlog_errno(status);
-                goto bail_unlock;
-        }
        oldflags = ocfs2_inode->ip_attr;
        flags = flags & mask;
        flags |= oldflags & ~mask;
@@ -120,7 +113,14 @@ static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
        if ((oldflags & OCFS2_IMMUTABLE_FL) || ((flags ^ oldflags) &
                (OCFS2_APPEND_FL | OCFS2_IMMUTABLE_FL))) {
                if (!capable(CAP_LINUX_IMMUTABLE))
-                        goto bail_commit;
+                        goto bail_unlock;
+        }
+        handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
+        if (IS_ERR(handle)) {
+                status = PTR_ERR(handle);
+                mlog_errno(status);
+                goto bail_unlock;
        }
        ocfs2_inode->ip_attr = flags;
@@ -130,8 +130,8 @@ static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
        if (status < 0)
                mlog_errno(status);
-bail_commit:
        ocfs2_commit_trans(osb, handle);
 bail_unlock:
        ocfs2_inode_unlock(inode, 1);
 bail:
@@ -706,8 +706,10 @@ int ocfs2_info_handle_freefrag(struct inode *inode,
        o2info_set_request_filled(&oiff->iff_req);
-        if (o2info_to_user(*oiff, req))
+        if (o2info_to_user(*oiff, req)) {
+                status = -EFAULT;
                goto bail;
+        }
        status = 0;
 bail:
diff --git a/fs/ocfs2/move_extents.c b/fs/ocfs2/move_extents.c
index 9f8dcadd9a50..f1fc172175b6 100644
--- a/fs/ocfs2/move_extents.c
+++ b/fs/ocfs2/move_extents.c
@@ -471,7 +471,7 @@ static int ocfs2_validate_and_adjust_move_goal(struct inode *inode,
        int ret, goal_bit = 0;
        struct buffer_head *gd_bh = NULL;
-        struct ocfs2_group_desc *bg = NULL;
+        struct ocfs2_group_desc *bg;
        struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
        int c_to_b = 1 << (osb->s_clustersize_bits -
                                        inode->i_sb->s_blocksize_bits);
@@ -482,13 +482,6 @@ static int ocfs2_validate_and_adjust_move_goal(struct inode *inode,
        range->me_goal = ocfs2_block_to_cluster_start(inode->i_sb,
                                                      range->me_goal);
        /*
-         * moving goal is not allowd to start with a group desc blok(#0 blk)
-         * let's compromise to the latter cluster.
-         */
-        if (range->me_goal == le64_to_cpu(bg->bg_blkno))
-                range->me_goal += c_to_b;
-        /*
         * validate goal sits within global_bitmap, and return the victim
         * group desc
         */
@@ -502,6 +495,13 @@ static int ocfs2_validate_and_adjust_move_goal(struct inode *inode,
        bg = (struct ocfs2_group_desc *)gd_bh->b_data;
        /*
+         * moving goal is not allowd to start with a group desc blok(#0 blk)
+         * let's compromise to the latter cluster.
+         */
+        if (range->me_goal == le64_to_cpu(bg->bg_blkno))
+                range->me_goal += c_to_b;
+        /*
         * movement is not gonna cross two groups.
         */
        if ((le16_to_cpu(bg->bg_bits) - goal_bit) * osb->s_clustersize <
@@ -1057,42 +1057,40 @@ int ocfs2_ioctl_move_extents(struct file *filp, void __user *argp)
        struct inode *inode = file_inode(filp);
        struct ocfs2_move_extents range;
-        struct ocfs2_move_extents_context *context = NULL;
+        struct ocfs2_move_extents_context *context;
+        if (!argp)
+                return -EINVAL;
        status = mnt_want_write_file(filp);
        if (status)
                return status;
        if ((!S_ISREG(inode->i_mode)) || !(filp->f_mode & FMODE_WRITE))
-                goto out;
+                goto out_drop;
        if (inode->i_flags & (S_IMMUTABLE|S_APPEND)) {
                status = -EPERM;
-                goto out;
+                goto out_drop;
        }
        context = kzalloc(sizeof(struct ocfs2_move_extents_context), GFP_NOFS);
        if (!context) {
                status = -ENOMEM;
                mlog_errno(status);
-                goto out;
+                goto out_drop;
        }
        context->inode = inode;
        context->file = filp;
-        if (argp) {
+        if (copy_from_user(&range, argp, sizeof(range))) {
-                if (copy_from_user(&range, argp, sizeof(range))) {
+                status = -EFAULT;
-                        status = -EFAULT;
+                goto out_free;
-                        goto out;
-                }
-        } else {
-                status = -EINVAL;
-                goto out;
        }
        if (range.me_start > i_size_read(inode))
-                goto out;
+                goto out_free;
        if (range.me_start + range.me_len > i_size_read(inode))
                        range.me_len = i_size_read(inode) - range.me_start;
@@ -1124,25 +1122,24 @@ int ocfs2_ioctl_move_extents(struct file *filp, void __user *argp)
                status = ocfs2_validate_and_adjust_move_goal(inode, &range);
                if (status)
-                        goto out;
+                        goto out_copy;
        }
        status = ocfs2_move_extents(context);
        if (status)
                mlog_errno(status);
-out:
+out_copy:
        /*
         * movement/defragmentation may end up being partially completed,
         * that's the reason why we need to return userspace the finished
         * length and new_offset even if failure happens somewhere.
         */
-        if (argp) {
+        if (copy_to_user(argp, &range, sizeof(range)))
-                if (copy_to_user(argp, &range, sizeof(range)))
+                status = -EFAULT;
-                        status = -EFAULT;
-        }
+out_free:
        kfree(context);
+out_drop:
        mnt_drop_write_file(filp);
        return status;
diff --git a/fs/open.c b/fs/open.c
index 68354466879f..8c741002f947 100644
--- a/fs/open.c
+++ b/fs/open.c
@@ -197,10 +197,7 @@ out:
 SYSCALL_DEFINE2(ftruncate, unsigned int, fd, unsigned long, length)
 {
-        long ret = do_sys_ftruncate(fd, length, 1);
+        return do_sys_ftruncate(fd, length, 1);
-        /* avoid REGPARM breakage on x86: */
-        asmlinkage_protect(2, ret, fd, length);
-        return ret;
 }
 #ifdef CONFIG_COMPAT
@@ -212,32 +209,15 @@ COMPAT_SYSCALL_DEFINE2(ftruncate, unsigned int, fd, compat_ulong_t, length)
 /* LFS versions of truncate are only needed on 32 bit machines */
 #if BITS_PER_LONG == 32
-SYSCALL_DEFINE(truncate64)(const char __user * path, loff_t length)
+SYSCALL_DEFINE2(truncate64, const char __user *, path, loff_t, length)
 {
        return do_sys_truncate(path, length);
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_truncate64(long path, loff_t length)
-{
-        return SYSC_truncate64((const char __user *) path, length);
-}
-SYSCALL_ALIAS(sys_truncate64, SyS_truncate64);
-#endif
-SYSCALL_DEFINE(ftruncate64)(unsigned int fd, loff_t length)
+SYSCALL_DEFINE2(ftruncate64, unsigned int, fd, loff_t, length)
 {
-        long ret = do_sys_ftruncate(fd, length, 0);
+        return do_sys_ftruncate(fd, length, 0);
-        /* avoid REGPARM breakage on x86: */
-        asmlinkage_protect(2, ret, fd, length);
-        return ret;
-}
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_ftruncate64(long fd, loff_t length)
-{
-        return SYSC_ftruncate64((unsigned int) fd, length);
 }
-SYSCALL_ALIAS(sys_ftruncate64, SyS_ftruncate64);
-#endif
 #endif /* BITS_PER_LONG == 32 */
@@ -299,7 +279,7 @@ int do_fallocate(struct file *file, int mode, loff_t offset, loff_t len)
        return ret;
 }
-SYSCALL_DEFINE(fallocate)(int fd, int mode, loff_t offset, loff_t len)
+SYSCALL_DEFINE4(fallocate, int, fd, int, mode, loff_t, offset, loff_t, len)
 {
        struct fd f = fdget(fd);
        int error = -EBADF;
@@ -311,14 +291,6 @@ SYSCALL_DEFINE(fallocate)(int fd, int mode, loff_t offset, loff_t len)
        return error;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_fallocate(long fd, long mode, loff_t offset, loff_t len)
-{
-        return SYSC_fallocate((int)fd, (int)mode, offset, len);
-}
-SYSCALL_ALIAS(sys_fallocate, SyS_fallocate);
-#endif
 /*
 * access() needs to use the real uid/gid, not the effective uid/gid.
 * We do this by temporarily clearing all FS-related capabilities and
@@ -983,29 +955,19 @@ long do_sys_open(int dfd, const char __user *filename, int flags, umode_t mode)
 SYSCALL_DEFINE3(open, const char __user *, filename, int, flags, umode_t, mode)
 {
-        long ret;
        if (force_o_largefile())
                flags |= O_LARGEFILE;
-        ret = do_sys_open(AT_FDCWD, filename, flags, mode);
+        return do_sys_open(AT_FDCWD, filename, flags, mode);
-        /* avoid REGPARM breakage on x86: */
-        asmlinkage_protect(3, ret, filename, flags, mode);
-        return ret;
 }
 SYSCALL_DEFINE4(openat, int, dfd, const char __user *, filename, int, flags,
                umode_t, mode)
 {
-        long ret;
        if (force_o_largefile())
                flags |= O_LARGEFILE;
-        ret = do_sys_open(dfd, filename, flags, mode);
+        return do_sys_open(dfd, filename, flags, mode);
-        /* avoid REGPARM breakage on x86: */
-        asmlinkage_protect(4, ret, dfd, filename, flags, mode);
-        return ret;
 }
 #ifndef __alpha__
diff --git a/fs/proc/Makefile b/fs/proc/Makefile
index 712f24db9600..ab30716584f5 100644
--- a/fs/proc/Makefile
+++ b/fs/proc/Makefile
@@ -5,7 +5,7 @@
 obj-y   += proc.o
 proc-y                  := nommu.o task_nommu.o
-proc-$(CONFIG_MMU)      := mmu.o task_mmu.o
+proc-$(CONFIG_MMU)      := task_mmu.o
 proc-y       += inode.o root.o base.o generic.o array.o \
                fd.o
diff --git a/fs/proc/array.c b/fs/proc/array.c
index f7ed9ee46eb9..cbd0f1b324b9 100644
--- a/fs/proc/array.c
+++ b/fs/proc/array.c
@@ -143,6 +143,7 @@ static const char * const task_state_array[] = {
        "x (dead)",             /*  64 */
        "K (wakekill)",         /* 128 */
        "W (waking)",           /* 256 */
+        "P (parked)",           /* 512 */
 };
 static inline const char *get_task_state(struct task_struct *tsk)
diff --git a/fs/proc/base.c b/fs/proc/base.c
index 69078c7cef1f..3861bcec41ff 100644
--- a/fs/proc/base.c
+++ b/fs/proc/base.c
@@ -86,6 +86,7 @@
 #include <linux/fs_struct.h>
 #include <linux/slab.h>
 #include <linux/flex_array.h>
+#include <linux/posix-timers.h>
 #ifdef CONFIG_HARDWALL
 #include <asm/hardwall.h>
 #endif
@@ -1347,11 +1348,10 @@ static ssize_t comm_write(struct file *file, const char __user *buf,
        struct inode *inode = file_inode(file);
        struct task_struct *p;
        char buffer[TASK_COMM_LEN];
+        const size_t maxlen = sizeof(buffer) - 1;
        memset(buffer, 0, sizeof(buffer));
-        if (count > sizeof(buffer) - 1)
+        if (copy_from_user(buffer, buf, count > maxlen ? maxlen : count))
-                count = sizeof(buffer) - 1;
-        if (copy_from_user(buffer, buf, count))
                return -EFAULT;
        p = get_proc_task(inode);
@@ -2013,6 +2013,102 @@ static const struct file_operations proc_map_files_operations = {
        .llseek         = default_llseek,
 };
+struct timers_private {
+        struct pid *pid;
+        struct task_struct *task;
+        struct sighand_struct *sighand;
+        struct pid_namespace *ns;
+        unsigned long flags;
+};
+static void *timers_start(struct seq_file *m, loff_t *pos)
+{
+        struct timers_private *tp = m->private;
+        tp->task = get_pid_task(tp->pid, PIDTYPE_PID);
+        if (!tp->task)
+                return ERR_PTR(-ESRCH);
+        tp->sighand = lock_task_sighand(tp->task, &tp->flags);
+        if (!tp->sighand)
+                return ERR_PTR(-ESRCH);
+        return seq_list_start(&tp->task->signal->posix_timers, *pos);
+}
+static void *timers_next(struct seq_file *m, void *v, loff_t *pos)
+{
+        struct timers_private *tp = m->private;
+        return seq_list_next(v, &tp->task->signal->posix_timers, pos);
+}
+static void timers_stop(struct seq_file *m, void *v)
+{
+        struct timers_private *tp = m->private;
+        if (tp->sighand) {
+                unlock_task_sighand(tp->task, &tp->flags);
+                tp->sighand = NULL;
+        }
+        if (tp->task) {
+                put_task_struct(tp->task);
+                tp->task = NULL;
+        }
+}
+static int show_timer(struct seq_file *m, void *v)
+{
+        struct k_itimer *timer;
+        struct timers_private *tp = m->private;
+        int notify;
+        static char *nstr[] = {
+                [SIGEV_SIGNAL] = "signal",
+                [SIGEV_NONE] = "none",
+                [SIGEV_THREAD] = "thread",
+        };
+        timer = list_entry((struct list_head *)v, struct k_itimer, list);
+        notify = timer->it_sigev_notify;
+        seq_printf(m, "ID: %d\n", timer->it_id);
+        seq_printf(m, "signal: %d/%p\n", timer->sigq->info.si_signo,
+                        timer->sigq->info.si_value.sival_ptr);
+        seq_printf(m, "notify: %s/%s.%d\n",
+                nstr[notify & ~SIGEV_THREAD_ID],
+                (notify & SIGEV_THREAD_ID) ? "tid" : "pid",
+                pid_nr_ns(timer->it_pid, tp->ns));
+        return 0;
+}
+static const struct seq_operations proc_timers_seq_ops = {
+        .start  = timers_start,
+        .next   = timers_next,
+        .stop   = timers_stop,
+        .show   = show_timer,
+};
+static int proc_timers_open(struct inode *inode, struct file *file)
+{
+        struct timers_private *tp;
+        tp = __seq_open_private(file, &proc_timers_seq_ops,
+                        sizeof(struct timers_private));
+        if (!tp)
+                return -ENOMEM;
+        tp->pid = proc_pid(inode);
+        tp->ns = inode->i_sb->s_fs_info;
+        return 0;
+}
+static const struct file_operations proc_timers_operations = {
+        .open           = proc_timers_open,
+        .read           = seq_read,
+        .llseek         = seq_lseek,
+        .release        = seq_release_private,
+};
 #endif /* CONFIG_CHECKPOINT_RESTORE */
 static struct dentry *proc_pident_instantiate(struct inode *dir,
@@ -2583,6 +2679,9 @@ static const struct pid_entry tgid_base_stuff[] = {
        REG("gid_map",    S_IRUGO|S_IWUSR, proc_gid_map_operations),
        REG("projid_map", S_IRUGO|S_IWUSR, proc_projid_map_operations),
 #endif
+#ifdef CONFIG_CHECKPOINT_RESTORE
+        REG("timers",     S_IRUGO, proc_timers_operations),
+#endif
 };
 static int proc_tgid_base_readdir(struct file * filp,
diff --git a/fs/proc/generic.c b/fs/proc/generic.c
index 4b3b3ffb52f1..21e1a8f1659d 100644
--- a/fs/proc/generic.c
+++ b/fs/proc/generic.c
@@ -755,37 +755,8 @@ void pde_put(struct proc_dir_entry *pde)
                free_proc_entry(pde);
 }
-/*
+static void entry_rundown(struct proc_dir_entry *de)
- * Remove a /proc entry and free it if it's not currently in use.
- */
-void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
 {
-        struct proc_dir_entry **p;
-        struct proc_dir_entry *de = NULL;
-        const char *fn = name;
-        unsigned int len;
-        spin_lock(&proc_subdir_lock);
-        if (__xlate_proc_name(name, &parent, &fn) != 0) {
-                spin_unlock(&proc_subdir_lock);
-                return;
-        }
-        len = strlen(fn);
-        for (p = &parent->subdir; *p; p=&(*p)->next ) {
-                if (proc_match(len, fn, *p)) {
-                        de = *p;
-                        *p = de->next;
-                        de->next = NULL;
-                        break;
-                }
-        }
-        spin_unlock(&proc_subdir_lock);
-        if (!de) {
-                WARN(1, "name '%s'\n", name);
-                return;
-        }
        spin_lock(&de->pde_unload_lock);
        /*
         * Stop accepting new callers into module. If you're
@@ -817,6 +788,40 @@ void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
                spin_lock(&de->pde_unload_lock);
        }
        spin_unlock(&de->pde_unload_lock);
+}
+/*
+ * Remove a /proc entry and free it if it's not currently in use.
+ */
+void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
+{
+        struct proc_dir_entry **p;
+        struct proc_dir_entry *de = NULL;
+        const char *fn = name;
+        unsigned int len;
+        spin_lock(&proc_subdir_lock);
+        if (__xlate_proc_name(name, &parent, &fn) != 0) {
+                spin_unlock(&proc_subdir_lock);
+                return;
+        }
+        len = strlen(fn);
+        for (p = &parent->subdir; *p; p=&(*p)->next ) {
+                if (proc_match(len, fn, *p)) {
+                        de = *p;
+                        *p = de->next;
+                        de->next = NULL;
+                        break;
+                }
+        }
+        spin_unlock(&proc_subdir_lock);
+        if (!de) {
+                WARN(1, "name '%s'\n", name);
+                return;
+        }
+        entry_rundown(de);
        if (S_ISDIR(de->mode))
                parent->nlink--;
@@ -827,3 +832,57 @@ void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
        pde_put(de);
 }
 EXPORT_SYMBOL(remove_proc_entry);
+int remove_proc_subtree(const char *name, struct proc_dir_entry *parent)
+{
+        struct proc_dir_entry **p;
+        struct proc_dir_entry *root = NULL, *de, *next;
+        const char *fn = name;
+        unsigned int len;
+        spin_lock(&proc_subdir_lock);
+        if (__xlate_proc_name(name, &parent, &fn) != 0) {
+                spin_unlock(&proc_subdir_lock);
+                return -ENOENT;
+        }
+        len = strlen(fn);
+        for (p = &parent->subdir; *p; p=&(*p)->next ) {
+                if (proc_match(len, fn, *p)) {
+                        root = *p;
+                        *p = root->next;
+                        root->next = NULL;
+                        break;
+                }
+        }
+        if (!root) {
+                spin_unlock(&proc_subdir_lock);
+                return -ENOENT;
+        }
+        de = root;
+        while (1) {
+                next = de->subdir;
+                if (next) {
+                        de->subdir = next->next;
+                        next->next = NULL;
+                        de = next;
+                        continue;
+                }
+                spin_unlock(&proc_subdir_lock);
+                entry_rundown(de);
+                next = de->parent;
+                if (S_ISDIR(de->mode))
+                        next->nlink--;
+                de->nlink = 0;
+                if (de == root)
+                        break;
+                pde_put(de);
+                spin_lock(&proc_subdir_lock);
+                de = next;
+        }
+        pde_put(root);
+        return 0;
+}
+EXPORT_SYMBOL(remove_proc_subtree);
diff --git a/fs/proc/internal.h b/fs/proc/internal.h
index 85ff3a4598b3..75710357a517 100644
--- a/fs/proc/internal.h
+++ b/fs/proc/internal.h
@@ -30,24 +30,6 @@ extern int proc_net_init(void);
 static inline int proc_net_init(void) { return 0; }
 #endif
-struct vmalloc_info {
-        unsigned long   used;
-        unsigned long   largest_chunk;
-};
-#ifdef CONFIG_MMU
-#define VMALLOC_TOTAL (VMALLOC_END - VMALLOC_START)
-extern void get_vmalloc_info(struct vmalloc_info *vmi);
-#else
-#define VMALLOC_TOTAL 0UL
-#define get_vmalloc_info(vmi)                   \
-do {                                            \
-        (vmi)->used = 0;                        \
-        (vmi)->largest_chunk = 0;               \
-} while(0)
-#endif
 extern int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
                                struct pid *pid, struct task_struct *task);
 extern int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
diff --git a/fs/proc/kcore.c b/fs/proc/kcore.c
index eda6f017f272..f6a13f489e30 100644
--- a/fs/proc/kcore.c
+++ b/fs/proc/kcore.c
@@ -15,6 +15,7 @@
 #include <linux/capability.h>
 #include <linux/elf.h>
 #include <linux/elfcore.h>
+#include <linux/notifier.h>
 #include <linux/vmalloc.h>
 #include <linux/highmem.h>
 #include <linux/printk.h>
@@ -564,7 +565,6 @@ static const struct file_operations proc_kcore_operations = {
        .llseek         = default_llseek,
 };
-#ifdef CONFIG_MEMORY_HOTPLUG
 /* just remember that we have to update kcore */
 static int __meminit kcore_callback(struct notifier_block *self,
                                    unsigned long action, void *arg)
@@ -578,8 +578,11 @@ static int __meminit kcore_callback(struct notifier_block *self,
        }
        return NOTIFY_OK;
 }
-#endif
+static struct notifier_block kcore_callback_nb __meminitdata = {
+        .notifier_call = kcore_callback,
+        .priority = 0,
+};
 static struct kcore_list kcore_vmalloc;
@@ -631,7 +634,7 @@ static int __init proc_kcore_init(void)
        add_modules_range();
        /* Store direct-map area from physical memory map */
        kcore_update_ram();
-        hotplug_memory_notifier(kcore_callback, 0);
+        register_hotmemory_notifier(&kcore_callback_nb);
        return 0;
 }
diff --git a/fs/proc/meminfo.c b/fs/proc/meminfo.c
index 1efaaa19c4f3..5aa847a603c0 100644
--- a/fs/proc/meminfo.c
+++ b/fs/proc/meminfo.c
@@ -11,6 +11,7 @@
 #include <linux/swap.h>
 #include <linux/vmstat.h>
 #include <linux/atomic.h>
+#include <linux/vmalloc.h>
 #include <asm/page.h>
 #include <asm/pgtable.h>
 #include "internal.h"
diff --git a/fs/proc/mmu.c b/fs/proc/mmu.c
deleted file mode 100644
index 8ae221dfd010..000000000000
--- a/fs/proc/mmu.c
+++ /dev/null
@@ -1,60 +0,0 @@
-/* mmu.c: mmu memory info files
- *
- * Copyright (C) 2004 Red Hat, Inc. All Rights Reserved.
- * Written by David Howells (dhowells@redhat.com)
- *
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version
- * 2 of the License, or (at your option) any later version.
- */
-#include <linux/spinlock.h>
-#include <linux/vmalloc.h>
-#include <linux/highmem.h>
-#include <asm/pgtable.h>
-#include "internal.h"
-void get_vmalloc_info(struct vmalloc_info *vmi)
-{
-        struct vm_struct *vma;
-        unsigned long free_area_size;
-        unsigned long prev_end;
-        vmi->used = 0;
-        if (!vmlist) {
-                vmi->largest_chunk = VMALLOC_TOTAL;
-        }
-        else {
-                vmi->largest_chunk = 0;
-                prev_end = VMALLOC_START;
-                read_lock(&vmlist_lock);
-                for (vma = vmlist; vma; vma = vma->next) {
-                        unsigned long addr = (unsigned long) vma->addr;
-                        /*
-                         * Some archs keep another range for modules in vmlist
-                         */
-                        if (addr < VMALLOC_START)
-                                continue;
-                        if (addr >= VMALLOC_END)
-                                break;
-                        vmi->used += vma->size;
-                        free_area_size = addr - prev_end;
-                        if (vmi->largest_chunk < free_area_size)
-                                vmi->largest_chunk = free_area_size;
-                        prev_end = vma->size + addr;
-                }
-                if (VMALLOC_END - prev_end > vmi->largest_chunk)
-                        vmi->largest_chunk = VMALLOC_END - prev_end;
-                read_unlock(&vmlist_lock);
-        }
-}
diff --git a/fs/read_write.c b/fs/read_write.c
index e6ddc8dceb96..8274a794253b 100644
--- a/fs/read_write.c
+++ b/fs/read_write.c
@@ -128,7 +128,7 @@ EXPORT_SYMBOL(generic_file_llseek_size);
 *
 * This is a generic implemenation of ->llseek useable for all normal local
 * filesystems.  It just updates the file offset to the value specified by
- * @offset and @whence under i_mutex.
+ * @offset and @whence.
 */
 loff_t generic_file_llseek(struct file *file, loff_t offset, int whence)
 {
@@ -515,8 +515,8 @@ SYSCALL_DEFINE3(write, unsigned int, fd, const char __user *, buf,
        return ret;
 }
-SYSCALL_DEFINE(pread64)(unsigned int fd, char __user *buf,
+SYSCALL_DEFINE4(pread64, unsigned int, fd, char __user *, buf,
-                        size_t count, loff_t pos)
+                        size_t, count, loff_t, pos)
 {
        struct fd f;
        ssize_t ret = -EBADF;
@@ -534,17 +534,9 @@ SYSCALL_DEFINE(pread64)(unsigned int fd, char __user *buf,
        return ret;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_pread64(long fd, long buf, long count, loff_t pos)
-{
-        return SYSC_pread64((unsigned int) fd, (char __user *) buf,
-                            (size_t) count, pos);
-}
-SYSCALL_ALIAS(sys_pread64, SyS_pread64);
-#endif
-SYSCALL_DEFINE(pwrite64)(unsigned int fd, const char __user *buf,
+SYSCALL_DEFINE4(pwrite64, unsigned int, fd, const char __user *, buf,
-                         size_t count, loff_t pos)
+                         size_t, count, loff_t, pos)
 {
        struct fd f;
        ssize_t ret = -EBADF;
@@ -562,14 +554,6 @@ SYSCALL_DEFINE(pwrite64)(unsigned int fd, const char __user *buf,
        return ret;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_pwrite64(long fd, long buf, long count, loff_t pos)
-{
-        return SYSC_pwrite64((unsigned int) fd, (const char __user *) buf,
-                             (size_t) count, pos);
-}
-SYSCALL_ALIAS(sys_pwrite64, SyS_pwrite64);
-#endif
 /*
 * Reduce an iovec's length in-place.  Return the resulting number of segments
@@ -897,8 +881,8 @@ SYSCALL_DEFINE5(pwritev, unsigned long, fd, const struct iovec __user *, vec,
        return ret;
 }
-ssize_t do_sendfile(int out_fd, int in_fd, loff_t *ppos, size_t count,
+static ssize_t do_sendfile(int out_fd, int in_fd, loff_t *ppos,
-                    loff_t max)
+                           size_t count, loff_t max)
 {
        struct fd in, out;
        struct inode *in_inode, *out_inode;
@@ -1022,3 +1006,43 @@ SYSCALL_DEFINE4(sendfile64, int, out_fd, int, in_fd, loff_t __user *, offset, si
        return do_sendfile(out_fd, in_fd, NULL, count, 0);
 }
+#ifdef CONFIG_COMPAT
+COMPAT_SYSCALL_DEFINE4(sendfile, int, out_fd, int, in_fd,
+                compat_off_t __user *, offset, compat_size_t, count)
+{
+        loff_t pos;
+        off_t off;
+        ssize_t ret;
+        if (offset) {
+                if (unlikely(get_user(off, offset)))
+                        return -EFAULT;
+                pos = off;
+                ret = do_sendfile(out_fd, in_fd, &pos, count, MAX_NON_LFS);
+                if (unlikely(put_user(pos, offset)))
+                        return -EFAULT;
+                return ret;
+        }
+        return do_sendfile(out_fd, in_fd, NULL, count, 0);
+}
+COMPAT_SYSCALL_DEFINE4(sendfile64, int, out_fd, int, in_fd,
+                compat_loff_t __user *, offset, compat_size_t, count)
+{
+        loff_t pos;
+        ssize_t ret;
+        if (offset) {
+                if (unlikely(copy_from_user(&pos, offset, sizeof(loff_t))))
+                        return -EFAULT;
+                ret = do_sendfile(out_fd, in_fd, &pos, count, 0);
+                if (unlikely(put_user(pos, offset)))
+                        return -EFAULT;
+                return ret;
+        }
+        return do_sendfile(out_fd, in_fd, NULL, count, 0);
+}
+#endif
diff --git a/fs/read_write.h b/fs/read_write.h
index d3e00ef67420..d07b954c6e0c 100644
--- a/fs/read_write.h
+++ b/fs/read_write.h
@@ -12,5 +12,3 @@ ssize_t do_sync_readv_writev(struct file *filp, const struct iovec *iov,
                unsigned long nr_segs, size_t len, loff_t *ppos, iov_fn_t fn);
 ssize_t do_loop_readv_writev(struct file *filp, struct iovec *iov,
                unsigned long nr_segs, loff_t *ppos, io_fn_t fn);
-ssize_t do_sendfile(int out_fd, int in_fd, loff_t *ppos, size_t count,
-                    loff_t max);
diff --git a/fs/reiserfs/xattr.c b/fs/reiserfs/xattr.c
index c196369fe408..4cce1d9552fb 100644
--- a/fs/reiserfs/xattr.c
+++ b/fs/reiserfs/xattr.c
@@ -187,8 +187,8 @@ fill_with_dentries(void *buf, const char *name, int namelen, loff_t offset,
        if (dbuf->count == ARRAY_SIZE(dbuf->dentries))
                return -ENOSPC;
-        if (name[0] == '.' && (name[1] == '\0' ||
+        if (name[0] == '.' && (namelen < 2 ||
-                               (name[1] == '.' && name[2] == '\0')))
+                               (namelen == 2 && name[1] == '.')))
                return 0;
        dentry = lookup_one_len(name, dbuf->xadir, namelen);
diff --git a/fs/signalfd.c b/fs/signalfd.c
index b53486961735..424b7b65321f 100644
--- a/fs/signalfd.c
+++ b/fs/signalfd.c
@@ -30,6 +30,7 @@
 #include <linux/signalfd.h>
 #include <linux/syscalls.h>
 #include <linux/proc_fs.h>
+#include <linux/compat.h>
 void signalfd_cleanup(struct sighand_struct *sighand)
 {
@@ -311,3 +312,33 @@ SYSCALL_DEFINE3(signalfd, int, ufd, sigset_t __user *, user_mask,
 {
        return sys_signalfd4(ufd, user_mask, sizemask, 0);
 }
+#ifdef CONFIG_COMPAT
+COMPAT_SYSCALL_DEFINE4(signalfd4, int, ufd,
+                     const compat_sigset_t __user *,sigmask,
+                     compat_size_t, sigsetsize,
+                     int, flags)
+{
+        compat_sigset_t ss32;
+        sigset_t tmp;
+        sigset_t __user *ksigmask;
+        if (sigsetsize != sizeof(compat_sigset_t))
+                return -EINVAL;
+        if (copy_from_user(&ss32, sigmask, sizeof(ss32)))
+                return -EFAULT;
+        sigset_from_compat(&tmp, &ss32);
+        ksigmask = compat_alloc_user_space(sizeof(sigset_t));
+        if (copy_to_user(ksigmask, &tmp, sizeof(sigset_t)))
+                return -EFAULT;
+        return sys_signalfd4(ufd, ksigmask, sizeof(sigset_t), flags);
+}
+COMPAT_SYSCALL_DEFINE3(signalfd, int, ufd,
+                     const compat_sigset_t __user *,sigmask,
+                     compat_size_t, sigsetsize)
+{
+        return compat_sys_signalfd4(ufd, sigmask, sigsetsize, 0);
+}
+#endif
diff --git a/fs/splice.c b/fs/splice.c
index 29e394e49ddd..6b485b8753bd 100644
--- a/fs/splice.c
+++ b/fs/splice.c
@@ -31,6 +31,7 @@
 #include <linux/security.h>
 #include <linux/gfp.h>
 #include <linux/socket.h>
+#include <linux/compat.h>
 #include "internal.h"
 /*
@@ -1690,6 +1691,27 @@ SYSCALL_DEFINE4(vmsplice, int, fd, const struct iovec __user *, iov,
        return error;
 }
+#ifdef CONFIG_COMPAT
+COMPAT_SYSCALL_DEFINE4(vmsplice, int, fd, const struct compat_iovec __user *, iov32,
+                    unsigned int, nr_segs, unsigned int, flags)
+{
+        unsigned i;
+        struct iovec __user *iov;
+        if (nr_segs > UIO_MAXIOV)
+                return -EINVAL;
+        iov = compat_alloc_user_space(nr_segs * sizeof(struct iovec));
+        for (i = 0; i < nr_segs; i++) {
+                struct compat_iovec v;
+                if (get_user(v.iov_base, &iov32[i].iov_base) ||
+                    get_user(v.iov_len, &iov32[i].iov_len) ||
+                    put_user(compat_ptr(v.iov_base), &iov[i].iov_base) ||
+                    put_user(v.iov_len, &iov[i].iov_len))
+                        return -EFAULT;
+        }
+        return sys_vmsplice(fd, iov, nr_segs, flags);
+}
+#endif
 SYSCALL_DEFINE6(splice, int, fd_in, loff_t __user *, off_in,
                int, fd_out, loff_t __user *, off_out,
                size_t, len, unsigned int, flags)
diff --git a/fs/sync.c b/fs/sync.c
index 2c5d6639a66a..905f3f6b3d85 100644
--- a/fs/sync.c
+++ b/fs/sync.c
@@ -283,8 +283,8 @@ EXPORT_SYMBOL(generic_write_sync);
 * already-instantiated disk blocks, there are no guarantees here that the data
 * will be available after a crash.
 */
-SYSCALL_DEFINE(sync_file_range)(int fd, loff_t offset, loff_t nbytes,
+SYSCALL_DEFINE4(sync_file_range, int, fd, loff_t, offset, loff_t, nbytes,
-                                unsigned int flags)
+                                unsigned int, flags)
 {
        int ret;
        struct fd f;
@@ -365,29 +365,11 @@ out_put:
 out:
        return ret;
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_sync_file_range(long fd, loff_t offset, loff_t nbytes,
-                                    long flags)
-{
-        return SYSC_sync_file_range((int) fd, offset, nbytes,
-                                    (unsigned int) flags);
-}
-SYSCALL_ALIAS(sys_sync_file_range, SyS_sync_file_range);
-#endif
 /* It would be nice if people remember that not all the world's an i386
   when they introduce new system calls */
-SYSCALL_DEFINE(sync_file_range2)(int fd, unsigned int flags,
+SYSCALL_DEFINE4(sync_file_range2, int, fd, unsigned int, flags,
-                                 loff_t offset, loff_t nbytes)
+                                 loff_t, offset, loff_t, nbytes)
 {
        return sys_sync_file_range(fd, offset, nbytes, flags);
 }
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_sync_file_range2(long fd, long flags,
-                                     loff_t offset, loff_t nbytes)
-{
-        return SYSC_sync_file_range2((int) fd, (unsigned int) flags,
-                                     offset, nbytes);
-}
-SYSCALL_ALIAS(sys_sync_file_range2, SyS_sync_file_range2);
-#endif
diff --git a/fs/sysfs/dir.c b/fs/sysfs/dir.c
index e14512678c9b..e8e0e71b29d5 100644
--- a/fs/sysfs/dir.c
+++ b/fs/sysfs/dir.c
@@ -165,21 +165,8 @@ struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd)
        if (unlikely(!sd))
                return NULL;
-        while (1) {
+        if (!atomic_inc_unless_negative(&sd->s_active))
-                int v, t;
+                return NULL;
-                v = atomic_read(&sd->s_active);
-                if (unlikely(v < 0))
-                        return NULL;
-                t = atomic_cmpxchg(&sd->s_active, v, v + 1);
-                if (likely(t == v))
-                        break;
-                if (t < 0)
-                        return NULL;
-                cpu_relax();
-        }
        if (likely(!ignore_lockdep(sd)))
                rwsem_acquire_read(&sd->dep_map, 0, 1, _RET_IP_);
@@ -281,6 +268,10 @@ void release_sysfs_dirent(struct sysfs_dirent * sd)
         */
        parent_sd = sd->s_parent;
+        WARN(!(sd->s_flags & SYSFS_FLAG_REMOVED),
+                "sysfs: free using entry: %s/%s\n",
+                parent_sd ? parent_sd->s_name : "", sd->s_name);
        if (sysfs_type(sd) == SYSFS_KOBJ_LINK)
                sysfs_put(sd->s_symlink.target_sd);
        if (sysfs_type(sd) & SYSFS_COPY_NAME)
@@ -399,7 +390,7 @@ struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type)
        sd->s_name = name;
        sd->s_mode = mode;
-        sd->s_flags = type;
+        sd->s_flags = type | SYSFS_FLAG_REMOVED;
        return sd;
@@ -479,6 +470,9 @@ int __sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd)
                ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME;
        }
+        /* Mark the entry added into directory tree */
+        sd->s_flags &= ~SYSFS_FLAG_REMOVED;
        return 0;
 }
@@ -1012,6 +1006,7 @@ static int sysfs_readdir(struct file * filp, void * dirent, filldir_t filldir)
        enum kobj_ns_type type;
        const void *ns;
        ino_t ino;
+        loff_t off;
        type = sysfs_ns_type(parent_sd);
        ns = sysfs_info(dentry->d_sb)->ns[type];
@@ -1034,6 +1029,7 @@ static int sysfs_readdir(struct file * filp, void * dirent, filldir_t filldir)
                        return 0;
        }
        mutex_lock(&sysfs_mutex);
+        off = filp->f_pos;
        for (pos = sysfs_dir_pos(ns, parent_sd, filp->f_pos, pos);
             pos;
             pos = sysfs_dir_next_pos(ns, parent_sd, filp->f_pos, pos)) {
@@ -1045,19 +1041,24 @@ static int sysfs_readdir(struct file * filp, void * dirent, filldir_t filldir)
                len = strlen(name);
                ino = pos->s_ino;
                type = dt_type(pos);
-                filp->f_pos = pos->s_hash;
+                off = filp->f_pos = pos->s_hash;
                filp->private_data = sysfs_get(pos);
                mutex_unlock(&sysfs_mutex);
-                ret = filldir(dirent, name, len, filp->f_pos, ino, type);
+                ret = filldir(dirent, name, len, off, ino, type);
                mutex_lock(&sysfs_mutex);
                if (ret < 0)
                        break;
        }
        mutex_unlock(&sysfs_mutex);
-        if ((filp->f_pos > 1) && !pos) { /* EOF */
-                filp->f_pos = INT_MAX;
+        /* don't reference last entry if its refcount is dropped */
+        if (!pos) {
                filp->private_data = NULL;
+                /* EOF and not changed as 0 or 1 in read/write path */
+                if (off == filp->f_pos && off > 1)
+                        filp->f_pos = INT_MAX;
        }
        return 0;
 }
diff --git a/fs/ubifs/super.c b/fs/ubifs/super.c
index ac838b844936..f21acf0ef01f 100644
--- a/fs/ubifs/super.c
+++ b/fs/ubifs/super.c
@@ -1568,6 +1568,12 @@ static int ubifs_remount_rw(struct ubifs_info *c)
        c->remounting_rw = 1;
        c->ro_mount = 0;
+        if (c->space_fixup) {
+                err = ubifs_fixup_free_space(c);
+                if (err)
+                        return err;
+        }
        err = check_free_space(c);
        if (err)
                goto out;
@@ -1684,12 +1690,6 @@ static int ubifs_remount_rw(struct ubifs_info *c)
                err = dbg_check_space_info(c);
        }
-        if (c->space_fixup) {
-                err = ubifs_fixup_free_space(c);
-                if (err)
-                        goto out;
-        }
        mutex_unlock(&c->umount_mutex);
        return err;
diff --git a/fs/ufs/util.c b/fs/ufs/util.c
index 95425b59ce0a..b6c2f94e041e 100644
--- a/fs/ufs/util.c
+++ b/fs/ufs/util.c
@@ -26,8 +26,7 @@ struct ufs_buffer_head * _ubh_bread_ (struct ufs_sb_private_info * uspi,
        count = size >> uspi->s_fshift;
        if (count > UFS_MAXFRAG)
                return NULL;
-        ubh = (struct ufs_buffer_head *)
+        ubh = kmalloc (sizeof (struct ufs_buffer_head), GFP_NOFS);
-                kmalloc (sizeof (struct ufs_buffer_head), GFP_NOFS);
        if (!ubh)
                return NULL;
        ubh->fragment = fragment;