aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorchenjie <chenjie6@huawei.com>2017-11-29 19:10:54 -0500
committerLinus Torvalds <torvalds@linux-foundation.org>2017-11-29 21:40:43 -0500
commit6ea8d958a2c95a1d514015d4e29ba21a8c0a1a91 (patch)
treece8cb7704e78795e561d07aabb43f22718745f8f
parent04e35f4495dd560db30c25efca4eecae8ec8c375 (diff)
mm/madvise.c: fix madvise() infinite loop under special circumstances
MADVISE_WILLNEED has always been a noop for DAX (formerly XIP) mappings. Unfortunately madvise_willneed() doesn't communicate this information properly to the generic madvise syscall implementation. The calling convention is quite subtle there. madvise_vma() is supposed to either return an error or update &prev otherwise the main loop will never advance to the next vma and it will keep looping for ever without a way to get out of the kernel. It seems this has been broken since introduction. Nobody has noticed because nobody seems to be using MADVISE_WILLNEED on these DAX mappings. [mhocko@suse.com: rewrite changelog] Link: http://lkml.kernel.org/r/20171127115318.911-1-guoxuenan@huawei.com Fixes: fe77ba6f4f97 ("[PATCH] xip: madvice/fadvice: execute in place") Signed-off-by: chenjie <chenjie6@huawei.com> Signed-off-by: guoxuenan <guoxuenan@huawei.com> Acked-by: Michal Hocko <mhocko@suse.com> Cc: Minchan Kim <minchan@kernel.org> Cc: zhangyi (F) <yi.zhang@huawei.com> Cc: Miao Xie <miaoxie@huawei.com> Cc: Mike Rapoport <rppt@linux.vnet.ibm.com> Cc: Shaohua Li <shli@fb.com> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Mel Gorman <mgorman@techsingularity.net> Cc: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Cc: David Rientjes <rientjes@google.com> Cc: Anshuman Khandual <khandual@linux.vnet.ibm.com> Cc: Rik van Riel <riel@redhat.com> Cc: Carsten Otte <cotte@de.ibm.com> Cc: Dan Williams <dan.j.williams@intel.com> Cc: <stable@vger.kernel.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
-rw-r--r--mm/madvise.c4
1 files changed, 1 insertions, 3 deletions
diff --git a/mm/madvise.c b/mm/madvise.c
index 375cf32087e4..751e97aa2210 100644
--- a/mm/madvise.c
+++ b/mm/madvise.c
@@ -276,15 +276,14 @@ static long madvise_willneed(struct vm_area_struct *vma,
276{ 276{
277 struct file *file = vma->vm_file; 277 struct file *file = vma->vm_file;
278 278
279 *prev = vma;
279#ifdef CONFIG_SWAP 280#ifdef CONFIG_SWAP
280 if (!file) { 281 if (!file) {
281 *prev = vma;
282 force_swapin_readahead(vma, start, end); 282 force_swapin_readahead(vma, start, end);
283 return 0; 283 return 0;
284 } 284 }
285 285
286 if (shmem_mapping(file->f_mapping)) { 286 if (shmem_mapping(file->f_mapping)) {
287 *prev = vma;
288 force_shm_swapin_readahead(vma, start, end, 287 force_shm_swapin_readahead(vma, start, end,
289 file->f_mapping); 288 file->f_mapping);
290 return 0; 289 return 0;
@@ -299,7 +298,6 @@ static long madvise_willneed(struct vm_area_struct *vma,
299 return 0; 298 return 0;
300 } 299 }
301 300
302 *prev = vma;
303 start = ((start - vma->vm_start) >> PAGE_SHIFT) + vma->vm_pgoff; 301 start = ((start - vma->vm_start) >> PAGE_SHIFT) + vma->vm_pgoff;
304 if (end > vma->vm_end) 302 if (end > vma->vm_end)
305 end = vma->vm_end; 303 end = vma->vm_end;