aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorSai Praneeth Prakhya <sai.praneeth.prakhya@intel.com>2018-11-29 12:12:23 -0500
committerIngo Molnar <mingo@kernel.org>2018-11-30 03:10:30 -0500
commit7e0dabd3010d6041ee0a952c1146b2150a11f1be (patch)
tree82891e713ff528e931b284147e1da13b91acd172
parent8c25db0a5a67986106aa3da7ce165ff961aa7847 (diff)
x86/mm/pageattr: Introduce helper function to unmap EFI boot services
Ideally, after kernel assumes control of the platform, firmware shouldn't access EFI boot services code/data regions. But, it's noticed that this is not so true in many x86 platforms. Hence, during boot, kernel reserves EFI boot services code/data regions [1] and maps [2] them to efi_pgd so that call to set_virtual_address_map() doesn't fail. After returning from set_virtual_address_map(), kernel frees the reserved regions [3] but they still remain mapped. Hence, introduce kernel_unmap_pages_in_pgd() which will later be used to unmap EFI boot services code/data regions. While at it modify kernel_map_pages_in_pgd() by: 1. Adding __init modifier because it's always used *only* during boot. 2. Add a warning if it's used after SMP is initialized because it uses __flush_tlb_all() which flushes mappings only on current CPU. Unmapping EFI boot services code/data regions will result in clearing PAGE_PRESENT bit and it shouldn't bother L1TF cases because it's already handled by protnone_mask() at arch/x86/include/asm/pgtable-invert.h. [1] efi_reserve_boot_services() [2] efi_map_region() -> __map_region() -> kernel_map_pages_in_pgd() [3] efi_free_boot_services() Signed-off-by: Sai Praneeth Prakhya <sai.praneeth.prakhya@intel.com> Signed-off-by: Ard Biesheuvel <ard.biesheuvel@linaro.org> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Cc: Andy Lutomirski <luto@kernel.org> Cc: Arend van Spriel <arend.vanspriel@broadcom.com> Cc: Bhupesh Sharma <bhsharma@redhat.com> Cc: Borislav Petkov <bp@alien8.de> Cc: Dave Hansen <dave.hansen@intel.com> Cc: Eric Snowberg <eric.snowberg@oracle.com> Cc: Hans de Goede <hdegoede@redhat.com> Cc: Joe Perches <joe@perches.com> Cc: Jon Hunter <jonathanh@nvidia.com> Cc: Julien Thierry <julien.thierry@arm.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Marc Zyngier <marc.zyngier@arm.com> Cc: Matt Fleming <matt@codeblueprint.co.uk> Cc: Nathan Chancellor <natechancellor@gmail.com> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Sedat Dilek <sedat.dilek@gmail.com> Cc: YiFei Zhu <zhuyifei1999@gmail.com> Cc: linux-efi@vger.kernel.org Link: http://lkml.kernel.org/r/20181129171230.18699-5-ard.biesheuvel@linaro.org Signed-off-by: Ingo Molnar <mingo@kernel.org>
-rw-r--r--arch/x86/include/asm/pgtable_types.h8
-rw-r--r--arch/x86/mm/pageattr.c40
2 files changed, 44 insertions, 4 deletions
diff --git a/arch/x86/include/asm/pgtable_types.h b/arch/x86/include/asm/pgtable_types.h
index 106b7d0e2dae..d6ff0bbdb394 100644
--- a/arch/x86/include/asm/pgtable_types.h
+++ b/arch/x86/include/asm/pgtable_types.h
@@ -564,8 +564,12 @@ extern pte_t *lookup_address_in_pgd(pgd_t *pgd, unsigned long address,
564 unsigned int *level); 564 unsigned int *level);
565extern pmd_t *lookup_pmd_address(unsigned long address); 565extern pmd_t *lookup_pmd_address(unsigned long address);
566extern phys_addr_t slow_virt_to_phys(void *__address); 566extern phys_addr_t slow_virt_to_phys(void *__address);
567extern int kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn, unsigned long address, 567extern int __init kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn,
568 unsigned numpages, unsigned long page_flags); 568 unsigned long address,
569 unsigned numpages,
570 unsigned long page_flags);
571extern int __init kernel_unmap_pages_in_pgd(pgd_t *pgd, unsigned long address,
572 unsigned long numpages);
569#endif /* !__ASSEMBLY__ */ 573#endif /* !__ASSEMBLY__ */
570 574
571#endif /* _ASM_X86_PGTABLE_DEFS_H */ 575#endif /* _ASM_X86_PGTABLE_DEFS_H */
diff --git a/arch/x86/mm/pageattr.c b/arch/x86/mm/pageattr.c
index db7a10082238..bac35001d896 100644
--- a/arch/x86/mm/pageattr.c
+++ b/arch/x86/mm/pageattr.c
@@ -2338,8 +2338,8 @@ bool kernel_page_present(struct page *page)
2338 2338
2339#endif /* CONFIG_DEBUG_PAGEALLOC */ 2339#endif /* CONFIG_DEBUG_PAGEALLOC */
2340 2340
2341int kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn, unsigned long address, 2341int __init kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn, unsigned long address,
2342 unsigned numpages, unsigned long page_flags) 2342 unsigned numpages, unsigned long page_flags)
2343{ 2343{
2344 int retval = -EINVAL; 2344 int retval = -EINVAL;
2345 2345
@@ -2353,6 +2353,8 @@ int kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn, unsigned long address,
2353 .flags = 0, 2353 .flags = 0,
2354 }; 2354 };
2355 2355
2356 WARN_ONCE(num_online_cpus() > 1, "Don't call after initializing SMP");
2357
2356 if (!(__supported_pte_mask & _PAGE_NX)) 2358 if (!(__supported_pte_mask & _PAGE_NX))
2357 goto out; 2359 goto out;
2358 2360
@@ -2375,6 +2377,40 @@ out:
2375} 2377}
2376 2378
2377/* 2379/*
2380 * __flush_tlb_all() flushes mappings only on current CPU and hence this
2381 * function shouldn't be used in an SMP environment. Presently, it's used only
2382 * during boot (way before smp_init()) by EFI subsystem and hence is ok.
2383 */
2384int __init kernel_unmap_pages_in_pgd(pgd_t *pgd, unsigned long address,
2385 unsigned long numpages)
2386{
2387 int retval;
2388
2389 /*
2390 * The typical sequence for unmapping is to find a pte through
2391 * lookup_address_in_pgd() (ideally, it should never return NULL because
2392 * the address is already mapped) and change it's protections. As pfn is
2393 * the *target* of a mapping, it's not useful while unmapping.
2394 */
2395 struct cpa_data cpa = {
2396 .vaddr = &address,
2397 .pfn = 0,
2398 .pgd = pgd,
2399 .numpages = numpages,
2400 .mask_set = __pgprot(0),
2401 .mask_clr = __pgprot(_PAGE_PRESENT | _PAGE_RW),
2402 .flags = 0,
2403 };
2404
2405 WARN_ONCE(num_online_cpus() > 1, "Don't call after initializing SMP");
2406
2407 retval = __change_page_attr_set_clr(&cpa, 0);
2408 __flush_tlb_all();
2409
2410 return retval;
2411}
2412
2413/*
2378 * The testcases use internal knowledge of the implementation that shouldn't 2414 * The testcases use internal knowledge of the implementation that shouldn't
2379 * be exposed to the rest of the kernel. Include these directly here. 2415 * be exposed to the rest of the kernel. Include these directly here.
2380 */ 2416 */