x86/mm: Rip out complicated, out-of-date, buggy TLB flushing

I think the flush_tlb_mm_range() code that tries to tune the flush sizes based on the CPU needs to get ripped out for several reasons: 1. It is obviously buggy. It uses mm->total_vm to judge the task's footprint in the TLB. It should certainly be using some measure of RSS, *NOT* ->total_vm since only resident memory can populate the TLB. 2. Haswell, and several other CPUs are missing from the intel_tlb_flushall_shift_set() function. Thus, it has been demonstrated to bitrot quickly in practice. 3. It is plain wrong in my vm: [ 0.037444] Last level iTLB entries: 4KB 0, 2MB 0, 4MB 0 [ 0.037444] Last level dTLB entries: 4KB 0, 2MB 0, 4MB 0 [ 0.037444] tlb_flushall_shift: 6 Which leads to it to never use invlpg. 4. The assumptions about TLB refill costs are wrong: http://lkml.kernel.org/r/1337782555-8088-3-git-send-email-alex.shi@intel.com (more on this in later patches) 5. I can not reproduce the original data: https://lkml.org/lkml/2012/5/17/59 I believe the sample times were too short. Running the benchmark in a loop yields times that vary quite a bit. Note that this leaves us with a static ceiling of 1 page. This is a conservative, dumb setting, and will be revised in a later patch. This also removes the code which attempts to predict whether we are flushing data or instructions. We expect instruction flushes to be relatively rare and not worth tuning for explicitly. Signed-off-by: Dave Hansen <dave.hansen@linux.intel.com> Link: http://lkml.kernel.org/r/20140731154055.ABC88E89@viggo.jf.intel.com Acked-by: Rik van Riel <riel@redhat.com> Acked-by: Mel Gorman <mgorman@suse.de> Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
author: Dave Hansen <dave.hansen@linux.intel.com> 2014-07-31 11:40:55 -0400
committer: H. Peter Anvin <hpa@linux.intel.com> 2014-07-31 11:48:50 -0400
commit: e9f4e0a9fe2723078b7a1a1169828dd46a7b2f9e (patch)
tree: c16300d2f05f2fce6b7b70b2c6fed1ac58486129 /arch/x86/kernel/cpu/intel.c
parent: 4995ab9cf512e9a6cc07dfd6b1d4e2fc48ce7fef (diff)
1 files changed, 0 insertions, 26 deletions
diff --git a/arch/x86/kernel/cpu/intel.c b/arch/x86/kernel/cpu/intel.c
index a80029035bf2..cd61755de49b 100644
--- a/arch/x86/kernel/cpu/intel.c
+++ b/arch/x86/kernel/cpu/intel.c
@@ -634,31 +634,6 @@ static void intel_tlb_lookup(const unsigned char desc)
        }
 }
-static void intel_tlb_flushall_shift_set(struct cpuinfo_x86 *c)
-{
-        switch ((c->x86 << 8) + c->x86_model) {
-        case 0x60f: /* original 65 nm celeron/pentium/core2/xeon, "Merom"/"Conroe" */
-        case 0x616: /* single-core 65 nm celeron/core2solo "Merom-L"/"Conroe-L" */
-        case 0x617: /* current 45 nm celeron/core2/xeon "Penryn"/"Wolfdale" */
-        case 0x61d: /* six-core 45 nm xeon "Dunnington" */
-                tlb_flushall_shift = -1;
-                break;
-        case 0x63a: /* Ivybridge */
-                tlb_flushall_shift = 2;
-                break;
-        case 0x61a: /* 45 nm nehalem, "Bloomfield" */
-        case 0x61e: /* 45 nm nehalem, "Lynnfield" */
-        case 0x625: /* 32 nm nehalem, "Clarkdale" */
-        case 0x62c: /* 32 nm nehalem, "Gulftown" */
-        case 0x62e: /* 45 nm nehalem-ex, "Beckton" */
-        case 0x62f: /* 32 nm Xeon E7 */
-        case 0x62a: /* SandyBridge */
-        case 0x62d: /* SandyBridge, "Romely-EP" */
-        default:
-                tlb_flushall_shift = 6;
-        }
-}
 static void intel_detect_tlb(struct cpuinfo_x86 *c)
 {
        int i, j, n;
@@ -683,7 +658,6 @@ static void intel_detect_tlb(struct cpuinfo_x86 *c)
                for (j = 1 ; j < 16 ; j++)
                        intel_tlb_lookup(desc[j]);
        }
-        intel_tlb_flushall_shift_set(c);
 }
 static const struct cpu_dev intel_cpu_dev = {
author	Dave Hansen <dave.hansen@linux.intel.com>	2014-07-31 11:40:55 -0400
committer	H. Peter Anvin <hpa@linux.intel.com>	2014-07-31 11:48:50 -0400
commit	e9f4e0a9fe2723078b7a1a1169828dd46a7b2f9e (patch)
tree	c16300d2f05f2fce6b7b70b2c6fed1ac58486129 /arch/x86/kernel/cpu/intel.c
parent	4995ab9cf512e9a6cc07dfd6b1d4e2fc48ce7fef (diff)

diff --git a/arch/x86/kernel/cpu/intel.c b/arch/x86/kernel/cpu/intel.c index a80029035bf2..cd61755de49b 100644 --- a/arch/x86/kernel/cpu/intel.c +++ b/arch/x86/kernel/cpu/intel.c
@@ -634,31 +634,6 @@ static void intel_tlb_lookup(const unsigned char desc)
634	}	634	}
635	}	635	}
636		636
637	static void intel_tlb_flushall_shift_set(struct cpuinfo_x86 *c)
638	{
639	switch ((c->x86 << 8) + c->x86_model) {
640	case 0x60f: /* original 65 nm celeron/pentium/core2/xeon, "Merom"/"Conroe" */
641	case 0x616: /* single-core 65 nm celeron/core2solo "Merom-L"/"Conroe-L" */
642	case 0x617: /* current 45 nm celeron/core2/xeon "Penryn"/"Wolfdale" */
643	case 0x61d: /* six-core 45 nm xeon "Dunnington" */
644	tlb_flushall_shift = -1;
645	break;
646	case 0x63a: /* Ivybridge */
647	tlb_flushall_shift = 2;
648	break;
649	case 0x61a: /* 45 nm nehalem, "Bloomfield" */
650	case 0x61e: /* 45 nm nehalem, "Lynnfield" */
651	case 0x625: /* 32 nm nehalem, "Clarkdale" */
652	case 0x62c: /* 32 nm nehalem, "Gulftown" */
653	case 0x62e: /* 45 nm nehalem-ex, "Beckton" */
654	case 0x62f: /* 32 nm Xeon E7 */
655	case 0x62a: /* SandyBridge */
656	case 0x62d: /* SandyBridge, "Romely-EP" */
657	default:
658	tlb_flushall_shift = 6;
659	}
660	}
661
662	static void intel_detect_tlb(struct cpuinfo_x86 *c)	637	static void intel_detect_tlb(struct cpuinfo_x86 *c)
663	{	638	{
664	int i, j, n;	639	int i, j, n;
@@ -683,7 +658,6 @@ static void intel_detect_tlb(struct cpuinfo_x86 *c)
683	for (j = 1 ; j < 16 ; j++)	658	for (j = 1 ; j < 16 ; j++)
684	intel_tlb_lookup(desc[j]);	659	intel_tlb_lookup(desc[j]);
685	}	660	}
686	intel_tlb_flushall_shift_set(c);
687	}	661	}
688		662
689	static const struct cpu_dev intel_cpu_dev = {	663	static const struct cpu_dev intel_cpu_dev = {