aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorPeter Zijlstra <peterz@infradead.org>2013-11-28 13:38:42 -0500
committerIngo Molnar <mingo@kernel.org>2014-01-13 09:13:13 -0500
commit35af99e646c7f7ea46dc2977601e9e71a51dadd5 (patch)
treed999820d233844278549cd826c4bfd6c7aa1ecc8
parentef08f0fff87630d4f67ceb09514d8b444df833f8 (diff)
sched/clock, x86: Use a static_key for sched_clock_stable
In order to avoid the runtime condition and variable load turn sched_clock_stable into a static_key. Also provide a shorter implementation of local_clock() and cpu_clock(int) when sched_clock_stable==1. MAINLINE PRE POST sched_clock_stable: 1 1 1 (cold) sched_clock: 329841 221876 215295 (cold) local_clock: 301773 234692 220773 (warm) sched_clock: 38375 25602 25659 (warm) local_clock: 100371 33265 27242 (warm) rdtsc: 27340 24214 24208 sched_clock_stable: 0 0 0 (cold) sched_clock: 382634 235941 237019 (cold) local_clock: 396890 297017 294819 (warm) sched_clock: 38194 25233 25609 (warm) local_clock: 143452 71234 71232 (warm) rdtsc: 27345 24245 24243 Signed-off-by: Peter Zijlstra <peterz@infradead.org> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Andrew Morton <akpm@linux-foundation.org> Link: http://lkml.kernel.org/n/tip-eummbdechzz37mwmpags1gjr@git.kernel.org Signed-off-by: Ingo Molnar <mingo@kernel.org>
-rw-r--r--arch/x86/kernel/cpu/amd.c2
-rw-r--r--arch/x86/kernel/cpu/intel.c2
-rw-r--r--arch/x86/kernel/cpu/perf_event.c2
-rw-r--r--arch/x86/kernel/tsc.c6
-rw-r--r--include/linux/sched.h4
-rw-r--r--kernel/sched/clock.c41
-rw-r--r--kernel/sched/debug.c2
-rw-r--r--kernel/time/tick-sched.c2
-rw-r--r--kernel/trace/ring_buffer.c2
9 files changed, 46 insertions, 17 deletions
diff --git a/arch/x86/kernel/cpu/amd.c b/arch/x86/kernel/cpu/amd.c
index bca023bdd6b2..8bc79cddd9a2 100644
--- a/arch/x86/kernel/cpu/amd.c
+++ b/arch/x86/kernel/cpu/amd.c
@@ -487,7 +487,7 @@ static void early_init_amd(struct cpuinfo_x86 *c)
487 set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC); 487 set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC);
488 set_cpu_cap(c, X86_FEATURE_NONSTOP_TSC); 488 set_cpu_cap(c, X86_FEATURE_NONSTOP_TSC);
489 if (!check_tsc_unstable()) 489 if (!check_tsc_unstable())
490 sched_clock_stable = 1; 490 set_sched_clock_stable();
491 } 491 }
492 492
493#ifdef CONFIG_X86_64 493#ifdef CONFIG_X86_64
diff --git a/arch/x86/kernel/cpu/intel.c b/arch/x86/kernel/cpu/intel.c
index ea04b342c026..1a439c047ff3 100644
--- a/arch/x86/kernel/cpu/intel.c
+++ b/arch/x86/kernel/cpu/intel.c
@@ -93,7 +93,7 @@ static void early_init_intel(struct cpuinfo_x86 *c)
93 set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC); 93 set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC);
94 set_cpu_cap(c, X86_FEATURE_NONSTOP_TSC); 94 set_cpu_cap(c, X86_FEATURE_NONSTOP_TSC);
95 if (!check_tsc_unstable()) 95 if (!check_tsc_unstable())
96 sched_clock_stable = 1; 96 set_sched_clock_stable();
97 } 97 }
98 98
99 /* Penwell and Cloverview have the TSC which doesn't sleep on S3 */ 99 /* Penwell and Cloverview have the TSC which doesn't sleep on S3 */
diff --git a/arch/x86/kernel/cpu/perf_event.c b/arch/x86/kernel/cpu/perf_event.c
index 9f97bd03f74f..b88645191fe5 100644
--- a/arch/x86/kernel/cpu/perf_event.c
+++ b/arch/x86/kernel/cpu/perf_event.c
@@ -1890,7 +1890,7 @@ void arch_perf_update_userpage(struct perf_event_mmap_page *userpg, u64 now)
1890 userpg->cap_user_rdpmc = x86_pmu.attr_rdpmc; 1890 userpg->cap_user_rdpmc = x86_pmu.attr_rdpmc;
1891 userpg->pmc_width = x86_pmu.cntval_bits; 1891 userpg->pmc_width = x86_pmu.cntval_bits;
1892 1892
1893 if (!sched_clock_stable) 1893 if (!sched_clock_stable())
1894 return; 1894 return;
1895 1895
1896 data = cyc2ns_read_begin(); 1896 data = cyc2ns_read_begin();
diff --git a/arch/x86/kernel/tsc.c b/arch/x86/kernel/tsc.c
index 92b090b2b79e..53c123537245 100644
--- a/arch/x86/kernel/tsc.c
+++ b/arch/x86/kernel/tsc.c
@@ -822,7 +822,7 @@ static unsigned long long cyc2ns_suspend;
822 822
823void tsc_save_sched_clock_state(void) 823void tsc_save_sched_clock_state(void)
824{ 824{
825 if (!sched_clock_stable) 825 if (!sched_clock_stable())
826 return; 826 return;
827 827
828 cyc2ns_suspend = sched_clock(); 828 cyc2ns_suspend = sched_clock();
@@ -842,7 +842,7 @@ void tsc_restore_sched_clock_state(void)
842 unsigned long flags; 842 unsigned long flags;
843 int cpu; 843 int cpu;
844 844
845 if (!sched_clock_stable) 845 if (!sched_clock_stable())
846 return; 846 return;
847 847
848 local_irq_save(flags); 848 local_irq_save(flags);
@@ -984,7 +984,7 @@ void mark_tsc_unstable(char *reason)
984{ 984{
985 if (!tsc_unstable) { 985 if (!tsc_unstable) {
986 tsc_unstable = 1; 986 tsc_unstable = 1;
987 sched_clock_stable = 0; 987 clear_sched_clock_stable();
988 disable_sched_clock_irqtime(); 988 disable_sched_clock_irqtime();
989 pr_info("Marking TSC unstable due to %s\n", reason); 989 pr_info("Marking TSC unstable due to %s\n", reason);
990 /* Change only the rating, when not registered */ 990 /* Change only the rating, when not registered */
diff --git a/include/linux/sched.h b/include/linux/sched.h
index a196cb7fc6f2..a03875221663 100644
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -1994,7 +1994,9 @@ static inline void sched_clock_idle_wakeup_event(u64 delta_ns)
1994 * but then during bootup it turns out that sched_clock() 1994 * but then during bootup it turns out that sched_clock()
1995 * is reliable after all: 1995 * is reliable after all:
1996 */ 1996 */
1997extern int sched_clock_stable; 1997extern int sched_clock_stable(void);
1998extern void set_sched_clock_stable(void);
1999extern void clear_sched_clock_stable(void);
1998 2000
1999extern void sched_clock_tick(void); 2001extern void sched_clock_tick(void);
2000extern void sched_clock_idle_sleep_event(void); 2002extern void sched_clock_idle_sleep_event(void);
diff --git a/kernel/sched/clock.c b/kernel/sched/clock.c
index 59371549ddf0..c9b34c4e3ecc 100644
--- a/kernel/sched/clock.c
+++ b/kernel/sched/clock.c
@@ -58,6 +58,7 @@
58#include <linux/percpu.h> 58#include <linux/percpu.h>
59#include <linux/ktime.h> 59#include <linux/ktime.h>
60#include <linux/sched.h> 60#include <linux/sched.h>
61#include <linux/static_key.h>
61 62
62/* 63/*
63 * Scheduler clock - returns current time in nanosec units. 64 * Scheduler clock - returns current time in nanosec units.
@@ -74,7 +75,27 @@ EXPORT_SYMBOL_GPL(sched_clock);
74__read_mostly int sched_clock_running; 75__read_mostly int sched_clock_running;
75 76
76#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK 77#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
77__read_mostly int sched_clock_stable; 78static struct static_key __sched_clock_stable = STATIC_KEY_INIT;
79
80int sched_clock_stable(void)
81{
82 if (static_key_false(&__sched_clock_stable))
83 return false;
84 return true;
85}
86
87void set_sched_clock_stable(void)
88{
89 if (!sched_clock_stable())
90 static_key_slow_dec(&__sched_clock_stable);
91}
92
93void clear_sched_clock_stable(void)
94{
95 /* XXX worry about clock continuity */
96 if (sched_clock_stable())
97 static_key_slow_inc(&__sched_clock_stable);
98}
78 99
79struct sched_clock_data { 100struct sched_clock_data {
80 u64 tick_raw; 101 u64 tick_raw;
@@ -234,7 +255,7 @@ u64 sched_clock_cpu(int cpu)
234 struct sched_clock_data *scd; 255 struct sched_clock_data *scd;
235 u64 clock; 256 u64 clock;
236 257
237 if (sched_clock_stable) 258 if (sched_clock_stable())
238 return sched_clock(); 259 return sched_clock();
239 260
240 if (unlikely(!sched_clock_running)) 261 if (unlikely(!sched_clock_running))
@@ -257,7 +278,7 @@ void sched_clock_tick(void)
257 struct sched_clock_data *scd; 278 struct sched_clock_data *scd;
258 u64 now, now_gtod; 279 u64 now, now_gtod;
259 280
260 if (sched_clock_stable) 281 if (sched_clock_stable())
261 return; 282 return;
262 283
263 if (unlikely(!sched_clock_running)) 284 if (unlikely(!sched_clock_running))
@@ -308,7 +329,10 @@ EXPORT_SYMBOL_GPL(sched_clock_idle_wakeup_event);
308 */ 329 */
309u64 cpu_clock(int cpu) 330u64 cpu_clock(int cpu)
310{ 331{
311 return sched_clock_cpu(cpu); 332 if (static_key_false(&__sched_clock_stable))
333 return sched_clock_cpu(cpu);
334
335 return sched_clock();
312} 336}
313 337
314/* 338/*
@@ -320,7 +344,10 @@ u64 cpu_clock(int cpu)
320 */ 344 */
321u64 local_clock(void) 345u64 local_clock(void)
322{ 346{
323 return sched_clock_cpu(raw_smp_processor_id()); 347 if (static_key_false(&__sched_clock_stable))
348 return sched_clock_cpu(raw_smp_processor_id());
349
350 return sched_clock();
324} 351}
325 352
326#else /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */ 353#else /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
@@ -340,12 +367,12 @@ u64 sched_clock_cpu(int cpu)
340 367
341u64 cpu_clock(int cpu) 368u64 cpu_clock(int cpu)
342{ 369{
343 return sched_clock_cpu(cpu); 370 return sched_clock();
344} 371}
345 372
346u64 local_clock(void) 373u64 local_clock(void)
347{ 374{
348 return sched_clock_cpu(0); 375 return sched_clock();
349} 376}
350 377
351#endif /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */ 378#endif /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
diff --git a/kernel/sched/debug.c b/kernel/sched/debug.c
index 374fe04a5e6e..dd52e7ffb10e 100644
--- a/kernel/sched/debug.c
+++ b/kernel/sched/debug.c
@@ -371,7 +371,7 @@ static void sched_debug_header(struct seq_file *m)
371 PN(cpu_clk); 371 PN(cpu_clk);
372 P(jiffies); 372 P(jiffies);
373#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK 373#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
374 P(sched_clock_stable); 374 P(sched_clock_stable());
375#endif 375#endif
376#undef PN 376#undef PN
377#undef P 377#undef P
diff --git a/kernel/time/tick-sched.c b/kernel/time/tick-sched.c
index ea20f7d1ac2c..c833249ab0fb 100644
--- a/kernel/time/tick-sched.c
+++ b/kernel/time/tick-sched.c
@@ -177,7 +177,7 @@ static bool can_stop_full_tick(void)
177 * TODO: kick full dynticks CPUs when 177 * TODO: kick full dynticks CPUs when
178 * sched_clock_stable is set. 178 * sched_clock_stable is set.
179 */ 179 */
180 if (!sched_clock_stable) { 180 if (!sched_clock_stable()) {
181 trace_tick_stop(0, "unstable sched clock\n"); 181 trace_tick_stop(0, "unstable sched clock\n");
182 /* 182 /*
183 * Don't allow the user to think they can get 183 * Don't allow the user to think they can get
diff --git a/kernel/trace/ring_buffer.c b/kernel/trace/ring_buffer.c
index cc2f66f68dc5..294b8a271a04 100644
--- a/kernel/trace/ring_buffer.c
+++ b/kernel/trace/ring_buffer.c
@@ -2558,7 +2558,7 @@ rb_reserve_next_event(struct ring_buffer *buffer,
2558 if (unlikely(test_time_stamp(delta))) { 2558 if (unlikely(test_time_stamp(delta))) {
2559 int local_clock_stable = 1; 2559 int local_clock_stable = 1;
2560#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK 2560#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
2561 local_clock_stable = sched_clock_stable; 2561 local_clock_stable = sched_clock_stable();
2562#endif 2562#endif
2563 WARN_ONCE(delta > (1ULL << 59), 2563 WARN_ONCE(delta > (1ULL << 59),
2564 KERN_WARNING "Delta way too big! %llu ts=%llu write stamp = %llu\n%s", 2564 KERN_WARNING "Delta way too big! %llu ts=%llu write stamp = %llu\n%s",