aboutsummaryrefslogtreecommitdiffstats
path: root/arch/x86/kernel/ftrace.c
diff options
context:
space:
mode:
authorSteven Rostedt <rostedt@goodmis.org>2008-08-14 18:05:05 -0400
committerIngo Molnar <mingo@elte.hu>2008-10-14 04:35:01 -0400
commit732f3ca7d4ba3c1be8d051d52302ef441ee7748b (patch)
tree503f2c44e3a1617cb4aa45454071cb52330574b9 /arch/x86/kernel/ftrace.c
parent0a37605c2261a06d8cafc62dee11374ad676c8c4 (diff)
ftrace: use only 5 byte nops for x86
Mathieu Desnoyers revealed a bug in the original code. The nop that is used to relpace the mcount caller can be a two part nop. This runs the risk where a process can be preempted after executing the first nop, but before the second part of the nop. The ftrace code calls kstop_machine to keep multiple CPUs from executing code that is being modified, but it does not protect against a task preempting in the middle of a two part nop. If the above preemption happens and the tracer is enabled, after the kstop_machine runs, all those nops will be calls to the trace function. If the preempted process that was preempted between the two nops is executed again, it will execute half of the call to the trace function, and this might crash the system. This patch instead uses what both the latest Intel and AMD spec suggests. That is the P6_NOP5 sequence of "0x0f 0x1f 0x44 0x00 0x00". Note, some older CPUs and QEMU might fault on this nop, so this nop is executed with fault handling first. If it detects a fault, it will then use the code "0x66 0x66 0x66 0x66 0x90". If that faults, it will then default to a simple "jmp 1f; .byte 0x00 0x00 0x00; 1:". The jmp is not optimal but will do if the first two can not be executed. TODO: Examine the cpuid to determine the nop to use. Signed-off-by: Steven Rostedt <srostedt@redhat.com> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'arch/x86/kernel/ftrace.c')
-rw-r--r--arch/x86/kernel/ftrace.c68
1 files changed, 61 insertions, 7 deletions
diff --git a/arch/x86/kernel/ftrace.c b/arch/x86/kernel/ftrace.c
index 96aadbfedcc6..4151c91254e8 100644
--- a/arch/x86/kernel/ftrace.c
+++ b/arch/x86/kernel/ftrace.c
@@ -16,8 +16,8 @@
16#include <linux/init.h> 16#include <linux/init.h>
17#include <linux/list.h> 17#include <linux/list.h>
18 18
19#include <asm/alternative.h>
20#include <asm/ftrace.h> 19#include <asm/ftrace.h>
20#include <asm/nops.h>
21 21
22 22
23/* Long is fine, even if it is only 4 bytes ;-) */ 23/* Long is fine, even if it is only 4 bytes ;-) */
@@ -119,13 +119,67 @@ notrace int ftrace_mcount_set(unsigned long *data)
119 119
120int __init ftrace_dyn_arch_init(void *data) 120int __init ftrace_dyn_arch_init(void *data)
121{ 121{
122 const unsigned char *const *noptable = find_nop_table(); 122 extern const unsigned char ftrace_test_p6nop[];
123 123 extern const unsigned char ftrace_test_nop5[];
124 /* This is running in kstop_machine */ 124 extern const unsigned char ftrace_test_jmp[];
125 125 int faulted = 0;
126 ftrace_mcount_set(data);
127 126
128 ftrace_nop = (unsigned long *)noptable[MCOUNT_INSN_SIZE]; 127 /*
128 * There is no good nop for all x86 archs.
129 * We will default to using the P6_NOP5, but first we
130 * will test to make sure that the nop will actually
131 * work on this CPU. If it faults, we will then
132 * go to a lesser efficient 5 byte nop. If that fails
133 * we then just use a jmp as our nop. This isn't the most
134 * efficient nop, but we can not use a multi part nop
135 * since we would then risk being preempted in the middle
136 * of that nop, and if we enabled tracing then, it might
137 * cause a system crash.
138 *
139 * TODO: check the cpuid to determine the best nop.
140 */
141 asm volatile (
142 "jmp ftrace_test_jmp\n"
143 /* This code needs to stay around */
144 ".section .text, \"ax\"\n"
145 "ftrace_test_jmp:"
146 "jmp ftrace_test_p6nop\n"
147 ".byte 0x00,0x00,0x00\n" /* 2 byte jmp + 3 bytes */
148 "ftrace_test_p6nop:"
149 P6_NOP5
150 "jmp 1f\n"
151 "ftrace_test_nop5:"
152 ".byte 0x66,0x66,0x66,0x66,0x90\n"
153 "jmp 1f\n"
154 ".previous\n"
155 "1:"
156 ".section .fixup, \"ax\"\n"
157 "2: movl $1, %0\n"
158 " jmp ftrace_test_nop5\n"
159 "3: movl $2, %0\n"
160 " jmp 1b\n"
161 ".previous\n"
162 _ASM_EXTABLE(ftrace_test_p6nop, 2b)
163 _ASM_EXTABLE(ftrace_test_nop5, 3b)
164 : "=r"(faulted) : "0" (faulted));
165
166 switch (faulted) {
167 case 0:
168 pr_info("ftrace: converting mcount calls to 0f 1f 44 00 00\n");
169 ftrace_nop = (unsigned long *)ftrace_test_p6nop;
170 break;
171 case 1:
172 pr_info("ftrace: converting mcount calls to 66 66 66 66 90\n");
173 ftrace_nop = (unsigned long *)ftrace_test_nop5;
174 break;
175 case 2:
176 pr_info("ftrace: converting mcount calls to jmp 1f\n");
177 ftrace_nop = (unsigned long *)ftrace_test_jmp;
178 break;
179 }
180
181 /* The return code is retured via data */
182 *(unsigned long *)data = 0;
129 183
130 return 0; 184 return 0;
131} 185}