diff options
author | Lai Jiangshan <laijs@cn.fujitsu.com> | 2009-03-18 04:42:57 -0400 |
---|---|---|
committer | Steven Rostedt <srostedt@redhat.com> | 2009-03-18 20:36:59 -0400 |
commit | e9d9df44736d116726f4596f7e2f9ce2764ffc0a (patch) | |
tree | bca129639885fa7288b925e5053f3787fa7e625a /arch/x86 | |
parent | 4acd4d00f716873e27e7b60ae292cbdbfae674dd (diff) |
ftrace: protect running nmi (V3)
When I review the sensitive code ftrace_nmi_enter(), I found
the atomic variable nmi_running does protect NMI VS do_ftrace_mod_code(),
but it can not protects NMI(entered nmi) VS NMI(ftrace_nmi_enter()).
cpu#1 | cpu#2 | cpu#3
ftrace_nmi_enter() | do_ftrace_mod_code() |
not modify | |
------------------------|-----------------------|--
executing | set mod_code_write = 1|
executing --|-----------------------|--------------------
executing | | ftrace_nmi_enter()
executing | | do modify
------------------------|-----------------------|-----------------
ftrace_nmi_exit() | |
cpu#3 may be being modified the code which is still being executed on cpu#1,
it will have undefined results and possibly take a GPF, this patch
prevents it occurred.
Signed-off-by: Lai Jiangshan <laijs@cn.fujitsu.com>
LKML-Reference: <49C0B411.30003@cn.fujitsu.com>
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Diffstat (limited to 'arch/x86')
-rw-r--r-- | arch/x86/kernel/ftrace.c | 63 |
1 files changed, 40 insertions, 23 deletions
diff --git a/arch/x86/kernel/ftrace.c b/arch/x86/kernel/ftrace.c index 1d0d7f42efe3..57b33edb7ce3 100644 --- a/arch/x86/kernel/ftrace.c +++ b/arch/x86/kernel/ftrace.c | |||
@@ -79,11 +79,11 @@ static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) | |||
79 | * | 79 | * |
80 | * 1) Put the instruction pointer into the IP buffer | 80 | * 1) Put the instruction pointer into the IP buffer |
81 | * and the new code into the "code" buffer. | 81 | * and the new code into the "code" buffer. |
82 | * 2) Set a flag that says we are modifying code | 82 | * 2) Wait for any running NMIs to finish and set a flag that says |
83 | * 3) Wait for any running NMIs to finish. | 83 | * we are modifying code, it is done in an atomic operation. |
84 | * 4) Write the code | 84 | * 3) Write the code |
85 | * 5) clear the flag. | 85 | * 4) clear the flag. |
86 | * 6) Wait for any running NMIs to finish. | 86 | * 5) Wait for any running NMIs to finish. |
87 | * | 87 | * |
88 | * If an NMI is executed, the first thing it does is to call | 88 | * If an NMI is executed, the first thing it does is to call |
89 | * "ftrace_nmi_enter". This will check if the flag is set to write | 89 | * "ftrace_nmi_enter". This will check if the flag is set to write |
@@ -95,9 +95,9 @@ static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) | |||
95 | * are the same as what exists. | 95 | * are the same as what exists. |
96 | */ | 96 | */ |
97 | 97 | ||
98 | #define MOD_CODE_WRITE_FLAG (1 << 31) /* set when NMI should do the write */ | ||
98 | static atomic_t nmi_running = ATOMIC_INIT(0); | 99 | static atomic_t nmi_running = ATOMIC_INIT(0); |
99 | static int mod_code_status; /* holds return value of text write */ | 100 | static int mod_code_status; /* holds return value of text write */ |
100 | static int mod_code_write; /* set when NMI should do the write */ | ||
101 | static void *mod_code_ip; /* holds the IP to write to */ | 101 | static void *mod_code_ip; /* holds the IP to write to */ |
102 | static void *mod_code_newcode; /* holds the text to write to the IP */ | 102 | static void *mod_code_newcode; /* holds the text to write to the IP */ |
103 | 103 | ||
@@ -114,6 +114,20 @@ int ftrace_arch_read_dyn_info(char *buf, int size) | |||
114 | return r; | 114 | return r; |
115 | } | 115 | } |
116 | 116 | ||
117 | static void clear_mod_flag(void) | ||
118 | { | ||
119 | int old = atomic_read(&nmi_running); | ||
120 | |||
121 | for (;;) { | ||
122 | int new = old & ~MOD_CODE_WRITE_FLAG; | ||
123 | |||
124 | if (old == new) | ||
125 | break; | ||
126 | |||
127 | old = atomic_cmpxchg(&nmi_running, old, new); | ||
128 | } | ||
129 | } | ||
130 | |||
117 | static void ftrace_mod_code(void) | 131 | static void ftrace_mod_code(void) |
118 | { | 132 | { |
119 | /* | 133 | /* |
@@ -127,27 +141,39 @@ static void ftrace_mod_code(void) | |||
127 | 141 | ||
128 | /* if we fail, then kill any new writers */ | 142 | /* if we fail, then kill any new writers */ |
129 | if (mod_code_status) | 143 | if (mod_code_status) |
130 | mod_code_write = 0; | 144 | clear_mod_flag(); |
131 | } | 145 | } |
132 | 146 | ||
133 | void ftrace_nmi_enter(void) | 147 | void ftrace_nmi_enter(void) |
134 | { | 148 | { |
135 | atomic_inc(&nmi_running); | 149 | if (atomic_inc_return(&nmi_running) & MOD_CODE_WRITE_FLAG) { |
136 | /* Must have nmi_running seen before reading write flag */ | 150 | smp_rmb(); |
137 | smp_mb(); | ||
138 | if (mod_code_write) { | ||
139 | ftrace_mod_code(); | 151 | ftrace_mod_code(); |
140 | atomic_inc(&nmi_update_count); | 152 | atomic_inc(&nmi_update_count); |
141 | } | 153 | } |
154 | /* Must have previous changes seen before executions */ | ||
155 | smp_mb(); | ||
142 | } | 156 | } |
143 | 157 | ||
144 | void ftrace_nmi_exit(void) | 158 | void ftrace_nmi_exit(void) |
145 | { | 159 | { |
146 | /* Finish all executions before clearing nmi_running */ | 160 | /* Finish all executions before clearing nmi_running */ |
147 | smp_wmb(); | 161 | smp_mb(); |
148 | atomic_dec(&nmi_running); | 162 | atomic_dec(&nmi_running); |
149 | } | 163 | } |
150 | 164 | ||
165 | static void wait_for_nmi_and_set_mod_flag(void) | ||
166 | { | ||
167 | if (!atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)) | ||
168 | return; | ||
169 | |||
170 | do { | ||
171 | cpu_relax(); | ||
172 | } while (atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)); | ||
173 | |||
174 | nmi_wait_count++; | ||
175 | } | ||
176 | |||
151 | static void wait_for_nmi(void) | 177 | static void wait_for_nmi(void) |
152 | { | 178 | { |
153 | if (!atomic_read(&nmi_running)) | 179 | if (!atomic_read(&nmi_running)) |
@@ -167,14 +193,9 @@ do_ftrace_mod_code(unsigned long ip, void *new_code) | |||
167 | mod_code_newcode = new_code; | 193 | mod_code_newcode = new_code; |
168 | 194 | ||
169 | /* The buffers need to be visible before we let NMIs write them */ | 195 | /* The buffers need to be visible before we let NMIs write them */ |
170 | smp_wmb(); | ||
171 | |||
172 | mod_code_write = 1; | ||
173 | |||
174 | /* Make sure write bit is visible before we wait on NMIs */ | ||
175 | smp_mb(); | 196 | smp_mb(); |
176 | 197 | ||
177 | wait_for_nmi(); | 198 | wait_for_nmi_and_set_mod_flag(); |
178 | 199 | ||
179 | /* Make sure all running NMIs have finished before we write the code */ | 200 | /* Make sure all running NMIs have finished before we write the code */ |
180 | smp_mb(); | 201 | smp_mb(); |
@@ -182,13 +203,9 @@ do_ftrace_mod_code(unsigned long ip, void *new_code) | |||
182 | ftrace_mod_code(); | 203 | ftrace_mod_code(); |
183 | 204 | ||
184 | /* Make sure the write happens before clearing the bit */ | 205 | /* Make sure the write happens before clearing the bit */ |
185 | smp_wmb(); | ||
186 | |||
187 | mod_code_write = 0; | ||
188 | |||
189 | /* make sure NMIs see the cleared bit */ | ||
190 | smp_mb(); | 206 | smp_mb(); |
191 | 207 | ||
208 | clear_mod_flag(); | ||
192 | wait_for_nmi(); | 209 | wait_for_nmi(); |
193 | 210 | ||
194 | return mod_code_status; | 211 | return mod_code_status; |