diff options
| author | Lai Jiangshan <laijs@cn.fujitsu.com> | 2009-03-18 04:42:57 -0400 |
|---|---|---|
| committer | Steven Rostedt <srostedt@redhat.com> | 2009-03-18 20:36:59 -0400 |
| commit | e9d9df44736d116726f4596f7e2f9ce2764ffc0a (patch) | |
| tree | bca129639885fa7288b925e5053f3787fa7e625a | |
| parent | 4acd4d00f716873e27e7b60ae292cbdbfae674dd (diff) | |
ftrace: protect running nmi (V3)
When I review the sensitive code ftrace_nmi_enter(), I found
the atomic variable nmi_running does protect NMI VS do_ftrace_mod_code(),
but it can not protects NMI(entered nmi) VS NMI(ftrace_nmi_enter()).
cpu#1 | cpu#2 | cpu#3
ftrace_nmi_enter() | do_ftrace_mod_code() |
not modify | |
------------------------|-----------------------|--
executing | set mod_code_write = 1|
executing --|-----------------------|--------------------
executing | | ftrace_nmi_enter()
executing | | do modify
------------------------|-----------------------|-----------------
ftrace_nmi_exit() | |
cpu#3 may be being modified the code which is still being executed on cpu#1,
it will have undefined results and possibly take a GPF, this patch
prevents it occurred.
Signed-off-by: Lai Jiangshan <laijs@cn.fujitsu.com>
LKML-Reference: <49C0B411.30003@cn.fujitsu.com>
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
| -rw-r--r-- | arch/x86/kernel/ftrace.c | 63 |
1 files changed, 40 insertions, 23 deletions
diff --git a/arch/x86/kernel/ftrace.c b/arch/x86/kernel/ftrace.c index 1d0d7f42efe3..57b33edb7ce3 100644 --- a/arch/x86/kernel/ftrace.c +++ b/arch/x86/kernel/ftrace.c | |||
| @@ -79,11 +79,11 @@ static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) | |||
| 79 | * | 79 | * |
| 80 | * 1) Put the instruction pointer into the IP buffer | 80 | * 1) Put the instruction pointer into the IP buffer |
| 81 | * and the new code into the "code" buffer. | 81 | * and the new code into the "code" buffer. |
| 82 | * 2) Set a flag that says we are modifying code | 82 | * 2) Wait for any running NMIs to finish and set a flag that says |
| 83 | * 3) Wait for any running NMIs to finish. | 83 | * we are modifying code, it is done in an atomic operation. |
| 84 | * 4) Write the code | 84 | * 3) Write the code |
| 85 | * 5) clear the flag. | 85 | * 4) clear the flag. |
| 86 | * 6) Wait for any running NMIs to finish. | 86 | * 5) Wait for any running NMIs to finish. |
| 87 | * | 87 | * |
| 88 | * If an NMI is executed, the first thing it does is to call | 88 | * If an NMI is executed, the first thing it does is to call |
| 89 | * "ftrace_nmi_enter". This will check if the flag is set to write | 89 | * "ftrace_nmi_enter". This will check if the flag is set to write |
| @@ -95,9 +95,9 @@ static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) | |||
| 95 | * are the same as what exists. | 95 | * are the same as what exists. |
| 96 | */ | 96 | */ |
| 97 | 97 | ||
| 98 | #define MOD_CODE_WRITE_FLAG (1 << 31) /* set when NMI should do the write */ | ||
| 98 | static atomic_t nmi_running = ATOMIC_INIT(0); | 99 | static atomic_t nmi_running = ATOMIC_INIT(0); |
| 99 | static int mod_code_status; /* holds return value of text write */ | 100 | static int mod_code_status; /* holds return value of text write */ |
| 100 | static int mod_code_write; /* set when NMI should do the write */ | ||
| 101 | static void *mod_code_ip; /* holds the IP to write to */ | 101 | static void *mod_code_ip; /* holds the IP to write to */ |
| 102 | static void *mod_code_newcode; /* holds the text to write to the IP */ | 102 | static void *mod_code_newcode; /* holds the text to write to the IP */ |
| 103 | 103 | ||
| @@ -114,6 +114,20 @@ int ftrace_arch_read_dyn_info(char *buf, int size) | |||
| 114 | return r; | 114 | return r; |
| 115 | } | 115 | } |
| 116 | 116 | ||
| 117 | static void clear_mod_flag(void) | ||
| 118 | { | ||
| 119 | int old = atomic_read(&nmi_running); | ||
| 120 | |||
| 121 | for (;;) { | ||
| 122 | int new = old & ~MOD_CODE_WRITE_FLAG; | ||
| 123 | |||
| 124 | if (old == new) | ||
| 125 | break; | ||
| 126 | |||
| 127 | old = atomic_cmpxchg(&nmi_running, old, new); | ||
| 128 | } | ||
| 129 | } | ||
| 130 | |||
| 117 | static void ftrace_mod_code(void) | 131 | static void ftrace_mod_code(void) |
| 118 | { | 132 | { |
| 119 | /* | 133 | /* |
| @@ -127,27 +141,39 @@ static void ftrace_mod_code(void) | |||
| 127 | 141 | ||
| 128 | /* if we fail, then kill any new writers */ | 142 | /* if we fail, then kill any new writers */ |
| 129 | if (mod_code_status) | 143 | if (mod_code_status) |
| 130 | mod_code_write = 0; | 144 | clear_mod_flag(); |
| 131 | } | 145 | } |
| 132 | 146 | ||
| 133 | void ftrace_nmi_enter(void) | 147 | void ftrace_nmi_enter(void) |
| 134 | { | 148 | { |
| 135 | atomic_inc(&nmi_running); | 149 | if (atomic_inc_return(&nmi_running) & MOD_CODE_WRITE_FLAG) { |
| 136 | /* Must have nmi_running seen before reading write flag */ | 150 | smp_rmb(); |
| 137 | smp_mb(); | ||
| 138 | if (mod_code_write) { | ||
| 139 | ftrace_mod_code(); | 151 | ftrace_mod_code(); |
| 140 | atomic_inc(&nmi_update_count); | 152 | atomic_inc(&nmi_update_count); |
| 141 | } | 153 | } |
| 154 | /* Must have previous changes seen before executions */ | ||
| 155 | smp_mb(); | ||
| 142 | } | 156 | } |
| 143 | 157 | ||
| 144 | void ftrace_nmi_exit(void) | 158 | void ftrace_nmi_exit(void) |
| 145 | { | 159 | { |
| 146 | /* Finish all executions before clearing nmi_running */ | 160 | /* Finish all executions before clearing nmi_running */ |
| 147 | smp_wmb(); | 161 | smp_mb(); |
| 148 | atomic_dec(&nmi_running); | 162 | atomic_dec(&nmi_running); |
| 149 | } | 163 | } |
| 150 | 164 | ||
| 165 | static void wait_for_nmi_and_set_mod_flag(void) | ||
| 166 | { | ||
| 167 | if (!atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)) | ||
| 168 | return; | ||
| 169 | |||
| 170 | do { | ||
| 171 | cpu_relax(); | ||
| 172 | } while (atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)); | ||
| 173 | |||
| 174 | nmi_wait_count++; | ||
| 175 | } | ||
| 176 | |||
| 151 | static void wait_for_nmi(void) | 177 | static void wait_for_nmi(void) |
| 152 | { | 178 | { |
| 153 | if (!atomic_read(&nmi_running)) | 179 | if (!atomic_read(&nmi_running)) |
| @@ -167,14 +193,9 @@ do_ftrace_mod_code(unsigned long ip, void *new_code) | |||
| 167 | mod_code_newcode = new_code; | 193 | mod_code_newcode = new_code; |
| 168 | 194 | ||
| 169 | /* The buffers need to be visible before we let NMIs write them */ | 195 | /* The buffers need to be visible before we let NMIs write them */ |
| 170 | smp_wmb(); | ||
| 171 | |||
| 172 | mod_code_write = 1; | ||
| 173 | |||
| 174 | /* Make sure write bit is visible before we wait on NMIs */ | ||
| 175 | smp_mb(); | 196 | smp_mb(); |
| 176 | 197 | ||
| 177 | wait_for_nmi(); | 198 | wait_for_nmi_and_set_mod_flag(); |
| 178 | 199 | ||
| 179 | /* Make sure all running NMIs have finished before we write the code */ | 200 | /* Make sure all running NMIs have finished before we write the code */ |
| 180 | smp_mb(); | 201 | smp_mb(); |
| @@ -182,13 +203,9 @@ do_ftrace_mod_code(unsigned long ip, void *new_code) | |||
| 182 | ftrace_mod_code(); | 203 | ftrace_mod_code(); |
| 183 | 204 | ||
| 184 | /* Make sure the write happens before clearing the bit */ | 205 | /* Make sure the write happens before clearing the bit */ |
| 185 | smp_wmb(); | ||
| 186 | |||
| 187 | mod_code_write = 0; | ||
| 188 | |||
| 189 | /* make sure NMIs see the cleared bit */ | ||
| 190 | smp_mb(); | 206 | smp_mb(); |
| 191 | 207 | ||
| 208 | clear_mod_flag(); | ||
| 192 | wait_for_nmi(); | 209 | wait_for_nmi(); |
| 193 | 210 | ||
| 194 | return mod_code_status; | 211 | return mod_code_status; |
